{"id":"https://openalex.org/W3095903821","doi":"https://doi.org/10.21437/interspeech.2020-2919","title":"Lattice-Free Maximum Mutual Information Training of Multilingual Speech Recognition Systems","display_name":"Lattice-Free Maximum Mutual Information Training of Multilingual Speech Recognition Systems","publication_year":2020,"publication_date":"2020-10-25","ids":{"openalex":"https://openalex.org/W3095903821","doi":"https://doi.org/10.21437/interspeech.2020-2919","mag":"3095903821"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-2919","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084521938","display_name":"Srikanth Madikeri","orcid":"https://orcid.org/0000-0002-4361-784X"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Srikanth Madikeri","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076301534","display_name":"Banriskhem K. Khonglah","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Banriskhem K. Khonglah","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077304441","display_name":"Sibo Tong","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"funder","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Sibo Tong","raw_affiliation_strings":["Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]},{"raw_affiliation_string":"Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076409146","display_name":"Petr Motl\u00ed\u010dek","orcid":"https://orcid.org/0000-0001-6467-1119"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Petr Motlicek","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108187466","display_name":"Herv\u00e9 Bourlard","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"funder","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Herv\u00e9 Bourlard","raw_affiliation_strings":["Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]},{"raw_affiliation_string":"Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084286453","display_name":"Daniel Povey","orcid":"https://orcid.org/0000-0002-0611-3634"},"institutions":[{"id":"https://openalex.org/I862669128","display_name":"Xiaomi (China)","ror":"https://ror.org/029f7bn57","country_code":"CN","type":"company","lineage":["https://openalex.org/I862669128"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Daniel Povey","raw_affiliation_strings":["Xiaomi Technology, China"],"affiliations":[{"raw_affiliation_string":"Xiaomi Technology, China","institution_ids":["https://openalex.org/I862669128"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.753,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":10,"citation_normalized_percentile":{"value":0.707884,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":85,"max":86},"biblio":{"volume":null,"issue":null,"first_page":"4746","last_page":"4750"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9946,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/extractor","display_name":"Extractor","score":0.5863408},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5351269},{"id":"https://openalex.org/keywords/sequence-labeling","display_name":"Sequence labeling","score":0.4457185}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8016794},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.71575356},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.6742983},{"id":"https://openalex.org/C117978034","wikidata":"https://www.wikidata.org/wiki/Q5422192","display_name":"Extractor","level":2,"score":0.5863408},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.5684196},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5351269},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.53034294},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5055175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48166287},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.452638},{"id":"https://openalex.org/C35639132","wikidata":"https://www.wikidata.org/wiki/Q7452468","display_name":"Sequence labeling","level":3,"score":0.4457185},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42022339},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.25443208},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.13526362},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.13305643},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.10919982},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C21880701","wikidata":"https://www.wikidata.org/wiki/Q2144042","display_name":"Process engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-2919","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1524333225","https://openalex.org/W1892788530","https://openalex.org/W1970890968","https://openalex.org/W1975550806","https://openalex.org/W1994606281","https://openalex.org/W2025198378","https://openalex.org/W2038810952","https://openalex.org/W2091746061","https://openalex.org/W2106440210","https://openalex.org/W2114016253","https://openalex.org/W2123798005","https://openalex.org/W2131342762","https://openalex.org/W2146168991","https://openalex.org/W2147590749","https://openalex.org/W2397721308","https://openalex.org/W2402146185","https://openalex.org/W2514741789","https://openalex.org/W2586412610","https://openalex.org/W2726599793","https://openalex.org/W2808939837","https://openalex.org/W2889282842","https://openalex.org/W2890843555","https://openalex.org/W2891816510","https://openalex.org/W2936547119","https://openalex.org/W4289329396"],"related_works":["https://openalex.org/W4386794561","https://openalex.org/W4205820553","https://openalex.org/W3116273293","https://openalex.org/W3021690593","https://openalex.org/W2916997151","https://openalex.org/W2781555308","https://openalex.org/W2251441308","https://openalex.org/W2163537793","https://openalex.org/W2126322296","https://openalex.org/W2125343999"],"abstract_inverted_index":{"Multilingual":[0],"acoustic":[1,62,85,105],"model":[2,55,74,86,106],"training":[3,21,33],"combines":[4],"data":[5,22],"from":[6,64],"multiple":[7],"languages":[8,66],"to":[9,51,59,82,101,123,144,152],"train":[10,52,83,102],"an":[11,84],"automatic":[12],"speech":[13,168],"recognition":[14,169],"system.Such":[15],"a":[16,24,42,53,69,79,98,108,163],"system":[17],"is":[18,27,58,75,121,130,159],"beneficial":[19],"when":[20,150],"for":[23,87,112],"target":[25,89],"language":[26,90],"limited.Lattice-Free":[28],"Maximum":[29],"Mutual":[30],"Information":[31],"(LF-MMI)":[32],"performs":[34],"sequence":[35],"discrimination":[36],"by":[37],"introducing":[38],"competing":[39],"hypotheses":[40],"through":[41],"denominator":[43,71,119],"graph":[44],"in":[45,146],"the":[46,61,88,103,113,125,153,166],"cost":[47,126],"function.The":[48,127],"standard":[49],"approach":[50,100,129],"multilingual":[54,104,134],"with":[56],"LF-MMI":[57,114,156],"combine":[60],"units":[63],"all":[65],"and":[67,139],"use":[68],"common":[70],"graph.The":[72],"resulting":[73],"either":[76],"used":[77,122],"as":[78,162],"feature":[80],"extractor":[81],"or":[91],"directly":[92],"fine-tuned.In":[93],"this":[94],"work,":[95],"we":[96],"propose":[97],"scalable":[99],"using":[107,137],"typical":[109,133],"multitask":[110],"network":[111],"framework.A":[115],"set":[116],"of":[117,165],"language-dependent":[118],"graphs":[120],"compute":[124],"proposed":[128],"evaluated":[131],"under":[132],"ASR":[135],"tasks":[136],"GlobalPhone":[138],"BABEL":[140],"datasets.Relative":[141],"improvements":[142],"up":[143],"13.2%":[145],"WER":[147],"are":[148],"obtained":[149],"compared":[151],"corresponding":[154],"monolingual":[155],"baselines.The":[157],"implementation":[158],"made":[160],"available":[161],"part":[164],"Kaldi":[167],"toolkit.":[170]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3095903821","counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2}],"updated_date":"2025-04-16T12:59:49.607298","created_date":"2020-11-09"}