{"id":"https://openalex.org/W4391021790","doi":"https://doi.org/10.1109/asru57964.2023.10389677","title":"Consistency Based Unsupervised Self-Training for ASR Personalisation","display_name":"Consistency Based Unsupervised Self-Training for ASR Personalisation","publication_year":2023,"publication_date":"2023-12-16","ids":{"openalex":"https://openalex.org/W4391021790","doi":"https://doi.org/10.1109/asru57964.2023.10389677"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389677","pdf_url":null,"source":{"id":"https://openalex.org/S4363606113","display_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2401.12085","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008123626","display_name":"Jisi Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jisi Zhang","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071287333","display_name":"Vandana Rajan","orcid":"https://orcid.org/0000-0002-2250-1688"},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Vandana Rajan","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063935505","display_name":"Haaris Mehmood","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Haaris Mehmood","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030185505","display_name":"David Tuckey","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"David Tuckey","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060097629","display_name":"Pablo Peso Parada","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Pablo Peso Parada","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113981675","display_name":"Md Asif Jalal","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Md Asif Jalal","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104088631","display_name":"Karthikeyan Saravanan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Karthikeyan Saravanan","raw_affiliation_strings":["Samsung Research UK, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK, United Kingdom","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114121755","display_name":"Gil Ho Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gil Ho Lee","raw_affiliation_strings":["AI R&D Group, Samsung Electronics,Suwon,South Korea"],"affiliations":[{"raw_affiliation_string":"AI R&D Group, Samsung Electronics,Suwon,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004902602","display_name":"Jungin Lee","orcid":"https://orcid.org/0000-0003-0390-119X"},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jungin Lee","raw_affiliation_strings":["AI R&D Group, Samsung Electronics,Suwon,South Korea"],"affiliations":[{"raw_affiliation_string":"AI R&D Group, Samsung Electronics,Suwon,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057180394","display_name":"Seokyeong Jung","orcid":null},"institutions":[{"id":"https://openalex.org/I2250650973","display_name":"Samsung (South Korea)","ror":"https://ror.org/04w3jy968","country_code":"KR","type":"company","lineage":["https://openalex.org/I2250650973"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seokyeong Jung","raw_affiliation_strings":["AI R&D Group, Samsung Electronics,Suwon,South Korea"],"affiliations":[{"raw_affiliation_string":"AI R&D Group, Samsung Electronics,Suwon,South Korea","institution_ids":["https://openalex.org/I2250650973"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":67},"biblio":{"volume":"33","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9913,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9906,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7406691},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6634258},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.63604295},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.47878158},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4414489},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.15195099}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389677","pdf_url":null,"source":{"id":"https://openalex.org/S4363606113","display_name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.12085","pdf_url":"http://arxiv.org/pdf/2401.12085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.12085","pdf_url":"http://arxiv.org/pdf/2401.12085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":33,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1795658042","https://openalex.org/W1828163288","https://openalex.org/W1904365287","https://openalex.org/W2296167893","https://openalex.org/W2431080869","https://openalex.org/W2641129314","https://openalex.org/W2799674897","https://openalex.org/W2889374926","https://openalex.org/W2936774411","https://openalex.org/W2973051376","https://openalex.org/W2990138404","https://openalex.org/W3008008574","https://openalex.org/W3015995734","https://openalex.org/W3026041220","https://openalex.org/W3034218934","https://openalex.org/W3094721881","https://openalex.org/W3096273170","https://openalex.org/W3097777922","https://openalex.org/W3112702554","https://openalex.org/W3125118953","https://openalex.org/W3162638900","https://openalex.org/W3163169798","https://openalex.org/W3194334755","https://openalex.org/W3206798603","https://openalex.org/W4221153728","https://openalex.org/W4283654390","https://openalex.org/W4296069270","https://openalex.org/W4297841489","https://openalex.org/W4319862444","https://openalex.org/W4322731129","https://openalex.org/W4372266975","https://openalex.org/W4385823503"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4391210591","https://openalex.org/W3172493050","https://openalex.org/W2748952813","https://openalex.org/W2466832359","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2109940557","https://openalex.org/W1582019636","https://openalex.org/W1499005795"],"abstract_inverted_index":{"On-device":[0],"Automatic":[1],"Speech":[2],"Recognition":[3],"(ASR)":[4],"models":[5],"trained":[6],"on":[7,118,124],"speech":[8],"data":[9,30,55,69,76,82,121,126],"of":[10,62,87,116],"a":[11,25,48,98,109,129],"large":[12],"population":[13],"might":[14],"underperform":[15],"for":[16,70],"individuals":[17],"unseen":[18],"during":[19],"training.":[20],"This":[21,91],"is":[22,47,77],"due":[23,79],"to":[24,52,56,80,128],"domain":[26],"shift":[27],"between":[28],"user":[29,54,68],"and":[31,41,84,122,132],"the":[32,134],"original":[33],"training":[34,102,120],"data,":[35],"differed":[36],"by":[37,96],"user's":[38],"speaking":[39],"characteristics":[40],"environmental":[42],"acoustic":[43],"conditions.":[44],"ASR":[45,63],"personalisation":[46,64,95],"solution":[49],"that":[50],"aims":[51],"exploit":[53],"improve":[57],"model":[58],"robustness.":[59],"The":[60],"majority":[61],"methods":[65],"assume":[66],"labelled":[67,75],"supervision.":[71],"Personalisation":[72],"without":[73],"any":[74],"challenging":[78],"limited":[81],"size":[83],"poor":[85],"quality":[86],"recorded":[88],"audio":[89],"samples.":[90],"work":[92],"addresses":[93],"unsupervised":[94],"developing":[97],"novel":[99],"consistency":[100],"based":[101],"method":[103,107],"via":[104],"pseudo-labelling.":[105],"Our":[106],"achieves":[108],"relative":[110],"Word":[111],"Error":[112],"Rate":[113],"Reduction":[114],"(WERR)":[115],"17.3%":[117],"unlabelled":[119],"8.1%":[123],"held-out":[125],"compared":[127],"pre-trained":[130],"model,":[131],"outperforms":[133],"current":[135],"state-of-the":[136],"art":[137],"methods.":[138]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4391021790","counts_by_year":[],"updated_date":"2025-01-04T13:16:34.485839","created_date":"2024-01-20"}