{"id":"https://openalex.org/W4391158951","doi":"https://doi.org/10.48550/arxiv.2401.12085","title":"Consistency Based Unsupervised Self-training For ASR Personalisation","display_name":"Consistency Based Unsupervised Self-training For ASR Personalisation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4391158951","doi":"https://doi.org/10.48550/arxiv.2401.12085"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2401.12085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2401.12085","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008123626","display_name":"Jisi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jisi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071287333","display_name":"Vandana Rajan","orcid":"https://orcid.org/0000-0002-2250-1688"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rajan, Vandana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063935505","display_name":"Haaris Mehmood","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mehmood, Haaris","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030185505","display_name":"David Tuckey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tuckey, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060097629","display_name":"Pablo Peso Parada","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parada, Pablo Peso","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113981675","display_name":"Md Asif Jalal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jalal, Md Asif","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104088631","display_name":"Karthikeyan Saravanan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saravanan, Karthikeyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114121755","display_name":"Gil Ho Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Gil Ho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004902602","display_name":"Jungin Lee","orcid":"https://orcid.org/0000-0003-0390-119X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Jungin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5057180394","display_name":"Seokyeong Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung, Seokyeong","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9954,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness","score":0.65440786},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.54184},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.49680236}],"concepts":[{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.87038314},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.73034996},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.65440786},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.57610095},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.54184},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.49680236},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4879579},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45643437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42246813},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.4197095},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3535934},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.10933587},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2401.12085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.12085","pdf_url":"http://arxiv.org/pdf/2401.12085","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2401.12085","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2401.12085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4312814274","https://openalex.org/W4285370786","https://openalex.org/W3207760230","https://openalex.org/W2536018345","https://openalex.org/W2296488620","https://openalex.org/W2146197305","https://openalex.org/W2134950286","https://openalex.org/W17155033","https://openalex.org/W1590307681","https://openalex.org/W1496222301"],"abstract_inverted_index":{"On-device":[0],"Automatic":[1],"Speech":[2],"Recognition":[3],"(ASR)":[4],"models":[5],"trained":[6],"on":[7,118,124],"speech":[8],"data":[9,30,55,69,76,82,121,126],"of":[10,62,87,116],"a":[11,25,48,98,109,129],"large":[12],"population":[13],"might":[14],"underperform":[15],"for":[16,70],"individuals":[17],"unseen":[18],"during":[19],"training.":[20],"This":[21,91],"is":[22,47,77],"due":[23,79],"to":[24,52,56,80,128],"domain":[26],"shift":[27],"between":[28],"user":[29,54,68],"and":[31,41,84,122,132],"the":[32,134],"original":[33],"training":[34,102,120],"data,":[35],"differed":[36],"by":[37,96],"user's":[38],"speaking":[39],"characteristics":[40],"environmental":[42],"acoustic":[43],"conditions.":[44],"ASR":[45,63],"personalisation":[46,64,95],"solution":[49],"that":[50],"aims":[51],"exploit":[53],"improve":[57],"model":[58],"robustness.":[59],"The":[60],"majority":[61],"methods":[65],"assume":[66],"labelled":[67,75],"supervision.":[71],"Personalisation":[72],"without":[73],"any":[74],"challenging":[78],"limited":[81],"size":[83],"poor":[85],"quality":[86],"recorded":[88],"audio":[89],"samples.":[90],"work":[92],"addresses":[93],"unsupervised":[94],"developing":[97],"novel":[99],"consistency":[100],"based":[101],"method":[103,107],"via":[104],"pseudo-labelling.":[105],"Our":[106],"achieves":[108],"relative":[110],"Word":[111],"Error":[112],"Rate":[113],"Reduction":[114],"(WERR)":[115],"17.3%":[117],"unlabelled":[119],"8.1%":[123],"held-out":[125],"compared":[127],"pre-trained":[130],"model,":[131],"outperforms":[133],"current":[135],"state-of-the":[136],"art":[137],"methods.":[138]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4391158951","counts_by_year":[],"updated_date":"2024-12-15T14:21:04.263413","created_date":"2024-01-24"}