{"id":"https://openalex.org/W4385895585","doi":"https://doi.org/10.21437/interspeech.2023-1050","title":"Unsupervised Code-switched Text Generation from Parallel Text","display_name":"Unsupervised Code-switched Text Generation from Parallel Text","publication_year":2023,"publication_date":"2023-08-14","ids":{"openalex":"https://openalex.org/W4385895585","doi":"https://doi.org/10.21437/interspeech.2023-1050"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2023-1050","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.research.ed.ac.uk/files/370167176/Unsupervised_Code_switched_CHI_DOA17052023_AFV_CC_BY.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086425896","display_name":"Jie Chi","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Jie Chi","raw_affiliation_strings":["Centre for Speech Technology Research, University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"Centre for Speech Technology Research, University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108923519","display_name":"Brian Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian Lu","raw_affiliation_strings":["Center for Language and Speech Processing, Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Center for Language and Speech Processing, Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052467896","display_name":"Jason Eisner","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason Eisner","raw_affiliation_strings":["Center for Language and Speech Processing, Johns Hopkins University"],"affiliations":[{"raw_affiliation_string":"Center for Language and Speech Processing, Johns Hopkins University","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110121346","display_name":"Peter M. Bell","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Peter Bell","raw_affiliation_strings":["Centre for Speech Technology Research, University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"Centre for Speech Technology Research, University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036738038","display_name":"Preethi Jyothi","orcid":null},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Preethi Jyothi","raw_affiliation_strings":["Department of Computer Science, Indian Institute of Technology Bombay"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Indian Institute of Technology Bombay","institution_ids":["https://openalex.org/I162827531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100693435","display_name":"Ahmed Ali","orcid":"https://orcid.org/0000-0002-9186-7544"},"institutions":[],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Ahmed M. Ali","raw_affiliation_strings":["Qatar Computing Research Institute, HBKU, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute, HBKU, Qatar","institution_ids":[]}]}],"institution_assertions":[],"countries_distinct_count":4,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5086425896"],"corresponding_institution_ids":["https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":68},"biblio":{"volume":null,"issue":null,"first_page":"1419","last_page":"1423"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.61135995},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.5381343},{"id":"https://openalex.org/keywords/forcing","display_name":"Forcing (mathematics)","score":0.4245038}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.81816727},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.61135995},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.60608846},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.5381343},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5053816},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.45686245},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45123535},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.4245038},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.42105773},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.20624506},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.13781708},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C49204034","wikidata":"https://www.wikidata.org/wiki/Q52139","display_name":"Climatology","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2023-1050","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/171128de-62cf-4da4-9885-cc26b53e4d26","pdf_url":"https://www.research.ed.ac.uk/files/370167176/Unsupervised_Code_switched_CHI_DOA17052023_AFV_CC_BY.pdf","source":{"id":"https://openalex.org/S4306400320","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false},{"is_oa":true,"landing_page_url":"https://www.pure.ed.ac.uk/ws/files/370167176/Unsupervised_Code_switched_CHI_DOA17052023_AFV_CC_BY.pdf","pdf_url":"https://www.pure.ed.ac.uk/ws/files/370167176/Unsupervised_Code_switched_CHI_DOA17052023_AFV_CC_BY.pdf","source":{"id":"https://openalex.org/S4306400321","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/171128de-62cf-4da4-9885-cc26b53e4d26","pdf_url":"https://www.research.ed.ac.uk/files/370167176/Unsupervised_Code_switched_CHI_DOA17052023_AFV_CC_BY.pdf","source":{"id":"https://openalex.org/S4306400320","display_name":"Edinburgh Research Explorer (University of Edinburgh)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98677209","host_organization_name":"University of Edinburgh","host_organization_lineage":["https://openalex.org/I98677209"],"host_organization_lineage_names":["University of Edinburgh"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"acceptedVersion","is_accepted":true,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":29,"referenced_works":["https://openalex.org/W197277712","https://openalex.org/W2038116248","https://openalex.org/W2075201173","https://openalex.org/W2126725946","https://openalex.org/W2252095989","https://openalex.org/W2262393948","https://openalex.org/W2550821151","https://openalex.org/W2798348125","https://openalex.org/W2883989418","https://openalex.org/W2884096449","https://openalex.org/W2963084773","https://openalex.org/W2963242190","https://openalex.org/W2963257891","https://openalex.org/W2964029788","https://openalex.org/W2966263504","https://openalex.org/W2972417954","https://openalex.org/W2972702443","https://openalex.org/W2973082572","https://openalex.org/W2973730088","https://openalex.org/W3035547806","https://openalex.org/W3096615836","https://openalex.org/W3097634649","https://openalex.org/W3100155399","https://openalex.org/W3101648800","https://openalex.org/W3104723404","https://openalex.org/W3122044994","https://openalex.org/W3197295304","https://openalex.org/W4225308107","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2990005675","https://openalex.org/W2394766824","https://openalex.org/W2393726922","https://openalex.org/W2386292991","https://openalex.org/W2374317326","https://openalex.org/W2366752344","https://openalex.org/W2364440891","https://openalex.org/W2361574037","https://openalex.org/W2078713291","https://openalex.org/W1603321096"],"abstract_inverted_index":{"There":[0],"has":[1],"been":[2,62],"great":[3],"interest":[4],"in":[5,31,54],"developing":[6],"automatic":[7],"speech":[8,17],"recognition":[9],"(ASR)":[10],"systems":[11],"that":[12,95,111],"can":[13],"handle":[14],"code-switched":[15],"(CS)":[16],"to":[18,37,45,64,101],"meet":[19],"the":[20,46,55,72,114],"needs":[21],"of":[22,48,74,89,117],"a":[23,57,86,91],"growing":[24],"bilingual":[25],"population.However,":[26],"existing":[27],"datasets":[28],"are":[29,80],"limited":[30],"size.It":[32],"is":[33],"expensive":[34],"and":[35,50,121],"difficult":[36],"collect":[38],"real":[39],"transcribed":[40],"spoken":[41],"CS":[42,52,67,75,103,125,131],"data":[43,53,76,100],"due":[44],"challenges":[47],"finding":[49],"identifying":[51],"wild.As":[56],"result,":[58],"many":[59],"attempts":[60],"have":[61],"made":[63],"generate":[65,102],"synthetic":[66],"data.Existing":[68],"methods":[69],"either":[70],"require":[71],"existence":[73],"during":[77],"training,":[78],"or":[79],"driven":[81],"by":[82],"linguistic":[83],"knowledge.We":[84],"introduce":[85],"novel":[87],"approach":[88],"forcing":[90],"multilingual":[92],"MT":[93],"system":[94],"was":[96],"trained":[97],"on":[98],"non-CS":[99],"translations.Comparing":[104],"against":[105],"two":[106,118],"prior":[107],"methods,":[108],"we":[109],"show":[110],"simply":[112],"leveraging":[113],"shared":[115],"representations":[116],"languages":[119],"(Mandarin":[120],"English)":[122],"yields":[123],"better":[124,130],"text":[126],"generation":[127],"and,":[128],"ultimately,":[129],"ASR.":[132]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4385895585","counts_by_year":[],"updated_date":"2024-12-15T17:15:31.805032","created_date":"2023-08-18"}