{"id":"https://openalex.org/W4392903597","doi":"https://doi.org/10.1109/icassp48485.2024.10445934","title":"Probability-Aware Word-Confusion-Network-To-Text Alignment Approach for Intent Classification","display_name":"Probability-Aware Word-Confusion-Network-To-Text Alignment Approach for Intent Classification","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392903597","doi":"https://doi.org/10.1109/icassp48485.2024.10445934"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10445934","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"https://doi.org/10.1109/icassp48485.2024.10445934","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075765823","display_name":"Esa\u00fa Villatoro-Tello","orcid":"https://orcid.org/0000-0002-1322-0358"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Esa\u00fa Villatoro-Tello","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084521938","display_name":"Srikanth Madikeri","orcid":"https://orcid.org/0000-0002-4361-784X"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Srikanth Madikeri","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067433878","display_name":"Bidisha Sharma","orcid":"https://orcid.org/0000-0002-4195-3532"},"institutions":[],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bidisha Sharma","raw_affiliation_strings":["Uniphore Software Systems Inc., Palo Alto, CA, USA"],"affiliations":[{"raw_affiliation_string":"Uniphore Software Systems Inc., Palo Alto, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027738812","display_name":"Driss Khalil","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Driss Khalil","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107893868","display_name":"Shashi Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Shashi Kumar","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021226188","display_name":"Iuliia Nigmatulina","orcid":"https://orcid.org/0000-0002-5111-1873"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Iuliia Nigmatulina","raw_affiliation_strings":["Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076409146","display_name":"Petr Motl\u00ed\u010dek","orcid":"https://orcid.org/0000-0001-6467-1119"},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]},{"id":"https://openalex.org/I60587646","display_name":"Brno University of Technology","ror":"https://ror.org/03613d656","country_code":"CZ","type":"education","lineage":["https://openalex.org/I60587646"]}],"countries":["CH","CZ"],"is_corresponding":false,"raw_author_name":"Petr Motlicek","raw_affiliation_strings":["Brno University of Technology, Brno, Czech Republic","Idiap Research Institute, Martigny, Switzerland"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Martigny, Switzerland","institution_ids":["https://openalex.org/I7495430"]},{"raw_affiliation_string":"Brno University of Technology, Brno, Czech Republic","institution_ids":["https://openalex.org/I60587646"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083410051","display_name":"Aravind Ganapathiraju","orcid":null},"institutions":[],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aravind Ganapathiraju","raw_affiliation_strings":["Uniphore Software Systems Inc., Palo Alto, CA, USA"],"affiliations":[{"raw_affiliation_string":"Uniphore Software Systems Inc., Palo Alto, CA, USA","institution_ids":[]}]}],"institution_assertions":[],"countries_distinct_count":3,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":"12617","last_page":"12621"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.8432583},{"id":"https://openalex.org/keywords/confusion","display_name":"Confusion","score":0.48167953}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8593252},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.8432583},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5609266},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.51106536},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.49024493},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.48167953},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.48138312},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4496029},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4433568},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.44214836},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4170714},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40972283},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08461425},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07477102},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C11171543","wikidata":"https://www.wikidata.org/wiki/Q41630","display_name":"Psychoanalysis","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10445934","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10445934","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320321408","funder_display_name":"Ministry of Education","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":32,"referenced_works":["https://openalex.org/W1554439802","https://openalex.org/W1649407914","https://openalex.org/W1989996186","https://openalex.org/W1993721840","https://openalex.org/W2007261869","https://openalex.org/W2125336414","https://openalex.org/W2397078722","https://openalex.org/W2405622356","https://openalex.org/W2407610416","https://openalex.org/W2594610113","https://openalex.org/W2802390314","https://openalex.org/W2949676527","https://openalex.org/W2963288440","https://openalex.org/W2972584841","https://openalex.org/W3006901707","https://openalex.org/W3008912312","https://openalex.org/W3015237657","https://openalex.org/W3035390927","https://openalex.org/W3095711142","https://openalex.org/W3097798370","https://openalex.org/W3100460087","https://openalex.org/W3163044982","https://openalex.org/W3197326126","https://openalex.org/W3198484663","https://openalex.org/W4226232334","https://openalex.org/W4284702538","https://openalex.org/W4286849919","https://openalex.org/W4287645199","https://openalex.org/W4296068780","https://openalex.org/W4372259765","https://openalex.org/W4385245566","https://openalex.org/W4385572995"],"related_works":["https://openalex.org/W4388155270","https://openalex.org/W4367156293","https://openalex.org/W2994151208","https://openalex.org/W2944691285","https://openalex.org/W28826848","https://openalex.org/W2750549761","https://openalex.org/W2122272819","https://openalex.org/W1872724644","https://openalex.org/W1584537303","https://openalex.org/W107105315"],"abstract_inverted_index":{"Spoken":[0],"Language":[1],"Understanding":[2],"(SLU)":[3],"technologies":[4],"have":[5],"greatly":[6],"improved":[7],"due":[8],"to":[9,25,66,114,137],"the":[10,23,120,127],"effective":[11],"pretraining":[12],"of":[13,19],"speech":[14],"representations.":[15],"A":[16],"common":[17],"requirement":[18],"industry-based":[20],"solutions":[21],"is":[22,93],"portability":[24],"deploy":[26],"SLU":[27],"models":[28,39],"in":[29],"voice-assistant":[30],"devices.":[31],"Thus,":[32],"distilling":[33],"knowledge":[34],"from":[35,71],"large":[36],"text-based":[37,88],"language":[38],"has":[40],"become":[41],"an":[42],"attractive":[43],"solution":[44],"for":[45],"achieving":[46],"good":[47],"performance":[48],"and":[49,84],"guaranteeing":[50],"portability.":[51],"In":[52],"this":[53],"paper,":[54],"we":[55],"introduce":[56],"a":[57,62,72,96,132,138],"novel":[58],"architecture":[59],"that":[60,78],"uses":[61],"cross-modal":[63],"attention":[64],"mechanism":[65],"extract":[67],"bin-level":[68],"contextual":[69,89],"embeddings":[70],"word-confusion":[73],"network":[74],"(WNC)":[75],"encoding":[76],"such":[77],"these":[79],"can":[80],"be":[81],"directly":[82],"compared":[83,136],"aligned":[85],"with":[86],"traditional":[87],"embeddings.":[90],"This":[91],"alignment":[92],"achieved":[94],"using":[95],"recently":[97],"proposed":[98],"tokenwise":[99],"constrastive":[100],"loss":[101],"function.":[102],"We":[103],"validate":[104],"our":[105,110],"architecture's":[106],"effectiveness":[107],"by":[108],"fine-tuning":[109],"WCN-based":[111],"pretrained":[112],"model":[113],"do":[115],"intent":[116],"classification":[117],"(IC)":[118],"on":[119,126],"well-known":[121],"SLURP":[122],"dataset.":[123],"Obtained":[124],"accuracy":[125],"IC":[128],"task":[129],"(81%),":[130],"depicts":[131],"9.4%":[133],"relative":[134],"improvement":[135],"recent/equivalent":[139],"E2E":[140],"method.":[141]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4392903597","counts_by_year":[],"updated_date":"2025-01-09T07:28:38.032646","created_date":"2024-03-19"}