{"id":"https://openalex.org/W4205654098","doi":"https://doi.org/10.1109/lsp.2022.3143036","title":"Neural Acoustic-Phonetic Approach for Speaker Verification With Phonetic Attention Mask","display_name":"Neural Acoustic-Phonetic Approach for Speaker Verification With Phonetic Attention Mask","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4205654098","doi":"https://doi.org/10.1109/lsp.2022.3143036"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/lsp.2022.3143036","pdf_url":"https://ieeexplore.ieee.org/ielx7/97/9686799/09681187.pdf","source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ieeexplore.ieee.org/ielx7/97/9686799/09681187.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013047791","display_name":"Tianchi Liu","orcid":"https://orcid.org/0000-0003-3472-0703"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Tianchi Liu","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore","Institute for Infocomm Research, A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, A*STAR, Singapore","institution_ids":["https://openalex.org/I115228651","https://openalex.org/I3005327000"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029637694","display_name":"Rohan Kumar Das","orcid":"https://orcid.org/0000-0002-1332-3357"},"institutions":[],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Rohan Kumar Das","raw_affiliation_strings":["Fortemedia, Singapore"],"affiliations":[{"raw_affiliation_string":"Fortemedia, Singapore","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004287909","display_name":"Kong Aik Lee","orcid":"https://orcid.org/0000-0001-9133-3000"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Kong Aik Lee","raw_affiliation_strings":["Institute for Infocomm Research, A*STAR, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, A*STAR, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.733,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":10,"citation_normalized_percentile":{"value":0.99997,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":92},"biblio":{"volume":"29","issue":null,"first_page":"782","last_page":"786"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9985,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.61558175},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.4229438}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7959086},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.75693965},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.61558175},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47642002},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4628019},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43676233},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.4229438},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41069698},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34859902},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/lsp.2022.3143036","pdf_url":"https://ieeexplore.ieee.org/ielx7/97/9686799/09681187.pdf","source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/lsp.2022.3143036","pdf_url":"https://ieeexplore.ieee.org/ielx7/97/9686799/09681187.pdf","source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.66,"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":43,"referenced_works":["https://openalex.org/W1521002338","https://openalex.org/W1600744878","https://openalex.org/W1647671624","https://openalex.org/W1677182931","https://openalex.org/W1836465849","https://openalex.org/W1974727132","https://openalex.org/W1996512145","https://openalex.org/W2069976350","https://openalex.org/W2095705004","https://openalex.org/W2127141656","https://openalex.org/W2129244720","https://openalex.org/W2143612262","https://openalex.org/W2154278880","https://openalex.org/W2265811614","https://openalex.org/W2369576693","https://openalex.org/W2398826216","https://openalex.org/W2514080268","https://openalex.org/W2549754302","https://openalex.org/W2640876020","https://openalex.org/W2747249235","https://openalex.org/W2751695221","https://openalex.org/W2801514793","https://openalex.org/W2888782552","https://openalex.org/W2888911591","https://openalex.org/W2889151164","https://openalex.org/W2889182547","https://openalex.org/W2889492015","https://openalex.org/W2916979304","https://openalex.org/W2922306975","https://openalex.org/W2936386404","https://openalex.org/W2944012040","https://openalex.org/W2962979137","https://openalex.org/W2964214551","https://openalex.org/W2964273407","https://openalex.org/W2973003853","https://openalex.org/W2993724474","https://openalex.org/W2999547272","https://openalex.org/W3097073596","https://openalex.org/W3097659012","https://openalex.org/W3168542456","https://openalex.org/W3197848469","https://openalex.org/W4234330420","https://openalex.org/W79762229"],"related_works":["https://openalex.org/W3135230428","https://openalex.org/W2886454286","https://openalex.org/W2171933535","https://openalex.org/W2069095950","https://openalex.org/W2061778110","https://openalex.org/W2022349254","https://openalex.org/W1970482590","https://openalex.org/W1598508708","https://openalex.org/W1589515751","https://openalex.org/W1577485118"],"abstract_inverted_index":{"Traditional":[0],"acoustic-phonetic":[1,44,69,99],"approach":[2,45],"makes":[3],"use":[4],"of":[5,15,27,72,110,131],"both":[6],"spectral":[7,54],"and":[8,79,133,137],"phonetic":[9,18,25,63,90],"information":[10,91],"when":[11],"comparing":[12],"the":[13,24,85,89,96,102,117],"voice":[14],"speakers.":[16],"While":[17],"units":[19],"are":[20],"not":[21],"equally":[22],"informative,":[23],"context":[26],"speech":[28,82],"plays":[29],"an":[30,126],"important":[31],"role":[32],"in":[33],"speaker":[34],"verification":[35],"(SV).":[36],"In":[37],"this":[38],"paper,":[39],"we":[40,87],"propose":[41],"a":[42,62],"neural":[43,68,98],"that":[46,108,116],"learns":[47],"to":[48,53],"dynamically":[49],"assign":[50],"differentiated":[51,59],"weights":[52,60],"features":[55],"for":[56,77,81,92,135],"SV.":[57,93],"Such":[58],"form":[61],"attention":[64],"mask":[65],"(PAM).":[66],"The":[67],"framework":[70,100,119],"consists":[71,109],"two":[73],"training":[74],"pipelines,":[75],"one":[76],"SV":[78],"another":[80],"recognition.":[83],"Through":[84],"PAM,":[86],"leverage":[88],"We":[94,114],"evaluate":[95],"proposed":[97,118],"on":[101],"RSR2015":[103],"database":[104],"Part":[105],"III":[106],"corpus,":[107],"random":[111],"digit":[112],"strings.":[113],"show":[115],"with":[120,125],"PAM":[121],"consistently":[122],"outperforms":[123],"baseline":[124],"equal":[127],"error":[128],"rate":[129],"reduction":[130],"13.45%":[132],"10.20%":[134],"female":[136],"male":[138],"data,":[139],"respectively.":[140]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4205654098","counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4}],"updated_date":"2024-12-07T07:20:41.073665","created_date":"2022-01-26"}