{"id":"https://openalex.org/W2123012529","doi":"https://doi.org/10.1109/icassp.2008.4518797","title":"Detecting tone errors in continuous Mandarin speech","display_name":"Detecting tone errors in continuous Mandarin speech","publication_year":2008,"publication_date":"2008-03-01","ids":{"openalex":"https://openalex.org/W2123012529","doi":"https://doi.org/10.1109/icassp.2008.4518797","mag":"2123012529"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518797","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100392899","display_name":"Bin Zhang","orcid":"https://orcid.org/0000-0003-0633-2930"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]},{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Yan-Bin Zhang","raw_affiliation_strings":["Information technology Institute, Beijing Jiaotong University, Beijing, China","Microsoft Research Asia, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Information technology Institute, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104229610","display_name":"Min Chu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Min Chu","raw_affiliation_strings":["Microsoft research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101464820","display_name":"Chao Huang","orcid":"https://orcid.org/0000-0002-3147-1951"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Chao Huang","raw_affiliation_strings":["Microsoft research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102925435","display_name":"Mangui Liang","orcid":"https://orcid.org/0000-0001-9492-8261"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"None Man-Gui Liang","raw_affiliation_strings":["Information technology Institute, Beijing Jiaotong University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Information technology Institute, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.707,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":12,"citation_normalized_percentile":{"value":0.805787,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":84,"max":85},"biblio":{"volume":null,"issue":null,"first_page":"5065","last_page":"5068"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9984,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.9264739},{"id":"https://openalex.org/keywords/tone","display_name":"Tone (literature)","score":0.8170312},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.7051793},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.62405324},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.49216026}],"concepts":[{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.9264739},{"id":"https://openalex.org/C2780583480","wikidata":"https://www.wikidata.org/wiki/Q1366327","display_name":"Tone (literature)","level":2,"score":0.8170312},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7584741},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.7051793},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6404791},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.62405324},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5842174},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.51946753},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.49216026},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35186046},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1007376},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518797","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality education","score":0.49}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":12,"referenced_works":["https://openalex.org/W105558132","https://openalex.org/W1523358955","https://openalex.org/W1585763212","https://openalex.org/W1606774179","https://openalex.org/W1608344791","https://openalex.org/W2045459610","https://openalex.org/W2099111195","https://openalex.org/W2123438540","https://openalex.org/W2152321560","https://openalex.org/W2158513796","https://openalex.org/W2166823384","https://openalex.org/W39287039"],"related_works":["https://openalex.org/W2481138693","https://openalex.org/W2393887907","https://openalex.org/W2388826840","https://openalex.org/W2386691339","https://openalex.org/W2379831327","https://openalex.org/W2365805939","https://openalex.org/W2347443630","https://openalex.org/W2287147624","https://openalex.org/W2163874654","https://openalex.org/W156219719"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,73,80],"new":[4],"approach":[5],"for":[6],"detecting":[7],"tone":[8,18,44,55,61,76],"errors":[9],"in":[10,33],"continuous":[11],"Mandarin":[12],"speech.":[13],"In":[14,37,83],"the":[15,38,41,53,58,64,67,75,84,89],"training":[16],"phase,":[17,40],"variations":[19],"are":[20],"modeled":[21],"with":[22],"context-depended":[23],"MSD-HMM":[24],"which":[25],"considers":[26],"six":[27],"contextual":[28],"factors":[29],"instead":[30],"of":[31,43],"two":[32,68],"traditional":[34],"triphone":[35],"HMM.":[36],"evaluation":[39],"goodness":[42],"pronunciation":[45,81],"is":[46,70,77],"measured":[47],"by":[48],"Kullback-Leibler":[49],"divergence":[50],"(KLD)":[51],"between":[52,66],"expected":[54],"model":[56],"and":[57],"most":[59],"representative":[60],"model.":[62],"When":[63],"KLD":[65],"models":[69],"larger":[71],"than":[72],"threshold,":[74],"detected":[78],"as":[79],"error.":[82],"ROC":[85],"curve,":[86],"we":[87],"get":[88],"equal":[90],"error":[91],"rate":[92],"at":[93],"2.6%.":[94]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2123012529","counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2024-12-09T03:21:56.190519","created_date":"2016-06-24"}