{"id":"https://openalex.org/W4251158933","doi":"https://doi.org/10.1002/scj.20354","title":"Incorporating a mixed excitation model and postfilter into HMM-based text-to-speech synthesis","display_name":"Incorporating a mixed excitation model and postfilter into HMM-based text-to-speech synthesis","publication_year":2005,"publication_date":"2005-01-01","ids":{"openalex":"https://openalex.org/W4251158933","doi":"https://doi.org/10.1002/scj.20354"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/scj.20354","pdf_url":null,"source":{"id":"https://openalex.org/S58208175","display_name":"Systems and Computers in Japan","issn_l":"0882-1666","issn":["0882-1666","1520-684X"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101886410","display_name":"Takayoshi Yoshimura","orcid":"https://orcid.org/0000-0002-1812-6491"},"institutions":[{"id":"https://openalex.org/I4210165351","display_name":"Toyota Central Research and Development Laboratories (Japan)","ror":"https://ror.org/05mjgqe69","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4210165351"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takayoshi Yoshimura","raw_affiliation_strings":["Research-Domain 21, Toyota Central R&D Labs., Inc., Aichi, 480-1192 Japan"],"affiliations":[{"raw_affiliation_string":"Research-Domain 21, Toyota Central R&D Labs., Inc., Aichi, 480-1192 Japan","institution_ids":["https://openalex.org/I4210165351"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103023678","display_name":"Keiichi Tokuda","orcid":"https://orcid.org/0000-0001-6143-0133"},"institutions":[{"id":"https://openalex.org/I197274945","display_name":"Nagoya Institute of Technology","ror":"https://ror.org/055yf1005","country_code":"JP","type":"education","lineage":["https://openalex.org/I197274945"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Keiichi Tokuda","raw_affiliation_strings":["Department of Computer Science, Nagoya Institute of Technology, Nagoya, 466-8555 Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Nagoya Institute of Technology, Nagoya, 466-8555 Japan","institution_ids":["https://openalex.org/I197274945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064866374","display_name":"Takashi Masuko","orcid":"https://orcid.org/0000-0002-2410-2007"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takashi Masuko","raw_affiliation_strings":["Interdisciplinary Graduate School of Science and Engineering, Tokyo Institute of Technology, Yokohama, 226-8502 Japan"],"affiliations":[{"raw_affiliation_string":"Interdisciplinary Graduate School of Science and Engineering, Tokyo Institute of Technology, Yokohama, 226-8502 Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022405100","display_name":"Takao Kobayashi","orcid":"https://orcid.org/0000-0003-0387-8030"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takao Kobayashi","raw_affiliation_strings":["Interdisciplinary Graduate School of Science and Engineering, Tokyo Institute of Technology, Yokohama, 226-8502 Japan"],"affiliations":[{"raw_affiliation_string":"Interdisciplinary Graduate School of Science and Engineering, Tokyo Institute of Technology, Yokohama, 226-8502 Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059137996","display_name":"Tadashi Kitamura","orcid":null},"institutions":[{"id":"https://openalex.org/I197274945","display_name":"Nagoya Institute of Technology","ror":"https://ror.org/055yf1005","country_code":"JP","type":"education","lineage":["https://openalex.org/I197274945"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tadashi Kitamura","raw_affiliation_strings":["Department of Computer Science, Nagoya Institute of Technology, Nagoya, 466-8555 Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Nagoya Institute of Technology, Nagoya, 466-8555 Japan","institution_ids":["https://openalex.org/I197274945"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":24,"citation_normalized_percentile":{"value":0.84805,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":88,"max":89},"biblio":{"volume":"36","issue":"12","first_page":"43","last_page":"50"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.953,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/narrowband","display_name":"Narrowband","score":0.55701715}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.72029126},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6874511},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.60169184},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.5975964},{"id":"https://openalex.org/C2776096036","wikidata":"https://www.wikidata.org/wiki/Q1140483","display_name":"Narrowband","level":2,"score":0.55701715},{"id":"https://openalex.org/C112633086","wikidata":"https://www.wikidata.org/wiki/Q381287","display_name":"White noise","level":2,"score":0.48947227},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4887695},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4513461},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41738117},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.33590972},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24870911},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.1326125},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09623331},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/scj.20354","pdf_url":null,"source":{"id":"https://openalex.org/S58208175","display_name":"Systems and Computers in Japan","issn_l":"0882-1666","issn":["0882-1666","1520-684X"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":3,"referenced_works":["https://openalex.org/W1495721037","https://openalex.org/W2097544856","https://openalex.org/W2109189270"],"related_works":["https://openalex.org/W2904846757","https://openalex.org/W2899084033","https://openalex.org/W2735765216","https://openalex.org/W2688184458","https://openalex.org/W2364370872","https://openalex.org/W2147186888","https://openalex.org/W2132687327","https://openalex.org/W2097963413","https://openalex.org/W2038801705","https://openalex.org/W2025614924"],"abstract_inverted_index":{"In":[0,25,54,187,208],"this":[1,121,132,164,226],"paper":[2,133],"we":[3,28,57,76,134,177,189],"introduce":[4,190],"a":[5,31,59,79,114,123,136,142,149,156,191,196],"mixed":[6,137,220],"excitation":[7,64,98,138,165,221],"model":[8,45,61,66,139,166,222],"into":[9],"an":[10,117],"HMM-based":[11],"speech":[12,37,40,106,128,161,185],"synthesis":[13,33,70],"system":[14,34,56],"with":[15,152,155],"the":[16,20,63,69,202,205,210,216,219],"objective":[17],"of":[18,22,87,97,125,204,212,218],"improving":[19],"quality":[21,203],"synthesized":[23,36,127,206],"speech.":[24,207],"previous":[26],"work":[27],"have":[29],"proposed":[30],"text-to-speech":[32],"that":[35,44,55,95,111,147,179],"by":[38],"outputting":[39],"parameters":[41],"using":[42,94],"HMMs":[43],"Mel":[46],"frequency":[47],"ceptral":[48],"coefficients,":[49],"fundamental":[50],"frequencies,":[51],"and":[52,82,89,116,120,223],"duration.":[53],"used":[58,193],"simple":[60],"as":[62,108,173,175],"source":[65],"for":[67,85,184],"exciting":[68],"filter":[71],"(an":[72],"MLSA":[73],"filter)":[74],"whereby":[75],"switched":[77],"between":[78],"pulse":[80,150],"sequence":[81],"white":[83,153],"noise":[84,154],"intervals":[86],"voiced":[88,109],"unvoiced":[90],"speech,":[91],"respectively.":[92],"When":[93],"type":[96],"model,":[99],"it":[100,180],"is":[101,122],"not":[102],"possible":[103],"to":[104,158,170,200],"synthesize":[105],"such":[107],"fricatives":[110],"contains":[112],"both":[113],"periodic":[115],"aperiodic":[118],"component,":[119],"cause":[124],"poor":[126],"quality.":[129],"Therefore,":[130],"in":[131,198,225,241],"incorporate":[135],"based":[140],"on":[141],"narrowband":[143],"vocoding":[144,172,194],"method":[145],"MELP":[146],"combines":[148],"stream":[151],"view":[157],"realizing":[159],"high-quality":[160],"synthesis.":[162,186],"Since":[163],"can":[167],"be":[168],"applied":[169],"wideband":[171],"well":[174],"narrowband,":[176],"anticipate":[178],"will":[181],"prove":[182],"effective":[183],"addition,":[188,209],"widely":[192],"method,":[195],"postfilter,":[197],"order":[199],"improve":[201],"results":[211],"subjective":[213],"evaluation":[214],"show":[215],"effectiveness":[217],"postfilter":[224],"system.":[227],"\u00a9":[228],"2005":[229],"Wiley":[230,242],"Periodicals,":[231],"Inc.":[232],"Syst":[233],"Comp":[234],"Jpn,":[235],"36(12):":[236],"43\u201350,":[237],"2005;":[238],"Published":[239],"online":[240],"InterScience":[243],"(www.interscience.wiley.com).":[244],"DOI":[245],"10.1002/scj.20354":[246]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4251158933","counts_by_year":[{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-01-20T07:57:46.933464","created_date":"2022-05-12"}