{"id":"https://openalex.org/W1250452774","doi":"https://doi.org/10.21437/eurospeech.2003-136","title":"Combining non-uniform unit selection with diphone based synthesis","display_name":"Combining non-uniform unit selection with diphone based synthesis","publication_year":2003,"publication_date":"2003-09-01","ids":{"openalex":"https://openalex.org/W1250452774","doi":"https://doi.org/10.21437/eurospeech.2003-136","mag":"1250452774"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-136","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088212404","display_name":"Michael Pucher","orcid":"https://orcid.org/0000-0002-5374-1342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michael Pucher","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026459289","display_name":"Friedrich Neubarth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Friedrich Neubarth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074433345","display_name":"Erhard Rank","orcid":null},"institutions":[{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Erhard Rank","raw_affiliation_strings":["Institute of Signal Processing and Speech Communication (4420)"],"affiliations":[{"raw_affiliation_string":"Institute of Signal Processing and Speech Communication (4420)","institution_ids":["https://openalex.org/I4210121626"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009725070","display_name":"Georg Niklfeld","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Georg Niklfeld","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101851275","display_name":"Qi Guan","orcid":"https://orcid.org/0000-0003-4165-461X"},"institutions":[{"id":"https://openalex.org/I1325886976","display_name":"Siemens (Germany)","ror":"https://ror.org/059mq0909","country_code":"DE","type":"funder","lineage":["https://openalex.org/I1325886976"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Qi Guan","raw_affiliation_strings":["Siemens"],"affiliations":[{"raw_affiliation_string":"Siemens","institution_ids":["https://openalex.org/I1325886976"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.465,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.496455,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":74,"max":76},"biblio":{"volume":null,"issue":null,"first_page":"1329","last_page":"1332"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9984,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/selection-algorithm","display_name":"Selection algorithm","score":0.5715735}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.80998313},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.7763773},{"id":"https://openalex.org/C122637931","wikidata":"https://www.wikidata.org/wiki/Q118084","display_name":"Unit (ring theory)","level":2,"score":0.715731},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.62561816},{"id":"https://openalex.org/C2775973920","wikidata":"https://www.wikidata.org/wiki/Q3252726","display_name":"Selection algorithm","level":3,"score":0.5715735},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.51647353},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4294988},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.39039233},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0875566},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-136","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality education","score":0.46}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":8,"referenced_works":["https://openalex.org/W1536452104","https://openalex.org/W1543527380","https://openalex.org/W2068804781","https://openalex.org/W2131058166","https://openalex.org/W2150658333","https://openalex.org/W2285365380","https://openalex.org/W2404028712","https://openalex.org/W67398698"],"related_works":["https://openalex.org/W629290331","https://openalex.org/W617685022","https://openalex.org/W611386996","https://openalex.org/W4395469854","https://openalex.org/W4205762803","https://openalex.org/W2535856026","https://openalex.org/W2371343292","https://openalex.org/W2265065644","https://openalex.org/W1788667622","https://openalex.org/W127416991"],"abstract_inverted_index":{"This":[0,68],"paper":[1],"describes":[2],"the":[3,14,53,56,61,64],"unit":[4,22,32,65,74],"selection":[5,66,75],"algorithm":[6,25,69],"of":[7,37,72],"a":[8,20,38,48],"speech":[9,50,81],"synthesis":[10],"system,":[11],"which":[12],"selects":[13],"k-best":[15],"paths":[16],"over":[17],"units":[18],"from":[19,63],"relational":[21],"database.":[23],"The":[24],"uses":[26],"words":[27],"and":[28,77],"diphones":[29],"as":[30],"basic":[31],"types.":[33],"It":[34],"is":[35],"part":[36],"customisable":[39],"textto-speech":[40],"system":[41],"designed":[42],"for":[43],"generating":[44],"new":[45],"prompts":[46],"using":[47],"recorded":[49],"corpus,":[51],"with":[52],"option":[54],"that":[55],"user":[57],"can":[58],"interactively":[59],"optimise":[60],"results":[62],"algorithm.":[67],"combines":[70],"advantages":[71],"nonuniform":[73],"algorithms":[76],"diphone":[78],"inventory":[79],"based":[80],"synthesis.":[82]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W1250452774","counts_by_year":[],"updated_date":"2025-02-17T21:28:59.303117","created_date":"2016-06-24"}