{"id":"https://openalex.org/W2159748844","doi":"https://doi.org/10.1109/tsa.2004.828641","title":"Language Model and Speaking Rate Adaptation for Spontaneous Presentation Speech Recognition","display_name":"Language Model and Speaking Rate Adaptation for Spontaneous Presentation Speech Recognition","publication_year":2004,"publication_date":"2004-06-21","ids":{"openalex":"https://openalex.org/W2159748844","doi":"https://doi.org/10.1109/tsa.2004.828641","mag":"2159748844"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsa.2004.828641","pdf_url":null,"source":{"id":"https://openalex.org/S202446260","display_name":"IEEE Transactions on Speech and Audio Processing","issn_l":"1063-6676","issn":["1063-6676","1558-2353"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://repository.kulib.kyoto-u.ac.jp/dspace/bitstream/2433/128905/1/TSA.2004.828641.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089538393","display_name":"H. Nanjo","orcid":"https://orcid.org/0000-0003-0703-103X"},"institutions":[{"id":"https://openalex.org/I39012071","display_name":"Kyoto College of Graduate Studies for Informatics","ror":"https://ror.org/05mzj8a56","country_code":"JP","type":"education","lineage":["https://openalex.org/I39012071"]},{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"funder","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"H. Nanjo","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Kyoto, Japan","institution_ids":["https://openalex.org/I39012071","https://openalex.org/I22299242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038044080","display_name":"Tatsuya Kawahara","orcid":"https://orcid.org/0000-0002-2686-2296"},"institutions":[{"id":"https://openalex.org/I39012071","display_name":"Kyoto College of Graduate Studies for Informatics","ror":"https://ror.org/05mzj8a56","country_code":"JP","type":"education","lineage":["https://openalex.org/I39012071"]},{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"funder","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"T. Kawahara","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Kyoto, Japan","institution_ids":["https://openalex.org/I39012071","https://openalex.org/I22299242"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.311,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":50,"citation_normalized_percentile":{"value":0.930013,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":"12","issue":"4","first_page":"391","last_page":"400"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9931,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9903,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.916904},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.6962926},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.67094755},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription","score":0.4351086}],"concepts":[{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.916904},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.80531347},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7251142},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.7181357},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.6962926},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.6866309},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.67094755},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5003054},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.46401724},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45186713},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.4351086},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.416945},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1687221},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09562713},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.08281264},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsa.2004.828641","pdf_url":null,"source":{"id":"https://openalex.org/S202446260","display_name":"IEEE Transactions on Speech and Audio Processing","issn_l":"1063-6676","issn":["1063-6676","1558-2353"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://hdl.handle.net/2433/128905","pdf_url":"https://repository.kulib.kyoto-u.ac.jp/dspace/bitstream/2433/128905/1/TSA.2004.828641.pdf","source":{"id":"https://openalex.org/S4306401454","display_name":"Kyoto University Research Information Repository (Kyoto University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I22299242","host_organization_name":"Kyoto University","host_organization_lineage":["https://openalex.org/I22299242"],"host_organization_lineage_names":["Kyoto University"],"type":"repository"},"license":"mit","license_id":"https://openalex.org/licenses/mit","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://hdl.handle.net/2433/128905","pdf_url":"https://repository.kulib.kyoto-u.ac.jp/dspace/bitstream/2433/128905/1/TSA.2004.828641.pdf","source":{"id":"https://openalex.org/S4306401454","display_name":"Kyoto University Research Information Repository (Kyoto University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I22299242","host_organization_name":"Kyoto University","host_organization_lineage":["https://openalex.org/I22299242"],"host_organization_lineage_names":["Kyoto University"],"type":"repository"},"license":"mit","license_id":"https://openalex.org/licenses/mit","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.55}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":35,"referenced_works":["https://openalex.org/W110463742","https://openalex.org/W150420562","https://openalex.org/W1513946950","https://openalex.org/W1517982047","https://openalex.org/W1549285799","https://openalex.org/W1577618146","https://openalex.org/W1590070522","https://openalex.org/W1665921526","https://openalex.org/W1675297740","https://openalex.org/W173400130","https://openalex.org/W1764939238","https://openalex.org/W1806349385","https://openalex.org/W187680888","https://openalex.org/W2096375461","https://openalex.org/W2096774922","https://openalex.org/W2100734170","https://openalex.org/W2115501357","https://openalex.org/W2117903328","https://openalex.org/W212398887","https://openalex.org/W2130628335","https://openalex.org/W2146871184","https://openalex.org/W2159518412","https://openalex.org/W2167915960","https://openalex.org/W2169518243","https://openalex.org/W2169941844","https://openalex.org/W2171907819","https://openalex.org/W2280630092","https://openalex.org/W2402326842","https://openalex.org/W24068691","https://openalex.org/W26527944","https://openalex.org/W3034729383","https://openalex.org/W3141224204","https://openalex.org/W50249030","https://openalex.org/W87954838","https://openalex.org/W93383444"],"related_works":["https://openalex.org/W4322096525","https://openalex.org/W4281893144","https://openalex.org/W2787311093","https://openalex.org/W2551914602","https://openalex.org/W2252095989","https://openalex.org/W2169518243","https://openalex.org/W2151348424","https://openalex.org/W2105076537","https://openalex.org/W2050138804","https://openalex.org/W1494910745"],"abstract_inverted_index":{"The":[0,188],"paper":[1],"addresses":[2],"adaptation":[3,62,103,195],"methods":[4,58,104,177,196],"to":[5,63,122,173,185],"language":[6,60],"model":[7,61],"and":[8,35,50,67,80,83,105,111,132,169,180],"speaking":[9],"rate":[10],"(SR)":[11],"of":[12,23,37,48,59,88,145,191,202],"individual":[13],"speakers":[14],"which":[15],"are":[16,178],"two":[17,193],"major":[18],"problems":[19],"in":[20,33,200],"automatic":[21],"transcription":[22,201],"spontaneous":[24,126],"presentation":[25],"speech.":[26],"To":[27],"cope":[28],"with":[29],"a":[30,64,68,118,135,156],"large":[31],"variation":[32],"expression":[34],"pronunciation":[36,52],"words":[38],"depending":[39],"on":[40,76],"the":[41,46,77,89,109,123,162,174,192],"speaker,":[42],"firstly,":[43],"we":[44,55,154],"investigate":[45],"effect":[47,190],"statistical":[49],"context-dependent":[51],"modeling.":[53],"Secondly,":[54],"present":[56,117],"unsupervised":[57],"specific":[65],"speaker":[66],"topic":[69],"by":[70],"1)":[71],"selecting":[72],"similar":[73],"texts":[74],"based":[75],"word":[78,112],"perplexity":[79,110],"TF-IDF":[81],"measure":[82],"2)":[84],"making":[85],"direct":[86],"use":[87],"initial":[90],"recognition":[91],"result":[92],"for":[93,143],"generating":[94],"an":[95],"enhanced":[96],"model.":[97],"We":[98,115,137],"confirm":[99],"that":[100,160],"all":[101],"proposed":[102,194],"their":[106,181],"combinations":[107],"reduce":[108],"error":[113,141],"rate.":[114],"also":[116,138,198],"decoding":[119,158,170],"strategy":[120,159],"adapted":[121],"SR.":[124,175],"In":[125],"speech,":[127],"SR":[128],"is":[129,149,197],"generally":[130],"fast":[131,150],"may":[133],"vary":[134],"lot.":[136],"observe":[139],"different":[140],"tendencies":[142],"portions":[144],"presentations":[146],"where":[147],"speech":[148],"or":[151],"slow.":[152],"Therefore,":[153],"propose":[155],"SR-dependent":[157],"applies":[161],"most":[163],"appropriate":[164],"acoustic":[165],"analysis,":[166],"phone":[167],"models,":[168],"parameters":[171],"according":[172],"Several":[176],"investigated":[179],"selective":[182],"application":[183],"leads":[184],"improved":[186],"accuracy.":[187],"combined":[189],"confirmed":[199],"real":[203],"academic":[204],"presentation.":[205]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2159748844","counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":4}],"updated_date":"2025-04-18T03:18:42.946435","created_date":"2016-06-24"}