{"id":"https://openalex.org/W2055285859","doi":"https://doi.org/10.1109/icassp.2010.5495610","title":"Using online model comparison in the Variational Bayes framework for online unsupervised Voice Activity Detection","display_name":"Using online model comparison in the Variational Bayes framework for online unsupervised Voice Activity Detection","publication_year":2010,"publication_date":"2010-01-01","ids":{"openalex":"https://openalex.org/W2055285859","doi":"https://doi.org/10.1109/icassp.2010.5495610","mag":"2055285859"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495610","pdf_url":null,"source":{"id":"https://openalex.org/S4363607879","display_name":"IEEE International Conference on Acoustics Speech and Signal Processing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023051838","display_name":"David Cournapeau","orcid":null},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"David Cournapeau","raw_affiliation_strings":["School of Informatics, Kyoto University Sakyo-ku, 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"School of Informatics, Kyoto University Sakyo-ku, 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["NTT Communication Science Labs, 2-4 Hikaridai, Seika-cho, Soraku-gun, Kyoto 619-0237, Japan#TAB#"],"affiliations":[{"raw_affiliation_string":"NTT Communication Science Labs, 2-4 Hikaridai, Seika-cho, Soraku-gun, Kyoto 619-0237, Japan#TAB#","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018620798","display_name":"Atsushi Nakamura","orcid":"https://orcid.org/0000-0003-0788-2221"},"institutions":[],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Atsushi Nakamura","raw_affiliation_strings":["NTT Communication Science Labs, 2-4 Hikaridai, Seika-cho, Soraku-gun, Kyoto 619-0237, Japan#TAB#"],"affiliations":[{"raw_affiliation_string":"NTT Communication Science Labs, 2-4 Hikaridai, Seika-cho, Soraku-gun, Kyoto 619-0237, Japan#TAB#","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038044080","display_name":"Tatsuya Kawahara","orcid":"https://orcid.org/0000-0002-2686-2296"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tatsuya Kawahara","raw_affiliation_strings":["School of Informatics, Kyoto University Sakyo-ku, 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"School of Informatics, Kyoto University Sakyo-ku, 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.592,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":2,"citation_normalized_percentile":{"value":0.37984,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":71,"max":75},"biblio":{"volume":"7","issue":null,"first_page":"4462","last_page":"4465"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech Enhancement Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech Enhancement Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition Technology","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Audio Signal Classification and Analysis","score":0.9991,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker Verification","score":0.56201},{"id":"https://openalex.org/keywords/audio-visual-speech-recognition","display_name":"Audio-Visual Speech Recognition","score":0.557719},{"id":"https://openalex.org/keywords/audio-event-detection","display_name":"Audio Event Detection","score":0.556838},{"id":"https://openalex.org/keywords/acoustic-modeling","display_name":"Acoustic Modeling","score":0.540275},{"id":"https://openalex.org/keywords/environmental-sound-recognition","display_name":"Environmental Sound Recognition","score":0.521779},{"id":"https://openalex.org/keywords/online-model","display_name":"Online model","score":0.50473225},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.44392952}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7664997},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.7492569},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.6585222},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.62717843},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.59545857},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.54884964},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.51796544},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5124355},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.50671893},{"id":"https://openalex.org/C2777851325","wikidata":"https://www.wikidata.org/wiki/Q7094102","display_name":"Online model","level":2,"score":0.50473225},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.4764995},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.44392952},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.40721625},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40326893},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.39262745},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.31764287},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.2293934},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.18120998},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11500758},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.102586985},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495610","pdf_url":null,"source":{"id":"https://openalex.org/S4363607879","display_name":"IEEE International Conference on Acoustics Speech and Signal Processing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, justice, and strong institutions","score":0.74,"id":"https://metadata.un.org/sdg/16"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":12,"referenced_works":["https://openalex.org/W1560013842","https://openalex.org/W1570770495","https://openalex.org/W1686266550","https://openalex.org/W2049633694","https://openalex.org/W2119535101","https://openalex.org/W2129120544","https://openalex.org/W2132214951","https://openalex.org/W2138561666","https://openalex.org/W2166607750","https://openalex.org/W2171911691","https://openalex.org/W3141736179","https://openalex.org/W629338568"],"related_works":["https://openalex.org/W4220802396","https://openalex.org/W2726838704","https://openalex.org/W2537862391","https://openalex.org/W2417174640","https://openalex.org/W2394466068","https://openalex.org/W2393473353","https://openalex.org/W2373790322","https://openalex.org/W2171665309","https://openalex.org/W1987683558","https://openalex.org/W1599183102"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"the":[3,23,58,74,78,81,92,99,107],"use":[4],"of":[5,38],"online":[6,11,51,69],"Variational":[7,59],"Bayes":[8,60],"method":[9,109],"for":[10,48,73,80],"Voice":[12],"Activity":[13],"Detection":[14],"(VAD)":[15],"in":[16,70],"an":[17],"unsupervised":[18],"context.":[19],"In":[20,62],"conventional":[21,112],"VAD,":[22],"final":[24],"step":[25],"often":[26],"relies":[27],"on":[28,91,98],"state":[29],"machines":[30],"whose":[31],"parameters":[32],"are":[33,67],"heuristically":[34],"tuned.":[35],"The":[36,84],"goal":[37],"this":[39,63],"study":[40],"is":[41,55,87],"to":[42,111],"propose":[43],"a":[44,103],"solid":[45],"statistical":[46,113],"scheme":[47],"VAD":[49,85,114],"using":[50],"model":[52],"comparison":[53],"which":[54],"provided":[56],"from":[57],"framework.":[61],"scheme,":[64],"two":[65],"models":[66],"estimated":[68],"parallel:":[71],"one":[72],"noise-only":[75],"situation,":[76],"and":[77],"other":[79],"noise-plus-signal":[82],"situation":[83],"decision":[86],"done":[88],"automatically":[89],"depending":[90],"selected":[93],"model.":[94],"An":[95],"experimental":[96],"evaluation":[97],"CENSREC-1-C":[100],"database":[101],"shows":[102],"significant":[104],"improvement":[105],"by":[106],"proposed":[108],"compared":[110],"methods.":[115]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2055285859","counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2024-11-21T13:02:22.595370","created_date":"2016-06-24"}