{"id":"https://openalex.org/W2034213230","doi":"https://doi.org/10.1109/icassp.2010.5495973","title":"Automatic audio tagging using covariate shift adaptation","display_name":"Automatic audio tagging using covariate shift adaptation","publication_year":2010,"publication_date":"2010-01-01","ids":{"openalex":"https://openalex.org/W2034213230","doi":"https://doi.org/10.1109/icassp.2010.5495973","mag":"2034213230"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495973","pdf_url":null,"source":{"id":"https://openalex.org/S4363607879","display_name":"IEEE International Conference on Acoustics Speech and Signal Processing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086940921","display_name":"Gordon Wichern","orcid":"https://orcid.org/0000-0002-8597-6795"},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"funder","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gordon Wichern","raw_affiliation_strings":["SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA"],"affiliations":[{"raw_affiliation_string":"SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046358579","display_name":"Makoto Yamada","orcid":"https://orcid.org/0000-0001-7508-5094"},"institutions":[{"id":"https://openalex.org/I92446798","display_name":"Colorado State University","ror":"https://ror.org/03k1gpj17","country_code":"US","type":"funder","lineage":["https://openalex.org/I92446798"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Makoto Yamada","raw_affiliation_strings":["Colorado State University, Japan"],"affiliations":[{"raw_affiliation_string":"Colorado State University, Japan","institution_ids":["https://openalex.org/I92446798"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062801525","display_name":"Harvey Thornburg","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"funder","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Harvey Thornburg","raw_affiliation_strings":["SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA"],"affiliations":[{"raw_affiliation_string":"SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072744508","display_name":"Masashi Sugiyama","orcid":"https://orcid.org/0000-0001-6658-6743"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"funder","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masashi Sugiyama","raw_affiliation_strings":["Department of Computer Science, Tokyo Institute of Technology & JST, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Tokyo Institute of Technology & JST, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074371899","display_name":"Andreas Spanias","orcid":"https://orcid.org/0000-0003-0306-9348"},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"funder","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andreas Spanias","raw_affiliation_strings":["SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA"],"affiliations":[{"raw_affiliation_string":"SenSIP Center, School of ECEE & School of Arts, Media, and Engineering, Arizona State University, USA","institution_ids":["https://openalex.org/I55732556"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.294,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":6,"citation_normalized_percentile":{"value":0.601354,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":81,"max":82},"biblio":{"volume":null,"issue":null,"first_page":"253","last_page":"256"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5623631},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.43729168},{"id":"https://openalex.org/keywords/sound-quality","display_name":"Sound Quality","score":0.42237598}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8338733},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.7017344},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5623631},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.53724384},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4968398},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4814043},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45800328},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.43729168},{"id":"https://openalex.org/C167310288","wikidata":"https://www.wikidata.org/wiki/Q7564808","display_name":"Sound quality","level":2,"score":0.42237598},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41273934},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.37432152},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34546986},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.24942261},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495973","pdf_url":null,"source":{"id":"https://openalex.org/S4363607879","display_name":"IEEE International Conference on Acoustics Speech and Signal Processing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.53,"display_name":"Industry, innovation and infrastructure"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":13,"referenced_works":["https://openalex.org/W189742998","https://openalex.org/W2010486494","https://openalex.org/W2034368206","https://openalex.org/W2075978670","https://openalex.org/W2098766654","https://openalex.org/W2103851188","https://openalex.org/W2116373735","https://openalex.org/W2123587156","https://openalex.org/W2139949258","https://openalex.org/W2146664010","https://openalex.org/W2148388310","https://openalex.org/W2150322163","https://openalex.org/W2152322845"],"related_works":["https://openalex.org/W4206042385","https://openalex.org/W2994787386","https://openalex.org/W2985746494","https://openalex.org/W2923628599","https://openalex.org/W2511384863","https://openalex.org/W2296317756","https://openalex.org/W2096089271","https://openalex.org/W2080773131","https://openalex.org/W2051519658","https://openalex.org/W2014100433"],"abstract_inverted_index":{"Automatically":[0],"annotating":[1],"or":[2],"tagging":[3,148],"unlabeled":[4],"audio":[5,31,69,109],"files":[6,37,70,138],"has":[7],"several":[8],"applications,":[9],"such":[10],"as":[11,112],"database":[12,135],"organization":[13],"and":[14,51,90,140],"recommender":[15],"systems.":[16],"We":[17],"are":[18,48,85],"interested":[19],"in":[20,76,87],"the":[21,24,36,45,68,77,82,88,94,125],"case":[22],"where":[23],"system":[25],"is":[26],"trained":[27],"using":[28],"clean":[29],"high-quality":[30],"files,":[32],"but":[33,93],"most":[34],"of":[35,97,117,127,136],"that":[38],"need":[39],"to":[40,114,123],"be":[41],"automatically":[42],"tagged":[43],"during":[44],"test":[46,91],"phase":[47],"heavily":[49],"compressed":[50],"noisy,":[52],"for":[53],"instance":[54],"if":[55],"they":[56],"were":[57],"captured":[58],"on":[59,131],"a":[60,72,106,115,132],"mobile":[61],"device.":[62],"In":[63],"this":[64],"situation":[65],"we":[66],"assume":[67],"follow":[71],"covariate":[73,128],"shift":[74],"model":[75],"acoustic":[78],"feature":[79,83],"space,":[80],"i.e.,":[81],"distributions":[84],"different":[86],"training":[89],"phases,":[92],"conditional":[95],"distribution":[96],"labels":[98],"given":[99],"features":[100],"remains":[101],"unchanged.":[102],"Our":[103],"method":[104],"uses":[105],"specially":[107],"designed":[108],"similarity":[110],"measure":[111],"input":[113],"set":[116],"weighted":[118],"logistic":[119],"regressors,":[120],"which":[121],"attempt":[122],"alleviate":[124],"influence":[126],"shift.":[129],"Results":[130],"freely":[133],"available":[134],"sound":[137],"contributed":[139],"labeled":[141],"by":[142],"non-expert":[143],"users,":[144],"demonstrate":[145],"effective":[146],"automatic":[147],"performance.":[149]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2034213230","counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-04-18T21:18:31.547339","created_date":"2016-06-24"}