{"id":"https://openalex.org/W2123702935","doi":"https://doi.org/10.1109/icassp.2012.6288970","title":"Noise and speaker compensation in the Log filter bank domain","display_name":"Noise and speaker compensation in the Log filter bank domain","publication_year":2012,"publication_date":"2012-03-01","ids":{"openalex":"https://openalex.org/W2123702935","doi":"https://doi.org/10.1109/icassp.2012.6288970","mag":"2123702935"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2012.6288970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019937451","display_name":"Vikas Joshi","orcid":"https://orcid.org/0000-0003-4467-3621"},"institutions":[{"id":"https://openalex.org/I24676775","display_name":"Indian Institute of Technology Madras","ror":"https://ror.org/03v0r5n49","country_code":"IN","type":"funder","lineage":["https://openalex.org/I24676775"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Vikas Joshi","raw_affiliation_strings":["[Department of electrical engineering, Indian Institute of Technology Madras, India]"],"affiliations":[{"raw_affiliation_string":"[Department of electrical engineering, Indian Institute of Technology Madras, India]","institution_ids":["https://openalex.org/I24676775"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059221392","display_name":"Raghavendra Bilgi","orcid":null},"institutions":[{"id":"https://openalex.org/I24676775","display_name":"Indian Institute of Technology Madras","ror":"https://ror.org/03v0r5n49","country_code":"IN","type":"funder","lineage":["https://openalex.org/I24676775"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Raghavendra Bilgi","raw_affiliation_strings":["[Department of electrical engineering, Indian Institute of Technology Madras, India]"],"affiliations":[{"raw_affiliation_string":"[Department of electrical engineering, Indian Institute of Technology Madras, India]","institution_ids":["https://openalex.org/I24676775"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085660348","display_name":"S. Umesh","orcid":"https://orcid.org/0000-0002-5957-1444"},"institutions":[{"id":"https://openalex.org/I24676775","display_name":"Indian Institute of Technology Madras","ror":"https://ror.org/03v0r5n49","country_code":"IN","type":"funder","lineage":["https://openalex.org/I24676775"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S. Umesh","raw_affiliation_strings":["[Department of electrical engineering, Indian Institute of Technology Madras, India]"],"affiliations":[{"raw_affiliation_string":"[Department of electrical engineering, Indian Institute of Technology Madras, India]","institution_ids":["https://openalex.org/I24676775"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013746163","display_name":"Luz Garc\u00eda","orcid":"https://orcid.org/0000-0001-5904-5412"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"funder","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"L. Garcia","raw_affiliation_strings":["Dept of Signal Theory, Telematics & Communications. University of Granada, Spain"],"affiliations":[{"raw_affiliation_string":"Dept of Signal Theory, Telematics & Communications. University of Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032065113","display_name":"Carmen Ben\u0131\u0301tez","orcid":"https://orcid.org/0000-0002-5407-8335"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"funder","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"C. Benitez","raw_affiliation_strings":["Dept of Signal Theory, Telematics & Communications. University of Granada, Spain"],"affiliations":[{"raw_affiliation_string":"Dept of Signal Theory, Telematics & Communications. University of Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.209,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":1,"citation_normalized_percentile":{"value":0.218827,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":64,"max":72},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9977,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.6851744},{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.6527956},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.5061094},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization","score":0.47475913}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.6851744},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6655029},{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.6527956},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6476367},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5262151},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.5061094},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.47475913},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.45692965},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.42750293},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42608392},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3503654},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.18988451},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.08349475},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2012.6288970","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.72,"display_name":"Peace, justice, and strong institutions"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":9,"referenced_works":["https://openalex.org/W2126597753","https://openalex.org/W2127144047","https://openalex.org/W2139246688","https://openalex.org/W2164931619","https://openalex.org/W2168101424","https://openalex.org/W2406196148","https://openalex.org/W2408673298","https://openalex.org/W257179395","https://openalex.org/W2964579"],"related_works":["https://openalex.org/W3162157266","https://openalex.org/W3044757496","https://openalex.org/W2548564146","https://openalex.org/W2162084437","https://openalex.org/W2108727544","https://openalex.org/W2100012411","https://openalex.org/W2087669554","https://openalex.org/W1997579527","https://openalex.org/W1911592522","https://openalex.org/W1482212662"],"abstract_inverted_index":{"In":[0],"this":[1,87],"paper,":[2],"we":[3,32,138],"propose":[4],"a":[5,83,154],"method":[6],"to":[7,26,146],"compensate":[8],"for":[9],"noise":[10,27,147],"and":[11,28,44,99,148],"speaker-variability":[12],"directly":[13,140],"in":[14,39,49,69,111],"the":[15,40,50,78,97,100,119,129,135],"Log":[16,41,51,70],"filter-bank":[17],"(FB)":[18],"domain,":[19,43],"so":[20],"that":[21,133,143],"MFCC":[22,141],"features":[23,142],"are":[24,144],"robust":[25,145],"speaker-variations.":[29,149],"For":[30,61],"noise-compensation,":[31],"use":[33],"Vector":[34],"Taylor":[35],"Series":[36],"(VTS)":[37],"approach":[38,80,131],"FB":[42,52,71],"speaker-normalization":[45],"is":[46,67,132],"also":[47,108],"done":[48,68,110],"domain":[53,72,113],"using":[54,73,92,105],"Linear":[55],"Vocal":[56],"tract":[57],"length":[58],"(VTLN)":[59],"matrices.":[60],"VTLN,":[62],"optimal":[63],"selection":[64,104],"of":[65,128,158],"warp-factor":[66,103],"canonical":[74],"GMM":[75,98,106],"model,":[76],"avoiding":[77],"two-pass":[79],"needed":[81],"by":[82,114],"HMM":[84],"model.":[85],"Further,":[86],"can":[88,107],"be":[89,109],"efficiently":[90],"implemented":[91],"sufficient":[93],"statistics":[94],"obtained":[95],"from":[96],"FB-VTLN-matrices.":[101],"The":[102,126,150],"cepstral":[112],"applying":[115],"DCT":[116],"matrices":[117],"without":[118],"usual":[120],"approximations":[121],"associated":[122],"with":[123],"conventional":[124],"linear-VTLN.":[125],"elegance":[127],"proposed":[130,151],"given":[134],"speech":[136],"data,":[137],"obtain":[139],"approach,":[152],"show":[153],"significant":[155],"relative":[156],"improvement":[157],"31%":[159],"over":[160],"baseline":[161],"on":[162],"Aurora-4":[163],"task.":[164]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2123702935","counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2025-03-25T04:13:04.094927","created_date":"2016-06-24"}