{"id":"https://openalex.org/W2166706387","doi":"https://doi.org/10.1109/tasl.2006.885921","title":"Audio Signal Feature Extraction and Classification Using Local Discriminant Bases","display_name":"Audio Signal Feature Extraction and Classification Using Local Discriminant Bases","publication_year":2007,"publication_date":"2007-04-25","ids":{"openalex":"https://openalex.org/W2166706387","doi":"https://doi.org/10.1109/tasl.2006.885921","mag":"2166706387"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2006.885921","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101630545","display_name":"Karthikeyan Umapathy","orcid":"https://orcid.org/0000-0002-0152-6472"},"institutions":[{"id":"https://openalex.org/I125749732","display_name":"Western University","ror":"https://ror.org/02grkyz14","country_code":"CA","type":"education","lineage":["https://openalex.org/I125749732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Karthikeyan Umapathy","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Western Ontario, London, ONT, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Western Ontario, London, ONT, Canada","institution_ids":["https://openalex.org/I125749732"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086845888","display_name":"Sridhar Krishnan","orcid":"https://orcid.org/0000-0002-4659-564X"},"institutions":[{"id":"https://openalex.org/I530967","display_name":"Toronto Metropolitan University","ror":"https://ror.org/05g13zd79","country_code":"CA","type":"education","lineage":["https://openalex.org/I530967"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Sridhar Krishnan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Ryerson University, Toronto, ONT, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Ryerson University, Toronto, ONT, Canada","institution_ids":["https://openalex.org/I530967"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042759215","display_name":"Raveendra K. Rao","orcid":"https://orcid.org/0000-0001-5442-347X"},"institutions":[{"id":"https://openalex.org/I125749732","display_name":"Western University","ror":"https://ror.org/02grkyz14","country_code":"CA","type":"education","lineage":["https://openalex.org/I125749732"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Raveendra K. Rao","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Western Ontario, London, ONT, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Western Ontario, London, ONT, Canada","institution_ids":["https://openalex.org/I125749732"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.918,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":89,"citation_normalized_percentile":{"value":0.97696,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"15","issue":"4","first_page":"1236","last_page":"1246"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9984,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9621,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/natural-sounds","display_name":"Natural sounds","score":0.507793},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.4192072}],"concepts":[{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.6872347},{"id":"https://openalex.org/C69738355","wikidata":"https://www.wikidata.org/wiki/Q1228929","display_name":"Linear discriminant analysis","level":2,"score":0.6807833},{"id":"https://openalex.org/C4060165","wikidata":"https://www.wikidata.org/wiki/Q11405","display_name":"Flute","level":2,"score":0.65965056},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.6235987},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6049392},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.57387644},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.54463255},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5155706},{"id":"https://openalex.org/C2780646970","wikidata":"https://www.wikidata.org/wiki/Q6980787","display_name":"Natural sounds","level":2,"score":0.507793},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.49685934},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.48539174},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.47884727},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.4383327},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.4192072},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20406774},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.12138194},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.086269975},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2006.885921","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.56,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":33,"referenced_works":["https://openalex.org/W2017608891","https://openalex.org/W2035071469","https://openalex.org/W2058189943","https://openalex.org/W2100488848","https://openalex.org/W2114708606","https://openalex.org/W2115755118","https://openalex.org/W2126049200","https://openalex.org/W2126224661","https://openalex.org/W2127177652","https://openalex.org/W2127489974","https://openalex.org/W2127503407","https://openalex.org/W2129244720","https://openalex.org/W2129316790","https://openalex.org/W2131981197","https://openalex.org/W2132549764","https://openalex.org/W2133401807","https://openalex.org/W2133824856","https://openalex.org/W2135346934","https://openalex.org/W2136246403","https://openalex.org/W2137343183","https://openalex.org/W2139435939","https://openalex.org/W2140623795","https://openalex.org/W2158836148","https://openalex.org/W2161036973","https://openalex.org/W2164024160","https://openalex.org/W2168441989","https://openalex.org/W2168629236","https://openalex.org/W2169790300","https://openalex.org/W3146003712","https://openalex.org/W3146177989","https://openalex.org/W34415881","https://openalex.org/W4236557323","https://openalex.org/W4298266977"],"related_works":["https://openalex.org/W4315836293","https://openalex.org/W4243888788","https://openalex.org/W4231351862","https://openalex.org/W4212794605","https://openalex.org/W3004352674","https://openalex.org/W2970176078","https://openalex.org/W2769884427","https://openalex.org/W2555630001","https://openalex.org/W2289868279","https://openalex.org/W1975359510"],"abstract_inverted_index":{"Audio":[0],"feature":[1,31,60],"extraction":[2,61],"plays":[3],"an":[4,58,199],"important":[5],"role":[6],"in":[7,86,195],"analyzing":[8],"and":[9,19,62,94,133,154,185,198,211,222,228,232,242,248,254,262,308],"characterizing":[10],"audio":[11,22,45,59,117,127,191],"content.":[12],"Auditory":[13],"scene":[14],"analysis,":[15],"content-based":[16],"retrieval,":[17],"indexing,":[18],"fingerprinting":[20],"of":[21,25,44,89,116,137,167,189,203],"are":[23],"few":[24],"the":[26,41,75,87,91,123,126,138,146,164,168,172,206,217,235,271,280,284,294,300,305,311],"applications":[27],"that":[28,39,67],"require":[29],"efficient":[30],"extraction.":[32],"The":[33,99,157,288],"key":[34],"to":[35,48,105,144,270],"extract":[36],"strong":[37],"features":[38,96,101,282,296],"characterize":[40],"complex":[42],"nature":[43],"signals":[46,118,128,192],"is":[47],"identify":[49],"their":[50],"discriminatory":[51,71],"subspaces.":[52],"In":[53,122,268],"this":[54,196],"paper,":[55],"we":[56],"propose":[57],"a":[63,106,112,273],"multigroup":[64],"classification":[65,115,201,275,290],"scheme":[66],"focuses":[68],"on":[69],"identifying":[70],"time-frequency":[72],"subspaces":[73],"using":[74,293],"local":[76],"discriminant":[77,108],"bases":[78],"(LDB)":[79],"technique.":[80],"Two":[81],"dissimilarity":[82],"measures":[83],"were":[84,102,129,142,193,266,297],"used":[85,194],"process":[88],"selecting":[90],"LDB":[92,281],"nodes":[93],"extracting":[95],"from":[97],"them.":[98],"extracted":[100],"then":[103],"fed":[104],"linear":[107],"analysis-based":[109],"classifier":[110],"for":[111,205,216,234,299,304,310],"three-level":[113],"hierarchical":[114],"into":[119,131,171],"ten":[120,174],"classes.":[121],"first":[124,139,207,301],"level,":[125,302,307],"grouped":[130],"artificial":[132,210],"natural":[134,213],"sounds.":[135,156],"Each":[136],"level":[140,148,159,170,208,219,237,313],"groups":[141,149,166,175],"subdivided":[143],"form":[145],"second":[147,169,218,306],"viz.":[150],"instrumental,":[151],"automobile,":[152],"human,":[153],"nonhuman":[155,230],"third":[158,236,312],"was":[160,276],"formed":[161],"by":[162],"subdividing":[163],"four":[165],"final":[173],"(drums,":[176],"flute,":[177,241],"piano,":[178],"aircraft,":[179],"helicopter,":[180],"male,":[181],"female,":[182],"animals,":[183,259],"birds":[184,261],"insects).":[186],"A":[187],"database":[188],"213":[190],"study":[197],"average":[200,289],"accuracy":[202],"83%":[204],"(113":[209],"100":[212],"sounds),":[214,231],"92%":[215],"(73":[220],"instrumental":[221],"40":[223,226],"automobile":[224],"sounds;":[225,245,251],"human":[227],"60":[229],"89%":[233],"(27":[238],"drums,":[239],"15":[240],"31":[243],"piano":[244],"23":[246],"aircraft":[247],"17":[249],"helicopter":[250],"20":[252,255,258,260,263],"male":[253],"female":[256],"speech;":[257],"insects":[264],"sounds)":[265],"achieved.":[267],"addition":[269],"above,":[272],"separate":[274],"also":[277],"performed":[278],"combining":[279],"with":[283],"mel-frequency":[285],"cepstral":[286],"coefficients.":[287],"accuracies":[291],"achieved":[292],"combined":[295],"91%":[298],"99%":[303],"95%":[309]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2166706387","counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":9},{"year":2013,"cited_by_count":8},{"year":2012,"cited_by_count":5}],"updated_date":"2024-12-08T22:59:44.129502","created_date":"2016-06-24"}