{"id":"https://openalex.org/W4390533658","doi":"https://doi.org/10.1007/s43926-023-00049-y","title":"Comparative analysis of audio classification with MFCC and STFT features using machine learning techniques","display_name":"Comparative analysis of audio classification with MFCC and STFT features using machine learning techniques","publication_year":2024,"publication_date":"2024-01-03","ids":{"openalex":"https://openalex.org/W4390533658","doi":"https://doi.org/10.1007/s43926-023-00049-y"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s43926-023-00049-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s43926-023-00049-y.pdf","source":{"id":"https://openalex.org/S4210230675","display_name":"Discover Internet of Things","issn_l":"2730-7239","issn":["2730-7239"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s43926-023-00049-y.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042779633","display_name":"Mahendra Kumar Gourisaria","orcid":"https://orcid.org/0000-0002-1785-8586"},"institutions":[{"id":"https://openalex.org/I67357951","display_name":"KIIT University","ror":"https://ror.org/00k8zt527","country_code":"IN","type":"funder","lineage":["https://openalex.org/I67357951"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Mahendra Kumar Gourisaria","raw_affiliation_strings":["School of Computer Engineering, KIIT Deemed to Be University, Bhubaneswar, Odisha, 751024, India"],"affiliations":[{"raw_affiliation_string":"School of Computer Engineering, KIIT Deemed to Be University, Bhubaneswar, Odisha, 751024, India","institution_ids":["https://openalex.org/I67357951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103855547","display_name":"Rakshit Agrawal","orcid":null},"institutions":[{"id":"https://openalex.org/I67357951","display_name":"KIIT University","ror":"https://ror.org/00k8zt527","country_code":"IN","type":"funder","lineage":["https://openalex.org/I67357951"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rakshit Agrawal","raw_affiliation_strings":["School of Computer Engineering, KIIT Deemed to Be University, Bhubaneswar, Odisha, 751024, India"],"affiliations":[{"raw_affiliation_string":"School of Computer Engineering, KIIT Deemed to Be University, Bhubaneswar, Odisha, 751024, India","institution_ids":["https://openalex.org/I67357951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048143999","display_name":"Manoj Sahni","orcid":"https://orcid.org/0000-0001-7949-9147"},"institutions":[{"id":"https://openalex.org/I33586908","display_name":"Pandit Deendayal Petroleum University","ror":"https://ror.org/02nsv5p42","country_code":"IN","type":"education","lineage":["https://openalex.org/I33586908"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manoj Sahni","raw_affiliation_strings":["Department of Mathematics, Pandit Deendayal Energy University, Gandhinagar, Gujarat, 382426, India"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics, Pandit Deendayal Energy University, Gandhinagar, Gujarat, 382426, India","institution_ids":["https://openalex.org/I33586908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054183825","display_name":"Pradeep Kumar Singh","orcid":"https://orcid.org/0000-0002-7676-9014"},"institutions":[{"id":"https://openalex.org/I4210142231","display_name":"Central University of Jammu","ror":"https://ror.org/03nw1rg94","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210142231"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Pradeep Kumar Singh","raw_affiliation_strings":["Central University of Jammu, Bagla Suchani, Jammu & Kashmir, India"],"affiliations":[{"raw_affiliation_string":"Central University of Jammu, Bagla Suchani, Jammu & Kashmir, India","institution_ids":["https://openalex.org/I4210142231"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5054183825"],"corresponding_institution_ids":["https://openalex.org/I4210142231"],"apc_list":{"value":990,"currency":"EUR","value_usd":1067},"apc_paid":{"value":990,"currency":"EUR","value_usd":1067},"fwci":17.021,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":12,"citation_normalized_percentile":{"value":0.999844,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"4","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9973,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9838,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.79695654},{"id":"https://openalex.org/keywords/audio-analyzer","display_name":"Audio analyzer","score":0.42304924}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8193666},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.79695654},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.48854145},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46122673},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4559177},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4379897},{"id":"https://openalex.org/C166386157","wikidata":"https://www.wikidata.org/wiki/Q1477735","display_name":"Short-time Fourier transform","level":4,"score":0.43121225},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.42304924},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.393418},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3658272},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.337714},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2997958},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.19307026},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.19240862},{"id":"https://openalex.org/C203024314","wikidata":"https://www.wikidata.org/wiki/Q1365258","display_name":"Fourier analysis","level":3,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s43926-023-00049-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s43926-023-00049-y.pdf","source":{"id":"https://openalex.org/S4210230675","display_name":"Discover Internet of Things","issn_l":"2730-7239","issn":["2730-7239"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1007/s43926-023-00049-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s43926-023-00049-y.pdf","source":{"id":"https://openalex.org/S4210230675","display_name":"Discover Internet of Things","issn_l":"2730-7239","issn":["2730-7239"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.52,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":42,"referenced_works":["https://openalex.org/W1996160964","https://openalex.org/W2032360374","https://openalex.org/W2038484192","https://openalex.org/W2054371124","https://openalex.org/W2059652044","https://openalex.org/W2083837083","https://openalex.org/W2104890527","https://openalex.org/W2107495852","https://openalex.org/W2113278353","https://openalex.org/W2114294947","https://openalex.org/W2118344753","https://openalex.org/W2130640900","https://openalex.org/W2139435939","https://openalex.org/W2140227114","https://openalex.org/W2154252319","https://openalex.org/W2263313801","https://openalex.org/W2296748324","https://openalex.org/W2583165630","https://openalex.org/W2751841560","https://openalex.org/W2794150026","https://openalex.org/W2883651221","https://openalex.org/W2895807593","https://openalex.org/W2944702657","https://openalex.org/W2981689685","https://openalex.org/W3007385536","https://openalex.org/W3037146579","https://openalex.org/W3039519447","https://openalex.org/W3040775664","https://openalex.org/W3041548722","https://openalex.org/W3046095786","https://openalex.org/W3082587889","https://openalex.org/W3083566224","https://openalex.org/W3090494684","https://openalex.org/W3097079238","https://openalex.org/W3113043802","https://openalex.org/W3152750834","https://openalex.org/W3155610073","https://openalex.org/W3164769453","https://openalex.org/W3174527197","https://openalex.org/W3196108907","https://openalex.org/W4248229790","https://openalex.org/W47831154"],"related_works":["https://openalex.org/W4387698063","https://openalex.org/W4382560817","https://openalex.org/W4214771044","https://openalex.org/W3110605476","https://openalex.org/W3004352674","https://openalex.org/W2766269877","https://openalex.org/W2494533082","https://openalex.org/W2363106653","https://openalex.org/W2098934641","https://openalex.org/W1975359510"],"abstract_inverted_index":{"Abstract":[0],"In":[1],"the":[2,18,87,102,118,122,129,164,176,183,219,237,244,249,254,257,260,263,273,277,283],"era":[3,32],"of":[4,17,120,124,143,179,185,201,256,285],"automated":[5,126,160],"and":[6,54,61,75,90,112,134,161,173,182,197,215,230,233,247,267,287],"digitalized":[7],"information,":[8],"advanced":[9,125],"computer":[10],"applications":[11],"deal":[12],"with":[13,282],"a":[14,30,82],"major":[15],"part":[16],"data":[19],"that":[20,156,272],"comprises":[21],"audio-related":[22],"information.":[23,64],"Advancements":[24],"in":[25,29,68,85,101,106],"technology":[26],"have":[27,241],"ushered":[28],"new":[31],"where":[33],"cutting-edge":[34],"devices":[35],"can":[36,157],"deliver":[37],"comprehensive":[38],"insights":[39],"into":[40,222],"audio":[41,72,76,153,189,210,220,238,280],"content,":[42],"leveraging":[43],"sophisticated":[44],"algorithms":[45],"such":[46,47],"as":[48],"Mel":[49],"Frequency":[50],"Cepstral":[51],"Coefficients":[52],"(MFCCs)":[53],"Short-Time":[55],"Fourier":[56],"Transform":[57],"(STFT)":[58],"to":[59,147,194,206],"extract":[60],"provide":[62],"pertinent":[63],"Our":[65,269],"study":[66],"helps":[67],"not":[69],"only":[70],"efficient":[71,152,196],"file":[73,77],"management":[74],"retrievals":[78],"but":[79],"also":[80,242],"plays":[81],"vital":[83],"role":[84],"security,":[86],"robotics":[88],"industry,":[89],"investigations.":[91],"Beyond":[92],"its":[93],"industrial":[94,165],"applications,":[95],"our":[96,144,187,202],"model":[97,191,275],"exhibits":[98],"remarkable":[99],"versatility":[100],"corporate":[103,138],"sector,":[104,166],"particularly":[105],"tasks":[107],"like":[108],"siren":[109],"sound":[110],"detection":[111],"more.":[113],"Embracing":[114],"this":[115],"capability":[116],"holds":[117],"promise":[119],"catalyzing":[121],"development":[123],"systems,":[127],"paving":[128],"way":[130],"for":[131,170,252],"increased":[132],"efficiency":[133],"safety":[135],"across":[136],"various":[137,226],"domains.":[139],"The":[140,199],"primary":[141],"aim":[142],"experiment":[145,270],"is":[146],"focus":[148],"on":[149,259,289],"creating":[150],"highly":[151],"classification":[154,190],"models":[155,281],"be":[158,195],"seamlessly":[159],"deployed":[162],"within":[163],"addressing":[167],"critical":[168],"needs":[169],"enhanced":[171],"productivity":[172],"performance.":[174],"Despite":[175],"dynamic":[177],"nature":[178],"environmental":[180],"sounds":[181],"presence":[184],"noises,":[186],"presented":[188],"comes":[192],"out":[193],"accurate.":[198],"novelty":[200],"research":[203],"work":[204],"reclines":[205],"compare":[207],"two":[208],"different":[209],"datasets":[211],"having":[212],"similar":[213],"characteristics":[214],"revolves":[216],"around":[217],"classifying":[218],"signals":[221],"several":[223],"categories":[224],"using":[225],"machine":[227],"learning":[228],"techniques":[229],"extracting":[231],"MFCCs":[232],"STFTs":[234],"features":[235],"from":[236],"signals.":[239],"We":[240],"tested":[243],"results":[245,261],"after":[246],"before":[248],"noise":[250,258],"removal":[251],"analyzing":[253],"effect":[255],"including":[262],"precision,":[264],"recall,":[265],"specificity,":[266],"F1-score.":[268],"shows":[271],"ANN":[274],"outperforms":[276],"other":[278],"six":[279],"accuracy":[284],"91.41%":[286],"91.27%":[288],"respective":[290],"datasets.":[291]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4390533658","counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":9}],"updated_date":"2025-04-25T06:09:26.756818","created_date":"2024-01-04"}