{"id":"https://openalex.org/W2887793820","doi":"https://doi.org/10.23919/wac.2018.8430295","title":"Speaker Recognition for Robotic Control via an IoT Device","display_name":"Speaker Recognition for Robotic Control via an IoT Device","publication_year":2018,"publication_date":"2018-06-01","ids":{"openalex":"https://openalex.org/W2887793820","doi":"https://doi.org/10.23919/wac.2018.8430295","mag":"2887793820"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.23919/wac.2018.8430295","pdf_url":null,"source":{"id":"https://openalex.org/S4363606418","display_name":"2022 World Automation Congress (WAC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076372105","display_name":"Zhanibek Kozhirbayev","orcid":"https://orcid.org/0000-0003-4235-9049"},"institutions":[{"id":"https://openalex.org/I10232997","display_name":"L. N. Gumilyov Eurasian National University","ror":"https://ror.org/0242cby63","country_code":"KZ","type":"education","lineage":["https://openalex.org/I10232997"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Zhanibek Kozhirbayev","raw_affiliation_strings":["Faculty of Information Technologies, L.N.Gumilyov Eurasian National University, Astana, Kazakhstan"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technologies, L.N.Gumilyov Eurasian National University, Astana, Kazakhstan","institution_ids":["https://openalex.org/I10232997"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091418584","display_name":"Berat A. Erol","orcid":"https://orcid.org/0000-0001-5734-4865"},"institutions":[{"id":"https://openalex.org/I45438204","display_name":"The University of Texas at San Antonio","ror":"https://ror.org/01kd65564","country_code":"US","type":"education","lineage":["https://openalex.org/I45438204"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Berat A. Erol","raw_affiliation_strings":["Autonomous Control Engineering Laboratories, The University of Texas at San Antonio, San Antonio, TX, USA"],"affiliations":[{"raw_affiliation_string":"Autonomous Control Engineering Laboratories, The University of Texas at San Antonio, San Antonio, TX, USA","institution_ids":["https://openalex.org/I45438204"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073789263","display_name":"Altynbek Sharipbay","orcid":"https://orcid.org/0000-0001-5334-1253"},"institutions":[{"id":"https://openalex.org/I10232997","display_name":"L. N. Gumilyov Eurasian National University","ror":"https://ror.org/0242cby63","country_code":"KZ","type":"education","lineage":["https://openalex.org/I10232997"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Altynbek Sharipbay","raw_affiliation_strings":["Faculty of Information Technologies, L.N.Gumilyov Eurasian National University, Astana, Kazakhstan"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technologies, L.N.Gumilyov Eurasian National University, Astana, Kazakhstan","institution_ids":["https://openalex.org/I10232997"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113537394","display_name":"Mo Jamshidi","orcid":null},"institutions":[{"id":"https://openalex.org/I45438204","display_name":"The University of Texas at San Antonio","ror":"https://ror.org/01kd65564","country_code":"US","type":"education","lineage":["https://openalex.org/I45438204"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mo Jamshidi","raw_affiliation_strings":["Autonomous Control Engineering Laboratories, The University of Texas at San Antonio, San Antonio, TX, USA"],"affiliations":[{"raw_affiliation_string":"Autonomous Control Engineering Laboratories, The University of Texas at San Antonio, San Antonio, TX, USA","institution_ids":["https://openalex.org/I45438204"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.737,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":23,"citation_normalized_percentile":{"value":0.857952,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":92},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9929,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.8183694},{"id":"https://openalex.org/keywords/speaker-identification","display_name":"Speaker identification","score":0.5023229},{"id":"https://openalex.org/keywords/identification","display_name":"Identification","score":0.4505936},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.41701642}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.83122706},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.8183694},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6991186},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.68049407},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.55116564},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5207577},{"id":"https://openalex.org/C2986627078","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker identification","level":3,"score":0.5023229},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4505936},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.44686973},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.41701642},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38337502},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.23919/wac.2018.8430295","pdf_url":null,"source":{"id":"https://openalex.org/S4363606418","display_name":"2022 World Automation Congress (WAC)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6,"display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":24,"referenced_works":["https://openalex.org/W1493163583","https://openalex.org/W1504478957","https://openalex.org/W1758466134","https://openalex.org/W1979786508","https://openalex.org/W2006012472","https://openalex.org/W2008957275","https://openalex.org/W2040514520","https://openalex.org/W2045956438","https://openalex.org/W2087992518","https://openalex.org/W2120097768","https://openalex.org/W2123107571","https://openalex.org/W2125572684","https://openalex.org/W2153514218","https://openalex.org/W2160564400","https://openalex.org/W2162905435","https://openalex.org/W2165880886","https://openalex.org/W2295754094","https://openalex.org/W2395750323","https://openalex.org/W2407452468","https://openalex.org/W2529077967","https://openalex.org/W2612380871","https://openalex.org/W2752901856","https://openalex.org/W2791286349","https://openalex.org/W2793150943"],"related_works":["https://openalex.org/W4317383455","https://openalex.org/W4293232884","https://openalex.org/W4234190324","https://openalex.org/W3204851989","https://openalex.org/W3119288895","https://openalex.org/W2548511587","https://openalex.org/W2548162870","https://openalex.org/W2422472940","https://openalex.org/W2185075503","https://openalex.org/W2019475500"],"abstract_inverted_index":{"Speaker":[0],"Recognition":[1],"is":[2,60],"considered":[3],"as":[4,30],"one":[5],"of":[6,65,74,77,118],"the":[7,14,34,56,63,91,115,119,136,147,151],"primary":[8],"tasks":[9],"in":[10,26,105],"speech":[11,37],"processing.":[12],"Nowadays,":[13],"speaker":[15,78,122],"identification":[16,79],"method":[17,49],"has":[18],"been":[19],"extensively":[20],"appealing":[21],"for":[22],"its":[23],"broad":[24],"application":[25],"many":[27],"fields,":[28],"such":[29],"smart":[31],"environments,":[32],"securing":[33],"cyber-physical":[35],"systems,":[36],"communications,":[38],"and":[39],"robotic":[40],"controls.":[41],"Researchers":[42],"are":[43,80],"targeting":[44],"to":[45,54,62,69,113,129],"perform":[46],"an":[47],"effective":[48],"that":[50,59],"makes":[51],"it":[52],"possible":[53],"obtain":[55],"recognition":[57,116,123,148],"ability":[58],"close":[61],"hearing":[64],"human.":[66],"In":[67],"order":[68],"get":[70],"high":[71],"accuracy,":[72],"challenges":[73],"large-scale":[75],"applications":[76],"overcome":[81],"through":[82],"applying":[83],"techniques":[84],"not":[85],"only":[86],"traditional":[87],"models":[88],"based":[89],"on":[90,135],"GMM,":[92],"but":[93],"also":[94],"deep":[95],"learning":[96],"methods.":[97],"Aiming":[98],"at":[99],"effectively":[100],"dealing":[101],"with":[102],"this":[103,106],"challenge,":[104],"paper,":[107],"we":[108],"present":[109],"a":[110,127,131],"novel":[111],"model":[112,155],"increase":[114],"accuracy":[117],"short":[120],"utterance":[121],"system.":[124],"We":[125],"developed":[126],"technique":[128],"train":[130],"Neural":[132],"Network":[133],"(NN)":[134],"extracted":[137],"Mel-Frequency":[138],"Cepstral":[139],"Coefficient":[140],"(MFCC)":[141],"features":[142],"from":[143],"audio":[144],"samples.":[145],"Therefore,":[146],"system":[149],"gains":[150],"significant":[152],"accuracy.":[153],"The":[154],"was":[156],"trained":[157],"using":[158],"open-source":[159],"high-level":[160],"neural":[161],"networks":[162],"API":[163],"Keras.":[164]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2887793820","counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4}],"updated_date":"2024-12-28T20:56:55.064312","created_date":"2018-08-22"}