{"id":"https://openalex.org/W4391621171","doi":"https://doi.org/10.1109/jiot.2024.3363176","title":"A Multimodal Driver Emotion Recognition Algorithm Based on the Audio and Video Signals in Internet of Vehicles Platform","display_name":"A Multimodal Driver Emotion Recognition Algorithm Based on the Audio and Video Signals in Internet of Vehicles Platform","publication_year":2024,"publication_date":"2024-02-07","ids":{"openalex":"https://openalex.org/W4391621171","doi":"https://doi.org/10.1109/jiot.2024.3363176"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2024.3363176","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101487553","display_name":"Na Ying","orcid":"https://orcid.org/0000-0003-1631-551X"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Na Ying","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102614711","display_name":"Yinhe Jiang","orcid":"https://orcid.org/0009-0005-1764-3816"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinhe Jiang","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062010713","display_name":"Chunsheng Guo","orcid":"https://orcid.org/0000-0002-5965-7133"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunsheng Guo","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101674730","display_name":"Di Zhou","orcid":"https://orcid.org/0000-0003-1765-3705"},"institutions":[{"id":"https://openalex.org/I4210106357","display_name":"Zhejiang Energy Research Institute","ror":"https://ror.org/01fqrb109","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210106357"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Di Zhou","raw_affiliation_strings":["Research Institute, Zhejiang Uniview Technologies Company Ltd., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Research Institute, Zhejiang Uniview Technologies Company Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I4210106357"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5115076567","display_name":"Jian Zhao","orcid":"https://orcid.org/0009-0009-1330-3012"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Zhao","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":10.218,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.99995,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"11","issue":"22","first_page":"35812","last_page":"35824"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11373","display_name":"Sleep and Work-Related Fatigue","score":0.998,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9854,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.60820985},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47366577}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8596822},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.60820985},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47366577},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.46702364},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45797038},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4332973},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2024.3363176","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.66,"display_name":"Reduced inequalities"}],"grants":[{"funder":"https://openalex.org/F4320338464","funder_display_name":"Natural Science Foundation of Zhejiang Province","award_id":"LTGS23F010001"}],"datasets":[],"versions":[],"referenced_works_count":31,"referenced_works":["https://openalex.org/W2046056978","https://openalex.org/W2047905903","https://openalex.org/W2143350951","https://openalex.org/W2157331557","https://openalex.org/W2481681431","https://openalex.org/W2785627692","https://openalex.org/W2896070351","https://openalex.org/W3005716209","https://openalex.org/W3010526965","https://openalex.org/W3013449349","https://openalex.org/W3013709764","https://openalex.org/W3042183479","https://openalex.org/W3044867770","https://openalex.org/W3081192838","https://openalex.org/W3095435288","https://openalex.org/W3135221627","https://openalex.org/W3139165098","https://openalex.org/W3154740307","https://openalex.org/W3165570722","https://openalex.org/W3165809733","https://openalex.org/W3171335274","https://openalex.org/W3209494353","https://openalex.org/W3213458668","https://openalex.org/W3216153120","https://openalex.org/W4206128048","https://openalex.org/W4206139378","https://openalex.org/W4220829848","https://openalex.org/W4285125856","https://openalex.org/W4312292725","https://openalex.org/W4322706756","https://openalex.org/W4377700521"],"related_works":["https://openalex.org/W4389116644","https://openalex.org/W4205463238","https://openalex.org/W3103844505","https://openalex.org/W2965546495","https://openalex.org/W2761785940","https://openalex.org/W259157601","https://openalex.org/W2521627374","https://openalex.org/W2153315159","https://openalex.org/W2110523656","https://openalex.org/W1482209366"],"abstract_inverted_index":{"Driving":[0],"can":[1,232],"take":[2],"up":[3],"a":[4,21,75,105,112,124,141,151,167,172,182,273],"substantial":[5],"part":[6],"of":[7,44,122,126,192,206,246,260,275,302,312,325],"daily":[8],"life":[9],"and":[10,42,59,74,85,171,211,216,263,266,293,304,316,327],"frequently":[11],"trigger":[12],"negative":[13],"emotions":[14],"like":[15],"anger":[16],"or":[17],"anxiety,":[18],"which":[19,139,231],"have":[20],"significant":[22],"adverse":[23],"impact":[24],"on":[25,252,290,314,318],"driving":[26],"safety":[27,41],"as":[28,30],"well":[29],"long-term":[31],"human":[32],"health.":[33],"To":[34],"identify":[35],"driver":[36,98,199,240],"emotions,":[37],"thereby":[38],"improving":[39],"the":[40,52,91,237,291],"humanization":[43],"intelligent":[45],"driving,":[46],"we":[47,188],"explore":[48],"how":[49],"to":[50,94,116,155,180,225,279],"model":[51,154,160,286],"discriminative":[53,184],"emotion":[54,78,99,200,241],"features":[55,87,146],"from":[56,229],"both":[57,166],"speech":[58,77],"facial":[60,72],"expressions":[61],"in":[62],"this":[63,247,283],"work.":[64],"More":[65],"specifically,":[66],"an":[67,190],"effective":[68],"attention-based":[69],"network":[70,79],"for":[71,198,236],"expression":[73],"lightweight":[76],"are":[80,88,147],"proposed,":[81],"separately.":[82],"Then,":[83],"audio":[84,107],"video":[86,185],"combined":[89],"at":[90],"feature":[92,108,143],"level":[93],"construct":[95],"our":[96],"multimodal":[97,227,239,254,285],"recognition":[100,242,298],"model.":[101],"This":[102,159],"paper":[103],"proposes":[104],"new":[106],"extractor":[109],"that":[110],"uses":[111,223],"multi-scale":[113],"residual":[114],"structure":[115],"extract":[117],"spectrogram":[118],"features.":[119],"In":[120],"terms":[121],"video,":[123],"set":[125],"frame":[127],"sequences":[128],"using":[129,272],"Local":[130],"Binary":[131],"Pattern":[132],"Histograms":[133],"(LBPH)":[134],"is":[135,161,250],"obtained":[136],"through":[137],"preprocessing,":[138],"generates":[140],"fixed-dimensional":[142],"representation.":[144,186],"These":[145],"then":[148],"input":[149],"into":[150],"fine-tuned":[152],"ResNet18":[153],"analyze":[156],"spatial":[157],"information.":[158],"further":[162],"augmented":[163],"by":[164],"integrating":[165],"temporal":[168],"attention":[169],"module":[170],"Gated":[173],"Recurrent":[174],"Unit":[175],"(GRU),":[176],"enhancing":[177],"its":[178],"capability":[179],"create":[181],"highly":[183],"Additionally,":[187,307],"propose":[189],"Internet":[191],"Vehicles":[193],"(IoV)":[194],"platform,":[195],"specifically":[196],"designed":[197],"recognition.":[201],"The":[202,220,244],"IoV":[203,221],"platform":[204,222],"consists":[205],"sensor":[207],"layer,":[208,213],"data":[209,217,228,234],"acquisition":[210],"transport":[212],"server":[214],"layer":[215],"application":[218],"layer.":[219],"sensors":[224],"collect":[226],"drivers,":[230],"provide":[233],"support":[235],"proposed":[238,248,284],"algorithm.":[243],"performance":[245,276],"algorithm":[249],"evaluated":[251],"two":[253],"emotional":[255],"datasets,":[256,295],"Ryerson":[257],"Audio-Visual":[258,268],"Dataset":[259],"Emotional":[261],"Speech":[262],"Song":[264],"(RAVDESS)":[265],"Surrey":[267],"Expressed":[269],"Emotion":[270],"(SAVEE),":[271],"variety":[274],"indicators.":[277],"Compared":[278],"other":[280],"baseline":[281],"methods,":[282],"achieves":[287],"state-of-the-art":[288],"results":[289],"RAVDESS":[292,315],"SAVEE":[294],"demonstrating":[296],"superior":[297],"accuracy":[299],"with":[300,321],"rates":[301],"0.93":[303,313],"0.99,":[305],"respectively.":[306,329],"it":[308],"exhibits":[309],"precision":[310],"scores":[311,324],"0.99":[317,326],"SAVEE,":[319],"along":[320],"exceptional":[322],"specificity":[323],"1.00,":[328]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4391621171","counts_by_year":[{"year":2024,"cited_by_count":4}],"updated_date":"2024-12-12T09:55:31.322235","created_date":"2024-02-08"}