{"id":"https://openalex.org/W4396788678","doi":"https://doi.org/10.48550/arxiv.2405.01828","title":"FER-YOLO-Mamba: Facial Expression Detection and Classification Based on\n Selective State Space","display_name":"FER-YOLO-Mamba: Facial Expression Detection and Classification Based on\n Selective State Space","publication_year":2024,"publication_date":"2024-05-02","ids":{"openalex":"https://openalex.org/W4396788678","doi":"https://doi.org/10.48550/arxiv.2405.01828"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.01828","pdf_url":"https://arxiv.org/pdf/2405.01828","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.01828","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101642586","display_name":"Hui Ma","orcid":"https://orcid.org/0000-0001-8072-4348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Hui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101004415","display_name":"Sen Lei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei, Sen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049945687","display_name":"Turgay \u00c7elik","orcid":"https://orcid.org/0000-0001-6925-6010"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Celik, Turgay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5015155189","display_name":"Heng-Chao Li","orcid":"https://orcid.org/0000-0002-9735-570X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Heng-Chao","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.8106,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.8106,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/facial-expression-recognition","display_name":"Facial expression recognition","score":0.4448076}],"concepts":[{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.51060516},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.48795313},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45033577},{"id":"https://openalex.org/C2987714656","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Facial expression recognition","level":4,"score":0.4448076},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43837684},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40940827},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.12947321},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.050216764}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.01828","pdf_url":"https://arxiv.org/pdf/2405.01828","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2405.01828","pdf_url":"https://arxiv.org/pdf/2405.01828","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4323520705","https://openalex.org/W4205986151","https://openalex.org/W2356663679","https://openalex.org/W2355913164","https://openalex.org/W2168968280","https://openalex.org/W2162992774","https://openalex.org/W2116055069","https://openalex.org/W2042327336","https://openalex.org/W2033914206","https://openalex.org/W1153638794"],"abstract_inverted_index":{"Facial":[0],"Expression":[1],"Recognition":[2],"(FER)":[3],"plays":[4],"a":[5,42,109],"pivotal":[6],"role":[7],"in":[8,58,95,121,134],"understanding":[9],"human":[10],"emotional":[11],"cues.":[12],"However,":[13],"traditional":[14],"FER":[15,53],"methods":[16],"based":[17],"on":[18,170],"visual":[19],"information":[20],"have":[21],"some":[22],"limitations,":[23],"such":[24],"as":[25],"preprocessing,":[26],"feature":[27,123],"extraction,":[28],"and":[29,69,88,100,156,175],"multi-stage":[30],"classification":[31],"procedures.":[32],"These":[33],"not":[34],"only":[35],"increase":[36],"computational":[37,74],"complexity":[38],"but":[39],"also":[40],"require":[41],"significant":[43],"amount":[44],"of":[45,86,118,129,141,162],"computing":[46],"resources.":[47],"Considering":[48],"Convolutional":[49],"Neural":[50],"Network":[51],"(CNN)-based":[52],"schemes":[54],"frequently":[55],"prove":[56],"inadequate":[57],"identifying":[59],"the":[60,70,79,84,103,115,126,139,146,160,163,182],"deep,":[61],"long-distance":[62,136],"dependencies":[63],"embedded":[64],"within":[65],"facial":[66,96,153],"expression":[67,97,154],"images,":[68],"Transformer's":[71],"inherent":[72,116],"quadratic":[73],"complexity,":[75],"this":[76,144],"paper":[77],"presents":[78],"FER-YOLO-Mamba":[80,104,165,183],"model,":[81,105,166],"which":[82,113],"integrates":[83],"principles":[85],"Mamba":[87,149],"YOLO":[89],"technologies":[90],"to":[91,189],"facilitate":[92],"efficient":[93],"coordination":[94],"image":[98],"recognition":[99],"localization.":[101],"Within":[102],"we":[106,167],"further":[107],"devise":[108],"FER-YOLO-VSS":[110],"dual-branch":[111],"module,":[112],"combines":[114],"strengths":[117],"convolutional":[119],"layers":[120],"local":[122],"extraction":[124],"with":[125],"exceptional":[127],"capability":[128],"State":[130],"Space":[131],"Models":[132],"(SSMs)":[133],"revealing":[135],"dependencies.":[137],"To":[138,158],"best":[140],"our":[142],"knowledge,":[143],"is":[145,194],"first":[147],"Vision":[148],"model":[150,184],"designed":[151],"for":[152],"detection":[155],"classification.":[157],"evaluate":[159],"performance":[161],"proposed":[164],"conducted":[168],"experiments":[169],"two":[171],"benchmark":[172],"datasets,":[173],"RAF-DB":[174],"SFEW.":[176],"The":[177,192],"experimental":[178],"results":[179,187],"indicate":[180],"that":[181],"achieved":[185],"better":[186],"compared":[188],"other":[190],"models.":[191],"code":[193],"available":[195],"from":[196],"https://github.com/SwjtuMa/FER-YOLO-Mamba.":[197]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4396788678","counts_by_year":[],"updated_date":"2024-12-06T23:41:48.903322","created_date":"2024-05-11"}