{"id":"https://openalex.org/W4282838846","doi":"https://doi.org/10.1002/cav.2090","title":"SCANET: Improving multimodal representation and fusion with sparse\u2010 and cross\u2010attention for multimodal sentiment analysis","display_name":"SCANET: Improving multimodal representation and fusion with sparse\u2010 and cross\u2010attention for multimodal sentiment analysis","publication_year":2022,"publication_date":"2022-06-01","ids":{"openalex":"https://openalex.org/W4282838846","doi":"https://doi.org/10.1002/cav.2090"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/cav.2090","pdf_url":null,"source":{"id":"https://openalex.org/S100062975","display_name":"Computer Animation and Virtual Worlds","issn_l":"1546-4261","issn":["1546-4261","1546-427X"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083999219","display_name":"Hao Wang","orcid":"https://orcid.org/0000-0001-9866-972X"},"institutions":[{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]},{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hao Wang","raw_affiliation_strings":["Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037042612","display_name":"Mingchuan Yang","orcid":"https://orcid.org/0000-0003-1511-4265"},"institutions":[{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]},{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingchuan Yang","raw_affiliation_strings":["Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100415030","display_name":"Zheng Li","orcid":"https://orcid.org/0000-0002-9165-6878"},"institutions":[{"id":"https://openalex.org/I25254941","display_name":"Beijing Normal University","ror":"https://ror.org/022k4wk35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I25254941"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Li","raw_affiliation_strings":["Center for Cognition and Neuroergonomics, State Key Laboratory of Cognitive Neuroscience and Learning, Beijing Normal University at Zhuhai, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Center for Cognition and Neuroergonomics, State Key Laboratory of Cognitive Neuroscience and Learning, Beijing Normal University at Zhuhai, Guangdong, China","institution_ids":["https://openalex.org/I25254941"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100420220","display_name":"Zhenhua Liu","orcid":"https://orcid.org/0000-0003-2760-3621"},"institutions":[{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]},{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenhua Liu","raw_affiliation_strings":["Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066864248","display_name":"Jie Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]},{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Hu","raw_affiliation_strings":["Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016048145","display_name":"Ziwang Fu","orcid":"https://orcid.org/0000-0001-7347-6702"},"institutions":[{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]},{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"funder","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziwang Fu","raw_affiliation_strings":["Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","School of Computer Science, Beijing University of Post and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Big Data and Artificial Intelligence, China Telecom Corporation Limited Beijing Research Institute, Beijing, China","institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"]},{"raw_affiliation_string":"School of Computer Science, Beijing University of Post and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085891781","display_name":"Feng Liu","orcid":"https://orcid.org/0000-0002-5289-5761"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"funder","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Liu","raw_affiliation_strings":["Institute of AI for Education, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of AI for Education, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5083999219"],"corresponding_institution_ids":["https://openalex.org/I4387153335","https://openalex.org/I4210136246"],"apc_list":{"value":3040,"currency":"USD","value_usd":3040},"apc_paid":null,"fwci":2.541,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.549215,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":"33","issue":"3-4","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12032","display_name":"Multisensory perception and integration","score":0.9916,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.87702024},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.70793676},{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.6675836},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.5264521},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.51402867},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment Analysis","score":0.47557107}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.87702024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8404394},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.70793676},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6675836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6117913},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.5398592},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.5264521},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.51402867},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.49055976},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.47557107},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3822385},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35089153},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33686304},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09570351},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1002/cav.2090","pdf_url":null,"source":{"id":"https://openalex.org/S100062975","display_name":"Computer Animation and Virtual Worlds","issn_l":"1546-4261","issn":["1546-4261","1546-427X"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":26,"referenced_works":["https://openalex.org/W2095176743","https://openalex.org/W2098689807","https://openalex.org/W2103104224","https://openalex.org/W2122563357","https://openalex.org/W2395639500","https://openalex.org/W2556418146","https://openalex.org/W2883409523","https://openalex.org/W2883430806","https://openalex.org/W2964010806","https://openalex.org/W2964051877","https://openalex.org/W2964110616","https://openalex.org/W2964260444","https://openalex.org/W2964346351","https://openalex.org/W3034266838","https://openalex.org/W3037572520","https://openalex.org/W3093051361","https://openalex.org/W3128412859","https://openalex.org/W3169801598","https://openalex.org/W3177318507","https://openalex.org/W3194765442","https://openalex.org/W3209710747","https://openalex.org/W3214432797","https://openalex.org/W4205727320","https://openalex.org/W4212774754","https://openalex.org/W4287704453","https://openalex.org/W4385270240"],"related_works":["https://openalex.org/W4390136517","https://openalex.org/W4387316634","https://openalex.org/W4381827277","https://openalex.org/W3167558523","https://openalex.org/W3157841754","https://openalex.org/W3120825179","https://openalex.org/W3093803775","https://openalex.org/W3013953798","https://openalex.org/W2563212008","https://openalex.org/W2477990774"],"abstract_inverted_index":{"Abstract":[0],"Learning":[1],"unimodal":[2,61],"representations":[3],"and":[4,42,56,76,84,102,133,136],"improving":[5],"multimodal":[6,12,54,89],"fusion":[7,90,97],"are":[8],"two":[9,74],"cores":[10],"of":[11,53,73,82],"sentiment":[13],"analysis":[14],"(MSA).":[15],"However,":[16],"previous":[17],"methods":[18],"ignore":[19],"the":[20,60,70,78,88,111,131],"information":[21,105],"differences":[22],"between":[23,125],"different":[24],"modalities:":[25],"Text":[26],"modality":[27,104],"has":[28,47],"high\u2010order":[29],"semantic":[30],"features":[31,81,124],"than":[32],"other":[33],"modalities.":[34,86,126],"In":[35,87],"this":[36],"article,":[37],"we":[38,64,92],"propose":[39],"a":[40],"sparse\u2010":[41],"cross\u2010attention":[43],"(SCANET)":[44],"framework":[45],"which":[46,99],"asymmetric":[48,96],"architecture":[49],"to":[50,68,109,120],"improve":[51,69],"performance":[52],"representation":[55,62,71],"fusion.":[57],"Specifically,":[58],"in":[59],"stage,":[63,91],"use":[65],"sparse":[66],"attention":[67],"efficiency":[72],"modalities":[75],"reduce":[77],"low\u2010order":[79],"redundant":[80],"audio":[83,101],"visual":[85,103],"design":[93],"an":[94],"innovative":[95],"module,":[98],"utilizes":[100],"matrix":[106],"as":[107],"weights":[108],"strengthen":[110],"target":[112],"text":[113],"modality.":[114],"We":[115,127],"also":[116],"introduce":[117],"contrastive":[118],"learning":[119],"effectively":[121],"enhance":[122],"complementary":[123],"apply":[128],"SCANET":[129],"on":[130],"CMU\u2010MOSI":[132],"CMU\u2010MOSEI":[134],"datasets,":[135],"experimental":[137],"results":[138],"show":[139],"that":[140],"our":[141],"proposed":[142],"method":[143],"achieves":[144],"state\u2010of\u2010the\u2010art":[145],"performance.":[146]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4282838846","counts_by_year":[{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":5}],"updated_date":"2025-02-20T08:50:17.973168","created_date":"2022-06-15"}