{"id":"https://openalex.org/W4390189773","doi":"https://doi.org/10.1109/dasc/picom/cbdcom/cy59711.2023.10361383","title":"MERGE: Multi-Entity Relational Reasoning Based Explanation in Visual Question Answering","display_name":"MERGE: Multi-Entity Relational Reasoning Based Explanation in Visual Question Answering","publication_year":2023,"publication_date":"2023-11-14","ids":{"openalex":"https://openalex.org/W4390189773","doi":"https://doi.org/10.1109/dasc/picom/cbdcom/cy59711.2023.10361383"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc/picom/cbdcom/cy59711.2023.10361383","pdf_url":null,"source":{"id":"https://openalex.org/S4363605881","display_name":"2021 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111099890","display_name":"Mengzhu Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"funder","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengzhu Pan","raw_affiliation_strings":["Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090335612","display_name":"Qianmu Li","orcid":"https://orcid.org/0000-0002-0998-1517"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"funder","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianmu Li","raw_affiliation_strings":["Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101653417","display_name":"Tian Qiu","orcid":"https://orcid.org/0000-0002-8608-5863"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"funder","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiu Tian","raw_affiliation_strings":["Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":66},"biblio":{"volume":null,"issue":null,"first_page":"1122","last_page":"1129"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9869,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.83445156},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.6753553},{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.4835384}],"concepts":[{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.83445156},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.77313757},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.69461393},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.6753553},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.583802},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5117709},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.4835384},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.42358145},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37537056}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc/picom/cbdcom/cy59711.2023.10361383","pdf_url":null,"source":{"id":"https://openalex.org/S4363605881","display_name":"2021 IEEE Intl Conf on Dependable, Autonomic and Secure Computing, Intl Conf on Pervasive Intelligence and Computing, Intl Conf on Cloud and Big Data Computing, Intl Conf on Cyber Science and Technology Congress (DASC/PiCom/CBDCom/CyberSciTech)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":48,"referenced_works":["https://openalex.org/W1956340063","https://openalex.org/W2101105183","https://openalex.org/W2154652894","https://openalex.org/W2277195237","https://openalex.org/W2506483933","https://openalex.org/W2600463316","https://openalex.org/W2745461083","https://openalex.org/W2890531016","https://openalex.org/W2936695845","https://openalex.org/W2944851425","https://openalex.org/W2946299408","https://openalex.org/W2947380532","https://openalex.org/W2948519073","https://openalex.org/W2955124656","https://openalex.org/W2962779575","https://openalex.org/W2963150162","https://openalex.org/W2963176022","https://openalex.org/W2963383024","https://openalex.org/W2963521239","https://openalex.org/W2963609017","https://openalex.org/W2963644680","https://openalex.org/W2963717374","https://openalex.org/W2963907629","https://openalex.org/W2963954913","https://openalex.org/W2963991868","https://openalex.org/W2964067226","https://openalex.org/W2964072591","https://openalex.org/W2970019270","https://openalex.org/W2970785793","https://openalex.org/W2973009097","https://openalex.org/W2983256121","https://openalex.org/W2998631105","https://openalex.org/W3004349648","https://openalex.org/W3010535384","https://openalex.org/W3035497460","https://openalex.org/W3035520037","https://openalex.org/W3090449556","https://openalex.org/W3104788521","https://openalex.org/W3133696297","https://openalex.org/W3161801106","https://openalex.org/W3201957104","https://openalex.org/W3204138855","https://openalex.org/W3204924011","https://openalex.org/W3213504576","https://openalex.org/W4226136952","https://openalex.org/W4299522971","https://openalex.org/W4312695920","https://openalex.org/W4320002812"],"related_works":["https://openalex.org/W4390241396","https://openalex.org/W4390091918","https://openalex.org/W4389682534","https://openalex.org/W4309397398","https://openalex.org/W3093385053","https://openalex.org/W3045060014","https://openalex.org/W2964061310","https://openalex.org/W2963477107","https://openalex.org/W2231285690","https://openalex.org/W2138707363"],"abstract_inverted_index":{"To":[0,58,133],"handle":[1],"VQA":[2,29],"tasks":[3],"in":[4,40,107],"complex":[5],"scenarios":[6],"involving":[7],"multiple":[8],"entities":[9,106],"and":[10,25,45,56,75,82,100,120,124,150,158],"obtain":[11],"reliable":[12],"explanations,":[13],"models":[14],"need":[15],"to":[16,53,67,127],"fully":[17],"understand":[18],"the":[19,33,54,69,77,95,104,135,166,174],"high-level":[20],"semantic":[21],"information":[22],"of":[23,35,72,79,97,137,169,176],"visual":[24,64,111],"textual":[26,131],"features.":[27],"Existing":[28],"methods":[30],"usually":[31],"lack":[32],"exploration":[34],"entity":[36],"relation":[37],"features,":[38],"resulting":[39],"insufficient":[41],"answer":[42,125,156,177],"prediction":[43],"accuracy":[44,78,157,175],"generated":[46],"explanations":[47,170],"that":[48,165],"are":[49,113],"not":[50],"sufficiently":[51],"relevant":[52],"image":[55,73],"question.":[57],"address":[59],"this":[60],"issue,":[61],"we":[62,140],"use":[63],"relational":[65],"reasoning":[66],"enhance":[68],"overall":[70],"understanding":[71],"scenes":[74],"improve":[76,173],"predicted":[80],"answers":[81],"explanations.":[83,132,160],"Our":[84],"proposed":[85],"method,":[86,139],"named":[87],"Multi-Entity":[88],"Relational":[89],"Reasoning":[90],"based":[91],"Explanation":[92],"(MERGE),":[93],"leverages":[94],"construction":[96],"action,":[98],"spatial,":[99],"attribute":[101],"relations":[102],"among":[103],"question-related":[105],"images.":[108],"The":[109,152],"contextual":[110],"features":[112],"encoded":[114],"through":[115],"a":[116],"graph":[117],"attention":[118],"mechanism":[119],"fused":[121],"with":[122],"question":[123],"embeddings":[126],"generate":[128],"more":[129],"accurate":[130],"validate":[134],"effectiveness":[136],"our":[138,162],"conducted":[141],"extensive":[142],"experiments":[143],"on":[144],"seven":[145],"datasets,":[146],"including":[147],"VQA-CP,":[148],"VQA-X,":[149],"CLEVR-X.":[151],"results":[153,163],"demonstrate":[154],"improved":[155],"high-quality":[159],"Furthermore,":[161],"show":[164],"supervisory":[167],"role":[168],"can":[171],"quantitatively":[172],"prediction.":[178]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4390189773","counts_by_year":[],"updated_date":"2025-02-19T14:01:14.858826","created_date":"2023-12-26"}