{"id":"https://openalex.org/W3137069976","doi":"https://doi.org/10.1109/access.2021.3067607","title":"Multi-Gate Attention Network for Image Captioning","display_name":"Multi-Gate Attention Network for Image Captioning","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3137069976","doi":"https://doi.org/10.1109/access.2021.3067607","mag":"3137069976"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3067607","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09382255.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09382255.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042991224","display_name":"Weitao Jiang","orcid":"https://orcid.org/0000-0002-7168-9357"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"funder","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weitao Jiang","raw_affiliation_strings":["School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077419230","display_name":"Xiying Li","orcid":"https://orcid.org/0000-0002-4753-8022"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"funder","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiying Li","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056953478","display_name":"Haifeng Hu","orcid":"https://orcid.org/0000-0002-4884-323X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"funder","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haifeng Hu","raw_affiliation_strings":["School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090328879","display_name":"Qiang Lu","orcid":"https://orcid.org/0000-0002-6071-4481"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"funder","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Lu","raw_affiliation_strings":["School of Intelligent Systems Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016566450","display_name":"Bohong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"funder","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bohong Liu","raw_affiliation_strings":["School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.978,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":20,"citation_normalized_percentile":{"value":0.622706,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":92,"max":93},"biblio":{"volume":"9","issue":null,"first_page":"69700","last_page":"69709"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9962,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8152303},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.45197767},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4301899}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8152303},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8084456},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.60864246},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.56720775},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5136623},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.45197767},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4301899},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.42323732},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3769893},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3676859},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3667162},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07656053},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3067607","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09382255.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://doaj.org/article/b0cad34a3a074e79a713e9645b3628e1","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3067607","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09382255.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.47,"id":"https://metadata.un.org/sdg/4","display_name":"Quality education"}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"U1611461"},{"funder":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China","award_id":"2018YFB1601101"},{"funder":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China","award_id":"2018YFB1601100"}],"datasets":[],"versions":[],"referenced_works_count":64,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1522301498","https://openalex.org/W1861492603","https://openalex.org/W1895577753","https://openalex.org/W1897761818","https://openalex.org/W1905882502","https://openalex.org/W1956340063","https://openalex.org/W1968001820","https://openalex.org/W1969616664","https://openalex.org/W2101105183","https://openalex.org/W2108598243","https://openalex.org/W2116492146","https://openalex.org/W2149172860","https://openalex.org/W2154652894","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2255466643","https://openalex.org/W2277195237","https://openalex.org/W2296385829","https://openalex.org/W2302086703","https://openalex.org/W2412393473","https://openalex.org/W2506483933","https://openalex.org/W2550553598","https://openalex.org/W2552161745","https://openalex.org/W2558834163","https://openalex.org/W2564898401","https://openalex.org/W2567070169","https://openalex.org/W2575842049","https://openalex.org/W2604522653","https://openalex.org/W2607768201","https://openalex.org/W2613718673","https://openalex.org/W2742141965","https://openalex.org/W2745461083","https://openalex.org/W2794576774","https://openalex.org/W2795151422","https://openalex.org/W2885013662","https://openalex.org/W2890531016","https://openalex.org/W2949376505","https://openalex.org/W2950178297","https://openalex.org/W2962706528","https://openalex.org/W2963084599","https://openalex.org/W2963403868","https://openalex.org/W2963717374","https://openalex.org/W2963807318","https://openalex.org/W2963954913","https://openalex.org/W2963970792","https://openalex.org/W2964018924","https://openalex.org/W2964110616","https://openalex.org/W2964121744","https://openalex.org/W2981992760","https://openalex.org/W2986670728","https://openalex.org/W2990818246","https://openalex.org/W2997945091","https://openalex.org/W3026446890","https://openalex.org/W3034733309","https://openalex.org/W3034772996","https://openalex.org/W3035160838","https://openalex.org/W3035284526","https://openalex.org/W3093272873","https://openalex.org/W3107848485","https://openalex.org/W4385245566","https://openalex.org/W639708223","https://openalex.org/W8316075","https://openalex.org/W956551720"],"related_works":["https://openalex.org/W4388184981","https://openalex.org/W4323777661","https://openalex.org/W4310447809","https://openalex.org/W4210416330","https://openalex.org/W4200243030","https://openalex.org/W3209117276","https://openalex.org/W3088136942","https://openalex.org/W2963177403","https://openalex.org/W2800782462","https://openalex.org/W2775506363"],"abstract_inverted_index":{"Self-attention":[0],"mechanism,":[1],"which":[2,47,80],"has":[3],"been":[4],"successfully":[5],"applied":[6],"to":[7,16,43,104,107,116,147,158],"current":[8,56,133],"encoder-decoder":[9],"framework":[10],"of":[11,211,227],"image":[12,23,134,149,169,182],"captioning,":[13],"is":[14,114],"used":[15],"enhance":[17],"the":[18,22,27,32,60,67,82,101,108,118,124,138,160,181,188,207,212,225],"feature":[19,129,170],"representation":[20],"in":[21,127],"encoder":[24,183],"and":[25,64,94,122,163,184,214],"capture":[26],"most":[28,36,109,132,210],"relevant":[29],"information":[30,126],"for":[31,142,168],"language":[33,144,189],"decoder.":[34],"However,":[35],"existing":[37],"methods":[38,136,219],"will":[39],"assign":[40],"attention":[41,62,102,120],"weights":[42,103],"all":[44,51],"candidate":[45],"vectors,":[46],"implicitly":[48],"hypothesizes":[49],"that":[50,206],"vectors":[52],"are":[53],"relevant.":[54],"Moreover,":[55],"self-attention":[57,84],"mechanisms":[58],"ignore":[59],"intra-object":[61,119],"distribution,":[63],"only":[65],"consider":[66,117],"inter-object":[68],"relationships.":[69],"In":[70],"this":[71],"paper,":[72],"we":[73,153,191],"propose":[74,154],"a":[75,155,193],"Multi-Gate":[76,195],"Attention":[77,89,196],"(MGA)":[78],"block,":[79],"expands":[81],"traditional":[83],"by":[85],"equipping":[86],"with":[87,176,221],"additional":[88],"Weight":[90],"Gate":[91],"(AWG)":[92],"module":[93,186],"Self-Gated":[95],"(SG)":[96],"module.":[97],"The":[98,112,199],"former":[99],"constrains":[100],"be":[105],"assigned":[106],"contributive":[110],"objects.":[111],"latter":[113],"adopted":[115],"distribution":[121],"eliminate":[123],"irrelevant":[125],"object":[128],"vector.":[130],"Furthermore,":[131],"captioning":[135],"apply":[137],"original":[139],"transformer":[140,157,161,178],"designed":[141],"natural":[143],"processing":[145],"task,":[146],"refine":[148],"features":[150],"directly.":[151],"Therefore,":[152],"pre-layernorm":[156,177],"simplify":[159],"architecture":[162,179],"make":[164],"it":[165],"more":[166],"efficient":[167],"enhancement.":[171],"By":[172],"integrating":[173],"MGA":[174,222],"block":[175],"into":[180,187],"AWG":[185],"decoder,":[190],"present":[192],"novel":[194],"Network":[197],"(MGAN).":[198],"experiments":[200,216],"on":[201,217],"MS":[202],"COCO":[203],"dataset":[204],"indicate":[205],"MGAN":[208],"outperforms":[209],"state-of-the-art,":[213],"further":[215],"other":[218],"combined":[220],"blocks":[223],"demonstrate":[224],"generalizability":[226],"our":[228],"proposal.":[229]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3137069976","counts_by_year":[{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":3}],"updated_date":"2025-05-04T06:16:19.107230","created_date":"2021-03-29"}