{"id":"https://openalex.org/W3170767867","doi":"https://doi.org/10.1145/3447548.3467206","title":"M6: Multi-Modality-to-Multi-Modality Multitask Mega-transformer for Unified Pretraining","display_name":"M6: Multi-Modality-to-Multi-Modality Multitask Mega-transformer for Unified Pretraining","publication_year":2021,"publication_date":"2021-08-13","ids":{"openalex":"https://openalex.org/W3170767867","doi":"https://doi.org/10.1145/3447548.3467206","mag":"3170767867"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3447548.3467206","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100612233","display_name":"Junyang Lin","orcid":"https://orcid.org/0000-0001-9931-383X"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junyang Lin","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004626105","display_name":"Rui Men","orcid":"https://orcid.org/0000-0002-4429-3461"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Men","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100459627","display_name":"Yang An","orcid":"https://orcid.org/0000-0002-6529-1609"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"An Yang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102025315","display_name":"Chang Zhou","orcid":"https://orcid.org/0000-0001-9241-702X"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chang Zhou","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013763116","display_name":"Yichang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yichang Zhang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100396097","display_name":"Peng Wang","orcid":"https://orcid.org/0000-0002-9218-9132"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Wang","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057864403","display_name":"Jingren Zhou","orcid":"https://orcid.org/0000-0002-4220-2634"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingren Zhou","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044791875","display_name":"Jie Tang","orcid":"https://orcid.org/0000-0003-3487-4593"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"funder","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Tang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082599714","display_name":"Hongxia Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongxia Yang","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.195,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.836516,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"3251","last_page":"3261"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9833,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.78337944},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6364167},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.55628824},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.51954204}],"concepts":[{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.78337944},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7426979},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6364167},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.595485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59486246},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.55628824},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.51954204},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48542485},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39515105},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3447548.3467206","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","score":0.63,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":5,"referenced_works":["https://openalex.org/W2549139847","https://openalex.org/W2970231061","https://openalex.org/W3035485997","https://openalex.org/W3096609285","https://openalex.org/W3102995547"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4320153225","https://openalex.org/W4307407935","https://openalex.org/W4293261942","https://openalex.org/W4224266612","https://openalex.org/W3125968744","https://openalex.org/W2383394264","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W203959209"],"abstract_inverted_index":{"Multimodal":[0],"pretraining":[1,32,44,84],"has":[2,58],"demonstrated":[3],"success":[4],"in":[5,33,45,138,150,171],"the":[6,18,40,86,115,126,134,148,164,172],"downstream":[7,154],"tasks":[8,113,155],"of":[9,27,49,88,120,153,174],"cross-modal":[10],"representation":[11],"learning.":[12,176],"However,":[13],"it":[14],"is":[15,23,96],"limited":[16],"to":[17,78,128],"English":[19],"data,":[20],"and":[21,53,91,122,132,160,163],"there":[22],"still":[24],"a":[25,73,151],"lack":[26],"large-scale":[28],"dataset":[29,42,57],"for":[30,43,82],"multimodal":[31],"Chinese.":[34,139],"In":[35],"this":[36],"work,":[37],"we":[38,71],"propose":[39,72],"largest":[41,135],"Chinese,":[46],"which":[47],"consists":[48],"over":[50,61],"1.9TB":[51],"images":[52],"292GB":[54],"texts.":[55],"The":[56,94,112],"large":[59],"coverage":[60],"domains,":[62],"including":[63,102],"encyclopedia,":[64],"question":[65],"answering,":[66],"forum":[67],"discussion,":[68],"etc.":[69],"Besides,":[70],"method":[74],"called":[75],"M6,":[76],"referring":[77],"Multi-Modality-to-Multi-Modality":[79],"Multitask":[80],"Mega-transformer,":[81],"unified":[83],"on":[85],"data":[87],"single":[89,158],"modality":[90,159],"multiple":[92,161],"modalities.":[93],"model":[95,116,127,137,167],"pretrained":[97,136,166],"with":[98,117],"our":[99,144],"proposed":[100,145],"tasks,":[101],"text-to-text":[103],"transfer,":[104,106],"image-to-text":[105],"as":[107,109],"well":[108],"multi-modality-to-text":[110],"transfer.":[111],"endow":[114],"strong":[118,169],"capability":[119],"understanding":[121],"generation.":[123],"We":[124],"scale":[125],"10":[129],"billion":[130],"parameters,":[131],"build":[133],"Experimental":[140],"results":[141],"show":[142],"that":[143],"M6":[146],"outperforms":[147],"baseline":[149],"number":[152],"concerning":[156],"both":[157],"modalities,":[162],"10B-parameter":[165],"demonstrates":[168],"potential":[170],"setting":[173],"zero-shot":[175]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3170767867","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":17},{"year":2022,"cited_by_count":2}],"updated_date":"2025-04-16T17:00:41.964494","created_date":"2021-06-22"}