{"id":"https://openalex.org/W4311001273","doi":"https://doi.org/10.48550/arxiv.2212.04408","title":"OFASys: A Multi-Modal Multi-Task Learning System for Building Generalist Models","display_name":"OFASys: A Multi-Modal Multi-Task Learning System for Building Generalist Models","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4311001273","doi":"https://doi.org/10.48550/arxiv.2212.04408"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.04408","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2212.04408","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063334231","display_name":"Jinze Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Jinze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004626105","display_name":"Rui Men","orcid":"https://orcid.org/0000-0002-4429-3461"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Men, Rui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111385619","display_name":"Yang Hao","orcid":"https://orcid.org/0000-0002-9949-7226"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049239373","display_name":"Xuancheng Ren","orcid":"https://orcid.org/0000-0002-6994-2114"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Xuancheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014400759","display_name":"Kai Dang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dang, Kai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013763116","display_name":"Yichang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yichang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102545093","display_name":"Xiaohuan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xiaohuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100396039","display_name":"Peng Wang","orcid":"https://orcid.org/0000-0002-5397-9115"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Peng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033146482","display_name":"Sinan Tan","orcid":"https://orcid.org/0000-0002-3299-9336"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Sinan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100459627","display_name":"Yang An","orcid":"https://orcid.org/0000-0002-6529-1609"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, An","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063498611","display_name":"Zeyu Cui","orcid":"https://orcid.org/0000-0003-0017-5292"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Zeyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100462721","display_name":"Han Yu","orcid":"https://orcid.org/0000-0003-1936-5328"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101014470","display_name":"Shuai Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Shuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013425805","display_name":"Wenbin Ge","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ge, Wenbin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100661619","display_name":"Jianxin Ma","orcid":"https://orcid.org/0009-0000-5214-432X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Jianxin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100612233","display_name":"Junyang Lin","orcid":"https://orcid.org/0000-0001-9931-383X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Junyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057864403","display_name":"Jingren Zhou","orcid":"https://orcid.org/0000-0002-4220-2634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Jingren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100613561","display_name":"Chang Zhou","orcid":"https://orcid.org/0000-0002-6029-1132"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Chang","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.824796,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":75,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9941,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5284267},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.45459914}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.87045044},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6482059},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.62515765},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5284267},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46444705},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.45459914},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.45426837},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41672757},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.04408","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2212.04408","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2212.04408","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.59}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W73545470","https://openalex.org/W649759291","https://openalex.org/W4320153225","https://openalex.org/W4307407935","https://openalex.org/W4293261942","https://openalex.org/W4224266612","https://openalex.org/W3125968744","https://openalex.org/W2383394264","https://openalex.org/W2167701463","https://openalex.org/W2110287964"],"abstract_inverted_index":{"Generalist":[0],"models,":[1,189],"which":[2,154],"are":[3,33],"capable":[4],"of":[5,55,68,79,84,111,142,186,194],"performing":[6],"diverse":[7,132],"multi-modal":[8,48,74,86,133,195],"tasks":[9,150],"in":[10,151,180],"a":[11,15,59,69,96,108,136,158],"task-agnostic":[12],"way":[13],"within":[14],"single":[16,109,160,174],"model,":[17,161],"have":[18],"been":[19],"explored":[20],"recently.":[21],"Being,":[22],"hopefully,":[23],"an":[24,36],"alternative":[25],"to":[26],"approaching":[27],"general-purpose":[28],"AI,":[29],"existing":[30],"generalist":[31,60],"models":[32],"still":[34],"at":[35,201],"early":[37],"stage,":[38],"where":[39],"modality":[40],"and":[41,50,124,146,170],"task":[42,71,87,97,117],"coverage":[43],"is":[44,81],"limited.":[45],"To":[46],"empower":[47],"task-scaling":[49,196],"speed":[51],"up":[52],"this":[53],"line":[54,110],"research,":[56],"we":[57,139,155],"release":[58],"model":[61,92,176],"learning":[62],"system,":[63],"OFASys,":[64,95,152],"built":[65],"on":[66],"top":[67],"declarative":[70],"interface":[72],"named":[73],"instruction.":[75],"At":[76],"the":[77,82,90,191],"core":[78],"OFASys":[80],"idea":[83],"decoupling":[85],"representations":[88],"from":[89,119],"underlying":[91],"implementations.":[93],"In":[94],"involving":[98],"multiple":[99],"modalities":[100,145],"can":[101,164],"be":[102],"defined":[103],"declaratively":[104],"even":[105],"with":[106,153,182],"just":[107],"code.":[112],"The":[113,173],"system":[114],"automatically":[115],"generates":[116],"plans":[118],"such":[120],"instructions":[121],"for":[122,131],"training":[123,130],"inference.":[125],"It":[126],"also":[127,156],"facilitates":[128],"multi-task":[129],"workloads.":[134],"As":[135],"starting":[137],"point,":[138],"provide":[140],"presets":[141],"7":[143],"different":[144],"23":[147],"highly-diverse":[148],"example":[149],"develop":[157],"first-in-kind,":[159],"OFA+,":[162],"that":[163],"handle":[165],"text,":[166],"image,":[167],"speech,":[168],"video,":[169],"motion":[171],"data.":[172],"OFA+":[175],"achieves":[177],"95%":[178],"performance":[179,192],"average":[181],"only":[183],"16%":[184],"parameters":[185],"15":[187],"task-finetuned":[188],"showcasing":[190],"reliability":[193],"provided":[197],"by":[198],"OFASys.":[199],"Available":[200],"https://github.com/OFA-Sys/OFASys":[202]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4311001273","counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-04-23T08:03:08.094898","created_date":"2022-12-22"}