{"id":"https://openalex.org/W4296762131","doi":"https://doi.org/10.48550/arxiv.2204.07834","title":"Bridging Cross-Lingual Gaps During Leveraging the Multilingual Sequence-to-Sequence Pretraining for Text Generation and Understanding","display_name":"Bridging Cross-Lingual Gaps During Leveraging the Multilingual Sequence-to-Sequence Pretraining for Text Generation and Understanding","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4296762131","doi":"https://doi.org/10.48550/arxiv.2204.07834"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.07834","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2204.07834","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007802059","display_name":"Changtong Zan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zan, Changtong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100456723","display_name":"Liang Ding","orcid":"https://orcid.org/0000-0001-8976-2084"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Liang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100333320","display_name":"Li Shen","orcid":"https://orcid.org/0000-0002-5443-0503"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100780040","display_name":"Yu Cao","orcid":"https://orcid.org/0009-0006-7562-5680"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100444161","display_name":"Weifeng Liu","orcid":"https://orcid.org/0000-0002-7798-797X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Weifeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5074103823","display_name":"Dacheng Tao","orcid":"https://orcid.org/0000-0001-7225-5449"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao, Dacheng","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60916,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":59,"max":69},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9869,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence-labeling","display_name":"Sequence labeling","score":0.48435342}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8352406},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.68708485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6239772},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.56149286},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.53877634},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5015967},{"id":"https://openalex.org/C35639132","wikidata":"https://www.wikidata.org/wiki/Q7452468","display_name":"Sequence labeling","level":3,"score":0.48435342},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.47564244},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.45123088},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.44418472},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.35559723},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.07834","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.07834","pdf_url":"http://arxiv.org/pdf/2204.07834","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2204.07834","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2204.07834","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","score":0.82,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4389760904","https://openalex.org/W4379251483","https://openalex.org/W4322096459","https://openalex.org/W4284703357","https://openalex.org/W3148229873","https://openalex.org/W3042366391","https://openalex.org/W2366403280","https://openalex.org/W2150160875","https://openalex.org/W2091301346","https://openalex.org/W1495108544"],"abstract_inverted_index":{"For":[0],"multilingual":[1,102],"sequence-to-sequence":[2],"pretrained":[3],"language":[4,39,148],"models":[5],"(multilingual":[6],"Seq2Seq":[7,103],"PLMs),":[8],"e.g.":[9,24,41],"mBART,":[10],"the":[11,30,46,61,68,77,87,91,101,113,118,155,170,179,188],"self-supervised":[12,92],"pretraining":[13,62],"task":[14,58,73,95],"is":[15],"trained":[16],"on":[17,36,120,125],"a":[18,37,97],"wide":[19],"range":[20],"of":[21,173],"monolingual":[22],"languages,":[23],"25":[25],"languages":[26],"from":[27],"CommonCrawl,":[28],"while":[29],"downstream":[31,121],"cross-lingual":[32,53,70,139,146,174],"tasks":[33],"generally":[34],"progress":[35],"bilingual":[38,130],"subset,":[40],"English-German,":[42],"making":[43],"there":[44],"exists":[45],"data":[47,122],"discrepancy,":[48,51,56,59],"namely":[49,57],"domain":[50,71],"and":[52,63,72,137,142,177],"learning":[54],"objective":[55],"between":[60],"finetuning":[64,161],"stages.":[65],"To":[66],"bridge":[67],"above":[69],"gaps,":[74],"we":[75,116],"extend":[76],"vanilla":[78],"pretrain-finetune":[79],"pipeline":[80],"with":[81,159,182],"extra":[82],"code-switching":[83,93],"restore":[84,94],"task.":[85],"Specifically,":[86],"first":[88],"stage":[89],"employs":[90],"as":[96],"pretext":[98],"task,":[99],"allowing":[100],"PLMs":[104],"to":[105],"acquire":[106],"some":[107],"in-domain":[108],"alignment":[109],"information.":[110],"And":[111],"for":[112],"second":[114],"stage,":[115],"fine-tune":[117],"model":[119,153,180],"normally.":[123],"Experiments":[124],"both":[126],"NLG":[127],"evaluation":[128,144],"(12":[129],"translation":[131,135],"tasks,":[132,136],"30":[133],"zero-shot":[134],"2":[138],"summarization":[140],"tasks)":[141,150],"NLU":[143],"(7":[145],"natural":[147],"inference":[149],"show":[151],"our":[152,166],"outperforms":[154],"strong":[156],"baseline":[157],"mBART":[158],"standard":[160],"strategy,":[162],"consistently.":[163],"Analyses":[164],"indicate":[165],"approach":[167],"could":[168],"narrow":[169],"Euclidean":[171],"distance":[172],"sentence":[175],"representations,":[176],"improve":[178],"generalization":[181],"trivial":[183],"computational":[184],"cost.":[185],"We":[186],"release":[187],"code":[189],"at:":[190],"https://github.com/zanchangtong/CSR4mBART.":[191]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4296762131","counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-04-18T14:32:44.348016","created_date":"2022-09-23"}