{"id":"https://openalex.org/W4390051525","doi":"https://doi.org/10.1145/3638248","title":"An Ensemble Strategy with Gradient Conflict for Multi-Domain Neural Machine Translation","display_name":"An Ensemble Strategy with Gradient Conflict for Multi-Domain Neural Machine Translation","publication_year":2023,"publication_date":"2023-12-21","ids":{"openalex":"https://openalex.org/W4390051525","doi":"https://doi.org/10.1145/3638248"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638248","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":"https://doi.org/10.1145/3638248","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044318863","display_name":"Zhibo Man","orcid":"https://orcid.org/0009-0002-3336-5703"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhibo Man","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100412293","display_name":"Yujie Zhang","orcid":"https://orcid.org/0000-0003-1245-0052"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yujie Zhang","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072762520","display_name":"Li Yu","orcid":"https://orcid.org/0000-0002-0569-2267"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Li","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030215088","display_name":"Yuanmeng Chen","orcid":"https://orcid.org/0000-0003-2572-9300"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanmeng Chen","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100394297","display_name":"Yufeng Chen","orcid":"https://orcid.org/0000-0003-0437-6788"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufeng Chen","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101698034","display_name":"Jinan Xu","orcid":"https://orcid.org/0000-0003-0170-626X"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"funder","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinan Xu","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":66},"biblio":{"volume":"23","issue":"2","first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.77549875},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.72846955},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.70989096},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.67977834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.61376184},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5096257},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.50927246},{"id":"https://openalex.org/C164660894","wikidata":"https://www.wikidata.org/wiki/Q2037833","display_name":"Piecewise","level":2,"score":0.48055318},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41986188},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39385393},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33157444},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12902275},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638248","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1145/3638248","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.46}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"61876198, 61976015, 61976016"}],"datasets":[],"versions":[],"referenced_works_count":50,"referenced_works":["https://openalex.org/W1524281572","https://openalex.org/W2131953535","https://openalex.org/W2187089797","https://openalex.org/W2261339088","https://openalex.org/W2525778437","https://openalex.org/W2567571499","https://openalex.org/W2581863816","https://openalex.org/W2740718109","https://openalex.org/W2740743644","https://openalex.org/W2744813330","https://openalex.org/W2756978580","https://openalex.org/W2759083144","https://openalex.org/W2760452458","https://openalex.org/W2803241009","https://openalex.org/W2892244498","https://openalex.org/W2933138175","https://openalex.org/W2946379889","https://openalex.org/W2954647460","https://openalex.org/W2962784628","https://openalex.org/W2963532001","https://openalex.org/W2963983698","https://openalex.org/W2970286654","https://openalex.org/W2990804422","https://openalex.org/W2997936605","https://openalex.org/W3034112745","https://openalex.org/W3034640977","https://openalex.org/W3034771276","https://openalex.org/W3106539628","https://openalex.org/W3116179216","https://openalex.org/W3170463198","https://openalex.org/W3174805484","https://openalex.org/W3196757209","https://openalex.org/W3199890931","https://openalex.org/W3206604436","https://openalex.org/W3212494843","https://openalex.org/W4225927944","https://openalex.org/W4226203238","https://openalex.org/W4285223438","https://openalex.org/W4285306484","https://openalex.org/W4287213465","https://openalex.org/W4287887789","https://openalex.org/W4287889965","https://openalex.org/W4297782088","https://openalex.org/W4297841743","https://openalex.org/W4297969478","https://openalex.org/W4300695819","https://openalex.org/W4300835687","https://openalex.org/W4307315281","https://openalex.org/W4365799947","https://openalex.org/W4388983924"],"related_works":["https://openalex.org/W4388145910","https://openalex.org/W4248336175","https://openalex.org/W2883671469","https://openalex.org/W2728761353","https://openalex.org/W2391445434","https://openalex.org/W2381570729","https://openalex.org/W2366107444","https://openalex.org/W2348315137","https://openalex.org/W2031260042","https://openalex.org/W1976205134"],"abstract_inverted_index":{"Multi-domain":[0],"neural":[1,9,49],"machine":[2,10,50],"translation":[3,11,51],"aims":[4],"to":[5,13,28,85,105,124,147],"construct":[6],"a":[7,70,101,116],"unified":[8],"model":[12,55,145],"translate":[14],"sentences":[15],"across":[16],"various":[17],"domains.":[18],"Nevertheless,":[19],"previous":[20,148],"studies":[21],"have":[22],"one":[23],"limitation":[24],"is":[25],"the":[26,74,78,121,127,139],"incapacity":[27],"acquire":[29],"both":[30,59],"domain-general":[31],"and":[32,61,83,88,108],"domain-specific":[33,62],"representations":[34],"concurrently.":[35],"To":[36],"this":[37],"end,":[38],"we":[39,94,114],"propose":[40],"an":[41,96],"ensemble":[42,90],"strategy":[43,99],"with":[44],"gradient":[45,110,122],"conflict":[46,123],"for":[47],"multi-domain":[48,136],"that":[52],"automatically":[53],"learns":[54],"parameters":[56,75],"by":[57],"identifying":[58],"domain-shared":[60],"features.":[63],"Specifically,":[64],"our":[65,130,143],"approach":[66],"consists":[67],"of":[68,76,120,129,142],"(1)":[69],"parameter-sharing":[71],"framework,":[72],"where":[73],"all":[77],"layers":[79],"are":[80],"originally":[81],"shared":[82],"equivalent":[84],"each":[86],"domain,":[87],"(2)":[89],"strategy,":[91],"in":[92],"which":[93],"design":[95],"Extra":[97],"Ensemble":[98],"via":[100],"piecewise":[102],"condition":[103],"function":[104],"learn":[106],"direction":[107],"distance-based":[109],"conflict.":[111],"In":[112],"addition,":[113],"give":[115],"detailed":[117],"theoretical":[118],"analysis":[119],"further":[125],"validate":[126],"effectiveness":[128],"approach.":[131],"Experimental":[132],"results":[133],"on":[134],"two":[135],"datasets":[137],"show":[138],"superior":[140],"performance":[141],"proposed":[144],"compared":[146],"work.":[149]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4390051525","counts_by_year":[],"updated_date":"2025-02-28T22:09:50.151425","created_date":"2023-12-22"}