{"id":"https://openalex.org/W3015046447","doi":"https://doi.org/10.1017/s1351324920000182","title":"Investigating translated Chinese and its variants using machine learning","display_name":"Investigating translated Chinese and its variants using machine learning","publication_year":2020,"publication_date":"2020-04-03","ids":{"openalex":"https://openalex.org/W3015046447","doi":"https://doi.org/10.1017/s1351324920000182","mag":"3015046447"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324920000182","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069337524","display_name":"Hai Hu","orcid":"https://orcid.org/0000-0002-2289-9008"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"funder","lineage":["https://openalex.org/I4210119109","https://openalex.org/I4407990318","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hai Hu","raw_affiliation_strings":["Department of Linguistics, Indiana University, Bloomington, IN, USA"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Indiana University, Bloomington, IN, USA","institution_ids":["https://openalex.org/I4210119109"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009027177","display_name":"Sandra K\u00fcbler","orcid":"https://orcid.org/0000-0003-0885-5436"},"institutions":[{"id":"https://openalex.org/I4210119109","display_name":"Indiana University Bloomington","ror":"https://ror.org/02k40bc56","country_code":"US","type":"funder","lineage":["https://openalex.org/I4210119109","https://openalex.org/I4407990318","https://openalex.org/I592451"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sandra K\u00fcbler","raw_affiliation_strings":["Department of Linguistics, Indiana University, Bloomington, IN, USA"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Indiana University, Bloomington, IN, USA","institution_ids":["https://openalex.org/I4210119109"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5069337524"],"corresponding_institution_ids":["https://openalex.org/I4210119109"],"apc_list":null,"apc_paid":null,"fwci":0.945,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.890908,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":88,"max":89},"biblio":{"volume":"27","issue":"3","first_page":"339","last_page":"372"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9976,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/linguistic-universal","display_name":"Linguistic universal","score":0.67666036},{"id":"https://openalex.org/keywords/problem-of-universals","display_name":"Problem of universals","score":0.48268226}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8435156},{"id":"https://openalex.org/C79078291","wikidata":"https://www.wikidata.org/wiki/Q980142","display_name":"Linguistic universal","level":3,"score":0.67666036},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.63904274},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.61957335},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.61799926},{"id":"https://openalex.org/C9354725","wikidata":"https://www.wikidata.org/wiki/Q286017","display_name":"Operationalization","level":2,"score":0.60166097},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5357404},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.5053564},{"id":"https://openalex.org/C16592111","wikidata":"https://www.wikidata.org/wiki/Q6092032","display_name":"Problem of universals","level":2,"score":0.48268226},{"id":"https://openalex.org/C153578388","wikidata":"https://www.wikidata.org/wiki/Q351625","display_name":"Theoretical linguistics","level":2,"score":0.17681077},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324920000182","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.62,"display_name":"Reduced inequalities"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":57,"referenced_works":["https://openalex.org/W10376690","https://openalex.org/W141389376","https://openalex.org/W1511948402","https://openalex.org/W1536870197","https://openalex.org/W1553669113","https://openalex.org/W1563516561","https://openalex.org/W1593045043","https://openalex.org/W1599248181","https://openalex.org/W1779279021","https://openalex.org/W1939136393","https://openalex.org/W1971020201","https://openalex.org/W1982008367","https://openalex.org/W1995875735","https://openalex.org/W2006832571","https://openalex.org/W2010095917","https://openalex.org/W2054151502","https://openalex.org/W2077779631","https://openalex.org/W2096204319","https://openalex.org/W2101440232","https://openalex.org/W2109625801","https://openalex.org/W2123442489","https://openalex.org/W2133990480","https://openalex.org/W2148365102","https://openalex.org/W2148959489","https://openalex.org/W2149545135","https://openalex.org/W2158664237","https://openalex.org/W2164628107","https://openalex.org/W22168010","https://openalex.org/W2252187216","https://openalex.org/W2462678396","https://openalex.org/W2472237015","https://openalex.org/W2486057246","https://openalex.org/W2486683351","https://openalex.org/W2507666215","https://openalex.org/W2512700785","https://openalex.org/W2552620689","https://openalex.org/W2567204716","https://openalex.org/W2608759623","https://openalex.org/W2610814933","https://openalex.org/W2611874649","https://openalex.org/W2615826748","https://openalex.org/W2806632318","https://openalex.org/W2906113790","https://openalex.org/W2944608091","https://openalex.org/W2954684707","https://openalex.org/W2963160607","https://openalex.org/W3137789548","https://openalex.org/W3140453591","https://openalex.org/W3196602046","https://openalex.org/W417454032","https://openalex.org/W4212974578","https://openalex.org/W4230225957","https://openalex.org/W4253149253","https://openalex.org/W4285719527","https://openalex.org/W593337613","https://openalex.org/W625942373","https://openalex.org/W835791623"],"related_works":["https://openalex.org/W4300920224","https://openalex.org/W4205749443","https://openalex.org/W32544657","https://openalex.org/W2356813761","https://openalex.org/W2327302055","https://openalex.org/W2159029267","https://openalex.org/W2156345224","https://openalex.org/W2103507589","https://openalex.org/W1966962243","https://openalex.org/W1537853517"],"abstract_inverted_index":{"Abstract":[0],"Translations":[1],"are":[2,15,41,107,142,314],"generally":[3],"assumed":[4],"to":[5,154,205,235,244],"share":[6],"universal":[7,85],"features":[8],"that":[9,14,26,61,112,252,313,336],"distinguish":[10],"them":[11],"from":[12,92,199,262,274,296],"texts":[13],"originally":[16],"written":[17],"in":[18,149,181,225,282,337],"the":[19,55,70,84,115,121,127,137,143,166,171,178,182,187,208,275,325,330],"same":[20,71],"language.":[21,57,73],"Thus,":[22],"we":[23,59,135,160,193,288],"can":[24,192,258,278],"argue":[25,60],"these":[27,62],"translations":[28,40,68,91,119,130,246,254,295],"constitute":[29,64],"their":[30,45,215,283],"own":[31],"variety":[32],"of":[33,67,87,145,186,210,291,308],"a":[34,256],"language,":[35],"often":[36,279],"called":[37],"translationese.":[38,292],"However,":[39,97],"also":[42,169],"influenced":[43],"by":[44],"source":[46,56,94,156,276,331],"languages":[47,81,95,102,277,299,332],"and":[48,89,120,151,174,190,213,304,329],"thus":[49],"show":[50,251],"different":[51,65,101,155,211],"characteristics":[52,86,144,179,212,222,312],"depending":[53],"on":[54,79,170,177,196,227,266],"Consequently,":[58],"variants":[63],"\u201cdialects\u201d":[66],"into":[69,114,126,247],"target":[72],"Studies":[74],"using":[75],"machine":[76,203],"learning":[77,204],"techniques":[78],"Indo-European":[80],"have":[82,240],"investigated":[83],"translationese":[88],"how":[90],"various":[93],"differ.":[96],"for":[98,217,317,321],"typologically":[99],"very":[100],"such":[103],"as":[104,123,125,255],"Chinese,":[105,322],"there":[106],"only":[108,164,267],"few":[109],"corpus":[110],"studies":[111,226],"tap":[113],"intricate":[116],"relation":[117],"between":[118,327],"originals,":[122],"well":[124,320],"relations":[128],"among":[129],"themselves.":[131],"In":[132,229],"this":[133],"contribution,":[134],"investigate":[136],"following":[138],"questions:":[139],"(1)":[140],"What":[141],"Chinese":[146,219,253,328],"translationese,":[147],"both":[148],"general":[150],"with":[152,221],"respect":[153],"languages?":[157],"(2)":[158],"Can":[159],"find":[161],"differences":[162],"not":[163,315],"at":[165],"lexical":[167],"but":[168],"syntactic":[172,237],"level?":[173],"(3)":[175],"Based":[176],"found":[180,281],"previous":[183],"questions,":[184],"which":[185,239],"proposed":[188],"laws":[189],"universals":[191],"corroborate":[194],"based":[195,265],"our":[197,218,231],"evidence":[198],"Chinese?":[200],"We":[201],"use":[202,307],"operationalize":[206],"determining":[207],"importance":[209,216],"comparing":[214],"dataset":[220],"previously":[223],"reported":[224],"English.":[228],"addition,":[230],"methodology":[232],"allows":[233],"us":[234],"add":[236],"features,":[238],"rarely":[241],"been":[242],"used":[243],"study":[245],"Chinese.":[248],"Our":[249],"results":[250],"whole":[257],"be":[259,280],"reliably":[260],"distinguished":[261],"non-translations,":[263],"even":[264],"five":[268],"features.":[269],"More":[270],"interestingly,":[271],"typological":[272],"traces":[273],"translations,":[284],"therefore":[285],"creating":[286],"what":[287],"call":[289],"dialects":[290],"For":[293],"instance,":[294],"two":[297],"Altaic":[298],"exhibit":[300],"more":[301],"noun":[302],"repetition":[303],"less":[305],"frequent":[306],"pronouns.":[309],"Additionally,":[310],"some":[311],"discriminative":[316],"English":[318,338],"work":[319],"possibly":[323],"because":[324],"distance":[326],"is":[333],"greater":[334],"than":[335],"studies.":[339]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3015046447","counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":4}],"updated_date":"2025-04-08T12:43:22.784124","created_date":"2020-04-10"}