{"id":"https://openalex.org/W4378227416","doi":"https://doi.org/10.1017/s1351324923000190","title":"Morphosyntactic probing of multilingual BERT models","display_name":"Morphosyntactic probing of multilingual BERT models","publication_year":2023,"publication_date":"2023-05-25","ids":{"openalex":"https://openalex.org/W4378227416","doi":"https://doi.org/10.1017/s1351324923000190"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000190","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/8C0D539D3F11FB188AB73228BA7F5805/S1351324923000190a.pdf/div-class-title-morphosyntactic-probing-of-multilingual-bert-models-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/8C0D539D3F11FB188AB73228BA7F5805/S1351324923000190a.pdf/div-class-title-morphosyntactic-probing-of-multilingual-bert-models-div.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018650131","display_name":"Judit \u00c1cs","orcid":"https://orcid.org/0000-0003-4918-4333"},"institutions":[{"id":"https://openalex.org/I4210117195","display_name":"Institute for Computer Science and Control","ror":"https://ror.org/0249v7n71","country_code":"HU","type":"facility","lineage":["https://openalex.org/I4210117195","https://openalex.org/I7597260"]},{"id":"https://openalex.org/I29770179","display_name":"Budapest University of Technology and Economics","ror":"https://ror.org/02w42ss30","country_code":"HU","type":"education","lineage":["https://openalex.org/I29770179"]}],"countries":["HU"],"is_corresponding":true,"raw_author_name":"Judit Acs","raw_affiliation_strings":["Department of Automation and Applied Informatics, Faculty of Electrical Engineering and Informatics, Budapest University of Technology and Economics, Budapest, Hungary","Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary","institution_ids":["https://openalex.org/I4210117195"]},{"raw_affiliation_string":"Department of Automation and Applied Informatics, Faculty of Electrical Engineering and Informatics, Budapest University of Technology and Economics, Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070578681","display_name":"Endre Hamerlik","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117195","display_name":"Institute for Computer Science and Control","ror":"https://ror.org/0249v7n71","country_code":"HU","type":"facility","lineage":["https://openalex.org/I4210117195","https://openalex.org/I7597260"]},{"id":"https://openalex.org/I74788687","display_name":"Comenius University Bratislava","ror":"https://ror.org/0587ef340","country_code":"SK","type":"education","lineage":["https://openalex.org/I74788687"]}],"countries":["HU","SK"],"is_corresponding":false,"raw_author_name":"Endre Hamerlik","raw_affiliation_strings":["Department of Applied Informatics, Comenius University in Bratislava Faculty of Mathematics Physics and Informatics, Bratislava, Slovakia","Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary","institution_ids":["https://openalex.org/I4210117195"]},{"raw_affiliation_string":"Department of Applied Informatics, Comenius University in Bratislava Faculty of Mathematics Physics and Informatics, Bratislava, Slovakia","institution_ids":["https://openalex.org/I74788687"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007903277","display_name":"Roy Schwartz","orcid":"https://orcid.org/0000-0003-3487-5713"},"institutions":[{"id":"https://openalex.org/I197251160","display_name":"Hebrew University of Jerusalem","ror":"https://ror.org/03qxff017","country_code":"IL","type":"education","lineage":["https://openalex.org/I197251160"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Roy Schwartz","raw_affiliation_strings":["School of Computer Science and Engineering, Hebrew University of Jerusalem, Jerusalem, Israel"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Hebrew University of Jerusalem, Jerusalem, Israel","institution_ids":["https://openalex.org/I197251160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088517824","display_name":"Noah A. Smith","orcid":"https://orcid.org/0000-0002-2310-6380"},"institutions":[{"id":"https://openalex.org/I4210156221","display_name":"Allen Institute for Artificial Intelligence","ror":"https://ror.org/05w520734","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156221"]},{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Noah A. Smith","raw_affiliation_strings":["Allen Institute for Artificial Intelligence, Seattle, WA, USA","Paul G. Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Allen Institute for Artificial Intelligence, Seattle, WA, USA","institution_ids":["https://openalex.org/I4210156221"]},{"raw_affiliation_string":"Paul G. Allen School of Computer Science and Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065413313","display_name":"Andr\u00e1s Kornai","orcid":"https://orcid.org/0000-0001-6078-6840"},"institutions":[{"id":"https://openalex.org/I4210117195","display_name":"Institute for Computer Science and Control","ror":"https://ror.org/0249v7n71","country_code":"HU","type":"facility","lineage":["https://openalex.org/I4210117195","https://openalex.org/I7597260"]},{"id":"https://openalex.org/I29770179","display_name":"Budapest University of Technology and Economics","ror":"https://ror.org/02w42ss30","country_code":"HU","type":"education","lineage":["https://openalex.org/I29770179"]}],"countries":["HU"],"is_corresponding":false,"raw_author_name":"Andras Kornai","raw_affiliation_strings":["Department of Algebra, Faculty of Natural Sciences, Budapest University of Technology and Economics","Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Informatics Laboratory, ELKH Institute for Computer Science and Control (SZTAKI), Budapest, Hungary","institution_ids":["https://openalex.org/I4210117195"]},{"raw_affiliation_string":"Department of Algebra, Faculty of Natural Sciences, Budapest University of Technology and Economics","institution_ids":["https://openalex.org/I29770179"]}]}],"institution_assertions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5018650131"],"corresponding_institution_ids":["https://openalex.org/I4210117195","https://openalex.org/I29770179"],"apc_list":null,"apc_paid":null,"fwci":0.352,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":1,"citation_normalized_percentile":{"value":0.606989,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":67,"max":78},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"40"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.993,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.91302097},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6478541},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.64032096},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6059846},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.60287035},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.60251963},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.51033515},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.47239965},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4429005},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.16128913},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000190","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/8C0D539D3F11FB188AB73228BA7F5805/S1351324923000190a.pdf/div-class-title-morphosyntactic-probing-of-multilingual-bert-models-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.06205","pdf_url":"http://arxiv.org/pdf/2306.06205","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2306.06205","pdf_url":"https://arxiv.org/pdf/2306.06205","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2306.06205","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1017/s1351324923000190","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/8C0D539D3F11FB188AB73228BA7F5805/S1351324923000190a.pdf/div-class-title-morphosyntactic-probing-of-multilingual-bert-models-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"display_name":"Quality education","score":0.79,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":["https://openalex.org/W4378227416"],"referenced_works_count":62,"referenced_works":["https://openalex.org/W1988865622","https://openalex.org/W2019911971","https://openalex.org/W2024165284","https://openalex.org/W2027889013","https://openalex.org/W2054888858","https://openalex.org/W2099295124","https://openalex.org/W2111460811","https://openalex.org/W2128390429","https://openalex.org/W2250382531","https://openalex.org/W2250539671","https://openalex.org/W2264869955","https://openalex.org/W2292919134","https://openalex.org/W2481240925","https://openalex.org/W2486227503","https://openalex.org/W2492794003","https://openalex.org/W2493916176","https://openalex.org/W2510905642","https://openalex.org/W2511550932","https://openalex.org/W2516090925","https://openalex.org/W2563574619","https://openalex.org/W2572743863","https://openalex.org/W2733687328","https://openalex.org/W2891555348","https://openalex.org/W2892205701","https://openalex.org/W2906152891","https://openalex.org/W2908510526","https://openalex.org/W2914924671","https://openalex.org/W2946417913","https://openalex.org/W2962680795","https://openalex.org/W2962739339","https://openalex.org/W2963250244","https://openalex.org/W2963643701","https://openalex.org/W2963918774","https://openalex.org/W2964204621","https://openalex.org/W2964303116","https://openalex.org/W2970529259","https://openalex.org/W2970862333","https://openalex.org/W2971044268","https://openalex.org/W2990138404","https://openalex.org/W2997900951","https://openalex.org/W3004346089","https://openalex.org/W3013563411","https://openalex.org/W3035137491","https://openalex.org/W3035390927","https://openalex.org/W3088409176","https://openalex.org/W3099668342","https://openalex.org/W3104235057","https://openalex.org/W3155744586","https://openalex.org/W3156886841","https://openalex.org/W3169194986","https://openalex.org/W3173447414","https://openalex.org/W3174770825","https://openalex.org/W3175606037","https://openalex.org/W3176828726","https://openalex.org/W3200130628","https://openalex.org/W3202070718","https://openalex.org/W4205288657","https://openalex.org/W4205945417","https://openalex.org/W4229785665","https://openalex.org/W4298742451","https://openalex.org/W46679369","https://openalex.org/W596964094"],"related_works":["https://openalex.org/W4288365749","https://openalex.org/W4288267738","https://openalex.org/W4287826556","https://openalex.org/W4287598411","https://openalex.org/W3198458223","https://openalex.org/W3098382480","https://openalex.org/W3094871513","https://openalex.org/W3049463507","https://openalex.org/W3013624417","https://openalex.org/W2936497627"],"abstract_inverted_index":{"We":[0,45,63],"introduce":[1],"an":[2],"extensive":[3],"dataset":[4],"for":[5,70,114],"multilingual":[6],"probing":[7,72],"of":[8,24,93,101],"morphological":[9,33],"information":[10,77,121],"in":[11,79],"language":[12],"models":[13,50],"(247":[14],"tasks":[15],"across":[16,60],"42":[17],"languages":[18],"from":[19,40],"10":[20],"families),":[21],"each":[22,71],"consisting":[23],"a":[25,28,32,85,111],"sentence":[26],"with":[27],"target":[29],"word":[30],"and":[31,52],"tag":[34],"as":[35],"the":[36,41,75,80,95,98,115,124,127],"desired":[37],"label,":[38],"derived":[39],"Universal":[42],"Dependencies":[43],"treebanks.":[44],"find":[46],"that":[47,56,89,108],"pre-trained":[48],"Transformer":[49],"(mBERT":[51],"XLM-RoBERTa)":[53],"learn":[54],"features":[55],"attain":[57],"strong":[58,112],"performance":[59],"these":[61],"tasks.":[62],"then":[64],"apply":[65],"two":[66],"methods":[67],"to":[68,118,123],"locate,":[69],"task,":[73],"where":[74],"disambiguating":[76],"resides":[78],"input.":[81],"The":[82,104],"first":[83],"is":[84,97,110],"new":[86],"perturbation":[87],"method":[88,100],"masks":[90],"various":[91],"parts":[92],"context;":[94],"second":[96],"classical":[99],"Shapley":[102],"values.":[103],"most":[105],"intriguing":[106],"finding":[107],"emerges":[109],"tendency":[113],"preceding":[116],"context":[117],"hold":[119],"more":[120],"relevant":[122],"prediction":[125],"than":[126],"following":[128],"context.":[129]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4378227416","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-01-05T10:15:09.476701","created_date":"2023-05-26"}