{"id":"https://openalex.org/W3113924821","doi":"https://doi.org/10.18653/v1/2020.coling-main.75","title":"Do Word Embeddings Capture Spelling Variation?","display_name":"Do Word Embeddings Capture Spelling Variation?","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3113924821","doi":"https://doi.org/10.18653/v1/2020.coling-main.75","mag":"3113924821"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.75","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.75.pdf","source":{"id":"https://openalex.org/S4363608852","display_name":"Proceedings of the 17th international conference on Computational linguistics -","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.aclweb.org/anthology/2020.coling-main.75.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004209770","display_name":"Dong Nguyen","orcid":"https://orcid.org/0000-0002-6062-3117"},"institutions":[{"id":"https://openalex.org/I193662353","display_name":"Utrecht University","ror":"https://ror.org/04pp8hn57","country_code":"NL","type":"education","lineage":["https://openalex.org/I193662353"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Dong Nguyen","raw_affiliation_strings":["Department of Information and Computing Sciences, Utrecht University, the Netherlands"],"affiliations":[{"raw_affiliation_string":"Department of Information and Computing Sciences, Utrecht University, the Netherlands","institution_ids":["https://openalex.org/I193662353"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038175231","display_name":"Jack Grieve","orcid":"https://orcid.org/0000-0003-3630-7349"},"institutions":[{"id":"https://openalex.org/I79619799","display_name":"University of Birmingham","ror":"https://ror.org/03angcq70","country_code":"GB","type":"education","lineage":["https://openalex.org/I79619799"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jack Grieve","raw_affiliation_strings":["Department of English Language and Linguistics, University of Birmingham, UK"],"affiliations":[{"raw_affiliation_string":"Department of English Language and Linguistics, University of Birmingham, UK","institution_ids":["https://openalex.org/I79619799"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.792,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":10,"citation_normalized_percentile":{"value":0.80582,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":86,"max":87},"biblio":{"volume":null,"issue":null,"first_page":"870","last_page":"881"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9984,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.9521766},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.89305425},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.617961}],"concepts":[{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.9521766},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.89305425},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.75227445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7328104},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.617961},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.58442265},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5745903},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.50014424},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.41478726},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.41061503},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.08830798},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07087013},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.75","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.75.pdf","source":{"id":"https://openalex.org/S4363608852","display_name":"Proceedings of the 17th international conference on Computational linguistics -","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://dspace.library.uu.nl/handle/1874/414733","pdf_url":"https://dspace.library.uu.nl/bitstream/handle/1874/414733/2020.coling_main.75.pdf?sequence=1&isAllowed=y","source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":["Royal Netherlands Academy of Arts and Sciences"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.75","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.75.pdf","source":{"id":"https://openalex.org/S4363608852","display_name":"Proceedings of the 17th international conference on Computational linguistics -","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.72,"id":"https://metadata.un.org/sdg/4","display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":50,"referenced_works":["https://openalex.org/W1527708454","https://openalex.org/W1529864641","https://openalex.org/W1629416181","https://openalex.org/W166259489","https://openalex.org/W168564468","https://openalex.org/W1796112755","https://openalex.org/W1868971014","https://openalex.org/W1893888233","https://openalex.org/W1901600440","https://openalex.org/W1972093334","https://openalex.org/W2096438711","https://openalex.org/W2101234009","https://openalex.org/W2101761627","https://openalex.org/W2139661915","https://openalex.org/W2141599568","https://openalex.org/W2146867136","https://openalex.org/W2152815769","https://openalex.org/W2153579005","https://openalex.org/W2159397589","https://openalex.org/W2187089797","https://openalex.org/W2250189634","https://openalex.org/W2250307271","https://openalex.org/W2251803266","https://openalex.org/W2252211741","https://openalex.org/W2296076036","https://openalex.org/W2307311961","https://openalex.org/W2460442863","https://openalex.org/W2493916176","https://openalex.org/W2515741950","https://openalex.org/W2548203103","https://openalex.org/W2732821633","https://openalex.org/W2739638526","https://openalex.org/W2769358515","https://openalex.org/W2793993185","https://openalex.org/W2798819017","https://openalex.org/W2799124508","https://openalex.org/W2806391156","https://openalex.org/W2852714836","https://openalex.org/W2896457183","https://openalex.org/W2906152891","https://openalex.org/W2912564276","https://openalex.org/W2945808722","https://openalex.org/W2962739339","https://openalex.org/W2962776659","https://openalex.org/W2963176474","https://openalex.org/W2963341956","https://openalex.org/W2963430224","https://openalex.org/W2964204621","https://openalex.org/W3098124506","https://openalex.org/W4294170691"],"related_works":["https://openalex.org/W611030372","https://openalex.org/W4298186509","https://openalex.org/W2748952813","https://openalex.org/W2556702969","https://openalex.org/W217221262","https://openalex.org/W2161008081","https://openalex.org/W2100947578","https://openalex.org/W2081317458","https://openalex.org/W1974418053","https://openalex.org/W1555832326"],"abstract_inverted_index":{"Analyses":[0],"of":[1,35,71,77,94,123,129],"word":[2,13,36,57,72,88],"embeddings":[3,14,37,58,89,101],"have":[4,15],"primarily":[5],"focused":[6],"on":[7,32,40,60],"semantic":[8],"and":[9,50,62,126],"syntactic":[10],"properties.":[11],"However,":[12],"the":[16,33,104,121,124,127,130],"potential":[17],"to":[18,97,133],"encode":[19,90],"other":[20],"properties":[21],"as":[22],"well.":[23],"In":[24,43],"this":[25],"paper,":[26],"we":[27,55],"propose":[28],"a":[29,118],"new":[30],"perspective":[31],"analysis":[34],"by":[38],"focusing":[39],"spelling":[41,46,78,91,111],"variation.":[42],"social":[44],"media,":[45],"variation":[47,79,92,125],"is":[48],"abundant":[49],"often":[51],"socially":[52],"meaningful.":[53],"Here,":[54],"analyze":[56],"trained":[59,102],"Twitter":[61],"Reddit":[63],"data.":[64],"We":[65],"present":[66],"three":[67],"analyses":[68],"using":[69,103],"pairs":[70],"forms":[73],"covering":[74],"seven":[75],"types":[76,96],"in":[80],"English.":[81],"Taken":[82],"together,":[83],"our":[84],"results":[85,115],"show":[86],"that":[87],"patterns":[93],"various":[95],"some":[98],"extent,":[99],"even":[100],"skipgram":[105],"model":[106],"which":[107],"does":[108],"not":[109],"take":[110],"into":[112],"account.":[113],"Our":[114],"also":[116],"suggest":[117],"link":[119],"between":[120],"intentionality":[122],"distance":[128],"non-conventional":[131],"spellings":[132],"their":[134],"conventional":[135],"spellings.":[136]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3113924821","counts_by_year":[{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3}],"updated_date":"2024-12-13T00:04:19.488710","created_date":"2021-01-05"}