{"id":"https://openalex.org/W4283019930","doi":"https://doi.org/10.48550/arxiv.2206.07615","title":"The SIGMORPHON 2022 Shared Task on Morpheme Segmentation","display_name":"The SIGMORPHON 2022 Shared Task on Morpheme Segmentation","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4283019930","doi":"https://doi.org/10.48550/arxiv.2206.07615"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.07615","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2206.07615","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064991912","display_name":"Khuyagbaatar Batsuren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Batsuren, Khuyagbaatar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075478426","display_name":"G\u00e1bor Bella","orcid":"https://orcid.org/0000-0002-3868-1740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bella, G\u00e1bor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082261951","display_name":"Aryaman Arora","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arora, Aryaman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023177581","display_name":"Viktor Martinovi\u0107","orcid":"https://orcid.org/0000-0003-2095-6192"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martinovi\u0107, Viktor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011757745","display_name":"Kyle Gorman","orcid":"https://orcid.org/0000-0002-4233-6595"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gorman, Kyle","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088317432","display_name":"Zden\u011bk \u017dabokrtsk\u00fd","orcid":"https://orcid.org/0000-0001-8149-4054"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u017dabokrtsk\u00fd, Zden\u011bk","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062041378","display_name":"Amarsanaa Ganbold","orcid":"https://orcid.org/0000-0003-4335-6608"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganbold, Amarsanaa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038334101","display_name":"\u0160\u00e1rka Dohnalov\u00e1","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dohnalov\u00e1, \u0160\u00e1rka","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059544000","display_name":"Magda \u0160ev\u010d\u00ed\u00adkov\u00e1","orcid":"https://orcid.org/0000-0003-4780-7912"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u0160ev\u010d\u00edkov\u00e1, Magda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002397331","display_name":"Kate\u0159ina Pelegrinov\u00e1","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pelegrinov\u00e1, Kate\u0159ina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001227032","display_name":"Fausto Giunchiglia","orcid":"https://orcid.org/0000-0002-5903-6150"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giunchiglia, Fausto","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061951606","display_name":"Ryan Cotterell","orcid":"https://orcid.org/0000-0003-4080-1833"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cotterell, Ryan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055467011","display_name":"Ekaterina Vylomova","orcid":"https://orcid.org/0000-0002-4058-5459"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vylomova, Ekaterina","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":60},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9941,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/text-segmentation","display_name":"Text segmentation","score":0.48980924},{"id":"https://openalex.org/keywords/lexical-analysis","display_name":"Lexical analysis","score":0.4649787},{"id":"https://openalex.org/keywords/word-formation","display_name":"Word formation","score":0.41445768}],"concepts":[{"id":"https://openalex.org/C165297611","wikidata":"https://www.wikidata.org/wiki/Q43249","display_name":"Morpheme","level":2,"score":0.9589522},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.71627736},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7149424},{"id":"https://openalex.org/C2777842544","wikidata":"https://www.wikidata.org/wiki/Q9056","display_name":"Czech","level":2,"score":0.6438314},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.61174786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5922947},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5203578},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.5196306},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.50519735},{"id":"https://openalex.org/C98501671","wikidata":"https://www.wikidata.org/wiki/Q1948408","display_name":"Text segmentation","level":3,"score":0.48980924},{"id":"https://openalex.org/C176982825","wikidata":"https://www.wikidata.org/wiki/Q835922","display_name":"Lexical analysis","level":2,"score":0.4649787},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.45267957},{"id":"https://openalex.org/C2777509023","wikidata":"https://www.wikidata.org/wiki/Q327358","display_name":"Word formation","level":2,"score":0.41445768},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.34055224},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.07615","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.07615","pdf_url":"http://arxiv.org/pdf/2206.07615","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.11850/588602","pdf_url":"https://www.research-collection.ethz.ch/bitstream/20.500.11850/588602/2/2022.sigmorphon-1.11.pdf","source":{"id":"https://openalex.org/S4306402302","display_name":"Repository for Publications and Research Data (ETH Zurich)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I35440088","host_organization_name":"ETH Zurich","host_organization_lineage":["https://openalex.org/I35440088"],"host_organization_lineage_names":["ETH Zurich"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2206.07615","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2206.07615","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Quality education","score":0.73,"id":"https://metadata.un.org/sdg/4"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W59105588","https://openalex.org/W4388277500","https://openalex.org/W4280575942","https://openalex.org/W3113616367","https://openalex.org/W2791858227","https://openalex.org/W2466768907","https://openalex.org/W2391986003","https://openalex.org/W2361481624","https://openalex.org/W2101234829","https://openalex.org/W2075530739"],"abstract_inverted_index":{"The":[0],"SIGMORPHON":[1],"2022":[2],"shared":[3],"task":[4],"on":[5],"morpheme":[6,32,78],"segmentation":[7],"challenged":[8],"systems":[9,99],"to":[10,72],"decompose":[11],"a":[12,15],"word":[13],"into":[14],"sequence":[16],"of":[17,23,121],"morphemes":[18],"and":[19,27,50,58,96,117,132],"covered":[20,34,80],"most":[21],"types":[22],"morphology:":[24],"compounds,":[25],"derivations,":[26],"inflections.":[28],"Subtask":[29,75],"1,":[30],"word-level":[31],"segmentation,":[33,79],"5":[35],"million":[36],"words":[37],"in":[38,83],"9":[39],"languages":[40,85],"(Czech,":[41,86],"English,":[42,87],"Spanish,":[43],"Hungarian,":[44],"French,":[45],"Italian,":[46],"Russian,":[47],"Latin,":[48],"Mongolian)":[49],"received":[51,89],"13":[52],"system":[53,61,91,127],"submissions":[54,92],"from":[55,93],"7":[56],"teams":[57],"the":[59,97,129],"best":[60,98],"averaged":[62],"97.29%":[63],"F1":[64],"score":[65],"across":[66],"all":[67,101,126,133],"languages,":[68],"ranging":[69],"English":[70],"(93.84%)":[71],"Latin":[73],"(99.38%).":[74],"2,":[76],"sentence-level":[77],"18,735":[81],"sentences":[82],"3":[84,94],"Mongolian),":[88],"10":[90],"teams,":[95],"outperformed":[100],"three":[102],"state-of-the-art":[103],"subword":[104],"tokenization":[105],"methods":[106],"(BPE,":[107],"ULM,":[108],"Morfessor2)":[109],"by":[110],"30.71%":[111],"absolute.":[112],"To":[113],"facilitate":[114],"error":[115],"analysis":[116],"support":[118],"any":[119],"type":[120],"future":[122],"studies,":[123],"we":[124],"released":[125],"predictions,":[128],"evaluation":[130],"script,":[131],"gold":[134],"standard":[135],"datasets.":[136]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4283019930","counts_by_year":[],"updated_date":"2024-12-15T18:07:22.560942","created_date":"2022-06-18"}