{"id":"https://openalex.org/W2251843872","doi":"https://doi.org/10.3115/v1/w14-3908","title":"Word-level Language Identification using CRF: Code-switching Shared Task Report of MSR India System","display_name":"Word-level Language Identification using CRF: Code-switching Shared Task Report of MSR India System","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2251843872","doi":"https://doi.org/10.3115/v1/w14-3908","mag":"2251843872"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3908","pdf_url":"https://aclanthology.org/W14-3908.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://aclanthology.org/W14-3908.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013274923","display_name":"Gokul Chittaranjan","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"funder","lineage":["https://openalex.org/I66946132"]},{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Gokul Chittaranjan","raw_affiliation_strings":["Microsoft Research India","University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Microsoft Research India","institution_ids":["https://openalex.org/I4210124949","https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008851653","display_name":"Yogarshi Vyas","orcid":null},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"funder","lineage":["https://openalex.org/I66946132"]},{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Yogarshi Vyas","raw_affiliation_strings":["Microsoft Research India","University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Microsoft Research India","institution_ids":["https://openalex.org/I4210124949","https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013639574","display_name":"Kalika Bali","orcid":"https://orcid.org/0000-0001-9275-742X"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"funder","lineage":["https://openalex.org/I66946132"]},{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Kalika Bali","raw_affiliation_strings":["Microsoft Research India","University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Microsoft Research India","institution_ids":["https://openalex.org/I4210124949","https://openalex.org/I4210124949"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008944385","display_name":"Monojit Choudhury","orcid":"https://orcid.org/0000-0001-7473-7839"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"funder","lineage":["https://openalex.org/I66946132"]},{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Monojit Choudhury","raw_affiliation_strings":["Microsoft Research India","University of Maryland"],"affiliations":[{"raw_affiliation_string":"University of Maryland","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"Microsoft Research India","institution_ids":["https://openalex.org/I4210124949","https://openalex.org/I4210124949"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.3,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":70,"citation_normalized_percentile":{"value":0.912934,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identification","display_name":"Identification","score":0.5299754},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.45939538}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.77073514},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.724453},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.66263956},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.63872105},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5299754},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48163858},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.45939538},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.44503722},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3507232},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2746657},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1688242},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09206161},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3908","pdf_url":"https://aclanthology.org/W14-3908.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.671.8903","pdf_url":"http://www.aclweb.org/anthology/W/W14/W14-3908.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3908","pdf_url":"https://aclanthology.org/W14-3908.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.67,"id":"https://metadata.un.org/sdg/4","display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":18,"referenced_works":["https://openalex.org/W2013489815","https://openalex.org/W2037615273","https://openalex.org/W2061272101","https://openalex.org/W2068130800","https://openalex.org/W2115616427","https://openalex.org/W2123660869","https://openalex.org/W2132609289","https://openalex.org/W2145867197","https://openalex.org/W2147880316","https://openalex.org/W2251149908","https://openalex.org/W2275309193","https://openalex.org/W2329583173","https://openalex.org/W2477899819","https://openalex.org/W2759478409","https://openalex.org/W4212942762","https://openalex.org/W4251217171","https://openalex.org/W4403817633","https://openalex.org/W941093546"],"related_works":["https://openalex.org/W4389976243","https://openalex.org/W3158134258","https://openalex.org/W3138119129","https://openalex.org/W3002509766","https://openalex.org/W2974240475","https://openalex.org/W2940588741","https://openalex.org/W2771594921","https://openalex.org/W2432897346","https://openalex.org/W2293063924","https://openalex.org/W2181336723"],"abstract_inverted_index":{"We":[0],"describe":[1],"a":[2,68],"CRF":[3],"based":[4],"system":[5],"for":[6,49],"word-level":[7],"language":[8,51,73],"identification":[9],"of":[10],"code-mixed":[11],"text.Our":[12],"method":[13],"uses":[14],"lexical,":[15],"contextual,":[16],"character":[17,21],"n-gram,":[18],"and":[19,23,60],"special":[20],"features,":[22],"therefore,":[24],"can":[25],"easily":[26],"be":[27],"replicated":[28],"across":[29,71],"languages.Its":[30],"performance":[31,70],"is":[32],"benchmarked":[33],"against":[34],"the":[35,40,72],"test":[36],"sets":[37],"provided":[38],"by":[39],"shared":[41],"task":[42],"on":[43],"code-mixing":[44],"(Solorio":[45],"et":[46],"al.,":[47],"2014)":[48],"four":[50],"pairs,":[52],"namely,":[53],"English-Spanish":[54],"(En-Es),":[55],"English-Nepali":[56],"(En-Ne),":[57],"English-Mandarin":[58],"(En-Cn),":[59],"Standard":[61],"Arabic-Arabic":[62],"(Ar-Ar)":[63],"Dialects.The":[64],"experimental":[65],"results":[66],"show":[67],"consistent":[69],"pairs.":[74]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2251843872","counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":13},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":15},{"year":2015,"cited_by_count":5}],"updated_date":"2025-03-21T21:33:12.068050","created_date":"2016-06-24"}