{"id":"https://openalex.org/W3099053576","doi":"https://doi.org/10.18653/v1/2020.emnlp-main.670","title":"META: Metadata-Empowered Weak Supervision for Text Classification","display_name":"META: Metadata-Empowered Weak Supervision for Text Classification","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3099053576","doi":"https://doi.org/10.18653/v1/2020.emnlp-main.670","mag":"3099053576"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.emnlp-main.670","pdf_url":"https://www.aclweb.org/anthology/2020.emnlp-main.670.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.aclweb.org/anthology/2020.emnlp-main.670.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032931351","display_name":"Dheeraj Mekala","orcid":null},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dheeraj Mekala","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022999126","display_name":"Xinyang Zhang","orcid":"https://orcid.org/0000-0001-6474-682X"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"funder","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xinyang Zhang","raw_affiliation_strings":["Department of Computer Science, University of at Illinois Urbana-Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of at Illinois Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039500313","display_name":"Jingbo Shang","orcid":"https://orcid.org/0000-0002-7249-4404"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California, San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"funder","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingbo Shang","raw_affiliation_strings":["Department of Computer Science and Engineering, University of California San Diego, CA, USA","Hal\u0131c\u0131oglu Data Science Institute, University of California San Diego, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of California San Diego, CA, USA","institution_ids":["https://openalex.org/I36258959"]},{"raw_affiliation_string":"Hal\u0131c\u0131oglu Data Science Institute, University of California San Diego, CA, USA","institution_ids":["https://openalex.org/I36258959"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.575,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":34,"citation_normalized_percentile":{"value":0.697851,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.67353314},{"id":"https://openalex.org/keywords/metadata-modeling","display_name":"Metadata modeling","score":0.43461993}],"concepts":[{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.9715634},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.81886977},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.67353314},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.59567606},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5741257},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5613378},{"id":"https://openalex.org/C30872290","wikidata":"https://www.wikidata.org/wiki/Q1172389","display_name":"Data element","level":3,"score":0.48489815},{"id":"https://openalex.org/C110326360","wikidata":"https://www.wikidata.org/wiki/Q17149476","display_name":"Metadata modeling","level":4,"score":0.43461993},{"id":"https://openalex.org/C136976847","wikidata":"https://www.wikidata.org/wiki/Q6822297","display_name":"Meta Data Services","level":4,"score":0.4163368},{"id":"https://openalex.org/C153048206","wikidata":"https://www.wikidata.org/wiki/Q3454922","display_name":"Metadata repository","level":3,"score":0.4162323},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.37298706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28356105},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C106159729","wikidata":"https://www.wikidata.org/wiki/Q2294553","display_name":"Financial economics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.emnlp-main.670","pdf_url":"https://www.aclweb.org/anthology/2020.emnlp-main.670.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.emnlp-main.670","pdf_url":"https://www.aclweb.org/anthology/2020.emnlp-main.670.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":40,"referenced_works":["https://openalex.org/W103340358","https://openalex.org/W1654860491","https://openalex.org/W1832693441","https://openalex.org/W2022322548","https://openalex.org/W2098136027","https://openalex.org/W2103931177","https://openalex.org/W2108281845","https://openalex.org/W2140124448","https://openalex.org/W2145658888","https://openalex.org/W2150815390","https://openalex.org/W2153579005","https://openalex.org/W2153624566","https://openalex.org/W2158329013","https://openalex.org/W2251292973","https://openalex.org/W2251939518","https://openalex.org/W2265846598","https://openalex.org/W2285986798","https://openalex.org/W2470673105","https://openalex.org/W2470861207","https://openalex.org/W2546547051","https://openalex.org/W2563010554","https://openalex.org/W2593560537","https://openalex.org/W2743104969","https://openalex.org/W2767878862","https://openalex.org/W2802181385","https://openalex.org/W2890931111","https://openalex.org/W2893359107","https://openalex.org/W2903908313","https://openalex.org/W2949169239","https://openalex.org/W2950894652","https://openalex.org/W2963413667","https://openalex.org/W2963858765","https://openalex.org/W2963921497","https://openalex.org/W3023960840","https://openalex.org/W3034588688","https://openalex.org/W3035055211","https://openalex.org/W3104717349","https://openalex.org/W3212662458","https://openalex.org/W4294170691","https://openalex.org/W4300996741"],"related_works":["https://openalex.org/W92613187","https://openalex.org/W3199469221","https://openalex.org/W3084772717","https://openalex.org/W2981561176","https://openalex.org/W2907247951","https://openalex.org/W2380261968","https://openalex.org/W2374379029","https://openalex.org/W2367786714","https://openalex.org/W2018424284","https://openalex.org/W1729161438"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,49],"weakly":[3],"supervised":[4],"learning":[5],"enable":[6],"training":[7],"high-quality":[8],"text":[9,23,123],"classifiers":[10],"by":[11],"only":[12],"providing":[13],"a":[14,99,129,166],"few":[15],"user-provided":[16],"seed":[17,144,176,179],"words.":[18],"Existing":[19],"methods":[20],"mainly":[21,58],"use":[22],"data":[24,124],"alone":[25],"to":[26,60,136,152],"generate":[27],"pseudo-labels":[28],"despite":[29],"the":[30,50,61,106,122,171,175],"fact":[31],"that":[32],"metadata":[33,51,65,78,82,111,126,198],"information":[34],"(e.g.,":[35,84],"author":[36],"and":[37,52,74,109,125,132,148,173,178,184,193],"timestamp)":[38],"is":[39,66,79],"widely":[40],"available":[41],"across":[42],"various":[43],"domains.":[44],"Strong":[45],"label":[46,90],"indicators":[47,91],"exist":[48],"it":[53],"has":[54],"been":[55],"long":[56],"overlooked":[57],"due":[59],"following":[62],"challenges:":[63],"(1)":[64],"multi-typed,":[67],"requiring":[68],"systematic":[69],"modeling":[70],"of":[71,116,140,196],"different":[72],"types":[73],"their":[75],"combinations,":[76],"(2)":[77],"noisy,":[80],"some":[81],"entities":[83],"authors,":[85],"venues)":[86],"are":[87],"more":[88],"compelling":[89],"than":[92],"others.":[93],"In":[94],"this":[95],"paper,":[96],"we":[97,120,146,169],"propose":[98],"novel":[100],"framework,":[101],"META,":[102],"which":[103,160],"goes":[104],"beyond":[105],"existing":[107],"paradigm":[108],"leverages":[110],"as":[112,157,199],"an":[113],"additional":[114,162],"source":[115],"weak":[117,163,200],"supervision.":[118,164,201],"Specifically,":[119],"organize":[121],"together":[127],"into":[128],"text-rich":[130],"network":[131,134],"adopt":[133],"motifs":[135,180],"capture":[137],"appropriate":[138],"combinations":[139],"metadata.":[141],"Based":[142],"on":[143,187],"words,":[145],"rank":[147],"filter":[149],"motif":[150],"instances":[151],"distill":[153],"highly":[154],"label-indicative":[155],"ones":[156],"\u201cseed":[158],"motifs\u201d,":[159],"provide":[161],"Following":[165],"bootstrapping":[167],"manner,":[168],"train":[170],"classifier":[172],"expand":[174],"words":[177],"iteratively.":[181],"Extensive":[182],"experiments":[183],"case":[185],"studies":[186],"real-world":[188],"datasets":[189],"demonstrate":[190],"superior":[191],"performance":[192],"significant":[194],"advantages":[195],"leveraging":[197]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3099053576","counts_by_year":[{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":4}],"updated_date":"2025-02-23T18:12:34.588991","created_date":"2020-11-23"}