{"id":"https://openalex.org/W3080521392","doi":"https://doi.org/10.1145/3405962.3405968","title":"Topic Modeling of Short Texts Using Anchor Words","display_name":"Topic Modeling of Short Texts Using Anchor Words","publication_year":2020,"publication_date":"2020-06-30","ids":{"openalex":"https://openalex.org/W3080521392","doi":"https://doi.org/10.1145/3405962.3405968","mag":"3080521392"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3405962.3405968","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039992424","display_name":"Florian Steuber","orcid":"https://orcid.org/0000-0003-1782-7445"},"institutions":[{"id":"https://openalex.org/I40527276","display_name":"Universit\u00e4t der Bundeswehr M\u00fcnchen","ror":"https://ror.org/05kkv3f82","country_code":"DE","type":"education","lineage":["https://openalex.org/I1315109972","https://openalex.org/I40527276","https://openalex.org/I4387152969"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Florian Steuber","raw_affiliation_strings":["Research Institute CODE, Bundeswehr University Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Research Institute CODE, Bundeswehr University Munich, Munich, Germany","institution_ids":["https://openalex.org/I40527276"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020485279","display_name":"Mirco Schoenfeld","orcid":"https://orcid.org/0000-0002-2843-3137"},"institutions":[{"id":"https://openalex.org/I292141241","display_name":"Munich School of Philosophy","ror":"https://ror.org/02kqy4228","country_code":"DE","type":"education","lineage":["https://openalex.org/I292141241"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Mirco Schoenfeld","raw_affiliation_strings":["Bavarian School of Public Policy, Technical University Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Bavarian School of Public Policy, Technical University Munich, Munich, Germany","institution_ids":["https://openalex.org/I292141241"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078551681","display_name":"Gabi Dreo Rodosek","orcid":"https://orcid.org/0000-0002-8702-8553"},"institutions":[{"id":"https://openalex.org/I40527276","display_name":"Universit\u00e4t der Bundeswehr M\u00fcnchen","ror":"https://ror.org/05kkv3f82","country_code":"DE","type":"education","lineage":["https://openalex.org/I1315109972","https://openalex.org/I40527276","https://openalex.org/I4387152969"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gabi Dreo Rodosek","raw_affiliation_strings":["Research Institute CODE, Bundeswehr University Munich, Munich, Germany"],"affiliations":[{"raw_affiliation_string":"Research Institute CODE, Bundeswehr University Munich, Munich, Germany","institution_ids":["https://openalex.org/I40527276"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.398,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.872881,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":82,"max":83},"biblio":{"volume":null,"issue":null,"first_page":"210","last_page":"219"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/archetype","display_name":"Archetype","score":0.5307391},{"id":"https://openalex.org/keywords/latent-semantic-analysis","display_name":"Latent semantic analysis","score":0.42697692}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8978853},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.8017924},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.726403},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.63067},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5967788},{"id":"https://openalex.org/C49848784","wikidata":"https://www.wikidata.org/wiki/Q131714","display_name":"Archetype","level":2,"score":0.5307391},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.51865405},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49884582},{"id":"https://openalex.org/C112933361","wikidata":"https://www.wikidata.org/wiki/Q2845258","display_name":"Probabilistic latent semantic analysis","level":2,"score":0.45102873},{"id":"https://openalex.org/C206194317","wikidata":"https://www.wikidata.org/wiki/Q1138624","display_name":"Convex hull","level":3,"score":0.43662393},{"id":"https://openalex.org/C170133592","wikidata":"https://www.wikidata.org/wiki/Q1806883","display_name":"Latent semantic analysis","level":2,"score":0.42697692},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.4191106},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3889287},{"id":"https://openalex.org/C112680207","wikidata":"https://www.wikidata.org/wiki/Q714886","display_name":"Regular polygon","level":2,"score":0.19551742},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18524507},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3405962.3405968","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality education","id":"https://metadata.un.org/sdg/4","score":0.56}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":26,"referenced_works":["https://openalex.org/W1880262756","https://openalex.org/W1956559956","https://openalex.org/W1968489927","https://openalex.org/W2001082470","https://openalex.org/W2004192095","https://openalex.org/W2041711198","https://openalex.org/W2046677795","https://openalex.org/W2047271471","https://openalex.org/W2063904635","https://openalex.org/W2078058974","https://openalex.org/W2096974619","https://openalex.org/W2098126593","https://openalex.org/W2123549998","https://openalex.org/W2133108446","https://openalex.org/W2144989404","https://openalex.org/W2152311353","https://openalex.org/W2168332560","https://openalex.org/W2171343266","https://openalex.org/W2171836785","https://openalex.org/W2910828880","https://openalex.org/W2914304175","https://openalex.org/W2944859252","https://openalex.org/W2949169239","https://openalex.org/W2998704965","https://openalex.org/W4212774754","https://openalex.org/W4253763636"],"related_works":["https://openalex.org/W4396666968","https://openalex.org/W4291700620","https://openalex.org/W3159709618","https://openalex.org/W2995939990","https://openalex.org/W2921491680","https://openalex.org/W2251863249","https://openalex.org/W2171515436","https://openalex.org/W2132052677","https://openalex.org/W2110027950","https://openalex.org/W1551384396"],"abstract_inverted_index":{"We":[0,58,107,138],"present":[1],"Archetypal":[2],"LDA":[3],"or":[4,22],"short":[5,12],"A-LDA,":[6],"a":[7,19,74],"topic":[8,46],"model":[9],"tailored":[10],"to":[11,35,55,103,124,131,148,169],"texts":[13],"containing":[14],"\"semantic":[15],"anchors\"":[16],"which":[17],"convey":[18],"certain":[20],"meaning":[21],"implicitly":[23],"build":[24],"on":[25],"discussions":[26],"beyond":[27],"their":[28,69],"mere":[29],"presence.":[30],"A-LDA":[31,133],"is":[32],"an":[33],"extension":[34],"Latent":[36],"Dirichlet":[37],"Allocation":[38],"in":[39,143,154],"that":[40,78,84,140],"we":[41],"guide":[42,104],"the":[43,56,65,87,105,109,121,158],"process":[44],"of":[45,111,145],"inference":[47],"by":[48,126],"these":[49,60],"semantic":[50,117],"anchors":[51],"as":[52,98],"seed":[53,61,163],"words":[54,62,119],"LDA.":[57,106],"identify":[59],"unsupervised":[63],"from":[64,167],"documents":[66],"and":[67,101,157],"evaluate":[68],"co-occurrences":[70],"using":[71,114],"archetypal":[72],"analysis,":[73],"geometric":[75],"approximation":[76],"problem":[77],"aims":[79],"for":[80,162],"finding":[81],"k":[82],"points":[83],"best":[85],"approximate":[86],"data":[88],"set's":[89],"convex":[90],"hull.":[91],"These":[92],"so":[93],"called":[94],"archetypes":[95,150],"are":[96,120],"considered":[97],"latent":[99],"topics":[100,142,156],"used":[102],"demonstrate":[108],"effectiveness":[110],"our":[112],"approach":[113],"Twitter,":[115],"where":[116],"anchor":[118],"hashtags":[122,146],"assigned":[123],"tweets":[125],"users.":[127],"In":[128],"direct":[129],"comparison":[130],"LDA,":[132],"achieves":[134],"10-13%":[135],"better":[136],"results.":[137],"find":[139],"representing":[141],"terms":[144],"corresponding":[147],"calculated":[149],"alone":[151],"already":[152],"results":[153],"interpretable":[155],"model's":[159],"performance":[160],"peaks":[161],"confidence":[164],"values":[165],"ranging":[166],"0.7":[168],"0.9.":[170]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3080521392","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2025-03-22T08:04:42.160089","created_date":"2020-09-01"}