{"id":"https://openalex.org/W4395443857","doi":"https://doi.org/10.48550/arxiv.2404.15238","title":"CultureBank: An Online Community-Driven Knowledge Base Towards\n Culturally Aware Language Technologies","display_name":"CultureBank: An Online Community-Driven Knowledge Base Towards\n Culturally Aware Language Technologies","publication_year":2024,"publication_date":"2024-04-23","ids":{"openalex":"https://openalex.org/W4395443857","doi":"https://doi.org/10.48550/arxiv.2404.15238"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15238","pdf_url":"http://arxiv.org/pdf/2404.15238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2404.15238","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101210510","display_name":"Weiyan Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Weiyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108141334","display_name":"Ryan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Ryan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081146434","display_name":"Yutong Zhang","orcid":"https://orcid.org/0000-0003-0599-4828"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yutong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002621773","display_name":"Caleb Ziems","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ziems, Caleb","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104287355","display_name":"Chunhua yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"yu, Chunhua","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059675637","display_name":"Raya Horesh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Horesh, Raya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046707914","display_name":"Rog\u00e9rio Abreu de Paula","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Paula, Rog\u00e9rio Abreu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5089413311","display_name":"Diyi Yang","orcid":"https://orcid.org/0000-0003-1220-3983"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Diyi","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12478","display_name":"Wikis in Education and Collaboration","score":0.9354,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12478","display_name":"Wikis in Education and Collaboration","score":0.9354,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9289,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.917,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cultural-knowledge","display_name":"Cultural Knowledge","score":0.4540882},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.41405454}],"concepts":[{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.53322256},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.5012808},{"id":"https://openalex.org/C2994055011","wikidata":"https://www.wikidata.org/wiki/Q210272","display_name":"Cultural knowledge","level":2,"score":0.4540882},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.41405454},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.40578097},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.3397444},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.2542335},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.15016764},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15238","pdf_url":"http://arxiv.org/pdf/2404.15238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15238","pdf_url":"http://arxiv.org/pdf/2404.15238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4242671254","https://openalex.org/W3142859449","https://openalex.org/W2748952813","https://openalex.org/W2599749361","https://openalex.org/W2385713529","https://openalex.org/W2380472855","https://openalex.org/W2369995614","https://openalex.org/W1986001501","https://openalex.org/W167983404"],"abstract_inverted_index":{"To":[0],"enhance":[1],"language":[2,92,124],"models'":[3],"cultural":[4,13,39,50,58,65,69,81,106],"awareness,":[5,82],"we":[6,27,77,113],"design":[7],"a":[8,21,30,91,109],"generalizable":[9],"pipeline":[10],"to":[11,60,71],"construct":[12,28],"knowledge":[14,31,51],"bases":[15],"from":[16,42,46],"different":[17,79],"online":[18],"communities":[19],"on":[20,57,94,103,117],"massive":[22],"scale.":[23],"With":[24,75],"the":[25],"pipeline,":[26],"CultureBank,":[29,76],"base":[32],"built":[33],"upon":[34],"users'":[35],"self-narratives":[36],"with":[37],"12K":[38],"descriptors":[40,59],"sourced":[41],"TikTok":[43],"and":[44,67,83,134],"11K":[45],"Reddit.":[47],"Unlike":[48],"previous":[49],"resources,":[52],"CultureBank":[53,142],"contains":[54],"diverse":[55],"views":[56],"allow":[61],"flexible":[62],"interpretation":[63],"of":[64],"knowledge,":[66],"contextualized":[68],"scenarios":[70],"help":[72],"grounded":[73],"evaluation.":[74],"evaluate":[78],"LLMs'":[80],"identify":[84],"areas":[85],"for":[86,120],"improvement.":[87],"We":[88],"also":[89],"fine-tune":[90],"model":[93,135],"CultureBank:":[95],"experiments":[96],"show":[97],"that":[98],"it":[99],"achieves":[100],"better":[101],"performances":[102],"two":[104],"downstream":[105],"tasks":[107],"in":[108],"zero-shot":[110],"setting.":[111],"Finally,":[112],"offer":[114],"recommendations":[115],"based":[116],"our":[118],"findings":[119],"future":[121],"culturally":[122],"aware":[123],"technologies.":[125],"The":[126,132,140],"project":[127],"page":[128],"is":[129,136,144],"https://culturebank.github.io":[130],".":[131,139,147],"code":[133],"at":[137,145],"https://github.com/SALT-NLP/CultureBank":[138],"released":[141],"dataset":[143],"https://huggingface.co/datasets/SALT-NLP/CultureBank":[146]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4395443857","counts_by_year":[],"updated_date":"2025-04-11T20:27:33.037098","created_date":"2024-04-26"}