{"id":"https://openalex.org/W4400702916","doi":"https://doi.org/10.48550/arxiv.2407.09823","title":"NativQA: Multilingual Culturally-Aligned Natural Query for LLMs","display_name":"NativQA: Multilingual Culturally-Aligned Natural Query for LLMs","publication_year":2024,"publication_date":"2024-07-13","ids":{"openalex":"https://openalex.org/W4400702916","doi":"https://doi.org/10.48550/arxiv.2407.09823"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.09823","pdf_url":"http://arxiv.org/pdf/2407.09823","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2407.09823","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021570815","display_name":"Md. Arid Hasan","orcid":"https://orcid.org/0000-0001-7916-614X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hasan, Md. Arid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035521035","display_name":"Maram Hasanain","orcid":"https://orcid.org/0000-0002-7466-178X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hasanain, Maram","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113392245","display_name":"Fatema Ahmad","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmad, Fatema","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104621313","display_name":"Sahinur Rahman Laskar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laskar, Sahinur Rahman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103198708","display_name":"S. Upadhyay","orcid":"https://orcid.org/0000-0002-8715-6977"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Upadhyay, Sunaya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059299971","display_name":"Vrunda N. Sukhadia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sukhadia, Vrunda N","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086826049","display_name":"M\u00fccahid Kutlu","orcid":"https://orcid.org/0000-0002-5660-4992"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kutlu, Mucahid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022279488","display_name":"Shammur Absar Chowdhury","orcid":"https://orcid.org/0000-0002-1331-2543"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chowdhury, Shammur Absar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5053436179","display_name":"Firoj Alam","orcid":"https://orcid.org/0000-0001-7172-1997"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alam, Firoj","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9901,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.987,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.606136},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.3252861},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.32488978},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.09823","pdf_url":"http://arxiv.org/pdf/2407.09823","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.09823","pdf_url":"http://arxiv.org/pdf/2407.09823","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W48866389","https://openalex.org/W4391375266","https://openalex.org/W4283262748","https://openalex.org/W4252362398","https://openalex.org/W3112533414","https://openalex.org/W2748952813","https://openalex.org/W2502773048","https://openalex.org/W2490481324","https://openalex.org/W2117651364","https://openalex.org/W1979668694"],"abstract_inverted_index":{"Natural":[0],"Question":[1],"Answering":[2],"(QA)":[3],"datasets":[4,31,43,82],"play":[5],"a":[6,38,70,102],"crucial":[7],"role":[8],"in":[9,24,48,83,113],"developing":[10],"and":[11,62,78,89,139,148],"evaluating":[12],"the":[13,28,55,94,97,134,145,154],"capabilities":[14],"of":[15,41,58,96,109],"large":[16],"language":[17],"models":[18],"(LLMs),":[19],"ensuring":[20],"their":[21,49],"effective":[22,56],"usage":[23],"real-world":[25],"applications.":[26],"Despite":[27],"numerous":[29],"QA":[30,81,105,111],"that":[32],"have":[33],"been":[34],"developed,":[35],"there":[36],"is":[37],"notable":[39],"lack":[40],"region-specific":[42],"generated":[44],"by":[45],"native":[46,84,127],"users":[47],"own":[50],"languages.":[51],"This":[52],"gap":[53],"hinders":[54],"benchmarking":[57],"LLMs":[59],"for":[60,86,153],"regional":[61],"cultural":[63],"specificities.":[64],"In":[65],"this":[66],"study,":[67],"we":[68,100],"propose":[69],"scalable":[71],"framework,":[72,99],"NativQA,":[73],"to":[74,92,119],"seamlessly":[75],"construct":[76],"culturally":[77],"regionally":[79],"aligned":[80],"languages,":[85,115],"LLM":[87],"evaluation":[88],"tuning.":[90],"Moreover,":[91],"demonstrate":[93],"efficacy":[95],"proposed":[98],"designed":[101],"multilingual":[103],"natural":[104],"dataset,":[106],"MultiNativQA,":[107],"consisting":[108],"~72K":[110],"pairs":[112],"seven":[114],"ranging":[116],"from":[117,126],"high":[118],"extremely":[120],"low":[121],"resource,":[122],"based":[123],"on":[124],"queries":[125],"speakers":[128],"covering":[129],"18":[130],"topics.":[131],"We":[132,142],"benchmark":[133],"MultiNativQA":[135,149],"dataset":[136,150],"with":[137],"open-":[138],"closed-source":[140],"LLMs.":[141],"made":[143],"both":[144],"framework":[146],"NativQA":[147],"publicly":[151],"available":[152],"community.":[155],"(https://nativqa.gitlab.io)":[156]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4400702916","counts_by_year":[],"updated_date":"2025-04-04T00:32:06.818811","created_date":"2024-07-17"}