{"id":"https://openalex.org/W4400600739","doi":"https://doi.org/10.48550/arxiv.2407.07321","title":"RAG vs. Long Context: Examining Frontier Large Language Models for\n Environmental Review Document Comprehension","display_name":"RAG vs. Long Context: Examining Frontier Large Language Models for\n Environmental Review Document Comprehension","publication_year":2024,"publication_date":"2024-07-09","ids":{"openalex":"https://openalex.org/W4400600739","doi":"https://doi.org/10.48550/arxiv.2407.07321"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.07321","pdf_url":"http://arxiv.org/pdf/2407.07321","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2407.07321","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024298908","display_name":"Hung Phan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Phan, Hung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103415600","display_name":"Anurag Acharya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Acharya, Anurag","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109746310","display_name":"Sarthak Chaturvedi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chaturvedi, Sarthak","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005446354","display_name":"Shivam Sharma","orcid":"https://orcid.org/0000-0003-2770-0966"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Shivam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102306075","display_name":"Mike Parker","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parker, Mike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104431148","display_name":"Dan Nally","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nally, Dan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079359777","display_name":"Ali Jannesari","orcid":"https://orcid.org/0000-0001-8672-5317"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jannesari, Ali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041535920","display_name":"Karl Pazdernik","orcid":"https://orcid.org/0000-0003-1410-4006"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pazdernik, Karl","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075175819","display_name":"Mahantesh Halappanavar","orcid":"https://orcid.org/0000-0002-2323-4753"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Halappanavar, Mahantesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050892907","display_name":"Sai Munikoti","orcid":"https://orcid.org/0000-0002-1205-7405"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Munikoti, Sai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5087089195","display_name":"Sameera Horawalavithana","orcid":"https://orcid.org/0000-0002-0327-3819"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Horawalavithana, Sameera","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7619,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7619,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.7191,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.7062,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/frontier","display_name":"Frontier","score":0.86973846}],"concepts":[{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.86973846},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.6598364},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6202717},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.38076973},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36599362},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.36135507},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.22560069},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.06757665},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.054492176}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.07321","pdf_url":"http://arxiv.org/pdf/2407.07321","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.07321","pdf_url":"http://arxiv.org/pdf/2407.07321","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W579144800","https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2347401120","https://openalex.org/W2334292868","https://openalex.org/W2310010941","https://openalex.org/W2147233680","https://openalex.org/W2069525434","https://openalex.org/W2041961361","https://openalex.org/W1988132375"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"been":[5,39,64],"applied":[6],"to":[7,26,82,127,176],"many":[8,233],"research":[9],"problems":[10],"across":[11],"various":[12],"domains.":[13],"One":[14],"of":[15,18,33,86,125,131,185,198,221,224],"the":[16,79,84,114,123,129,149,168,178,183,186,212,217,222,225],"applications":[17],"LLMs":[19,89,126,166,189],"is":[20],"providing":[21,156],"question-answering":[22,35],"systems":[23,36],"that":[24,69,206,232],"cater":[25],"users":[27,46],"from":[28,101],"different":[29,142,196],"fields.":[30],"The":[31],"effectiveness":[32],"LLM-based":[34],"has":[37,61],"already":[38],"established":[40,65],"at":[41],"an":[42],"acceptable":[43],"level":[44],"for":[45],"posing":[47],"questions":[48,99,157,199,239],"in":[49,66,111,138,141,172,194,216],"popular":[50],"and":[51,57,94,134,190,242],"public":[52],"domains":[53,68],"such":[54],"as":[55,161,163],"trivia":[56],"literature.":[58],"However,":[59],"it":[60],"not":[62],"often":[63],"niche":[67],"traditionally":[70],"require":[71],"specialized":[72],"expertise.":[73],"To":[74],"this":[75],"end,":[76],"we":[77,147],"construct":[78],"NEPAQuAD1.0":[80],"benchmark":[81],"evaluate":[83],"performance":[85,184],"three":[87],"frontier":[88,226],"--":[90,96],"Claude":[91],"Sonnet,":[92],"Gemini,":[93],"GPT-4":[95],"when":[97],"answering":[98,237],"originating":[100],"Environmental":[102,116,117],"Impact":[103],"Statements":[104],"prepared":[105],"by":[106,155],"U.S.":[107],"federal":[108],"government":[109],"agencies":[110],"accordance":[112],"with":[113],"National":[115],"Act":[118],"(NEPA).":[119],"We":[120,181],"specifically":[121],"measure":[122],"ability":[124],"understand":[128],"nuances":[130],"legal,":[132],"technical,":[133],"compliance-related":[135],"information":[136,170],"present":[137,171],"NEPA":[139,153,174],"documents":[140,175],"contextual":[143,169],"scenarios.":[144],"For":[145],"example,":[146],"test":[148],"LLMs'":[150],"internal":[151],"prior":[152],"knowledge":[154],"without":[158],"any":[159],"context,":[160],"well":[162],"assess":[164],"how":[165],"synthesize":[167],"long":[173,187,213],"facilitate":[177],"question/answering":[179],"task.":[180],"compare":[182],"context":[188,214],"RAG":[191,207],"powered":[192,208],"models":[193,209,215,234],"handling":[195],"types":[197],"(e.g.,":[200],"problem-solving,":[201],"divergent).":[202],"Our":[203,228],"results":[204],"suggest":[205],"significantly":[210],"outperform":[211],"answer":[218],"accuracy":[219],"regardless":[220],"choice":[223],"LLM.":[227],"further":[229],"analysis":[230],"reveals":[231],"perform":[235],"better":[236],"closed":[238],"than":[240],"divergent":[241],"problem-solving":[243],"questions.":[244]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4400600739","counts_by_year":[],"updated_date":"2025-01-20T23:39:49.877034","created_date":"2024-07-13"}