{"id":"https://openalex.org/W4281250694","doi":"https://doi.org/10.48550/arxiv.2205.09712","title":"Selection-Inference: Exploiting Large Language Models for Interpretable Logical Reasoning","display_name":"Selection-Inference: Exploiting Large Language Models for Interpretable Logical Reasoning","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4281250694","doi":"https://doi.org/10.48550/arxiv.2205.09712"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2205.09712","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2205.09712","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009239144","display_name":"Antonia Creswell","orcid":"https://orcid.org/0000-0003-1037-9395"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Creswell, Antonia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072322524","display_name":"Murray Shanahan","orcid":"https://orcid.org/0000-0001-5984-2964"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shanahan, Murray","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5018830387","display_name":"Irina Higgins","orcid":"https://orcid.org/0000-0002-1890-2091"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Higgins, Irina","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":91,"citation_normalized_percentile":{"value":0.999939,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9985,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9985,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9952,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.967,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/logical-reasoning","display_name":"Logical reasoning","score":0.55583483},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5204316},{"id":"https://openalex.org/keywords/opportunistic-reasoning","display_name":"Opportunistic reasoning","score":0.46311963},{"id":"https://openalex.org/keywords/non-monotonic-logic","display_name":"Non-monotonic logic","score":0.46279076},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.44939688},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.44622958}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.72425395},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6776515},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.60509557},{"id":"https://openalex.org/C43971567","wikidata":"https://www.wikidata.org/wiki/Q3142865","display_name":"Logical reasoning","level":2,"score":0.55583483},{"id":"https://openalex.org/C134752490","wikidata":"https://www.wikidata.org/wiki/Q374182","display_name":"Logical consequence","level":2,"score":0.5396009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.522822},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5204316},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.5159131},{"id":"https://openalex.org/C97364631","wikidata":"https://www.wikidata.org/wiki/Q484284","display_name":"Deductive reasoning","level":2,"score":0.48270226},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.46311963},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.46279076},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.44939688},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.44622958},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.4221112},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42108122},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40352416},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.36840725},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.12742826},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11439556},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.08579543},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2205.09712","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2205.09712","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2205.09712","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.58}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2567893123","https://openalex.org/W2399112294","https://openalex.org/W2355314240","https://openalex.org/W2182693335","https://openalex.org/W2106247677","https://openalex.org/W2077137711","https://openalex.org/W1974525301","https://openalex.org/W1945364905","https://openalex.org/W190590315","https://openalex.org/W1540734423"],"abstract_inverted_index":{"Large":[0],"language":[1,51],"models":[2,52],"(LLMs)":[3],"have":[4],"been":[5],"shown":[6],"to":[7,14,21,54,67,73,102,112,144],"be":[8],"capable":[9],"of":[10,36,45,80,106,140,152,176,202],"impressive":[11],"few-shot":[12],"generalisation":[13,131],"new":[15],"tasks.":[16,156,177],"However,":[17],"they":[18],"still":[19],"tend":[20,53],"perform":[22,55],"poorly":[23],"on":[24,38,149,172],"multi-step":[25],"logical":[26,46,154],"reasoning":[27,71,109,155,191],"problems.":[28,77],"Here":[29],"we":[30,82],"carry":[31],"out":[32],"a":[33,84,104,119,129,137,150,166,188],"comprehensive":[34],"evaluation":[35],"LLMs":[37,91],"50":[39],"tasks":[40],"that":[41,50,88,118],"probe":[42],"different":[43],"aspects":[44],"reasoning.":[47],"We":[48,116],"show":[49,117],"fairly":[56],"well":[57],"at":[58],"single":[59],"step":[60],"inference":[61,101],"or":[62],"entailment":[63],"tasks,":[64],"but":[65],"struggle":[66],"chain":[68],"together":[69],"multiple":[70],"steps":[72,110],"solve":[74],"more":[75],"complex":[76],"In":[78],"light":[79],"this,":[81],"propose":[83],"Selection-Inference":[85],"(SI)":[86],"framework":[87,127,184],"exploits":[89],"pre-trained":[90],"as":[92],"general":[93],"processing":[94],"modules,":[95],"and":[96,100,200],"alternates":[97],"between":[98],"selection":[99],"generate":[103],"series":[105],"interpretable,":[107],"casual":[108],"leading":[111],"the":[113,125,161,173,182,198,203],"final":[114],"answer.":[115],"7B":[120],"parameter":[121,170],"LLM":[122],"used":[123],"within":[124],"SI":[126,183],"in":[128,160],"5-shot":[130],"setting,":[132],"with":[133],"no":[134],"fine-tuning,":[135],"yields":[136],"performance":[138],"improvement":[139],"over":[141],"100%":[142],"compared":[143],"an":[145],"equivalent":[146],"vanilla":[147],"baseline":[148,171],"suite":[151,175],"10":[153],"The":[157],"same":[158,162,174],"model":[159],"setting":[163],"even":[164],"outperforms":[165],"significantly":[167],"larger":[168],"280B":[169],"Moreover,":[178],"answers":[179],"produced":[180],"by":[181,187],"are":[185],"accompanied":[186],"causal":[189],"natural-language-based":[190],"trace,":[192],"which":[193],"has":[194],"important":[195],"implications":[196],"for":[197],"safety":[199],"trustworthiness":[201],"system.":[204]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4281250694","counts_by_year":[{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":53},{"year":2022,"cited_by_count":2}],"updated_date":"2025-01-08T20:28:38.904976","created_date":"2022-05-23"}