{"id":"https://openalex.org/W4394591183","doi":"https://doi.org/10.48550/arxiv.2404.03753","title":"A Reinforcement Learning based Reset Policy for CDCL SAT Solvers","display_name":"A Reinforcement Learning based Reset Policy for CDCL SAT Solvers","publication_year":2024,"publication_date":"2024-04-04","ids":{"openalex":"https://openalex.org/W4394591183","doi":"https://doi.org/10.48550/arxiv.2404.03753"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.03753","pdf_url":"https://arxiv.org/pdf/2404.03753","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.03753","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100459278","display_name":"Chunxiao Li","orcid":"https://orcid.org/0000-0003-0996-9742"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chunxiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059096757","display_name":"Charlie Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Charlie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020799779","display_name":"C.Y. Chung","orcid":"https://orcid.org/0000-0003-3639-5852"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chung, Jonathan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025747129","display_name":"Zhengyang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhengyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110336671","display_name":"L\u00fc","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017735998","display_name":"Piyush Jha","orcid":"https://orcid.org/0000-0003-1590-593X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jha, Piyush","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5052292970","display_name":"Vijay Ganesh","orcid":"https://orcid.org/0000-0002-6029-2047"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganesh, Vijay","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9655,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9655,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9249,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reset","display_name":"Reset (finance)","score":0.79951084}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.81995434},{"id":"https://openalex.org/C2779795794","wikidata":"https://www.wikidata.org/wiki/Q7315343","display_name":"Reset (finance)","level":2,"score":0.79951084},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6161492},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5400797},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25548533},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.20643187},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.10895255},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.08189663},{"id":"https://openalex.org/C106159729","wikidata":"https://www.wikidata.org/wiki/Q2294553","display_name":"Financial economics","level":1,"score":0.053034157}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.03753","pdf_url":"https://arxiv.org/pdf/2404.03753","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2404.03753","pdf_url":"https://arxiv.org/pdf/2404.03753","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W96259911","https://openalex.org/W4391375266","https://openalex.org/W4385608460","https://openalex.org/W350273603","https://openalex.org/W2748952813","https://openalex.org/W2393495588","https://openalex.org/W2370772865","https://openalex.org/W2168225754","https://openalex.org/W2000034628","https://openalex.org/W1528611913"],"abstract_inverted_index":{"Restart":[0],"policy":[1,233],"is":[2,279],"an":[3,280],"important":[4],"technique":[5],"used":[6],"in":[7,43,188],"modern":[8],"Conflict-Driven":[9],"Clause":[10],"Learning":[11],"(CDCL)":[12],"solvers,":[13,34],"wherein":[14],"some":[15],"parts":[16,48,73],"of":[17,29,49,74,82,86,101,104,117,128,253,263],"the":[18,27,30,50,58,67,75,80,92,98,102,105,118,126,150,163,180,196,199,217,225,240,251],"solver":[19,68],"state":[20],"are":[21,37,54,266],"erased":[22],"at":[23,258],"certain":[24],"intervals":[25],"during":[26,179],"run":[28],"solver.":[31],"In":[32,121],"most":[33],"variable":[35,264],"activities":[36,265],"preserved":[38],"across":[39,268],"restart":[40],"boundaries,":[41],"resulting":[42],"solvers":[44,193,220],"continuing":[45],"to":[46,62,69,130,235],"search":[47,70,119],"assignment":[51,76,93],"tree":[52],"that":[53,212,230,277],"not":[55,89],"far":[56],"from":[57],"one":[59],"immediately":[60],"prior":[61],"a":[63,84,113,134,254,260],"restart.":[64],"To":[65],"enable":[66],"possibly":[71],"\"distant\"":[72],"tree,":[77],"we":[78,124,275],"study":[79],"effect":[81],"resets,":[83],"variant":[85],"restarts":[87],"which":[88],"only":[90],"erases":[91],"trail,":[94],"but":[95],"also":[96,249],"randomizes":[97],"activity":[99],"scores":[100],"variables":[103],"input":[106,246],"formula":[107],"after":[108],"reset,":[109,256],"thus":[110],"potentially":[111],"enabling":[112],"better":[114],"global":[115],"exploration":[116],"space.":[120],"this":[122],"paper,":[123],"model":[125],"problem":[127],"whether":[129],"trigger":[131],"reset":[132,147,186,200,214,241,269],"as":[133],"multi-armed":[135],"bandit":[136],"(MAB)":[137],"problem,":[138],"and":[139,155,194,205,224,237],"propose":[140],"two":[141,160],"reinforcement":[142],"learning":[143],"(RL)":[144],"based":[145,174],"adaptive":[146],"policies":[148,187],"using":[149],"Upper":[151],"Confidence":[152],"Bound":[153],"(UCB)":[154],"Thompson":[156],"sampling":[157],"algorithms.":[158],"These":[159],"algorithms":[161],"balance":[162],"exploration-exploitation":[164],"tradeoff":[165],"by":[166],"adaptively":[167],"choosing":[168],"arms":[169],"(reset":[170],"vs.":[171,285],"no":[172],"reset)":[173],"on":[175,202,221,272],"their":[176],"estimated":[177],"rewards":[178],"solver's":[181],"run.":[182],"We":[183,248],"implement":[184],"our":[185,231],"four":[189],"baseline":[190,219],"SOTA":[191],"CDCL":[192],"compare":[195],"baselines":[197],"against":[198],"versions":[201,215],"Satcoin":[203,223],"benchmarks":[204],"SAT":[206,226],"Competition":[207],"instances.":[208],"Our":[209],"results":[210],"show":[211,276],"RL-based":[213],"outperform":[216],"corresponding":[218],"both":[222],"competition":[227],"instances,":[228],"suggesting":[229],"RL":[232],"helps":[234],"dynamically":[236],"profitably":[238],"adapt":[239],"frequency":[242],"for":[243],"any":[244],"given":[245],"instance.":[247],"introduce":[250],"concept":[252],"partial":[255,287],"where":[257],"least":[259],"constant":[261],"number":[262],"retained":[267],"boundaries.":[270],"Building":[271],"previous":[273],"results,":[274],"there":[278],"exponential":[281],"separation":[282],"between":[283],"O(1)":[284],"$\\Omega(n)$-length":[286],"resets.":[288]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4394591183","counts_by_year":[],"updated_date":"2025-04-23T21:09:29.440140","created_date":"2024-04-09"}