{"id":"https://openalex.org/W2946832132","doi":"https://doi.org/10.1145/3316781.3317748","title":"A Memory-Efficient Markov Decision Process Computation Framework Using BDD-based Sampling Representation","display_name":"A Memory-Efficient Markov Decision Process Computation Framework Using BDD-based Sampling Representation","publication_year":2019,"publication_date":"2019-05-23","ids":{"openalex":"https://openalex.org/W2946832132","doi":"https://doi.org/10.1145/3316781.3317748","mag":"2946832132"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3316781.3317748","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026633836","display_name":"Zhou He","orcid":"https://orcid.org/0000-0002-8923-9493"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"funder","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"He Zhou","raw_affiliation_strings":["Department of Electrical & Computer Engineering Texas A&M University"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering Texas A&M University","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021685706","display_name":"Sunil P. Khatri","orcid":"https://orcid.org/0000-0001-7134-9929"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"funder","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sunil P. Khatri","raw_affiliation_strings":["Department of Electrical & Computer Engineering Texas A&M University"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering Texas A&M University","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103246390","display_name":"Jiang Hu","orcid":"https://orcid.org/0000-0003-1157-7799"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"funder","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiang Hu","raw_affiliation_strings":["Department of Electrical & Computer Engineering Texas A&M University"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering Texas A&M University","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006587869","display_name":"Frank Liu","orcid":"https://orcid.org/0000-0001-6615-0739"},"institutions":[{"id":"https://openalex.org/I4210156936","display_name":"IBM Research - Austin","ror":"https://ror.org/05gjbbg60","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210156936"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Frank Liu","raw_affiliation_strings":["IBM Research, Austin"],"affiliations":[{"raw_affiliation_string":"IBM Research, Austin","institution_ids":["https://openalex.org/I4210156936"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":61},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9963,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.9935,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/binary-decision-diagram","display_name":"Binary decision diagram","score":0.49026635}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7573947},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6621864},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.5273134},{"id":"https://openalex.org/C3309909","wikidata":"https://www.wikidata.org/wiki/Q864155","display_name":"Binary decision diagram","level":2,"score":0.49026635},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.46208665},{"id":"https://openalex.org/C20837028","wikidata":"https://www.wikidata.org/wiki/Q623966","display_name":"Influence diagram","level":3,"score":0.4581683},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.44969377},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.43478984},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34222004},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.326501},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15256503},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.12217063},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3316781.3317748","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.79,"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":25,"referenced_works":["https://openalex.org/W1522512418","https://openalex.org/W1530444831","https://openalex.org/W1591803298","https://openalex.org/W1991513691","https://openalex.org/W1994143452","https://openalex.org/W2030224590","https://openalex.org/W2076337359","https://openalex.org/W2080267935","https://openalex.org/W2088413745","https://openalex.org/W2106237563","https://openalex.org/W2119380192","https://openalex.org/W2119567691","https://openalex.org/W2120406836","https://openalex.org/W2140190779","https://openalex.org/W2145805610","https://openalex.org/W2147471137","https://openalex.org/W2345031381","https://openalex.org/W2587460705","https://openalex.org/W2741634092","https://openalex.org/W2746414954","https://openalex.org/W2795693315","https://openalex.org/W2913838200","https://openalex.org/W3148740559","https://openalex.org/W4298023569","https://openalex.org/W657718082"],"related_works":["https://openalex.org/W4300616421","https://openalex.org/W2952096052","https://openalex.org/W2205783098","https://openalex.org/W2163801945","https://openalex.org/W2122917767","https://openalex.org/W2120406836","https://openalex.org/W2108122578","https://openalex.org/W2103286150","https://openalex.org/W2089210394","https://openalex.org/W1596417907"],"abstract_inverted_index":{"Although":[0],"Markov":[1],"Decision":[2,67],"Process":[3],"(MDP)":[4],"has":[5],"wide":[6],"applications":[7],"in":[8,15],"autonomous":[9],"systems":[10],"as":[11],"a":[12,18,58,74,80],"core":[13],"model":[14],"Reinforcement":[16],"Learning,":[17],"key":[19],"bottleneck":[20],"is":[21,33],"the":[22,27],"large":[23],"memory":[24,89],"utilization":[25],"of":[26,49,95],"state":[28],"transition":[29],"probability":[30,63],"matrices.":[31,51],"This":[32],"particularly":[34],"problematic":[35],"for":[36,43,62,97],"computational":[37],"platforms":[38],"with":[39],"limited":[40],"memory,":[41],"or":[42],"Bayesian":[44],"MDP,":[45,99],"which":[46],"requires":[47],"dozens":[48],"such":[50],"To":[52],"mitigate":[53],"this":[54],"difficulty,":[55],"we":[56],"propose":[57],"highly":[59],"memory-efficient":[60],"representation":[61],"matrices":[64],"using":[65],"Binary":[66],"Diagram":[68],"(BDD)":[69],"based":[70],"sampling,":[71],"and":[72,92],"develop":[73],"corresponding":[75],"(Bayesian/classical)":[76],"MDP":[77],"solver":[78],"on":[79],"CPU-GPU":[81],"platform.":[82],"Simulation":[83],"results":[84],"indicate":[85],"our":[86],"approach":[87],"reduces":[88],"by":[90],"one":[91],"two":[93],"orders":[94],"magnitude":[96],"Bayesian/classical":[98],"respectively.":[100]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2946832132","counts_by_year":[],"updated_date":"2025-01-25T17:45:19.492672","created_date":"2019-05-29"}