{"id":"https://openalex.org/W309675244","doi":"https://doi.org/10.1613/jair.4623","title":"Optimally Solving Dec-POMDPs as Continuous-State MDPs","display_name":"Optimally Solving Dec-POMDPs as Continuous-State MDPs","publication_year":2016,"publication_date":"2016-02-24","ids":{"openalex":"https://openalex.org/W309675244","doi":"https://doi.org/10.1613/jair.4623","mag":"309675244"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.4623","pdf_url":"https://jair.org/index.php/jair/article/download/10986/26136","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://jair.org/index.php/jair/article/download/10986/26136","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032392204","display_name":"Jilles Dibangoye","orcid":"https://orcid.org/0000-0001-8826-4438"},"institutions":[{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"funder","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jilles Steeve Dibangoye","raw_affiliation_strings":["Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#"],"affiliations":[{"raw_affiliation_string":"Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033129735","display_name":"Christopher Amato","orcid":"https://orcid.org/0000-0002-6786-7384"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Amato","raw_affiliation_strings":["CSAIL, MIT Cambridge, MA#TAB#"],"affiliations":[{"raw_affiliation_string":"CSAIL, MIT Cambridge, MA#TAB#","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022343068","display_name":"Olivier Buffet","orcid":"https://orcid.org/0000-0002-5072-5857"},"institutions":[{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"funder","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Olivier Buffet","raw_affiliation_strings":["Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#"],"affiliations":[{"raw_affiliation_string":"Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051052976","display_name":"Fran\u00e7ois Charpillet","orcid":"https://orcid.org/0000-0001-8260-1536"},"institutions":[{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"funder","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Fran\u00e7ois Charpillet","raw_affiliation_strings":["Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#"],"affiliations":[{"raw_affiliation_string":"Inria, Universit\u00e9 de Lorraine, Nancy, France#TAB#","institution_ids":["https://openalex.org/I90183372"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":0,"currency":"USD","value_usd":0},"apc_paid":null,"fwci":7.214,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":74,"citation_normalized_percentile":{"value":0.955208,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":"55","issue":null,"first_page":"443","last_page":"497"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.998,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.987,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.86237335},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74442196},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.72276247},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.6850269},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6761794},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.6289742},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5493082},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5097143},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.43944803},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.31445724},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25255647},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.22418052},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19170803},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.18744567},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.17612031},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.14775214},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":9,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.4623","pdf_url":"https://jair.org/index.php/jair/article/download/10986/26136","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-00907338","pdf_url":"https://inria.hal.science/hal-00907338/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-01279444","pdf_url":"https://inria.hal.science/hal-01279444/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://inria.hal.science/hal-01279444","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-01279444/file/dibangoye16a.pdf","pdf_url":"https://hal.inria.fr/hal-01279444/file/dibangoye16a.pdf","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-01279444/document","pdf_url":"https://hal.inria.fr/hal-01279444/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-00907338/file/ijcai13b.pdf","pdf_url":"https://hal.inria.fr/hal-00907338/file/ijcai13b.pdf","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://hal.inria.fr/hal-00907338/document","pdf_url":"https://hal.inria.fr/hal-00907338/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":["Centre National de la Recherche Scientifique"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.638.9102","pdf_url":"http://people.csail.mit.edu/camato/publications/DABC-IJCAI13.pdf","source":{"id":"https://openalex.org/S4306400349","display_name":"CiteSeer X (The Pennsylvania State University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I130769515","host_organization_name":"Pennsylvania State University","host_organization_lineage":["https://openalex.org/I130769515"],"host_organization_lineage_names":["Pennsylvania State University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1613/jair.4623","pdf_url":"https://jair.org/index.php/jair/article/download/10986/26136","source":{"id":"https://openalex.org/S139930977","display_name":"Journal of Artificial Intelligence Research","issn_l":"1076-9757","issn":["1076-9757","1943-5037"],"is_oa":true,"is_in_doaj":true,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310315760","host_organization_name":"AI Access Foundation","host_organization_lineage":["https://openalex.org/P4310315760"],"host_organization_lineage_names":["AI Access Foundation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.82,"display_name":"Peace, justice, and strong institutions"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":77,"referenced_works":["https://openalex.org/W100327610","https://openalex.org/W110618639","https://openalex.org/W118921981","https://openalex.org/W124331494","https://openalex.org/W1513089816","https://openalex.org/W1554448638","https://openalex.org/W1560489415","https://openalex.org/W156814138","https://openalex.org/W1575232410","https://openalex.org/W1576060340","https://openalex.org/W1588304026","https://openalex.org/W1589131899","https://openalex.org/W1670739992","https://openalex.org/W1710391264","https://openalex.org/W1745373831","https://openalex.org/W1798373787","https://openalex.org/W1805286982","https://openalex.org/W1908253641","https://openalex.org/W1930803870","https://openalex.org/W1969483458","https://openalex.org/W1972774725","https://openalex.org/W1976195538","https://openalex.org/W1988975763","https://openalex.org/W2009533501","https://openalex.org/W2021061679","https://openalex.org/W2024780670","https://openalex.org/W2028145673","https://openalex.org/W2034725503","https://openalex.org/W2039403346","https://openalex.org/W2055921164","https://openalex.org/W2087992130","https://openalex.org/W2088956500","https://openalex.org/W2101450289","https://openalex.org/W2102764452","https://openalex.org/W2103215206","https://openalex.org/W2103541323","https://openalex.org/W2105757562","https://openalex.org/W2108005621","https://openalex.org/W2110962519","https://openalex.org/W2116753650","https://openalex.org/W2119567691","https://openalex.org/W2121754545","https://openalex.org/W2121943493","https://openalex.org/W2122905566","https://openalex.org/W2124520701","https://openalex.org/W2124951610","https://openalex.org/W2128371572","https://openalex.org/W2131747355","https://openalex.org/W2134802714","https://openalex.org/W2153601367","https://openalex.org/W2153821047","https://openalex.org/W2162635261","https://openalex.org/W2162735718","https://openalex.org/W2163827199","https://openalex.org/W2163944731","https://openalex.org/W2165421048","https://openalex.org/W2168359464","https://openalex.org/W2169294731","https://openalex.org/W2169982856","https://openalex.org/W2196890647","https://openalex.org/W2287282975","https://openalex.org/W2294192315","https://openalex.org/W2321292752","https://openalex.org/W2341171179","https://openalex.org/W24098402","https://openalex.org/W241919466","https://openalex.org/W2545350044","https://openalex.org/W2963493419","https://openalex.org/W309675244","https://openalex.org/W3104860527","https://openalex.org/W4199186","https://openalex.org/W4232967792","https://openalex.org/W4236849587","https://openalex.org/W4285719527","https://openalex.org/W4298023569","https://openalex.org/W4299414914","https://openalex.org/W85998123"],"related_works":["https://openalex.org/W52153049","https://openalex.org/W4323315247","https://openalex.org/W4321379664","https://openalex.org/W3169161914","https://openalex.org/W2294884454","https://openalex.org/W2211790881","https://openalex.org/W2096013579","https://openalex.org/W1760611253","https://openalex.org/W1589140671","https://openalex.org/W1515117609"],"abstract_inverted_index":{"Decentralized":[0],"partially":[1],"observable":[2],"Markov":[3],"decision":[4],"processes":[5],"(Dec-POMDPs)":[6],"provide":[7,101],"a":[8,26,39,42,47,66,136],"general":[9],"model":[10],"for":[11,96],"decision-making":[12],"under":[13],"uncertainty":[14],"in":[15,65,119,163],"decentralized":[16],"settings,":[17],"but":[18],"are":[19],"difficult":[20],"to":[21,93,126,128,189],"solve":[22],"optimally":[23],"(NEXP-Complete).":[24],"As":[25],"new":[27,77],"way":[28],"of":[29,37,57,192],"solving":[30],"these":[31],"problems,":[32],"we":[33,81,103,134],"introduce":[34,135],"the":[35,58,97,116,124,190,193],"idea":[36],"transforming":[38],"Dec-POMDP":[40,78],"into":[41],"continuous-state":[43,90],"deterministic":[44],"MDP":[45,91],"with":[46,166],"piecewise-linear":[48],"and":[49,89,111,152],"convex":[50],"value":[51,140],"function.":[52],"This":[53,76],"approach":[54,106,183],"makes":[55],"use":[56],"fact":[59],"that":[60,114,144,160,181],"planning":[61],"can":[62,72],"be":[63,74,94],"accomplished":[64],"centralized":[67],"offline":[68],"manner,":[69],"while":[70],"execution":[71],"still":[73],"decentralized.":[75],"formulation,":[79],"which":[80],"call":[82],"an":[83,129,167,172],"occupancy":[84],"MDP,":[85],"allows":[86],"powerful":[87],"POMDP":[88],"methods":[92],"used":[95],"first":[98],"time.":[99],"To":[100],"scalability,":[102],"refine":[104],"this":[105],"by":[107],"combining":[108],"heuristic":[109,138],"search":[110,139],"compact":[112,148],"representations":[113],"exploit":[115],"structure":[117],"present":[118],"multi-agent":[120],"domains,":[121],"without":[122],"losing":[123],"ability":[125],"converge":[127],"optimal":[130,168],"solution.":[131,169],"In":[132],"particular,":[133],"feature-based":[137,147],"iteration":[141],"(FB-HSVI)":[142],"algorithm":[143],"relies":[145],"on":[146],"representations,":[149],"point-based":[150],"updates":[151],"efficient":[153],"action":[154],"selection.":[155],"A":[156],"theoretical":[157],"analysis":[158,175],"demonstrates":[159],"FB-HSVI":[161],"terminates":[162],"finite":[164],"time":[165],"We":[170],"include":[171],"extensive":[173],"empirical":[174],"using":[176],"well-known":[177],"benchmarks,":[178],"thereby":[179],"demonstrating":[180],"our":[182],"provides":[184],"significant":[185],"scalability":[186],"improvements":[187],"compared":[188],"state":[191],"art.":[194]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W309675244","counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":9},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":4}],"updated_date":"2025-04-22T05:07:06.222291","created_date":"2016-06-24"}