{"id":"https://openalex.org/W3150158988","doi":"https://doi.org/10.1017/s0021900200012560","title":"First Passage Optimality and Variance Minimisation of Markov Decision Processes with Varying Discount Factors","display_name":"First Passage Optimality and Variance Minimisation of Markov Decision Processes with Varying Discount Factors","publication_year":2015,"publication_date":"2015-06-01","ids":{"openalex":"https://openalex.org/W3150158988","doi":"https://doi.org/10.1017/s0021900200012560","mag":"3150158988"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0021900200012560","pdf_url":null,"source":{"id":"https://openalex.org/S160779208","display_name":"Journal of Applied Probability","issn_l":"0021-9002","issn":["0021-9002","1475-6072"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020038593","display_name":"X. G. Wu","orcid":"https://orcid.org/0000-0002-0903-8852"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao Wu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101505539","display_name":"Xianping Guo","orcid":"https://orcid.org/0000-0001-6954-5947"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xianping Guo","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.141,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":8,"citation_normalized_percentile":{"value":0.800892,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":84,"max":85},"biblio":{"volume":"52","issue":"02","first_page":"441","last_page":"456"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.997,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.997,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10768","display_name":"Electric Vehicles and Infrastructure","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9887,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimisation","display_name":"Minimisation (clinical trials)","score":0.8243355}],"concepts":[{"id":"https://openalex.org/C86941820","wikidata":"https://www.wikidata.org/wiki/Q6865391","display_name":"Minimisation (clinical trials)","level":2,"score":0.8243355},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.7785026},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6421176},{"id":"https://openalex.org/C6177178","wikidata":"https://www.wikidata.org/wiki/Q10998070","display_name":"Discounting","level":2,"score":0.6081635},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.57130516},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5698985},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.51090497},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.4672622},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.34402645},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3343861},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.18321255},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1743409},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0021900200012560","pdf_url":null,"source":{"id":"https://openalex.org/S160779208","display_name":"Journal of Applied Probability","issn_l":"0021-9002","issn":["0021-9002","1475-6072"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, justice, and strong institutions","score":0.65}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":14,"referenced_works":["https://openalex.org/W1977158480","https://openalex.org/W1991478799","https://openalex.org/W1992668155","https://openalex.org/W2006115861","https://openalex.org/W2010559195","https://openalex.org/W2014323878","https://openalex.org/W2024265320","https://openalex.org/W2035033056","https://openalex.org/W2060110534","https://openalex.org/W2065365821","https://openalex.org/W2083635875","https://openalex.org/W2083738358","https://openalex.org/W2156049124","https://openalex.org/W2313791856"],"related_works":["https://openalex.org/W4255368532","https://openalex.org/W2413828414","https://openalex.org/W2379651310","https://openalex.org/W2367222340","https://openalex.org/W2162286586","https://openalex.org/W2113019827","https://openalex.org/W2077098439","https://openalex.org/W2011109452","https://openalex.org/W187740018","https://openalex.org/W1541249122"],"abstract_inverted_index":{"This":[0],"paper":[1],"deals":[2],"with":[3,18],"the":[4,34,38,46,51,61,67,88,96,99,123,126,132,139],"first":[5,52,79,103,127],"passage":[6,53,80,104,128],"optimality":[7,81,129,135],"and":[8,22,48,119,131],"variance":[9,68,97],"minimisation":[10,69],"problems":[11],"of":[12,50,83,90,101,136],"discrete-time":[13],"Markov":[14],"decision":[15],"processes":[16],"(MDPs)":[17],"varying":[19],"discount":[20,134],"factors":[21],"unbounded":[23],"rewards/costs.":[24],"First,":[25],"under":[26],"suitable":[27],"conditions":[28],"slightly":[29],"weaker":[30],"than":[31],"those":[32],"in":[33,138],"previous":[35,140],"literature":[36],"on":[37],"standard":[39,133],"(infinite":[40],"horizon)":[41],"discounted":[42],"MDPs,":[43,84],"we":[44,65,109],"establish":[45],"existence":[47,89],"characterisation":[49],"expected-optimal":[54,62,105],"stationary":[55,63,106],"policies.":[56,107],"Second,":[57],"to":[58,76,114,121],"further":[59],"distinguish":[60],"policies,":[64],"introduce":[66],"problem,":[70],"prove":[71],"that":[72,94],"it":[73],"is":[74],"equivalent":[75],"a":[77,91,111],"new":[78],"problem":[82],"and,":[85],"thus,":[86],"show":[87,122],"variance-optimal":[92],"policy":[93],"minimises":[95],"over":[98],"set":[100],"all":[102],"Finally,":[108],"use":[110],"computable":[112],"example":[113],"illustrate":[115],"our":[116],"main":[117],"results":[118],"also":[120],"difference":[124],"between":[125],"here":[130],"MDPs":[137],"literature.":[141]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3150158988","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3}],"updated_date":"2025-04-17T21:18:13.128299","created_date":"2021-04-13"}