{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,6]],"date-time":"2024-09-06T12:12:20Z","timestamp":1725624740348},"reference-count":19,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012,3]]},"DOI":"10.1109\/icassp.2012.6289040","type":"proceedings-article","created":{"date-parts":[[2012,9,7]],"date-time":"2012-09-07T19:58:06Z","timestamp":1347047886000},"page":"4989-4992","source":"Crossref","is-referenced-by-count":7,"title":["Off-policy learning in large-scale POMDP-based dialogue systems"],"prefix":"10.1109","author":[{"given":"Lucie","family":"Daubigney","sequence":"first","affiliation":[]},{"given":"Matthieu","family":"Geist","sequence":"additional","affiliation":[]},{"given":"Olivier","family":"Pietquin","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1145\/1102351.1102377"},{"key":"17","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2011-434","article-title":"Uncertainty management for on-line optimisation of a POMDP-based large-scale spoken dialogue system","author":"daubigney","year":"2011","journal-title":"Proc of Interspeech 2011"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553441"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.3115\/1614108.1614146"},{"key":"16","article-title":"Managing Uncertainty within the KTD Framework","author":"geist","year":"0","journal-title":"Proc of the AL&E Workshop 2011"},{"key":"13","article-title":"Sample Efficient Online Learning of Optimal Dialogue Policies with Kalman Temporal Differences","author":"pietquin","year":"2011","journal-title":"Proc IJCAI 2011"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2006.06.008"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2005.1566498"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1109\/ADPRL.2009.4927543"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1109\/89.817450"},{"key":"2","article-title":"Reinforcement learning for spoken dialogue systems","author":"singh","year":"0","journal-title":"Proc NIPS'99 1999"},{"journal-title":"Reinforcement Learning An Introduction","year":"1998","author":"sutton","key":"1"},{"key":"10","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2010-41","article-title":"Natural Belief-Critic: A reinforcement algorithm for parameter estimation in statistical spoken dialogue systems","author":"jurcicek","year":"2010","journal-title":"InterSpeech '11"},{"key":"7","doi-asserted-by":"crossref","DOI":"10.1017\/S0269888906000944","article-title":"A survey of statistical user simulation techniques for rl of dialogue management strategies","author":"schatzmann","year":"2006","journal-title":"The Knowledge Engineering Review"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.1997.658991"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2009.04.001"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.855836"},{"key":"9","article-title":"Gaussian processes for fast policy optimisation of POMDPbased dialogue managers","author":"gas?ic?","year":"0","journal-title":"Proc of SigDial 2010"},{"key":"8","article-title":"Effects of the user model on simulation-based learning of dialogue strategies","author":"schatzmann","year":"0","journal-title":"Proc of ASRU'05 2005"}],"event":{"name":"ICASSP 2012 - 2012 IEEE International Conference on Acoustics, Speech and Signal Processing","start":{"date-parts":[[2012,3,25]]},"location":"Kyoto, Japan","end":{"date-parts":[[2012,3,30]]}},"container-title":["2012 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/6268628\/6287775\/06289040.pdf?arnumber=6289040","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,28]],"date-time":"2022-01-28T13:28:30Z","timestamp":1643376510000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6289040\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,3]]},"references-count":19,"URL":"https:\/\/doi.org\/10.1109\/icassp.2012.6289040","relation":{},"subject":[],"published":{"date-parts":[[2012,3]]}}}