{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,20]],"date-time":"2024-09-20T16:37:50Z","timestamp":1726850270670},"reference-count":252,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Annual Reviews in Control"],"published-print":{"date-parts":[[2020]]},"DOI":"10.1016\/j.arcontrol.2020.06.001","type":"journal-article","created":{"date-parts":[[2020,6,26]],"date-time":"2020-06-26T09:50:01Z","timestamp":1593165001000},"page":"119-138","update-policy":"http:\/\/dx.doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":58,"special_numbering":"C","title":["From inverse optimal control to inverse reinforcement learning: A historical review"],"prefix":"10.1016","volume":"50","author":[{"given":"Nematollah","family":"Ab Azar","sequence":"first","affiliation":[]},{"given":"Aref","family":"Shahmansoorian","sequence":"additional","affiliation":[]},{"given":"Mohsen","family":"Davoudi","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.arcontrol.2020.06.001_bib254","doi-asserted-by":"crossref","first-page":"1608","DOI":"10.1177\/0278364910371999","article-title":"Autonomous helicopter aerobatics through apprenticeship learning","volume":"29(13)","author":"Abbeel","year":"2010","journal-title":"The International Journal of Robotics Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0001","series-title":"Proceedings of the twenty-first international conference on machine learning","first-page":"1","article-title":"Apprenticeship learning via inverse reinforcement learning","author":"Abbeel","year":"2004"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0002","series-title":"Inverse optimal control for differentially flat systems with application to lower-limb prosthetic devices","author":"Aghasadeghi","year":"2015"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0003","series-title":"2011 IEEE\/RSJ international conference on intelligent robots and systems","first-page":"1561","article-title":"Maximum entropy inverse reinforcement learning in continuous state spaces with path integrals","author":"Aghasadeghi","year":"2011"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0004","series-title":"2012 IEEE international conference on robotics and automation","first-page":"4962","article-title":"Inverse optimal control for a hybrid dynamical system with impacts","author":"Aghasadeghi","year":"2012"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0005","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1287\/opre.49.5.771.10607","article-title":"Inverse optimization","volume":"49","author":"Ahuja","year":"2001","journal-title":"Operations Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0006","series-title":"The calculus of variations","author":"Akhiezer","year":"1962"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0007","series-title":"2015 12th international conference on informatics in control, automation and robotics (ICINCO)","first-page":"275","article-title":"A new inverse optimal control method for discrete-time systems","volume":"1","author":"Almobaied","year":"2015"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0008","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1002\/oca.2331","article-title":"Inverse optimal controller based on extended Kalman filter for discrete\u2010time nonlinear systems","volume":"39","author":"Almobaied","year":"2018","journal-title":"Optimal Control Applications and Methods"},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0009","doi-asserted-by":"crossref","first-page":"943","DOI":"10.1109\/TSMCB.2008.926614","article-title":"Discrete-time nonlinear HJB solution using approximate dynamic programming: Convergence proof","volume":"38","author":"Al-Tamimi","year":"2008","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part B (Cybernetics)"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0010","series-title":"THE inverse problem of optimal control (No. TR-6560-3)","author":"Anderson","year":"1966"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0011","series-title":"Optimal control: Linear quadratic methods","author":"Anderson","year":"2007"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib252","series-title":"Optimal Control: Linear Quadratic Methods","author":"Anderson","year":"1989"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0012","doi-asserted-by":"crossref","first-page":"480","DOI":"10.2514\/3.19750","article-title":"Robust colocated control for large flexible space structures","volume":"4","author":"Arbel","year":"1981","journal-title":"Journal of Guidance and Control"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0013","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1109\/TRO.2008.915449","article-title":"An optimality principle governing human walking","volume":"24","author":"Arechavaleta","year":"2008","journal-title":"IEEE Transactions on Robotics"},{"issue":"3\u20134","key":"10.1016\/j.arcontrol.2020.06.001_bib0014","doi-asserted-by":"crossref","first-page":"243","DOI":"10.1016\/j.robot.2010.11.004","article-title":"Teacher feedback to scaffold and refine demonstrated motion primitives on a mobile robot","volume":"59","author":"Argall","year":"2011","journal-title":"Robotics and Autonomous Systems"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0015","doi-asserted-by":"crossref","first-page":"469","DOI":"10.1016\/j.robot.2008.10.024","article-title":"A survey of robot learning from demonstration","volume":"57","author":"Argall","year":"2009","journal-title":"Robotics and autonomous systems"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0016","unstructured":"Arora, S., & Doshi, P. (2018). A survey of inverse reinforcement learning: Challenges, methods and progress. arXiv preprint arXiv:1806.06877."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0017","doi-asserted-by":"crossref","first-page":"1163","DOI":"10.1016\/0362-546X(83)90049-4","article-title":"Stabilization with relaxed controls","volume":"7","author":"Artstein","year":"1983","journal-title":"Nonlinear Anal. TMA"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0018","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1109\/MSP.2017.2743240","article-title":"Deep reinforcement learning: A brief survey","volume":"34","author":"Arulkumaran","year":"2017","journal-title":"IEEE Signal Processing Magazine"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0019","series-title":"Twenty-fourth international joint conference on artificial intelligence","article-title":"Maximum entropy semi-supervised inverse reinforcement learning","author":"Audiffren","year":"2015"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0020","series-title":"Proceedings of the 28th International conference on machine learning (ICML-11)","first-page":"897","article-title":"Apprenticeship learning about multiple intentions","author":"Babes","year":"2011"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0021","doi-asserted-by":"crossref","first-page":"571","DOI":"10.1177\/0142331208095427","article-title":"From Artstein-Sontag theorem to the min-projection strategy","volume":"32","author":"Bacciotti","year":"2010","journal-title":"Transactions of the Institute of Measurement and Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0022","series-title":"Advances in neural information processing systems","first-page":"1153","article-title":"Boosting structured prediction for imitation learning","author":"Bagnell","year":"2007"},{"issue":"15","key":"10.1016\/j.arcontrol.2020.06.001_bib0023","first-page":"103","article-title":"A framework for behavioural claning","volume":"15","author":"Bain","year":"1999","journal-title":"Machine Intelligence"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0024","series-title":"AISB96 workshop on learning in robots and animals","first-page":"3","article-title":"Robot see, robot do: An overview of robot imitation","author":"Bakker","year":"1996"},{"issue":"01","key":"10.1016\/j.arcontrol.2020.06.001_bib0025","doi-asserted-by":"crossref","DOI":"10.1142\/S0219843612500065","article-title":"A survey of vision-based architectures for robot learning by imitation","volume":"9","author":"Bandera","year":"2012","journal-title":"International Journal of Humanoid Robotics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0026","first-page":"679","article-title":"A Markovian decision process","author":"Bellman","year":"1957","journal-title":"Journal of Mathematics and Mechanics"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0027","doi-asserted-by":"crossref","first-page":"424","DOI":"10.1016\/0022-247X(70)90090-9","article-title":"Dynamic programming and inverse optimal problems in mathematical economics","volume":"29","author":"Bellman","year":"1970","journal-title":"Journal of Mathematical Analysis and Applications"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0028","series-title":"Mathematical tables and other aids to computation","first-page":"247","article-title":"Functional approximations and dynamic programming","author":"Bellman","year":"1959"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0029","series-title":"An inverse problem in dynamic programming and automatic control","author":"Bellman","year":"1963"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0030","series-title":"Proceedings of 1995 34th IEEE conference on decision and control","first-page":"560","article-title":"Neuro-dynamic programming: An overview","volume":"1","author":"Bertsekas","year":"1995"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0031","series-title":"Neuro-dynamic programming","author":"Bertsekas","year":"1996"},{"issue":"12","key":"10.1016\/j.arcontrol.2020.06.001_bib0032","doi-asserted-by":"crossref","first-page":"3824","DOI":"10.4249\/scholarpedia.3824","article-title":"Robot learning by demonstration","volume":"8","author":"Billard","year":"2013","journal-title":"Scholarpedia"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0033","series-title":"Proceedings of the fourth international conference on autonomous agents","first-page":"373","article-title":"A biologically inspired robotic model for learning by imitation","author":"Billard","year":"2000"},{"issue":"2\u20133","key":"10.1016\/j.arcontrol.2020.06.001_bib0034","doi-asserted-by":"crossref","first-page":"145","DOI":"10.1016\/S0921-8890(01)00155-5","article-title":"Learning human arm movements by imitation:: Evaluation of a biologically inspired connectionist architecture","volume":"37","author":"Billard","year":"2001","journal-title":"Robotics and Autonomous Systems"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0035","series-title":"Pattern recognition and machine learning","author":"Bishop","year":"2006"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0036","doi-asserted-by":"crossref","first-page":"103","DOI":"10.3846\/16483840.2002.10414022","article-title":"The inverse simulation study of aircraft flight path reconstruction","volume":"17","author":"Blajer","year":"2002","journal-title":"Transport"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0037","unstructured":"Bliss, G.A. (1946). Lectures on the Calculus of Variations."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0038","series-title":"Workshops at the twenty-ninth AAAI conference on artificial intelligence","article-title":"Deep apprenticeship learning for playing video games","author":"Bogdanovic","year":"2015"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0039","series-title":"Vorlesungen \u00fcber variationsrechnung","author":"Bolza","year":"1909"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0040","series-title":"Proceedings of the fourteenth international conference on artificial intelligence and statistics","first-page":"182","article-title":"Relative entropy inverse reinforcement learning","author":"Boularias","year":"2011"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0041","volume":"Vol. 15","author":"Boyd","year":"1994"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0042","unstructured":"Brown, D.S., Goo, W., Nagarajan, P., & Niekum, S. (2019). Extrapolating beyond suboptimal demonstrations via inverse reinforcement learning from observations. arXiv preprint arXiv:1904.06387."},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0043","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1109\/37.506395","article-title":"Optimal control-1950 to 1985","volume":"16","author":"Bryson","year":"1996","journal-title":"IEEE Control Systems Magazine"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0044","doi-asserted-by":"crossref","first-page":"263","DOI":"10.1017\/S0956792505006182","article-title":"A survey on level set methods for inverse problems and optimal design","volume":"16","author":"Burger","year":"2005","journal-title":"European Journal of Applied Mathematics"},{"issue":"1\u20133","key":"10.1016\/j.arcontrol.2020.06.001_bib0045","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1007\/BF01585693","article-title":"On an instance of the inverse shortest paths problem","volume":"53","author":"Burton","year":"1992","journal-title":"Mathematical Programming"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0046","doi-asserted-by":"crossref","first-page":"243","DOI":"10.1016\/S0045-7949(96)00340-9","article-title":"Optimal regularization of an inverse dynamics problem","volume":"63","author":"Busby","year":"1997","journal-title":"Computers & Structures"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0047","series-title":"NIPS workshop on autonomous learning robots","article-title":"Layered hybrid inverse optimal control for learning robot manipulation from demonstration","author":"Byravan","year":"2014"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0048","doi-asserted-by":"crossref","first-page":"667","DOI":"10.1017\/S0140525X98001745","article-title":"Learning by imitation: A hierarchical approach","volume":"21","author":"Byrne","year":"1998","journal-title":"Behavioral and Brain Sciences"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0049","doi-asserted-by":"crossref","first-page":"441","DOI":"10.1075\/is.8.3.08cal","article-title":"What is the teacher's role in robot programming by demonstration?: Toward benchmarks for improved learning","volume":"8","author":"Calinon","year":"2007","journal-title":"Interaction Studies"},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0051","doi-asserted-by":"crossref","first-page":"491","DOI":"10.1007\/BF00934036","article-title":"On the general inverse problem of optimal control theory","volume":"32","author":"Casti","year":"1980","journal-title":"Journal of Optimization Theory and Applications"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0052","unstructured":"Casti, J.L. (1974). A Note on the General Inverse Problem of Optimal Control Theory."},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0053","doi-asserted-by":"crossref","first-page":"147","DOI":"10.2307\/1911845","article-title":"The inverse optimal problem: A dynamic programming approach","volume":"56","author":"Chang","year":"1988","journal-title":"Econometrica"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0054","doi-asserted-by":"crossref","first-page":"349","DOI":"10.1016\/0005-1098(82)90096-6","article-title":"On receding horizon feedback control","volume":"18","author":"Chen","year":"1982","journal-title":"Automatica"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0055","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1613\/jair.2584","article-title":"Interactive policy learning through confidence-based autonomy","volume":"34","author":"Chernova","year":"2009","journal-title":"Journal of Artificial Intelligence Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0056","first-page":"691","article-title":"Inverse reinforcement learning in partially observable environments","volume":"12","author":"Choi","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0057","series-title":"Twenty-third international joint conference on artificial intelligence","article-title":"Bayesian nonparametric feature construction for inverse reinforcement learning","author":"Choi","year":"2013"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0058","doi-asserted-by":"crossref","first-page":"564","DOI":"10.1109\/TRO.2019.2891173","article-title":"Robust learning from demonstrations with mixed qualities using leveraged gaussian processes","volume":"35","author":"Choi","year":"2019","journal-title":"IEEE Transactions on Robotics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0059","series-title":"53rd IEEE conference on decision and control","first-page":"6677","article-title":"Reconstructing trajectories from the moments of occupation measures","author":"Claeys","year":"2014"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0060","series-title":"Robotics: Science and systems","article-title":"An inverse optimal control approach for the transfer of human walking motions in constrained environment to humanoid robots","author":"Clever","year":"2016"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0061","series-title":"A generalization of Sontag's formula for high-performance CLF-based control","author":"Curtis III","year":"2002"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0062","series-title":"International symposium on experimental robotics","first-page":"3","article-title":"Learning transferable policies for monocular reactive mav control","author":"Daftry","year":"2016"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0063","doi-asserted-by":"crossref","first-page":"597","DOI":"10.1287\/moor.1060.0208","article-title":"A cost-shaping linear program for average-cost approximate dynamic programming with performance guarantees","volume":"31","author":"De Farias","year":"2006","journal-title":"Mathematics of Operations Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0064","first-page":"30","article-title":"Robot programming by human demonstration: Adaptation and inconsistency in constrained motion","volume":"1","author":"Delson","year":"1996"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0065","doi-asserted-by":"crossref","first-page":"151","DOI":"10.1016\/S0167-6911(97)00067-4","article-title":"Stochastic nonlinear stabilization\u2014II: Inverse optimality","volume":"32","author":"Deng","year":"1997","journal-title":"Systems & Control Letters"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0066","doi-asserted-by":"crossref","first-page":"2581","DOI":"10.1109\/TMECH.2015.2510165","article-title":"Learning compliant movement primitives through demonstration and statistical generalization","volume":"21","author":"Deni\u0161a","year":"2015","journal-title":"IEEE\/ASME Transactions on Mechatronics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0067","article-title":"Direct loss minimization inverse optimal control","author":"Doerr","year":"2015","journal-title":"Robotics: Science and Systems"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0068","series-title":"Advances in neural information processing systems","first-page":"1087","article-title":"One-shot imitation learning","author":"Duan","year":"2017"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0069","doi-asserted-by":"crossref","first-page":"270","DOI":"10.1115\/1.3151899","article-title":"Inverse design and active control concepts in strong unsteady heat conduction","volume":"41","author":"Dulikravich","year":"1988","journal-title":"Applied Mechanics Reviews"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0070","series-title":"Proceedings of the 27th international conference on machine learning (ICML-10)","first-page":"335","article-title":"Inverse optimal control with linearly-solvable MDPs","author":"Dvijotham","year":"2010"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0071","doi-asserted-by":"crossref","first-page":"388","DOI":"10.1177\/1059712313491614","article-title":"Probabilistic model-based imitation learning","volume":"21","author":"Englert","year":"2013","journal-title":"Adaptive Behavior"},{"issue":"13\u201314","key":"10.1016\/j.arcontrol.2020.06.001_bib0072","doi-asserted-by":"crossref","first-page":"1474","DOI":"10.1177\/0278364917745980","article-title":"Inverse KKT: Learning cost functions of manipulation tasks from demonstrations","volume":"36","author":"Englert","year":"2017","journal-title":"The International Journal of Robotics Research"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0073","doi-asserted-by":"crossref","first-page":"293","DOI":"10.1093\/nsr\/nwt032","article-title":"Challenges of big data analysis","volume":"1","author":"Fan","year":"2014","journal-title":"National Science Review"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0074","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1002\/(SICI)1099-1115(200002)14:1<1::AID-ACS595>3.0.CO;2-B","article-title":"Inverse optimal adaptive control for non-linear uncertain systems with exogenous disturbances","volume":"14","author":"Fausz","year":"2000","journal-title":"International Journal of Adaptive Control and Signal Processing"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0075","unstructured":"Finn, C., Christiano, P., Abbeel, P., & Levine, S. (2016). A connection between generative adversarial networks, inverse reinforcement learning, and energy-based models. arXiv preprint arXiv:1611.03852.2016b."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0076","series-title":"International conference on machine learning","first-page":"49","article-title":"Guided cost learning: Deep inverse optimal control via policy optimization","author":"Finn","year":"2016"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0077","unstructured":"Finn, C., Yu, T., Zhang, T., Abbeel, P., & Levine, S. (2017). One-shot visual imitation learning via meta-learning. arXiv preprint arXiv:1709.04905."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0078","series-title":"Robust nonlinear control design: State-space and lyapunov techniques","author":"Freeman","year":"2008"},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0079","doi-asserted-by":"crossref","first-page":"1365","DOI":"10.1137\/S0363012993258732","article-title":"Inverse optimality in robust stabilization","volume":"34","author":"Freeman","year":"1996","journal-title":"SIAM Journal on Control and Optimization"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0080","series-title":"Proceedings of 35th IEEE conference on decision and control","first-page":"3926","article-title":"Control Lyapunov functions: New ideas from an old source","volume":"4","author":"Freeman","year":"1996"},{"issue":"11","key":"10.1016\/j.arcontrol.2020.06.001_bib0081","doi-asserted-by":"crossref","first-page":"995","DOI":"10.1109\/TAC.1987.1104479","article-title":"A new approach to the LQ design from the viewpoint of the inverse regulator problem","volume":"32","author":"Fujii","year":"1987","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0082","series-title":"Proceedings of the 27th IEEE conference on decision and control","first-page":"26","article-title":"Inverse problems in H\/sub infinity\/control theory and linear-quadratic differential games","author":"Fujii","year":"1988"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0083","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1137\/0322022","article-title":"A complete optimality condition in the inverse problem of optimal control","volume":"22","author":"Fujii","year":"1984","journal-title":"SIAM journal on Control and Optimization"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0247","doi-asserted-by":"crossref","first-page":"293","DOI":"10.1108\/17563781211255862","article-title":"A survey of inverse reinforcement learning techniques","volume":"5","author":"Gao","year":"2012","journal-title":"International Journal of Intelligent Computing and Cybernetics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0084","series-title":"Proceedings of the 18th international conference on autonomous agents and multiagent systems","first-page":"1368","article-title":"Discriminatively learning inverse optimal control models for predicting human intentions","author":"Gaurav","year":"2019"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0085","series-title":"2015 IEEE international conference on robotics and automation (ICRA)","article-title":"An incremental approach to learning generalizable robot tasks from human demonstration","author":"Ghalamzan","year":"2015"},{"issue":"5\u20136","key":"10.1016\/j.arcontrol.2020.06.001_bib0086","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1561\/2200000049","article-title":"Bayesian reinforcement learning: A survey","volume":"8","author":"Ghavamzadeh","year":"2015","journal-title":"Foundations and Trends\u00ae in Machine Learning"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0087","doi-asserted-by":"crossref","first-page":"339","DOI":"10.1016\/j.orl.2018.03.007","article-title":"Robust inverse optimization","volume":"46","author":"Ghobadi","year":"2018","journal-title":"Operations Research Letters"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0088","series-title":"Advances in neural information processing systems","first-page":"2672","article-title":"Generative adversarial nets","author":"Goodfellow","year":"2014"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0089","series-title":"Advances in neural information processing systems","first-page":"3909","article-title":"Cooperative inverse reinforcement learning","author":"Hadfield-Menell","year":"2016"},{"issue":"2\u20133","key":"10.1016\/j.arcontrol.2020.06.001_bib0090","doi-asserted-by":"crossref","first-page":"615","DOI":"10.1080\/02331934.2018.1495205","article-title":"Optimality conditions for a class of inverse optimal control problems with partial differential equations","volume":"68","author":"Harder","year":"2019","journal-title":"Optimization"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0091","series-title":"A robot controller using learning by imitation","author":"Hayes","year":"1994"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0092","series-title":"Thirty-Second AAAI conference on artificial intelligence","article-title":"Optiongan: Learning joint reward-policy options using generative adversarial inverse reinforcement learning","author":"Henderson","year":"2018"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0093","series-title":"Thirty-second AAAI conference on artificial intelligence","article-title":"Rainbow: Combining improvements in deep reinforcement learning","author":"Hessel","year":"2018"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0094","doi-asserted-by":"crossref","first-page":"329","DOI":"10.1023\/B:JOCO.0000038914.26975.9b","article-title":"Inverse combinatorial optimization: A survey on problems, methods, and results","volume":"8","author":"Heuberger","year":"2004","journal-title":"Journal of Combinatorial Optimization"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0095","series-title":"Advances in neural information processing systems","first-page":"4565","article-title":"Generative adversarial imitation learning","author":"Ho","year":"2016"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0096","unstructured":"Huang, B., Ma, X., & Vaidya, U. (2019). Data-driven nonlinear stabilization using koopman operator. arXiv preprint arXiv:1901.07678."},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0097","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1145\/3054912","article-title":"Imitation learning: A survey of learning methods","volume":"50","author":"Hussein","year":"2017","journal-title":"ACM Computing Surveys (CSUR)"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0098","series-title":"Advances in neural information processing systems","first-page":"1547","article-title":"Learning attractor landscapes for learning motor primitives","author":"Ijspeert","year":"2003"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib253","doi-asserted-by":"crossref","first-page":"328","DOI":"10.1162\/NECO_a_00393","article-title":"Dynamical movement primitives: learning attractor models for motor behaviors","volume":"25(2)","author":"Ijspeert","year":"2013","journal-title":"Neural computation"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0099","first-page":"25","article-title":"Inverse dynamic programming. Memoirs of the Faculty of Science, Kyushu University","volume":"30","author":"Iwamoto","year":"1976","journal-title":"Series A, Mathematics"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0100","doi-asserted-by":"crossref","first-page":"319","DOI":"10.1016\/j.orl.2004.04.007","article-title":"Inverse conic programming with applications","volume":"33","author":"Iyengar","year":"2005","journal-title":"Operations Research Letters"},{"issue":"3\u20134","key":"10.1016\/j.arcontrol.2020.06.001_bib0101","doi-asserted-by":"crossref","first-page":"142","DOI":"10.1561\/2200000058","article-title":"Non-convex optimization for machine learning","volume":"10","author":"Jain","year":"2017","journal-title":"Foundations and Trends\u00ae in Machine Learning"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0102","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1137\/0311001","article-title":"Inverse problem of linear optimal control","volume":"11","author":"Jameson","year":"1973","journal-title":"SIAM Journal on Control"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0103","doi-asserted-by":"crossref","first-page":"288","DOI":"10.1109\/87.826800","article-title":"Constructive Lyapunov control design for turbocharged diesel engines","volume":"8","author":"Jankovic","year":"2000","journal-title":"IEEE Transactions on Control Systems Technology"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0104","unstructured":"Jin, M., Damianou, A., Abbeel, P., & Spanos, C. (2015). Inverse reinforcement learning via deep gaussian process. arXiv preprint arXiv:1512.08065."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0105","series-title":"52nd IEEE conference on decision and control","first-page":"2906","article-title":"Inverse optimal control for deterministic continuous-time nonlinear systems","author":"Johnson","year":"2013"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0106","series-title":"2013 IEEE international conference on robotics and automation","first-page":"1331","article-title":"Learning objective functions for manipulation","author":"Kalakrishnan","year":"2013"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0107","doi-asserted-by":"crossref","first-page":"51","DOI":"10.1115\/1.3653115","article-title":"When is a linear control system optimal?","volume":"86","author":"Kalman","year":"1964","journal-title":"Journal of Basic Engineering"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0108","doi-asserted-by":"crossref","first-page":"557","DOI":"10.1016\/0005-1098(83)90011-0","article-title":"Determining quadratic weighting matrices to locate poles in a specified region","volume":"19","author":"Kawasaki","year":"1983","journal-title":"Automatica"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0109","series-title":"International conference on artificial neural networks","first-page":"601","article-title":"Teaching by showing in kendama based on optimization principle","author":"Kawato","year":"1994"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0110","series-title":"2011 IEEE international symposium on intelligent control","first-page":"613","article-title":"Imputing a convex objective function","author":"Keshavarz","year":"2011"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0111","doi-asserted-by":"crossref","first-page":"943","DOI":"10.1109\/TRO.2011.2159412","article-title":"Learning stable nonlinear dynamical systems with gaussian mixture models","volume":"27","author":"Khansari-Zadeh","year":"2011","journal-title":"IEEE Transactions on Robotics"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0112","doi-asserted-by":"crossref","first-page":"752","DOI":"10.1016\/j.robot.2014.03.001","article-title":"Learning control Lyapunov function to ensure stability of dynamical system-based robot reaching motions","volume":"62","author":"Khansari-Zadeh","year":"2014","journal-title":"Robotics and Autonomous Systems"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0113","series-title":"Advances in neural information processing systems","first-page":"2859","article-title":"Learning from limited demonstrations","author":"Kim","year":"2013"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0114","series-title":"Advances in neural information processing systems","first-page":"1007","article-title":"Inverse reinforcement learning through structured classification","author":"Klein","year":"2012"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0115","doi-asserted-by":"crossref","first-page":"1437","DOI":"10.1080\/002071797223109","article-title":"A local approach to solving the inverse minimax control problem for discrete-time systems","volume":"68","author":"Kogan","year":"1997","journal-title":"International Journal of Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0116","series-title":"Advances in neural information processing systems","first-page":"769","article-title":"Hierarchical apprenticeship learning with application to quadruped locomotion","author":"Kolter","year":"2008"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0117","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1049\/ip-cta:20010375","article-title":"Inverse control of systems with hysteresis and creep","volume":"148","author":"Krejci","year":"2001","journal-title":"IEE Proceedings-Control Theory and Applications"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0118","series-title":"Proceedings of the 1998 American control conference. ACC (IEEE Cat. No. 98CH36207)","first-page":"1648","article-title":"Stability margins in inverse optimal input-to-state stabilization","volume":"3","author":"Krstic","year":"1998"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0119","unstructured":"Krstic, M., Kanellakopoulos, I., & Kokotovic, P.V. (1995). Nonlinear and adaptive control design."},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0120","doi-asserted-by":"crossref","first-page":"336","DOI":"10.1109\/9.661589","article-title":"Inverse optimal design of input-to-state stabilizing nonlinear controllers","volume":"43","author":"Krstic","year":"1998","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0121","series-title":"Proceedings of the 1997 American control conference (Cat. No. 97CH36041)","first-page":"1884","article-title":"Inverse optimality results for the attitude motion of a rigid spacecraft","volume":"3","author":"Krstic","year":"1997"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0122","doi-asserted-by":"crossref","first-page":"1042","DOI":"10.1109\/9.763225","article-title":"Inverse optimal stabilization of a rigid spacecraft","volume":"44","author":"Krstic","year":"1999","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0123","series-title":"1999 European control conference (ECC)","first-page":"791","article-title":"Adaptive inverse control of piezoelectric actuators with hysteresis operators","author":"Kuhnen","year":"1999"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0124","series-title":"Mathematical systems theory and economics i\/ii","first-page":"189","article-title":"On the inverse optimal problem","author":"Kurz","year":"1969"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0125","doi-asserted-by":"crossref","first-page":"796","DOI":"10.1137\/S1052623400366802","article-title":"Global optimization with polynomials and the problem of moments","volume":"11","author":"Lasserre","year":"2001","journal-title":"SIAM Journal on Optimization"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0126","series-title":"Proceedings of international conference on neural networks (ICNN'97)","first-page":"712","article-title":"Training strategies for critic and action neural networks in dual heuristic programming method","volume":"2","author":"Lendaris","year":"1997"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0127","first-page":"661","article-title":"Analytical design of controllers","volume":"21","author":"Letov","year":"1960","journal-title":"I. Avtom. Telemekh"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0128","unstructured":"Levine, S., & Koltun, V. (2012). Continuous inverse optimal control with locally optimal examples. arXiv preprint arXiv:1206.4617."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0129","series-title":"Advances in neural information processing systems","first-page":"1342","article-title":"Feature construction for inverse reinforcement learning","author":"Levine","year":"2010"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0130","series-title":"Advances in neural information processing systems","first-page":"19","article-title":"Nonlinear inverse reinforcement learning with gaussian processes","author":"Levine","year":"2011"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0131","volume":"17","year":"2013"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0132","doi-asserted-by":"crossref","first-page":"7776","DOI":"10.1109\/ACCESS.2017.2696365","article-title":"Machine learning with big data: Challenges and approaches","volume":"5","author":"L'heureux","year":"2017","journal-title":"IEEE Access"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0133","series-title":"IFAC proceedings volumes","first-page":"9662","article-title":"Inverse optimality design for biological movement systems","volume":"44","author":"Li","year":"2011"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0134","unstructured":"Li, Y., Yao, Y., & Hu, X. (2018). Continuous-Time Inverse Quadratic Optimal Control Problem. arXiv preprint arXiv:1811.00129."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0135","series-title":"Proceedings of the 1999 American control conference (Cat. No. 99CH36251)","first-page":"1598","article-title":"On integral-input-to-state stabilization","volume":"3","author":"Liberzon","year":"1999"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0136","doi-asserted-by":"crossref","first-page":"393","DOI":"10.1016\/0167-6911(91)90111-Q","article-title":"A universal formula for stabilization with bounded controls","volume":"16","author":"Lin","year":"1991","journal-title":"Systems & Control Letters"},{"issue":"11","key":"10.1016\/j.arcontrol.2020.06.001_bib0137","doi-asserted-by":"crossref","first-page":"1639","DOI":"10.1109\/TAC.2005.858694","article-title":"Inverse optimal adaptive control for attitude tracking of spacecraft","volume":"50","author":"Luo","year":"2005","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0138","series-title":"1991 American control conference","first-page":"1879","article-title":"Inverse trajectory control and zero dynamics sensitivity of an elastic manipulator","author":"Madhavan","year":"1991"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0139","doi-asserted-by":"crossref","first-page":"593","DOI":"10.1007\/s10514-016-9556-2","article-title":"Probabilistic movement primitives for coordination of multiple human\u2013robot collaborative tasks","volume":"41","author":"Maeda","year":"2017","journal-title":"Autonomous Robots"},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0140","doi-asserted-by":"crossref","first-page":"241","DOI":"10.1016\/S0167-6911(97)00079-0","article-title":"Stability margins of nonlinear receding-horizon control via inverse optimality","volume":"32","author":"Magni","year":"1997","journal-title":"Systems & Control Letters"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0141","series-title":"Deep apprenticeship learning for playing games (Doctoral dissertation","author":"Markovikj","year":"2014"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0142","series-title":"1999 European control conference (ECC)","first-page":"2413","article-title":"Inverse optimal H\u221e disturbance attenuation of robotic manipulators","author":"Maruyama","year":"1999"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0143","series-title":"Inverse optimal control: Theoretical study (Doctoral dissertation","author":"Maslovskaya","year":"2018"},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0144","doi-asserted-by":"crossref","first-page":"809","DOI":"10.2307\/2371626","article-title":"On multipliers for Lagrange problems","volume":"61","author":"McShane","year":"1939","journal-title":"American Journal of Mathematics"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0145","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1002\/oca.4660150305","article-title":"Discrete-time LQ design from the viewpoint of the inverse optimal regulator","volume":"15","author":"Mehdi","year":"1994","journal-title":"Optimal Control Applications and Methods"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0146","unstructured":"Menner, M., Worsnop, P., & Zeilinger, M.N. (2018). Predictive modeling by infinite-horizon constrained inverse optimal control with application to a human manipulation task. arXiv preprint arXiv:1812.11600."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0147","doi-asserted-by":"crossref","DOI":"10.1109\/TCST.2019.2955663","article-title":"Constrained inverse optimal control with application to a human manipulation task","author":"Menner","year":"2019","journal-title":"IEEE Transactions on Control Systems Technology"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0148","series-title":"Markov decision processes in practice","first-page":"63","article-title":"Approximate dynamic programming by practical examples","author":"Mes","year":"2017"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0149","series-title":"Advances in neural information processing systems","first-page":"2050","article-title":"Compatible reward inverse reinforcement learning","author":"Metelli","year":"2017"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0150","doi-asserted-by":"crossref","first-page":"369","DOI":"10.1109\/TRO.2015.2405593","article-title":"Bayesian nonparametric reward learning from demonstration","volume":"31","author":"Michini","year":"2015","journal-title":"IEEE Transactions on Robotics"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0151","doi-asserted-by":"crossref","first-page":"454","DOI":"10.1109\/TAC.1973.1100364","article-title":"The stable regulator problem and its inverse","volume":"18","author":"Molinari","year":"1973","journal-title":"IEEE Transactions on Automatic Control"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0152","doi-asserted-by":"crossref","first-page":"369","DOI":"10.1007\/s10514-009-9170-7","article-title":"From human to humanoid locomotion\u2014An inverse optimal control approach","volume":"28","author":"Mombaur","year":"2010","journal-title":"Autonomous robots"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0153","series-title":"Learning helicopter control through teaching by showing","author":"Montgomery","year":"1999"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0155","doi-asserted-by":"crossref","unstructured":"Moylan, P.J., & Anderson, B.D. (1973). Nonlinear regulator theory and an inverse optimal control problem.","DOI":"10.1109\/TAC.1973.1100365"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0156","doi-asserted-by":"crossref","first-page":"140","DOI":"10.1109\/TSMCC.2002.801727","article-title":"Adaptive dynamic programming","volume":"32","author":"Murray","year":"2002","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part C (Applications and Reviews)"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0157","series-title":"Inverse problems and optimal design in electricity and magnetism (No. 35)","author":"Neittaanm\u00e4ki","year":"1996"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0158","series-title":"Proceedings of the twenty-third conference on uncertainty in artificial intelligence","first-page":"295","article-title":"Apprenticeship learning using inverse reinforcement learning and gradient methods","author":"Neu","year":"2007"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0159","first-page":"2","article-title":"Algorithms for inverse reinforcement learning","volume":"1","author":"Ng","year":"2000","journal-title":"Icml"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0160","series-title":"Advances in neural information processing systems","first-page":"1747","article-title":"Inverse reinforcement learning with locally consistent reward functions","author":"Nguyen","year":"2015"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0161","series-title":"On the inverse optimal control problem in manual control systems","volume":"Vol. 208","author":"Obermayer","year":"1965"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0162","series-title":"49th IEEE conference on decision and control (CDC)","first-page":"4813","article-title":"Discrete-time inverse optimal control for nonlinear systems trajectory tracking","author":"Ornelas","year":"2010"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0163","series-title":"1990 American control conference","first-page":"67","article-title":"Adaptive stabilization of non-linearizable systems under a matching assumption","author":"Ortega","year":"1990"},{"issue":"1\u20132","key":"10.1016\/j.arcontrol.2020.06.001_bib0164","first-page":"1","article-title":"An algorithmic perspective on imitation learning","volume":"7","author":"Osa","year":"2018","journal-title":"Foundations and Trends\u00ae in Robotics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0165","series-title":"Robotics: Science and systems","first-page":"1","article-title":"Online trajectory planning in dynamic environments for surgical task automation","author":"Osa","year":"2014"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0166","series-title":"Proceedings of the 1997 American control conference (Cat. No. 97CH36041)","first-page":"1889","article-title":"Achieving good performance in global attitude stabilization","volume":"3","author":"Osipchuk","year":"1997"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0167","series-title":"Advances in neural information processing systems","first-page":"2616","article-title":"Probabilistic movement primitives","author":"Paraschos","year":"2013"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0168","doi-asserted-by":"crossref","first-page":"847","DOI":"10.1109\/70.897796","article-title":"Analytic nonlinear H\/sub\/spl infin\/\/inverse-optimal control for Euler-Lagrange system","volume":"16","author":"Park","year":"2000","journal-title":"IEEE Transactions on Robotics and Automation"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0169","series-title":"An inverse optimal control problem and its application to the choice of performance index for economic stabilization policy","first-page":"64","volume":"1","author":"Park","year":"1975"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0170","series-title":"Robotics science and systems workshop on inverse optimal control and robotic learning from demonstration","article-title":"Inverse optimal control for humanoid locomotion","author":"Park","year":"2013"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0171","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition workshops","first-page":"2050","article-title":"Zero-shot visual imitation","author":"Pathak","year":"2018"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0172","series-title":"53rd IEEE conference on decision and control","first-page":"5581","article-title":"Inverse optimal control with polynomial optimization","author":"Pauwels","year":"2014"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0173","doi-asserted-by":"crossref","first-page":"1798","DOI":"10.1137\/14099454X","article-title":"Linear conic optimization for inverse optimal control","volume":"54","author":"Pauwels","year":"2016","journal-title":"SIAM Journal on Control and Optimization"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0174","series-title":"Thirtieth AAAI conference on artificial intelligence","article-title":"Inverse reinforcement learning through policy gradient minimization","author":"Pirotta","year":"2016"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0175","doi-asserted-by":"crossref","first-page":"360","DOI":"10.1109\/TNN.2003.809412","article-title":"Adaptive inverse control of linear and nonlinear systems using dynamic neural networks","volume":"14","author":"Plett","year":"2003","journal-title":"IEEE Transactions on Neural Networks"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0176","unstructured":"Pontryagin, L.S., Boltyanskii, V.G., Gamkrelidze, R.V., & Mishchenko, E.F. (1961). Mathematical Theory of Optimal Processes{in Russian}."},{"issue":"713","key":"10.1016\/j.arcontrol.2020.06.001_bib0177","doi-asserted-by":"crossref","first-page":"390","DOI":"10.1017\/S0001924000047801","article-title":"Synthesis of an aircraft roll-stabilisation system: an application of invERSE OPTIMAL CONTROL THEORY","volume":"74","author":"Porter","year":"1970","journal-title":"The Aeronautical Journal"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0178","series-title":"2008 winter simulation conference","first-page":"205","article-title":"Approximate dynamic programming: Lessons from the field","author":"Powell","year":"2008"},{"issue":"9","key":"10.1016\/j.arcontrol.2020.06.001_bib0179","doi-asserted-by":"crossref","first-page":"2637","DOI":"10.1177\/0142331218806338","article-title":"Inverse optimal control of a class of affine nonlinear systems","volume":"41","author":"Prasanna","year":"2019","journal-title":"Transactions of the Institute of Measurement and Control"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0180","doi-asserted-by":"crossref","first-page":"770","DOI":"10.1109\/TCST.2014.2343935","article-title":"Solutions to the inverse lqr problem with application to biological systems analysis","volume":"23","author":"Priess","year":"2014","journal-title":"IEEE Transactions on Control Systems Technology"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0181","series-title":"2012 IEEE international conference on robotics and automation","first-page":"531","article-title":"A convex approach to inverse optimal control and its application to modeling human locomotion","author":"Puydupin-Jamin","year":"2012"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0182","series-title":"Analysis and optimization of systems","first-page":"227","article-title":"On inverse problem of nonlinear system dynamics","author":"Radoslav","year":"1988"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0183","first-page":"2586","volume":"7","author":"Ramachandran","year":"2007"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0184","series-title":"Proceedings of the 19th international conference on neural information processing systems","first-page":"1153","article-title":"Boosting structured prediction for imitation learning","author":"Ratliff","year":"2006"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0185","series-title":"Maximum margin planning. In Proceedings of the 23rd international conference on machine learning","first-page":"729","author":"Ratliff","year":"2006"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0186","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1007\/s10514-009-9121-3","article-title":"Learning to search: Functional gradient techniques for imitation learning","volume":"27","author":"Ratliff","year":"2009","journal-title":"Autonomous Robots"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0187","doi-asserted-by":"crossref","first-page":"275","DOI":"10.1007\/s10514-018-9791-9","article-title":"Learning control Lyapunov functions from counterexamples and demonstrations","volume":"43","author":"Ravanbakhsh","year":"2019","journal-title":"Autonomous Robots"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0188","unstructured":"Ravi, S., & Larochelle, H. (2016). Optimization as a model for few-shot learning."},{"issue":"4","key":"10.1016\/j.arcontrol.2020.06.001_bib0189","doi-asserted-by":"crossref","first-page":"370","DOI":"10.1109\/TAC.1964.1105746","article-title":"On an inverse problem in optimal control","volume":"9","author":"Rekasius","year":"1964","journal-title":"IEEE Transactions on Automatic Control"},{"issue":"11","key":"10.1016\/j.arcontrol.2020.06.001_bib0190","doi-asserted-by":"crossref","first-page":"286","DOI":"10.1016\/j.ifacol.2015.09.199","article-title":"Approximate optimal control by inverse CLF approach","volume":"48","author":"Rohrweck","year":"2015","journal-title":"IFAC-PapersOnLine"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0191","series-title":"Proceedings of the thirteenth international conference on artificial intelligence and statistics","first-page":"661","article-title":"Efficient reductions for imitation learning","author":"Ross","year":"2010"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0192","series-title":"Proceedings of the fourteenth international conference on artificial intelligence and statistics","first-page":"627","article-title":"A reduction of imitation learning and structured prediction to no-regret online learning","author":"Ross","year":"2011"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0193","series-title":"2017 IEEE 56th annual conference on decision and control (CDC)","first-page":"721","article-title":"On inverse optimal control via polynomial optimization","author":"Rouot","year":"2017"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0194","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1145\/279943.279964","article-title":"Learning agents for uncertain environments","volume":"98","author":"Russell","year":"1998","journal-title":"COLT"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0195","series-title":"Proceedings of international conference on neural networks (ICNN'97)","first-page":"2273","article-title":"Asymptotic dynamic programming: Preliminary concepts and results","volume":"4","author":"Saeks","year":"1997"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0196","series-title":"Discrete-time inverse optimal control for nonlinear systems","author":"Sanchez","year":"2017"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0197","first-page":"111","article-title":"Chaos stabilization: An inverse optimal control approach","volume":"32","author":"Sanchez","year":"2002","journal-title":"Latin American Applied Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0198","series-title":"Advances in neural information processing systems","first-page":"1040","article-title":"Learning from demonstration","author":"Schaal","year":"1997"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0199","doi-asserted-by":"crossref","first-page":"233","DOI":"10.1016\/S1364-6613(99)01327-3","article-title":"Is imitation learning the route to humanoid robots?","volume":"3","author":"Schaal","year":"1999","journal-title":"Trends in Cognitive Sciences"},{"issue":"1431","key":"10.1016\/j.arcontrol.2020.06.001_bib0200","doi-asserted-by":"crossref","first-page":"537","DOI":"10.1098\/rstb.2002.1258","article-title":"Computational approaches to motor learning by imitation","volume":"358","author":"Schaal","year":"2003","journal-title":"Philosophical Transactions of the Royal Society of London. Series B: Biological Sciences"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0201","series-title":"International conference on machine learning","first-page":"1889","article-title":"Trust region policy optimization","author":"Schulman","year":"2015"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0202","unstructured":"Schulman, J., Wolski, F., Dhariwal, P., Radford, A., & Klimov, O. (2017). Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347."},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0203","doi-asserted-by":"crossref","first-page":"568","DOI":"10.1016\/0022-247X(85)90317-8","article-title":"Generalized polynomial approximations in Markovian decision processes","volume":"110","author":"Schweitzer","year":"1985","journal-title":"Journal of Mathematical Analysis and Applications"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0204","doi-asserted-by":"crossref","unstructured":"Sepulchre, R., Jankovic, M., & Kokotovic, P. (1997). Constructive Nonlinear Control.","DOI":"10.1007\/978-1-4471-0967-9"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0205","series-title":"Constructive nonlinear control","author":"Sepulchre","year":"2012"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0206","doi-asserted-by":"crossref","first-page":"297","DOI":"10.1007\/s10958-009-9553-5","article-title":"Inverse optimal control and construction of control Lyapunov functions","volume":"161","author":"Shahmansoorian","year":"2009","journal-title":"Journal of Mathematical Sciences"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0207","series-title":"Proceedings of the 2016 international conference on autonomous agents & multiagent systems","first-page":"1060","article-title":"Inverse reinforcement learning from failure","author":"Shiarlis","year":"2016"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0208","volume":"2","year":"2004"},{"issue":"12","key":"10.1016\/j.arcontrol.2020.06.001_bib0209","doi-asserted-by":"crossref","first-page":"1565","DOI":"10.1177\/0278364910369715","article-title":"Learning from demonstration for autonomous navigation in complex unstructured terrain","volume":"29","author":"Silver","year":"2010","journal-title":"The International Journal of Robotics Research"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0210","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1016\/0167-6911(89)90028-5","article-title":"A universal construction of Artstein's theorem on nonlinear stabilization","volume":"13","author":"Sontag","year":"1989","journal-title":"Systems & control letters"},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0211","doi-asserted-by":"crossref","first-page":"462","DOI":"10.1137\/0321028","article-title":"A Lyapunov-like characterization of asymptotic controllability","volume":"21","author":"Sontag","year":"1983","journal-title":"SIAM Journal on Control and Optimization"},{"issue":"1","key":"10.1016\/j.arcontrol.2020.06.001_bib0212","doi-asserted-by":"crossref","first-page":"92","DOI":"10.1109\/9.45152","article-title":"On adaptive inverse dynamics control of rigid robots","volume":"35","author":"Spong","year":"1990","journal-title":"IEEE Transactions on Automatic Control"},{"issue":"5","key":"10.1016\/j.arcontrol.2020.06.001_bib0213","doi-asserted-by":"crossref","first-page":"706","DOI":"10.1109\/9.668841","article-title":"Partial pole placement by LQ regulators: An inverse problem approach","volume":"43","author":"Sugimoto","year":"1998","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0214","unstructured":"Sun, M., & Ma, X. (2019). Adversarial Imitation Learning from Incomplete Demonstrations. arXiv preprint arXiv:1905.12310."},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0215","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1109\/37.588098","article-title":"300 years of optimal control: From the brachystochrone to the maximum principle","volume":"17","author":"Sussmann","year":"1997","journal-title":"IEEE Control Systems Magazine"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0216","series-title":"Reinforcement learning: An introduction","author":"Sutton","year":"1998"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0217","series-title":"Proceedings of the 25th international conference on machine learning","first-page":"1032","article-title":"Apprenticeship learning using linear programming","author":"Syed","year":"2008"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0218","series-title":"Advances in neural information processing systems","first-page":"1449","article-title":"A game-theoretic approach to apprenticeship learning","author":"Syed","year":"2008"},{"issue":"10","key":"10.1016\/j.arcontrol.2020.06.001_bib0219","doi-asserted-by":"crossref","first-page":"1314","DOI":"10.1177\/0278364915587923","article-title":"Statistical mutual conversion between whole body motion primitives and linguistic sentences for human motions","volume":"34","author":"Takano","year":"2015","journal-title":"The International Journal of Robotics Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0220","series-title":"Proceedings of the 22nd international conference on machine learning","first-page":"896","article-title":"Learning structured prediction models: A large margin approach","author":"Taskar","year":"2005"},{"issue":"6","key":"10.1016\/j.arcontrol.2020.06.001_bib0221","doi-asserted-by":"crossref","first-page":"674","DOI":"10.1109\/TAC.1967.1098741","article-title":"On the inverse optimum control problem for a class of nonlinear autonomous systems","volume":"12","author":"Thau","year":"1967","journal-title":"IEEE Transactions on Automatic Control"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0222","unstructured":"Torabi, F., Warnell, G., & Stone, P. (2018). Behavioral cloning from observation. arXiv preprint arXiv:1805.01954."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0223","unstructured":"Tucker, A., Gleave, A., & Russell, S. (2018). Inverse reinforcement learning for video games. arXiv preprint arXiv:1810.10593."},{"issue":"3","key":"10.1016\/j.arcontrol.2020.06.001_bib0224","doi-asserted-by":"crossref","first-page":"891","DOI":"10.1007\/s11063-017-9702-7","article-title":"Model-free deep inverse reinforcement learning by logistic regression","volume":"47","author":"Uchibe","year":"2018","journal-title":"Neural Processing Letters"},{"issue":"2\u20133","key":"10.1016\/j.arcontrol.2020.06.001_bib0225","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1016\/j.robot.2004.03.004","article-title":"Programming full-body movements for humanoid robots by observation","volume":"47","author":"Ude","year":"2004","journal-title":"Robotics and autonomous systems"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0226","series-title":"Machine learning and statistical classification","article-title":"Learning to control dynamic systems","author":"Urbancic","year":"1993"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0227","series-title":"2010 IEEE international conference on robotics and automation","first-page":"2074","article-title":"Superhuman performance of surgical tasks by robots using iterative learning from human-guided demonstrations","author":"Van Den Berg","year":"2010"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0228","series-title":"2014 IEEE international autumn meeting on power, electronics and computing (ROPEC)","first-page":"1","article-title":"Inverse optimal control on electric power conversion","author":"Vega","year":"2014"},{"issue":"May","key":"10.1016\/j.arcontrol.2020.06.001_bib0229","first-page":"883","article-title":"Learning from examples as an inverse problem","volume":"6","author":"Vito","year":"2005","journal-title":"Journal of Machine Learning Research"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0230","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1109\/MCI.2009.932261","article-title":"Adaptive dynamic programming: An introduction","volume":"4","author":"Wang","year":"2009","journal-title":"IEEE computational intelligence magazine"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0231","series-title":"Proceedings of the institution of electrical engineers","first-page":"449","article-title":"Synthesis of optimal block controllers for multivariable control systems and its inverse optimal-control problem","volume":"126","author":"Wei","year":"1979"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0232","series-title":"Advanced forecasting methods for global crisis warning and models of intelligence","first-page":"25","author":"Werbos","year":"1977"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0233","series-title":"Handbook of intelligent control: Neural, fuzzy and adaptive approaches","article-title":"Approximate dynamic programming for real-time control and neural modeling","author":"Werbos","year":"1992"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0234","series-title":"Adaptive systems in control and signal processing 1986","first-page":"1","article-title":"Adaptive inverse control","author":"Widrow","year":"1987"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0235","series-title":"Proceedings of international workshop on neural networks for identification, control, robotics and signal\/image processing","first-page":"30","article-title":"Adaptive inverse control based on linear and nonlinear adaptive filtering","author":"Widrow","year":"1996"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0236","series-title":"Adaptive inverse control, reissue edition: A signal processing approach","author":"Widrow","year":"2008"},{"issue":"17","key":"10.1016\/j.arcontrol.2020.06.001_bib0237","doi-asserted-by":"crossref","first-page":"493","DOI":"10.1049\/el:19770361","article-title":"Inverse optimal control problem for linear discrete-time systems","volume":"13","author":"Willems","year":"1977","journal-title":"Electronics Letters"},{"issue":"7\u20138","key":"10.1016\/j.arcontrol.2020.06.001_bib0238","doi-asserted-by":"crossref","first-page":"1317","DOI":"10.1016\/S0893-6080(98)00066-5","article-title":"Multiple paired forward and inverse models for motor control","volume":"11","author":"Wolpert","year":"1998","journal-title":"Neural Networks"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0239","unstructured":"Wulfmeier, M., Ondruska, P., & Posner, I. (2015). Maximum entropy deep inverse reinforcement learning. arXiv preprint arXiv:1507.04888."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0240","series-title":"Predictive control: Fundamentals and developments","author":"Xi","year":"2019"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0241","series-title":"Mathematical problems in engineering","article-title":"A survey on inverse problems for applied sciences","author":"Yaman","year":"2013"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0242","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1029\/WR022i002p00095","article-title":"Review of parameter identification procedures in groundwater hydrology: The inverse problem","volume":"22","author":"Yeh","year":"1986","journal-title":"Water Resources Research"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0243","unstructured":"Yu, T., Finn, C., Xie, A., Dasari, S., Zhang, T., Abbeel, P. et\u00a0al. (2018). One-shot imitation from observing humans via domain-adaptive meta-learning. arXiv preprint arXiv:1802.01557."},{"issue":"10","key":"10.1016\/j.arcontrol.2020.06.001_bib0244","doi-asserted-by":"crossref","first-page":"3505","DOI":"10.1142\/S0218127404011442","article-title":"Chaotifying fuzzy hyperbolic model using adaptive inverse optimal control approach","volume":"14","author":"Zhang","year":"2004","journal-title":"International Journal of Bifurcation and Chaos"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0245","series-title":"Twenty-eighth AAAI conference on artificial intelligence","article-title":"Robust bayesian inverse reinforcement learning with sparse behavior noise","author":"Zheng","year":"2014"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0246","series-title":"2012 IEEE congress on evolutionary computation","first-page":"1","article-title":"A review of inverse reinforcement learning theory and recent advances","author":"Zhifei","year":"2012"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0248","doi-asserted-by":"crossref","first-page":"17","DOI":"10.3390\/robotics7020017","article-title":"Robot learning from demonstration in robotic assembly: A survey","volume":"7","author":"Zhu","year":"2018","journal-title":"Robotics"},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0249","unstructured":"Ziebart, B.D. (2010). Modeling purposeful adaptive behavior with the principle of maximum causal entropy (Doctoral dissertation, figshare)."},{"key":"10.1016\/j.arcontrol.2020.06.001_bib0250","first-page":"1433","article-title":"Maximum entropy inverse reinforcement learning","volume":"8","author":"Ziebart","year":"2008","journal-title":"Aaai"},{"issue":"2","key":"10.1016\/j.arcontrol.2020.06.001_bib0251","doi-asserted-by":"crossref","first-page":"175","DOI":"10.1177\/0278364910392608","article-title":"Optimization and learning for rough terrain legged locomotion","volume":"30","author":"Zucker","year":"2011","journal-title":"The International Journal of Robotics Research"}],"container-title":["Annual Reviews in Control"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1367578820300511?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1367578820300511?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2022,10,30]],"date-time":"2022-10-30T09:46:59Z","timestamp":1667123219000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1367578820300511"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"references-count":252,"alternative-id":["S1367578820300511"],"URL":"https:\/\/doi.org\/10.1016\/j.arcontrol.2020.06.001","relation":{},"ISSN":["1367-5788"],"issn-type":[{"value":"1367-5788","type":"print"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"From inverse optimal control to inverse reinforcement learning: A historical review","name":"articletitle","label":"Article Title"},{"value":"Annual Reviews in Control","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.arcontrol.2020.06.001","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2020 Elsevier Ltd. All rights reserved.","name":"copyright","label":"Copyright"}]}}