{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T19:46:22Z","timestamp":1729626382922,"version":"3.28.0"},"reference-count":38,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9560895","type":"proceedings-article","created":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:28:35Z","timestamp":1634689715000},"page":"11196-11202","source":"Crossref","is-referenced-by-count":13,"title":["Spatial Reasoning from Natural Language Instructions for Robot Manipulation"],"prefix":"10.1109","author":[{"given":"Sagar Gubbi","family":"Venkatesh","sequence":"first","affiliation":[]},{"given":"Anirban","family":"Biswas","sequence":"additional","affiliation":[]},{"given":"Raviteja","family":"Upadrashta","sequence":"additional","affiliation":[]},{"given":"Vikram","family":"Srinivasan","sequence":"additional","affiliation":[]},{"given":"Partha","family":"Talukdar","sequence":"additional","affiliation":[]},{"given":"Bharadwaj","family":"Amrutur","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref38","first-page":"21","article-title":"Ssd: Single shot multibox detector","author":"liu","year":"2016","journal-title":"European Conference on Computer Vision"},{"article-title":"Enabling robots to understand incomplete natural language instructions using commonsense reasoning","year":"2019","author":"chen","key":"ref33"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794287"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.028"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1138"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.215"},{"key":"ref36","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.12026","article-title":"Learning interpretable spatial operations in a rich 3d blocks world","volume":"32","author":"bisk","year":"2018","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2018","author":"devlin","key":"ref35"},{"article-title":"Learning to generate unambiguous spatial referring expressions for real-world environments","year":"2019","author":"do?an","key":"ref34"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2016.XII.037"},{"key":"ref11","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v25i1.7979","article-title":"Understanding natural language commands for robotic navigation and mobile manipulation","author":"tellex","year":"2011","journal-title":"Twenty-Fifth AAAI Conference on Artificial Intelligence"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2017.XIII.056"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"44","DOI":"10.18653\/v1\/W17-2806","article-title":"Communication with robots using multi-layer recurrent networks","author":"pi\u0161l","year":"2017","journal-title":"Proceedings of the First Workshop on Language Grounding for Robotics"},{"key":"ref14","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"2015","journal-title":"ICLRE"},{"article-title":"Reinforcement learning with augmented data","year":"2020","author":"laskin","key":"ref15"},{"key":"ref16","first-page":"719","article-title":"Human-robot communication and machine learning","volume":"11","author":"klingspor","year":"1997","journal-title":"Applied Artificial Intelligence"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2014.09.031"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2009.5152776"},{"key":"ref19","first-page":"806","article-title":"Learning to follow navigational directions","author":"vogel","year":"2010","journal-title":"Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00209"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00387"},{"key":"ref27","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v30i1.10364","article-title":"Listen, attend, and walk: Neural mapping of navigational instructions to action sequences","author":"mei","year":"2016","journal-title":"THIRTIETH AAAI Conference on Artificial Intelligence"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1106"},{"key":"ref6","first-page":"3314","article-title":"Speaker-follower models for vision-and-language navigation","author":"fried","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref29","article-title":"Walk the talk: Connecting language, knowledge, and action in route instructions","author":"macmahon","year":"2006","journal-title":"Association for the Advancement of Artificial Intelligence (AAAI)"},{"key":"ref5","first-page":"37","article-title":"Look before you leap: Bridging model-free and model-based reinforcement learning for planned-ahead vision-and-language navigation","author":"wang","year":"2018","journal-title":"Proceedings of the European Conference on Computer Vision (ECCV)"},{"article-title":"Few-shot object grounding and mapping for natural language robot instruction following","year":"2020","author":"blukis","key":"ref8"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1287"},{"key":"ref2","article-title":"Towards a dataset for human computer communication via grounded language acquisition","author":"bisk","year":"2016","journal-title":"Work-shops at the Thirtieth AAAI Conference on Artificial Intelligence"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ROMAN.2017.8172349"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1089"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.3115\/1687878.1687892"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00754"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.493"},{"key":"ref24","first-page":"2054","article-title":"Embodied question answering","author":"das","year":"2018","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops"},{"key":"ref23","first-page":"4971","article-title":"Don’t just assume; look and answer: Overcoming priors for visual question answering","author":"agrawal","year":"2018","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref26","article-title":"Self-monitoring navigation agent via auxiliary progress estimation","author":"ma","year":"2019","journal-title":"ICLRE"},{"article-title":"Chasing ghosts: Instruction following as bayesian state tracking","year":"2019","author":"anderson","key":"ref25"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2021,5,30]]},"location":"Xi'an, China","end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09560895.pdf?arnumber=9560895","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,12]],"date-time":"2023-01-12T22:33:23Z","timestamp":1673562803000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9560895\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9560895","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}