{"id":"https://openalex.org/W4390494915","doi":"https://doi.org/10.1177/02783649231224053","title":"Rapid locomotion via reinforcement learning","display_name":"Rapid locomotion via reinforcement learning","publication_year":2024,"publication_date":"2024-01-02","ids":{"openalex":"https://openalex.org/W4390494915","doi":"https://doi.org/10.1177/02783649231224053"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1177/02783649231224053","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.1177/02783649231224053","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014707090","display_name":"Gabriel B. Margolis","orcid":"https://orcid.org/0000-0001-8191-4813"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Gabriel B. Margolis","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100631685","display_name":"Ge Yang","orcid":"https://orcid.org/0000-0003-0918-7329"},"institutions":[{"id":"https://openalex.org/I4210160315","display_name":"The NSF AI Institute for Artificial Intelligence and Fundamental Interactions","ror":"https://ror.org/04pvzz946","country_code":"US","type":"facility","lineage":["https://openalex.org/I121934306","https://openalex.org/I12912129","https://openalex.org/I136199984","https://openalex.org/I4210160315","https://openalex.org/I63966007"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ge Yang","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","NSF AI Institute for Artificial Intelligence and Fundamental Interactions, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"NSF AI Institute for Artificial Intelligence and Fundamental Interactions, Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210160315"]},{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061581198","display_name":"Kartik Paigwar","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kartik Paigwar","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100357784","display_name":"Tao Chen","orcid":"https://orcid.org/0000-0003-0190-3853"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tao Chen","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089793278","display_name":"Pulkit Agrawal","orcid":"https://orcid.org/0000-0001-8463-9917"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"funder","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I4210160315","display_name":"The NSF AI Institute for Artificial Intelligence and Fundamental Interactions","ror":"https://ror.org/04pvzz946","country_code":"US","type":"facility","lineage":["https://openalex.org/I121934306","https://openalex.org/I12912129","https://openalex.org/I136199984","https://openalex.org/I4210160315","https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pulkit Agrawal","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","NSF AI Institute for Artificial Intelligence and Fundamental Interactions, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]},{"raw_affiliation_string":"NSF AI Institute for Artificial Intelligence and Fundamental Interactions, Cambridge, MA, USA","institution_ids":["https://openalex.org/I4210160315"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5014707090"],"corresponding_institution_ids":["https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":7.662,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.999978,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"43","issue":"4","first_page":"572","last_page":"587"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9841,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.977,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.78980064},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.58744603},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.58018273},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.57174253},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5595796},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.49429035},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.48774153},{"id":"https://openalex.org/C14185376","wikidata":"https://www.wikidata.org/wiki/Q30232","display_name":"Agile software development","level":2,"score":0.45397568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4375247},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.41735685},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4170637},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.35123697},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3240338},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1177/02783649231224053","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2205.02824","pdf_url":"https://arxiv.org/pdf/2205.02824","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1177/02783649231224053","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":true,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":"PHY-2019786"},{"funder":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency","award_id":"HR001119S0005"},{"funder":"https://openalex.org/F4320338294","funder_display_name":"Air Force Research Laboratory","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":45,"referenced_works":["https://openalex.org/W1945123189","https://openalex.org/W1975230295","https://openalex.org/W1991692529","https://openalex.org/W1997576152","https://openalex.org/W2061983716","https://openalex.org/W2086853455","https://openalex.org/W2133859362","https://openalex.org/W2161427949","https://openalex.org/W2296073425","https://openalex.org/W2411824964","https://openalex.org/W2593412525","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2891076394","https://openalex.org/W2911087563","https://openalex.org/W2924656332","https://openalex.org/W2962957031","https://openalex.org/W2963184939","https://openalex.org/W2963614114","https://openalex.org/W2968213087","https://openalex.org/W2969111820","https://openalex.org/W2972758308","https://openalex.org/W2972810470","https://openalex.org/W2981030070","https://openalex.org/W3000354568","https://openalex.org/W3089482831","https://openalex.org/W3090207068","https://openalex.org/W3103568523","https://openalex.org/W3104876774","https://openalex.org/W3108412994","https://openalex.org/W3204973825","https://openalex.org/W3206363598","https://openalex.org/W3209211683","https://openalex.org/W3213974477","https://openalex.org/W4205430897","https://openalex.org/W4226143977","https://openalex.org/W4226340130","https://openalex.org/W4286963241","https://openalex.org/W4287082128","https://openalex.org/W4287180395","https://openalex.org/W4301431487","https://openalex.org/W4309442087","https://openalex.org/W4311486620","https://openalex.org/W4317987839","https://openalex.org/W4383108493"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W3032871857","https://openalex.org/W2920061524","https://openalex.org/W2328553770","https://openalex.org/W2145821588","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2038908348","https://openalex.org/W1992962589","https://openalex.org/W1977959518"],"abstract_inverted_index":{"Agile":[0],"maneuvers":[1],"such":[2],"as":[3],"sprinting":[4],"and":[5,40,49,51,68,86],"high-speed":[6],"turning":[7],"in":[8,63],"the":[9,27,71,98],"wild":[10],"are":[11,78,101],"challenging":[12],"for":[13,26,93],"legged":[14],"robots.":[15],"We":[16],"present":[17],"an":[18,80,88],"end-to-end":[19],"learned":[20],"controller":[21,57],"that":[22],"achieves":[23],"record":[24],"agility":[25],"MIT":[28],"Mini":[29],"Cheetah,":[30],"sustaining":[31],"speeds":[32],"up":[33],"to":[34,54,70],"3.9":[35],"m/s.":[36],"This":[37],"system":[38,90],"runs":[39],"turns":[41],"fast":[42],"on":[43,83],"natural":[44],"terrains":[45],"like":[46],"grass,":[47],"ice,":[48],"gravel":[50],"responds":[52],"robustly":[53],"disturbances.":[55],"Our":[56],"is":[58],"a":[59],"neural":[60],"network":[61],"trained":[62],"simulation":[64],"via":[65],"reinforcement":[66],"learning":[67],"transferred":[69],"real":[72],"world.":[73],"The":[74],"two":[75],"key":[76],"components":[77],"(i)":[79],"adaptive":[81],"curriculum":[82],"velocity":[84],"commands":[85],"(ii)":[87],"online":[89],"identification":[91],"strategy":[92],"sim-to-real":[94],"transfer.":[95],"Videos":[96],"of":[97],"robot\u2019s":[99],"behaviors":[100],"available":[102],"at":[103],"https://agility.csail.mit.edu/":[104],".":[105]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4390494915","counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":10}],"updated_date":"2025-04-14T22:45:40.065394","created_date":"2024-01-03"}