{"id":"https://openalex.org/W4364383075","doi":"https://doi.org/10.48550/arxiv.2304.04150","title":"RoboPianist: Dexterous Piano Playing with Deep Reinforcement Learning","display_name":"RoboPianist: Dexterous Piano Playing with Deep Reinforcement Learning","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4364383075","doi":"https://doi.org/10.48550/arxiv.2304.04150"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.04150","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2304.04150","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023707892","display_name":"Kevin Zakka","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zakka, Kevin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106821653","display_name":"Laura Smith","orcid":"https://orcid.org/0000-0002-7890-497X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Smith, Laura","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006600962","display_name":"Nimrod Gileadi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gileadi, Nimrod","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076676581","display_name":"Taylor A. Howell","orcid":"https://orcid.org/0000-0001-5144-5702"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Howell, Taylor","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103151044","display_name":"Xue Bin Peng","orcid":"https://orcid.org/0009-0000-0875-5334"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Xue Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103710224","display_name":"Sumeet Singh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Sumeet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008259889","display_name":"Yuval Tassa","orcid":"https://orcid.org/0000-0002-1197-288X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tassa, Yuval","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021289514","display_name":"Pete Florence","orcid":"https://orcid.org/0000-0002-7148-5645"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Florence, Pete","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005577303","display_name":"Andy Zeng","orcid":"https://orcid.org/0000-0002-4319-2159"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Andy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049349154","display_name":"Pieter Abbeel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abbeel, Pieter","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.99995,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":84,"max":87},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9957,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9744,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9565,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7474322},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5276757},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.45187163}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.80517393},{"id":"https://openalex.org/C124086623","wikidata":"https://www.wikidata.org/wiki/Q5994","display_name":"Piano","level":2,"score":0.8002864},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7474322},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.69055176},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.64214104},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5727043},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.55701005},{"id":"https://openalex.org/C2778473898","wikidata":"https://www.wikidata.org/wiki/Q2145110","display_name":"Repertoire","level":2,"score":0.53992385},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5276757},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.49421242},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.45187163},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4392681},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37468165},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.080723286},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.064893514},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0},{"id":"https://openalex.org/C52119013","wikidata":"https://www.wikidata.org/wiki/Q50637","display_name":"Art history","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.04150","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2304.04150","pdf_url":"http://arxiv.org/pdf/2304.04150","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2304.04150","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.04150","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.5,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W629160228","https://openalex.org/W607893370","https://openalex.org/W587444722","https://openalex.org/W584653787","https://openalex.org/W4362512397","https://openalex.org/W4255048859","https://openalex.org/W3120300186","https://openalex.org/W2357375963","https://openalex.org/W2316271602","https://openalex.org/W2084831119"],"abstract_inverted_index":{"Replicating":[0],"human-like":[1],"dexterity":[2,47],"in":[3,13,26],"robot":[4],"hands":[5,100],"represents":[6],"one":[7],"of":[8,34,46,68,106,122],"the":[9,27,32,65],"largest":[10],"open":[11,128],"problems":[12,35],"robotics.":[14],"Reinforcement":[15],"learning":[16],"is":[17,140],"a":[18,42,60,71,94],"promising":[19],"approach":[20],"that":[21,62,96],"has":[22,37],"achieved":[23],"impressive":[24],"progress":[25],"last":[28],"few":[29],"years;":[30],"however,":[31],"class":[33],"it":[36],"typically":[38],"addressed":[39],"corresponds":[40],"to":[41,50,73,101],"rather":[43],"narrow":[44],"definition":[45],"as":[48,70],"compared":[49],"human":[51,66],"capabilities.":[52],"To":[53],"address":[54],"this":[55],"gap,":[56],"we":[57],"investigate":[58],"piano-playing,":[59],"skill":[61],"challenges":[63,129],"even":[64],"limits":[67],"dexterity,":[69],"means":[72],"test":[74],"high-dimensional":[75],"control,":[76],"and":[77,82,85,89,127,138],"which":[78],"requires":[79],"high":[80],"spatial":[81],"temporal":[83],"precision,":[84],"complex":[86],"finger":[87],"coordination":[88],"planning.":[90],"We":[91,115],"introduce":[92,117],"RoboPianist,":[93],"system":[95],"enables":[97],"simulated":[98],"anthropomorphic":[99],"learn":[102],"an":[103,118],"extensive":[104],"repertoire":[105],"150":[107],"piano":[108],"pieces":[109],"where":[110],"traditional":[111],"model-based":[112],"optimization":[113],"struggles.":[114],"additionally":[116],"open-sourced":[119],"environment,":[120],"benchmark":[121],"tasks,":[123],"interpretable":[124],"evaluation":[125],"metrics,":[126],"for":[130],"future":[131],"study.":[132],"Our":[133],"website":[134],"featuring":[135],"videos,":[136],"code,":[137],"datasets":[139],"available":[141],"at":[142],"https://kzakka.com/robopianist/":[143]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4364383075","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-01-15T02:01:55.728564","created_date":"2023-04-12"}