{"id":"https://openalex.org/W4384614004","doi":"https://doi.org/10.48550/arxiv.2307.07091","title":"Robotic Manipulation Datasets for Offline Compositional Reinforcement Learning","display_name":"Robotic Manipulation Datasets for Offline Compositional Reinforcement Learning","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4384614004","doi":"https://doi.org/10.48550/arxiv.2307.07091"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2307.07091","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2307.07091","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090201614","display_name":"Marcel Hussing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hussing, Marcel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077848901","display_name":"Jorge A. Mendez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mendez, Jorge A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092489701","display_name":"Anisha Singrodia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singrodia, Anisha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030081726","display_name":"David Kent","orcid":"https://orcid.org/0000-0002-5418-3602"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kent, Cassandra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020691490","display_name":"Eric Eaton","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eaton, Eric","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.712026,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":67,"max":78},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9964,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9805,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9664,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.75839317}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8261409},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.82240844},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.75839317},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7485173},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.63551563},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.57881325},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2307.07091","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.07091","pdf_url":"http://arxiv.org/pdf/2307.07091","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2307.07091","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2307.07091","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4306674287","https://openalex.org/W4283697347","https://openalex.org/W4210805261","https://openalex.org/W3170094116","https://openalex.org/W3107602296","https://openalex.org/W3046775127","https://openalex.org/W2961085424"],"abstract_inverted_index":{"Offline":[0],"reinforcement":[1],"learning":[2],"(RL)":[3],"is":[4,29,37,107],"a":[5,78,113,186],"promising":[6],"direction":[7],"that":[8,147,161],"allows":[9],"RL":[10,36,88,150],"agents":[11,62],"to":[12,31,63,135,157,174,180,182],"pre-train":[13],"on":[14,143],"large":[15,43],"datasets,":[16,44],"avoiding":[17],"the":[18,26,56,74,96,154,176],"recurrence":[19],"of":[20,80,116,120],"expensive":[21],"data":[22],"collection.":[23],"To":[24],"advance":[25],"field,":[27],"it":[28,47],"crucial":[30],"generate":[32],"large-scale":[33],"datasets.":[34],"Compositional":[35],"particularly":[38],"appealing":[39],"for":[40,90,130,188],"generating":[41],"such":[42],"since":[45],"1)":[46],"permits":[48],"creating":[49],"many":[50],"tasks":[51,66,98,156],"from":[52,99,109],"few":[53],"components,":[54,71],"2)":[55],"task":[57,81,138],"structure":[58,179],"may":[59],"enable":[60],"trained":[61],"solve":[64],"new":[65],"by":[67],"combining":[68],"relevant":[69],"learned":[70],"and":[72,118,127,160],"3)":[73],"compositional":[75,137,162,178,193],"dimensions":[76],"provide":[77,125],"notion":[79],"relatedness.":[82],"This":[83],"paper":[84],"provides":[85],"four":[86],"offline":[87,149,192],"datasets":[89],"simulated":[91],"robotic":[92],"manipulation":[93],"created":[94],"using":[95],"256":[97,121],"CompoSuite":[100],"[Mendez":[101],"et":[102],"al.,":[103],"2022a].":[104],"Each":[105],"dataset":[106],"collected":[108],"an":[110,132],"agent":[111],"with":[112],"different":[114],"degree":[115],"performance,":[117],"consists":[119],"million":[122],"transitions.":[123],"We":[124],"training":[126,155],"evaluation":[128],"settings":[129],"assessing":[131],"agent's":[133],"ability":[134],"learn":[136,153],"policies.":[139],"Our":[140],"benchmarking":[141],"experiments":[142],"each":[144],"setting":[145],"show":[146],"current":[148,169],"methods":[151,163,170],"can":[152],"some":[158],"extent":[159],"significantly":[164],"outperform":[165],"non-compositional":[166],"methods.":[167],"However,":[168],"are":[171],"still":[172],"unable":[173],"extract":[175],"tasks'":[177],"generalize":[181],"unseen":[183],"tasks,":[184],"showing":[185],"need":[187],"further":[189],"research":[190],"in":[191],"RL.":[194]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4384614004","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-01-21T06:26:54.938593","created_date":"2023-07-18"}