{"id":"https://openalex.org/W4399657744","doi":"https://doi.org/10.48550/arxiv.2406.08406","title":"RRLS : Robust Reinforcement Learning Suite","display_name":"RRLS : Robust Reinforcement Learning Suite","publication_year":2024,"publication_date":"2024-06-12","ids":{"openalex":"https://openalex.org/W4399657744","doi":"https://doi.org/10.48550/arxiv.2406.08406"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08406","pdf_url":"https://arxiv.org/pdf/2406.08406","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.08406","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019608057","display_name":"Adil Zouitine","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zouitine, Adil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036340153","display_name":"David Bertoin","orcid":"https://orcid.org/0000-0003-3858-3881"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bertoin, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113950734","display_name":"Pierre J. Clavier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Clavier, Pierre","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110482875","display_name":"Matthieu Geist","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geist, Matthieu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049708660","display_name":"Emmanuel Rachelson","orcid":"https://orcid.org/0000-0002-8559-1617"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rachelson, Emmanuel","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.837,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.837,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.836,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.8243,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.87305003},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8287746},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6201881},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5733698},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4761555},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.20888063},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.09784299},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07253933},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08406","pdf_url":"https://arxiv.org/pdf/2406.08406","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2406.08406","pdf_url":"https://arxiv.org/pdf/2406.08406","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4379115841","https://openalex.org/W4310083477","https://openalex.org/W4231704780","https://openalex.org/W352609212","https://openalex.org/W2920061524","https://openalex.org/W2748952813","https://openalex.org/W2328553770","https://openalex.org/W2083794993","https://openalex.org/W1511772879"],"abstract_inverted_index":{"Robust":[0,63],"reinforcement":[1,97],"learning":[2,7,98],"is":[3,22,121,134],"the":[4,45,62,116],"problem":[5],"of":[6,18,42,51,84,118],"control":[8,79],"policies":[9],"that":[10],"provide":[11],"optimal":[12],"worst-case":[13],"performance":[14],"against":[15],"a":[16,23,39,48,68],"span":[17],"adversarial":[19],"environments.":[20,74,130],"It":[21,120],"crucial":[24],"ingredient":[25],"for":[26,87,112],"deploying":[27],"algorithms":[28],"in":[29,44,105],"real-world":[30],"scenarios":[31],"with":[32,81],"prevalent":[33],"environmental":[34],"uncertainties":[35],"and":[36,89,102],"has":[37],"been":[38],"long-standing":[40],"object":[41],"attention":[43],"community,":[46],"without":[47],"standardized":[49],"set":[50],"benchmarks.":[52],"This":[53],"contribution":[54],"endeavors":[55],"to":[56,94,124,128],"fill":[57],"this":[58],"gap.":[59],"We":[60],"introduce":[61],"Reinforcement":[64],"Learning":[65],"Suite":[66],"(RRLS),":[67],"benchmark":[69,92],"suite":[70],"based":[71],"on":[72],"Mujoco":[73],"RRLS":[75],"provides":[76],"six":[77],"continuous":[78],"tasks":[80],"two":[82],"types":[83],"uncertainty":[85],"sets":[86],"training":[88],"evaluation.":[90],"Our":[91],"aims":[93],"standardize":[95],"robust":[96],"tasks,":[99],"facilitating":[100],"reproducible":[101],"comparable":[103],"experiments,":[104],"particular":[106],"those":[107],"from":[108],"recent":[109],"state-of-the-art":[110],"contributions,":[111],"which":[113],"we":[114],"demonstrate":[115],"use":[117],"RRLS.":[119],"also":[122],"designed":[123],"be":[125],"easily":[126],"expandable":[127],"new":[129],"The":[131],"source":[132],"code":[133],"available":[135],"at":[136],"\\href{https://github.com/SuReLI/RRLS}{https://github.com/SuReLI/RRLS}.":[137]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4399657744","counts_by_year":[],"updated_date":"2024-12-15T08:45:57.008644","created_date":"2024-06-14"}