{"id":"https://openalex.org/W4221152718","doi":"https://doi.org/10.48550/arxiv.2203.07454","title":"L2Explorer: A Lifelong Reinforcement Learning Assessment Environment","display_name":"L2Explorer: A Lifelong Reinforcement Learning Assessment Environment","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4221152718","doi":"https://doi.org/10.48550/arxiv.2203.07454"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.07454","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2203.07454","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037437190","display_name":"Erik C. Johnson","orcid":"https://orcid.org/0000-0002-7397-8531"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Johnson, Erik C.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029274378","display_name":"Eric Q. Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Eric Q.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010949000","display_name":"Blake A. Schreurs","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schreurs, Blake","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078223421","display_name":"Chigozie S. Ewulum","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ewulum, Chigozie S.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028530447","display_name":"Chace Ashcraft","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ashcraft, Chace","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002942175","display_name":"Neil M. Fendley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fendley, Neil M.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080508216","display_name":"Megan M. Baker","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baker, Megan M.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035926574","display_name":"Alexander New","orcid":"https://orcid.org/0000-0001-8369-1473"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"New, Alexander","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5030439130","display_name":"Gautam K. Vallabha","orcid":"https://orcid.org/0000-0001-6856-7968"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vallabha, Gautam K.","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.901037,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":76,"max":80},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10731","display_name":"Educational Games and Gamification","score":0.8856,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10731","display_name":"Educational Games and Gamification","score":0.8856,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.7938,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4278967}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.76437616},{"id":"https://openalex.org/C108771440","wikidata":"https://www.wikidata.org/wiki/Q368475","display_name":"Lifelong learning","level":2,"score":0.76233745},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6514449},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5882141},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.5336284},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47100535},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4278967},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.36281312},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3279398},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14470282},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.09017557},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.07722145},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.07454","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2203.07454","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2203.07454","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.43,"display_name":"Industry, innovation and infrastructure"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4372778609","https://openalex.org/W422428167","https://openalex.org/W2499777278","https://openalex.org/W2391851613","https://openalex.org/W2384383462","https://openalex.org/W2380954666","https://openalex.org/W2364105709","https://openalex.org/W2037025106","https://openalex.org/W1981922029","https://openalex.org/W1485190762"],"abstract_inverted_index":{"Despite":[0],"groundbreaking":[1],"progress":[2],"in":[3,16,27,55,149,181],"reinforcement":[4,18],"learning":[5,19,32,57,65],"for":[6,71,92,176],"robotics,":[7],"gameplay,":[8],"and":[9,77,96,121,127,162,170,184],"other":[10],"complex":[11,126],"domains,":[12],"major":[13],"challenges":[14],"remain":[15],"applying":[17],"to":[20,35,40,79,115,133,146,151,157,188],"the":[21,45,85,167],"evolving,":[22],"open-world":[23,182],"problems":[24],"often":[25],"found":[26],"critical":[28],"application":[29],"spaces.":[30],"Reinforcement":[31],"solutions":[33],"tend":[34],"generalize":[36],"poorly":[37],"when":[38],"exposed":[39],"new":[41],"tasks":[42,120],"outside":[43],"of":[44,119],"data":[46,163],"distribution":[47],"they":[48],"are":[49],"trained":[50],"on,":[51],"prompting":[52],"an":[53],"interest":[54],"continual":[56,64,93],"algorithms.":[58],"In":[59,131],"tandem":[60],"with":[61,137,154],"research":[62,81],"on":[63],"algorithms,":[66],"there":[67],"is":[68],"a":[69,90,103,117,143,174],"need":[70,87],"challenge":[72],"environments,":[73],"carefully":[74],"designed":[75],"experiments,":[76],"metrics":[78,156],"assess":[80,158],"progress.":[82],"We":[83],"address":[84],"latter":[86],"by":[88],"introducing":[89],"framework":[91,175],"reinforcement-learning":[94],"development":[95],"assessment":[97],"using":[98],"Lifelong":[99],"Learning":[100],"Explorer":[101],"(L2Explorer),":[102],"new,":[104],"Unity-based,":[105],"first-person":[106],"3D":[107],"exploration":[108],"environment":[109,169],"that":[110],"can":[111],"be":[112],"continuously":[113],"reconfigured":[114],"generate":[116],"range":[118],"task":[122],"variants":[123],"structured":[124],"into":[125],"evolving":[128],"evaluation":[129,171,179],"curricula.":[130],"contrast":[132],"procedurally":[134],"generated":[135],"worlds":[136],"randomized":[138],"components,":[139],"we":[140],"have":[141],"developed":[142],"systematic":[144],"approach":[145,172],"defining":[147],"curricula":[148],"response":[150],"controlled":[152],"changes":[153],"accompanying":[155],"transfer,":[159],"performance":[160],"recovery,":[161],"efficiency.":[164],"Taken":[165],"together,":[166],"L2Explorer":[168],"provides":[173],"developing":[177],"future":[178],"methodologies":[180],"settings":[183],"rigorously":[185],"evaluating":[186],"approaches":[187],"lifelong":[189],"learning.":[190]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4221152718","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2025-01-04T15:09:15.236030","created_date":"2022-04-03"}