{"id":"https://openalex.org/W4205803553","doi":"https://doi.org/10.1111/tops.12595","title":"A Critical Period for Robust Curriculum\u2010Based Deep Reinforcement Learning of Sequential Action in a Robot Arm","display_name":"A Critical Period for Robust Curriculum\u2010Based Deep Reinforcement Learning of Sequential Action in a Robot Arm","publication_year":2022,"publication_date":"2022-01-10","ids":{"openalex":"https://openalex.org/W4205803553","doi":"https://doi.org/10.1111/tops.12595","pmid":"https://pubmed.ncbi.nlm.nih.gov/35005844"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1111/tops.12595","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1111/tops.12595","source":{"id":"https://openalex.org/S22283869","display_name":"Topics in Cognitive Science","issn_l":"1756-8757","issn":["1756-8757","1756-8765"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1111/tops.12595","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007949246","display_name":"Roy de Kleijn","orcid":"https://orcid.org/0000-0002-1759-3960"},"institutions":[{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Roy de Kleijn","raw_affiliation_strings":["Leiden Institute for Brain and Cognition, Leiden University"],"affiliations":[{"raw_affiliation_string":"Leiden Institute for Brain and Cognition, Leiden University","institution_ids":["https://openalex.org/I121797337"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047433939","display_name":"Deniz Sen","orcid":"https://orcid.org/0000-0001-9104-6204"},"institutions":[{"id":"https://openalex.org/I4210120676","display_name":"Mathematical Institute of the Slovak Academy of Sciences","ror":"https://ror.org/02fhy7464","country_code":"SK","type":"facility","lineage":["https://openalex.org/I207624831","https://openalex.org/I4210120676"]},{"id":"https://openalex.org/I121797337","display_name":"Leiden University","ror":"https://ror.org/027bh9e22","country_code":"NL","type":"education","lineage":["https://openalex.org/I121797337"]}],"countries":["NL","SK"],"is_corresponding":false,"raw_author_name":"Deniz Sen","raw_affiliation_strings":["Mathematical Institute, Leiden University"],"affiliations":[{"raw_affiliation_string":"Mathematical Institute, Leiden University","institution_ids":["https://openalex.org/I4210120676","https://openalex.org/I121797337"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052387922","display_name":"George Kachergis","orcid":"https://orcid.org/0000-0003-4153-4167"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"George Kachergis","raw_affiliation_strings":["Language & Cognition Lab Stanford University"],"affiliations":[{"raw_affiliation_string":"Language & Cognition Lab Stanford University","institution_ids":["https://openalex.org/I97018004"]}]}],"institution_assertions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5007949246"],"corresponding_institution_ids":["https://openalex.org/I121797337"],"apc_list":{"value":3140,"currency":"USD","value_usd":3140,"provenance":"doaj"},"apc_paid":{"value":3140,"currency":"USD","value_usd":3140,"provenance":"doaj"},"fwci":1.767,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":5,"citation_normalized_percentile":{"value":0.999897,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":83,"max":85},"biblio":{"volume":"14","issue":"2","first_page":"311","last_page":"326"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10656","display_name":"Child and Animal Learning Development","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10656","display_name":"Child and Animal Learning Development","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11431","display_name":"Action Observation and Synchronization","score":0.9963,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11883","display_name":"Embodied and Extended Cognition","score":0.9946,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6356402},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.56043917},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.5501191},{"id":"https://openalex.org/C2781291010","wikidata":"https://www.wikidata.org/wiki/Q178580","display_name":"Period (music)","level":2,"score":0.541532},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.50256395},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46166426},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.38230133},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07575229},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003479","descriptor_name":"Curriculum","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009068","descriptor_name":"Movement","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011930","descriptor_name":"Reaction Time","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":4,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1111/tops.12595","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1111/tops.12595","source":{"id":"https://openalex.org/S22283869","display_name":"Topics in Cognitive Science","issn_l":"1756-8757","issn":["1756-8757","1756-8765"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"http://hdl.handle.net/1887/3443845","pdf_url":"https://scholarlypublications.universiteitleiden.nl/access/item%3A3443846/view","source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":["Royal Netherlands Academy of Arts and Sciences"],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/PMC9303318","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35005844","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1111/tops.12595","pdf_url":"https://onlinelibrary.wiley.com/doi/pdfdirect/10.1111/tops.12595","source":{"id":"https://openalex.org/S22283869","display_name":"Topics in Cognitive Science","issn_l":"1756-8757","issn":["1756-8757","1756-8765"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.43,"display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":32,"referenced_works":["https://openalex.org/W1491843047","https://openalex.org/W1980862600","https://openalex.org/W1993411524","https://openalex.org/W1994530392","https://openalex.org/W1997508571","https://openalex.org/W1997649014","https://openalex.org/W2003191899","https://openalex.org/W2004303440","https://openalex.org/W2019237106","https://openalex.org/W2028418738","https://openalex.org/W2035477615","https://openalex.org/W2076231167","https://openalex.org/W2083871567","https://openalex.org/W2103660272","https://openalex.org/W2121863487","https://openalex.org/W2141497885","https://openalex.org/W2151495024","https://openalex.org/W2151834591","https://openalex.org/W2166302491","https://openalex.org/W2296073425","https://openalex.org/W2541673242","https://openalex.org/W2734648945","https://openalex.org/W2736660860","https://openalex.org/W2790065565","https://openalex.org/W2790096445","https://openalex.org/W2964319760","https://openalex.org/W4234438384","https://openalex.org/W4244412329","https://openalex.org/W4247455532","https://openalex.org/W4256152819","https://openalex.org/W4256259208","https://openalex.org/W4301385536"],"related_works":["https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3049728571","https://openalex.org/W2590211375","https://openalex.org/W2586732548","https://openalex.org/W2138720691","https://openalex.org/W20361778","https://openalex.org/W2031695474","https://openalex.org/W2024136090"],"abstract_inverted_index":{"Abstract":[0],"Many":[1],"everyday":[2],"activities":[3],"are":[4,31,302],"sequential":[5,27,72,135,322],"in":[6,33,68,115,137,231,241,286],"nature.":[7],"That":[8],"is,":[9],"they":[10,267],"can":[11,250],"be":[12,283],"seen":[13],"as":[14,261,280],"a":[15,56,109,138,147,164,202,224],"sequence":[16],"of":[17,26,40,64,71,83,88,99,118,226,234,321],"subactions":[18,36,42],"and":[19,309,318],"sometimes":[20],"subgoals.":[21],"In":[22,129,190],"the":[23,38,69,74,95,116,130,208,220,258],"motor":[24],"execution":[25,39],"action,":[28,73],"context":[29,81],"effects":[30,82],"observed":[32],"which":[34,84,266,289],"later":[35,253],"modulate":[37],"earlier":[41],"(e.g.,":[43],"reaching":[44,198],"for":[45,159,197,204,314],"an":[46,65],"overturned":[47],"mug,":[48],"people":[49],"will":[50],"optimize":[51],"their":[52,103,269,304],"grasp":[53],"to":[54,94,101,108,112,125,157,163,170,179,184,218,223,245,296],"achieve":[55],"comfortable":[57],"end":[58],"state).":[59],"A":[60],"trajectory":[61],"(movement)":[62],"adaptation":[63],"often\u2010used":[66],"paradigm":[67],"study":[70],"serial":[75,165],"response":[76,166],"time":[77,124,167],"task,":[78],"showed":[79],"several":[80],"centering":[85,181],"behavior":[86,92,182],"is":[87],"special":[89],"interest.":[90],"Centering":[91],"refers":[93],"tendency":[96],"(or":[97],"strategy)":[98],"subjects":[100,186],"move":[102],"arm":[104],"or":[105],"mouse":[106],"cursor":[107],"position":[110],"equidistant":[111],"all":[113,126],"stimuli":[114],"absence":[117],"predictive":[119],"information,":[120],"thereby":[121],"reducing":[122],"movement":[123],"possible":[127],"targets.":[128],"current":[131],"study,":[132],"we":[133,193],"investigated":[134],"action":[136,227],"virtual":[139,242],"robotic":[140],"agent":[141,154],"trained":[142,156],"using":[143],"proximal":[144],"policy":[145],"optimization,":[146],"state\u2010of\u2010the\u2010art":[148],"deep":[149],"reinforcement":[150],"learning":[151,264,308,320],"algorithm.":[152],"The":[153],"was":[155,210],"reach":[158],"appearing":[160],"targets,":[161],"similar":[162,183,244],"task":[168,221],"given":[169],"humans.":[171],"We":[172],"found":[173],"that":[174,240],"agents":[175,196,216,290],"were":[176],"more":[177],"likely":[178],"develop":[180],"human":[185,317],"after":[187,288],"curricularized":[188],"learning.":[189,254],"our":[191],"curriculum,":[192,214],"first":[194],"rewarded":[195],"targets":[199],"before":[200],"introducing":[201,273],"penalty":[203,209],"energy":[205],"expenditure.":[206],"When":[207],"applied":[211],"with":[212],"no":[213],"many":[215],"failed":[217],"learn":[219,295],"due":[222],"lack":[225],"space":[228],"exploration,":[229],"resulting":[230],"high":[232],"variability":[233],"agents'":[235],"performance.":[236],"Our":[237],"findings":[238],"suggest":[239],"agents,":[243],"infants,":[246],"early":[247],"energetic":[248],"exploration":[249],"promote":[251],"robust":[252],"This":[255],"may":[256,282],"have":[257],"same":[259],"effect":[260],"infants'":[262],"curiosity\u2010based":[263],"by":[265],"shape":[268],"own":[270],"curriculum.":[271],"However,":[272],"new":[274,298,312],"goals":[275],"cannot":[276,293],"wait":[277],"too":[278],"long,":[279],"there":[281],"critical":[284],"periods":[285],"development":[287],"(as":[291],"humans)":[292],"flexibly":[294],"incorporate":[297],"objectives.":[299],"These":[300],"lessons":[301],"making":[303],"way":[305],"into":[306],"machine":[307,319],"offer":[310],"exciting":[311],"avenues":[313],"studying":[315],"both":[316],"action.":[323]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4205803553","counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2024-12-09T12:28:08.148906","created_date":"2022-01-26"}