{"id":"https://openalex.org/W2797655438","doi":"https://doi.org/10.1162/neco_a_01079","title":"A Reinforcement Learning Neural Network for Robotic Manipulator Control","display_name":"A Reinforcement Learning Neural Network for Robotic Manipulator Control","publication_year":2018,"publication_date":"2018-04-13","ids":{"openalex":"https://openalex.org/W2797655438","doi":"https://doi.org/10.1162/neco_a_01079","mag":"2797655438","pmid":"https://pubmed.ncbi.nlm.nih.gov/29652591"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01079","pdf_url":null,"source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://doi.org/10.1162/neco_a_01079","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103000208","display_name":"Yazhou Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yazhou Hu","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang 110016, P.R.C., and University of Chinese Academy of Sciences, Beijing 100049, P.R.C."],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang 110016, P.R.C., and University of Chinese Academy of Sciences, Beijing 100049, P.R.C.","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043933382","display_name":"Bailu Si","orcid":"https://orcid.org/0000-0002-0260-3433"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bailu Si","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang 110016, Shenyang, P.R.C."],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang 110016, Shenyang, P.R.C.","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103000208","https://openalex.org/A5043933382"],"corresponding_institution_ids":["https://openalex.org/I142078773","https://openalex.org/I4210165038","https://openalex.org/I142078773","https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":2.244,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":32,"citation_normalized_percentile":{"value":0.881998,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":95},"biblio":{"volume":"30","issue":"7","first_page":"1983","last_page":"2004"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9938,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12047","display_name":"Viral Infections and Vectors","score":0.9634,"subfield":{"id":"https://openalex.org/subfields/2725","display_name":"Infectious Diseases"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot-manipulator","display_name":"Robot manipulator","score":0.54350835}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8702593},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.7266922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6286846},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59495974},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5904887},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.554634},{"id":"https://openalex.org/C2985527887","wikidata":"https://www.wikidata.org/wiki/Q1587588","display_name":"Robot manipulator","level":3,"score":0.54350835},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.45577314},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.44921142},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.36640245},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.35415447},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.34231234},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32314062},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.25062987},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":"","qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017711","descriptor_name":"Nonlinear Dynamics","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":"","qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012371","descriptor_name":"Robotics","qualifier_ui":"","qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01079","pdf_url":null,"source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/29652591","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1162/neco_a_01079","pdf_url":null,"source":{"id":"https://openalex.org/S207023548","display_name":"Neural Computation","issn_l":"0899-7667","issn":["0899-7667","1530-888X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315718","host_organization_name":"The MIT Press","host_organization_lineage":["https://openalex.org/P4310315718"],"host_organization_lineage_names":["The MIT Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[{"score":0.69,"display_name":"Peace, justice, and strong institutions","id":"https://metadata.un.org/sdg/16"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":64,"referenced_works":["https://openalex.org/W141093380","https://openalex.org/W1493190793","https://openalex.org/W1534175819","https://openalex.org/W1542301858","https://openalex.org/W1655556108","https://openalex.org/W1854776945","https://openalex.org/W1919998456","https://openalex.org/W1938776391","https://openalex.org/W1962665893","https://openalex.org/W1964665855","https://openalex.org/W1988182293","https://openalex.org/W1990026397","https://openalex.org/W1991926214","https://openalex.org/W2002260889","https://openalex.org/W2007640554","https://openalex.org/W2010193406","https://openalex.org/W2016840647","https://openalex.org/W2024928738","https://openalex.org/W2035780363","https://openalex.org/W2037949549","https://openalex.org/W2050838777","https://openalex.org/W2056850155","https://openalex.org/W2071447329","https://openalex.org/W2073923906","https://openalex.org/W2074379389","https://openalex.org/W2075439079","https://openalex.org/W2076063813","https://openalex.org/W2078736691","https://openalex.org/W2089904313","https://openalex.org/W2096156956","https://openalex.org/W2098732944","https://openalex.org/W2104733512","https://openalex.org/W2106071123","https://openalex.org/W2108931365","https://openalex.org/W2121863487","https://openalex.org/W2133594302","https://openalex.org/W2136064843","https://openalex.org/W2156246393","https://openalex.org/W2156492453","https://openalex.org/W2164136313","https://openalex.org/W2166778519","https://openalex.org/W2167038379","https://openalex.org/W2176016037","https://openalex.org/W2182044576","https://openalex.org/W2214957967","https://openalex.org/W2253274025","https://openalex.org/W2302808317","https://openalex.org/W2330240534","https://openalex.org/W238867305","https://openalex.org/W2404552068","https://openalex.org/W2484646121","https://openalex.org/W2489526136","https://openalex.org/W2529658650","https://openalex.org/W2539937352","https://openalex.org/W2546883040","https://openalex.org/W2567443749","https://openalex.org/W2570494446","https://openalex.org/W2575705757","https://openalex.org/W2602429550","https://openalex.org/W2618598701","https://openalex.org/W2953326790","https://openalex.org/W4211221179","https://openalex.org/W4252673275","https://openalex.org/W4390809112"],"related_works":["https://openalex.org/W4380318855","https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W3049728571","https://openalex.org/W2964765435","https://openalex.org/W2586732548","https://openalex.org/W2138720691","https://openalex.org/W20361778","https://openalex.org/W2031695474","https://openalex.org/W2024136090"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,11,62,96],"neural":[3],"network":[4,38],"model":[5,21,94],"for":[6],"reinforcement":[7,78],"learning":[8,79,86],"to":[9,70],"control":[10,80],"robotic":[12,31,99],"manipulator":[13,32,100],"with":[14],"unknown":[15],"parameters":[16],"and":[17,51,104],"dead":[18],"zones.":[19],"The":[20,27,65,82],"is":[22,33,45,59,88],"composed":[23],"of":[24,29,39,55,84,91,107],"three":[25,66],"networks.":[26],"state":[28,37],"the":[30,36,40,42,48,52,56,72,77,85,92,102,105,108],"predicted":[34],"by":[35,47,61],"model,":[41],"action":[43,49,57],"policy":[44,58],"learned":[46],"network,":[50],"performance":[53,73],"index":[54,74],"estimated":[60],"critic":[63],"network.":[64],"networks":[67],"work":[68],"together":[69],"optimize":[71],"based":[75],"on":[76,95],"scheme.":[81],"convergence":[83],"methods":[87],"analyzed.":[89],"Application":[90],"proposed":[93],"simulated":[97],"two-link":[98],"demonstrates":[101],"effectiveness":[103],"stability":[106],"model.":[109]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2797655438","counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":3}],"updated_date":"2025-01-03T13:05:40.062099","created_date":"2018-04-24"}