{"id":"https://openalex.org/W4382049667","doi":"https://doi.org/10.1177/02783649231179499","title":"Composable energy policies for reactive motion generation and reinforcement learning","display_name":"Composable energy policies for reactive motion generation and reinforcement learning","publication_year":2023,"publication_date":"2023-06-26","ids":{"openalex":"https://openalex.org/W4382049667","doi":"https://doi.org/10.1177/02783649231179499"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1177/02783649231179499","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/records/5336918/files/CR_2021_COMPOSABLE_URAIN%20(1).pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067156748","display_name":"Julen Urain","orcid":"https://orcid.org/0000-0003-1135-6654"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Julen Urain","raw_affiliation_strings":["Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100402747","display_name":"Anqi Li","orcid":"https://orcid.org/0000-0001-8580-4750"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anqi Li","raw_affiliation_strings":["Robot Learning Lab, University of Washington, Seattle, WA, USA"],"affiliations":[{"raw_affiliation_string":"Robot Learning Lab, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036597033","display_name":"Puze Liu","orcid":"https://orcid.org/0000-0001-6887-7704"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Puze Liu","raw_affiliation_strings":["Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063752250","display_name":"Carlo D\u2019Eramo","orcid":"https://orcid.org/0000-0003-2712-118X"},"institutions":[{"id":"https://openalex.org/I4392021234","display_name":"Hessian Center for Artificial Intelligence","ror":"https://ror.org/014ybqb54","country_code":null,"type":"facility","lineage":["https://openalex.org/I31512782","https://openalex.org/I4392021234"]}],"countries":[],"is_corresponding":false,"raw_author_name":"Carlo D\u2019Eramo","raw_affiliation_strings":["Hessian.AI, The Hessian Center for Artificial Intelligence, Germany"],"affiliations":[{"raw_affiliation_string":"Hessian.AI, The Hessian Center for Artificial Intelligence, Germany","institution_ids":["https://openalex.org/I4392021234","https://openalex.org/I4392021234"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071367253","display_name":"Jan Peters","orcid":"https://orcid.org/0000-0002-5266-8091"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I33256026","display_name":"German Research Centre for Artificial Intelligence","ror":"https://ror.org/01ayc5b57","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I33256026"]},{"id":"https://openalex.org/I4392021234","display_name":"Hessian Center for Artificial Intelligence","ror":"https://ror.org/014ybqb54","country_code":null,"type":"facility","lineage":["https://openalex.org/I31512782","https://openalex.org/I4392021234"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jan Peters","raw_affiliation_strings":["Centre for Cognitive Science, Darmstadt, Germany","Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","Hessian.AI, The Hessian Center for Artificial Intelligence, Germany","Research Department: Systems AI for Robot LearningGerman Research Center for AI (DFKI), Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Institute for Intelligent Autonomous Systems, TU Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Research Department: Systems AI for Robot LearningGerman Research Center for AI (DFKI), Darmstadt, Germany","institution_ids":["https://openalex.org/I33256026"]},{"raw_affiliation_string":"Centre for Cognitive Science, Darmstadt, Germany","institution_ids":[]},{"raw_affiliation_string":"Hessian.AI, The Hessian Center for Artificial Intelligence, Germany","institution_ids":["https://openalex.org/I4392021234"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5067156748"],"corresponding_institution_ids":["https://openalex.org/I31512782"],"apc_list":null,"apc_paid":null,"fwci":0.421,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.620722,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":67,"max":78},"biblio":{"volume":"42","issue":"10","first_page":"827","last_page":"858"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9978,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.52076715}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8749844},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6911624},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.54542094},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5381976},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.52076715},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.519059},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.51786137},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4872214},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.46402484},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.46360147},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4541128},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.43261763},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14730608},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.14122751},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12512249},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1177/02783649231179499","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://zenodo.org/record/5336918","pdf_url":"https://zenodo.org/records/5336918/files/CR_2021_COMPOSABLE_URAIN%20(1).pdf","source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":["European Organization for Nuclear Research"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.04962","pdf_url":"http://arxiv.org/pdf/2105.04962","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://zenodo.org/record/5336918","pdf_url":"https://zenodo.org/records/5336918/files/CR_2021_COMPOSABLE_URAIN%20(1).pdf","source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":["European Organization for Nuclear Research"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.88,"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":45,"referenced_works":["https://openalex.org/W1424654272","https://openalex.org/W1608481154","https://openalex.org/W192919555","https://openalex.org/W1971315778","https://openalex.org/W1999502602","https://openalex.org/W2003132288","https://openalex.org/W2012204020","https://openalex.org/W2016211524","https://openalex.org/W2019965290","https://openalex.org/W2032558547","https://openalex.org/W2070683816","https://openalex.org/W2073787051","https://openalex.org/W2078639473","https://openalex.org/W2099893201","https://openalex.org/W2106130932","https://openalex.org/W2107464055","https://openalex.org/W2109169869","https://openalex.org/W2109910161","https://openalex.org/W2112474089","https://openalex.org/W2116064496","https://openalex.org/W2117211893","https://openalex.org/W2128990851","https://openalex.org/W2132083787","https://openalex.org/W2135639338","https://openalex.org/W2142224528","https://openalex.org/W2177274602","https://openalex.org/W2529800952","https://openalex.org/W2584986912","https://openalex.org/W2597289420","https://openalex.org/W2604698059","https://openalex.org/W2906487027","https://openalex.org/W2911426134","https://openalex.org/W2963403593","https://openalex.org/W2963627347","https://openalex.org/W2967727187","https://openalex.org/W2968095426","https://openalex.org/W3040063093","https://openalex.org/W3102334304","https://openalex.org/W3132689247","https://openalex.org/W3174273518","https://openalex.org/W3194622054","https://openalex.org/W3204951990","https://openalex.org/W3207620687","https://openalex.org/W3207939773","https://openalex.org/W4212774754"],"related_works":["https://openalex.org/W4284974072","https://openalex.org/W4225269853","https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2341346307","https://openalex.org/W2145363145","https://openalex.org/W1985560493","https://openalex.org/W1626977535"],"abstract_inverted_index":{"In":[0,179,261],"this":[1],"work,":[2,263],"we":[3,56,153,191,264,291],"introduce":[4],"composable":[5],"energy":[6],"policies":[7,35,151,202],"(CEP),":[8],"a":[9,26,31,45,52,107,160,185,188,235,275],"novel":[10],"framework":[11,75],"for":[12,167,278],"multi-objective":[13,98],"motion":[14,80,89,99,176,215,272],"generation.":[15],"We":[16,29],"frame":[17],"the":[18,48,60,63,70,77,95,104,132,149,173,218,241,248,282,288,294],"problem":[19,96],"of":[20,33,47,79,97,106,109,220,237],"composing":[21],"multiple":[22],"policy":[23,43,71,123,158,162,226,277],"components":[24,124],"from":[25,82,212],"probabilistic":[27],"view.":[28],"consider":[30],"set":[32,108,236],"stochastic":[34,114,161],"represented":[36],"in":[37,62,136,170,187,240],"arbitrary":[38],"task":[39],"spaces,":[40],"where":[41,121],"each":[42,157,168],"represents":[44],"distribution":[46],"actions":[49],"to":[50,58,129,147,200,233,267],"solve":[51,148],"particular":[53],"task.":[54],"Then,":[55],"aim":[57],"find":[59],"action":[61],"configuration":[64],"space":[65],"that":[66,155,194,203,210],"optimally":[67],"satisfies":[68],"all":[69],"components.":[72],"The":[73],"presented":[74],"allows":[76,163,198,231],"fusion":[78],"generators":[81,216],"different":[83,122],"sources:":[84],"optimal":[85],"control,":[86],"data-driven":[87],"policies,":[88,111],"planning,":[90],"and":[91,297],"handcrafted":[92],"policies.":[93,115],"Classically,":[94],"generation":[100,177],"is":[101,143,217],"solved":[102],"by":[103],"composition":[105],"deterministic":[110],"rather":[112],"than":[113],"However,":[116],"there":[117],"are":[118],"common":[119],"situations":[120],"have":[125],"conflicting":[126,150,206],"behaviors,":[127],"leading":[128],"oscillations":[130],"or":[131,255],"robot":[133,221],"getting":[134],"stuck":[135],"an":[137],"undesirable":[138],"state.":[139],"While":[140],"our":[141,262,269],"approach":[142],"not":[144],"directly":[145],"able":[146],"problem,":[152],"claim":[154],"modeling":[156],"as":[159,183,274],"more":[164],"expressive":[165],"representations":[166],"component":[169],"contrast":[171],"with":[172,228,287],"classical":[174],"reactive":[175,214,271],"approaches.":[178],"some":[180],"tasks,":[181],"such":[182],"reaching":[184],"target":[186],"cluttered":[189],"environment,":[190],"show":[192,265],"experimentally":[193],"CEP":[195],"additional":[196],"expressivity":[197],"us":[199,232],"model":[201],"reduce":[204],"these":[205,213,225],"behaviors.":[207],"A":[208],"field":[209],"benefits":[211],"one":[219],"reinforcement":[222,229,249,279,283],"learning.":[223,280],"Integrating":[224],"architectures":[227],"learning":[230,242,250,284,295],"include":[234],"inductive":[238,245],"biases":[239,246],"problem.":[243],"These":[244],"guide":[247],"agent":[251,285],"towards":[252],"informative":[253],"regions":[254],"improve":[256,293],"collision":[257],"safety":[258],"while":[259],"exploring.":[260],"how":[266],"integrate":[268],"proposed":[270],"generator":[273],"structured":[276],"Combining":[281],"exploration":[286],"prior-based":[289],"CEP,":[290],"can":[292],"performance":[296],"explore":[298],"safer.":[299]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4382049667","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-01-04T06:08:23.461174","created_date":"2023-06-27"}