{"id":"https://openalex.org/W4403788137","doi":"https://doi.org/10.48550/arxiv.2409.16208","title":"Context-Based Meta Reinforcement Learning for Robust and Adaptable\n Peg-in-Hole Assembly Tasks","display_name":"Context-Based Meta Reinforcement Learning for Robust and Adaptable\n Peg-in-Hole Assembly Tasks","publication_year":2024,"publication_date":"2024-09-24","ids":{"openalex":"https://openalex.org/W4403788137","doi":"https://doi.org/10.48550/arxiv.2409.16208"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16208","pdf_url":"http://arxiv.org/pdf/2409.16208","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2409.16208","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059109200","display_name":"Ahmed Shokry","orcid":"https://orcid.org/0000-0002-0453-2923"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shokry, Ahmed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066618929","display_name":"Walid Gomaa","orcid":"https://orcid.org/0000-0002-8518-8908"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gomaa, Walid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035238211","display_name":"Tobias Zaenker","orcid":"https://orcid.org/0000-0002-8485-2192"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zaenker, Tobias","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069650777","display_name":"Murad Dawood","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dawood, Murad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054286317","display_name":"Shady A. Maged","orcid":"https://orcid.org/0000-0001-8641-9985"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maged, Shady A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069985186","display_name":"Mohammed I. Awad","orcid":"https://orcid.org/0000-0002-0367-0187"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Awad, Mohammed I.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5103231515","display_name":"Maren Bennewitz","orcid":"https://orcid.org/0000-0003-4343-3028"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bennewitz, Maren","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.9968,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.9968,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9856,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9694,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7656647},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.64431864},{"id":"https://openalex.org/C54400483","wikidata":"https://www.wikidata.org/wiki/Q1793202","display_name":"PEG ratio","level":2,"score":0.59597784},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.59011316},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.52664876},{"id":"https://openalex.org/C2781002164","wikidata":"https://www.wikidata.org/wiki/Q6822311","display_name":"Meta learning (computer science)","level":3,"score":0.46549428},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34276596},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2202191},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.13698485},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.08191326},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08124724},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.06477982},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16208","pdf_url":"http://arxiv.org/pdf/2409.16208","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2409.16208","pdf_url":"http://arxiv.org/pdf/2409.16208","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4383109125","https://openalex.org/W4310083477","https://openalex.org/W4294873804","https://openalex.org/W2920061524","https://openalex.org/W2891227010","https://openalex.org/W2328553770","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2038908348","https://openalex.org/W1977959518"],"abstract_inverted_index":{"Peg-in-hole":[0],"assembly":[1],"in":[2,16,20,71,95,183,207,240],"unknown":[3,210],"environments":[4],"is":[5],"a":[6,61,115,127,136,152,193],"challenging":[7],"task":[8,21,70],"due":[9],"to":[10,38,46,49,67,111,122,144,179,225],"onboard":[11],"sensor":[12],"errors,":[13],"which":[14],"result":[15],"uncertainty":[17],"and":[18,28,86,141,172,175,189,200,217,222],"variations":[19],"parameters":[22,148],"such":[23],"as":[24,42],"the":[25,69,72,78,82,96,107,120,124,157,164,170,177,219,226,241],"hole":[26,187,211],"position":[27],"orientation.":[29],"Meta":[30,83,108],"Reinforcement":[31],"Learning":[32],"(Meta":[33],"RL)":[34],"has":[35],"been":[36],"proposed":[37,165,233],"mitigate":[39],"this":[40],"problem":[41],"it":[43],"learns":[44],"how":[45],"quickly":[47],"adapt":[48,106],"new":[50],"tasks":[51,146,184,208],"with":[52,100,147,185,209,229],"different":[53,186],"parameters.":[54],"However,":[55],"previous":[56,227],"approaches":[57],"either":[58],"depend":[59],"on":[60,192],"sample-inefficient":[62,230],"procedure":[63],"or":[64],"human":[65],"demonstrations":[66],"perform":[68,123],"real":[73,97,194],"world.":[74],"Our":[75,160],"work":[76,228],"modifies":[77],"data":[79,113,166],"used":[80],"by":[81,151],"RL":[84,109],"agent":[85,110,178],"uses":[87],"simple":[88],"features":[89],"that":[90,139,149,163,197],"can":[91],"be":[92],"easily":[93],"measured":[94],"world":[98],"even":[99],"an":[101],"uncalibrated":[102],"camera.":[103],"We":[104],"further":[105],"use":[112],"from":[114,156],"force/torque":[116,201],"sensor,":[117],"instead":[118],"of":[119,130,154],"camera,":[121],"assembly,":[125],"using":[126],"small":[128],"amount":[129],"training":[131,158,171],"data.":[132],"Finally,":[133],"we":[134],"propose":[135],"fine-tuning":[137],"method":[138],"consistently":[140],"safely":[142],"adapts":[143],"out-of-distribution":[145],"differ":[150],"factor":[153],"10":[155,236],"tasks.":[159,243],"results":[161],"demonstrate":[162],"modification":[167],"significantly":[168],"enhances":[169],"adaptation":[173],"efficiency":[174],"enables":[176],"achieve":[180,204],"100%":[181,205],"success":[182,206],"positions":[188],"orientations.":[190],"Experiments":[191],"robot":[195],"confirm":[196],"both":[198],"camera-":[199],"sensor-equipped":[202],"agents":[203],"positions,":[212],"matching":[213],"their":[214],"simulation":[215],"performance":[216],"validating":[218],"approach's":[220],"robustness":[221],"applicability.":[223],"Compared":[224],"adaptation,":[231],"our":[232],"methods":[234],"are":[235],"times":[237],"more":[238],"sample-efficient":[239],"real-world":[242]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403788137","counts_by_year":[],"updated_date":"2024-12-11T06:01:27.178043","created_date":"2024-10-26"}