{"id":"https://openalex.org/W2790734939","doi":"https://doi.org/10.1145/3171221.3171289","title":"Deep Reinforcement Learning of Abstract Reasoning from Demonstrations","display_name":"Deep Reinforcement Learning of Abstract Reasoning from Demonstrations","publication_year":2018,"publication_date":"2018-02-26","ids":{"openalex":"https://openalex.org/W2790734939","doi":"https://doi.org/10.1145/3171221.3171289","mag":"2790734939"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3171221.3171289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043286307","display_name":"Madison Clark-Turner","orcid":null},"institutions":[{"id":"https://openalex.org/I161057412","display_name":"University of New Hampshire","ror":"https://ror.org/01rmh9n78","country_code":"US","type":"education","lineage":["https://openalex.org/I161057412"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Madison Clark-Turner","raw_affiliation_strings":["University of New Hampshire, Durham, NH, USA"],"affiliations":[{"raw_affiliation_string":"University of New Hampshire, Durham, NH, USA","institution_ids":["https://openalex.org/I161057412"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035462171","display_name":"Momotaz Begum","orcid":"https://orcid.org/0000-0002-1073-2008"},"institutions":[{"id":"https://openalex.org/I161057412","display_name":"University of New Hampshire","ror":"https://ror.org/01rmh9n78","country_code":"US","type":"education","lineage":["https://openalex.org/I161057412"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Momotaz Begum","raw_affiliation_strings":["University of New Hampshire, Durham, NH, USA"],"affiliations":[{"raw_affiliation_string":"University of New Hampshire, Durham, NH, USA","institution_ids":["https://openalex.org/I161057412"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.614,"has_fulltext":true,"fulltext_origin":"ngrams","cited_by_count":15,"citation_normalized_percentile":{"value":0.857952,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":88,"max":89},"biblio":{"volume":null,"issue":null,"first_page":"160","last_page":"168"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9902,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9898,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/milestone","display_name":"Milestone","score":0.54373693}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7102655},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6940903},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.63925254},{"id":"https://openalex.org/C2779182362","wikidata":"https://www.wikidata.org/wiki/Q17126187","display_name":"Session (web analytics)","level":2,"score":0.6331066},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.60478806},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6038766},{"id":"https://openalex.org/C120060458","wikidata":"https://www.wikidata.org/wiki/Q10145","display_name":"Milestone","level":2,"score":0.54373693},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5249096},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.43356758},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.42558426},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.41019413},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.387263},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32494187},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09761226},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1145/3171221.3171289","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.72,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":"1664554"}],"datasets":[],"versions":[],"referenced_works_count":38,"referenced_works":["https://openalex.org/W1533651650","https://openalex.org/W1684361744","https://openalex.org/W1754243990","https://openalex.org/W1923404803","https://openalex.org/W1947481528","https://openalex.org/W1983705368","https://openalex.org/W1986014385","https://openalex.org/W1989819438","https://openalex.org/W2016053056","https://openalex.org/W2025521298","https://openalex.org/W2053910308","https://openalex.org/W2063471043","https://openalex.org/W2073395107","https://openalex.org/W2107019937","https://openalex.org/W2121249629","https://openalex.org/W2138739434","https://openalex.org/W2145339207","https://openalex.org/W2156303437","https://openalex.org/W2165698076","https://openalex.org/W2301093073","https://openalex.org/W2402268235","https://openalex.org/W2461621749","https://openalex.org/W2522489477","https://openalex.org/W2523246573","https://openalex.org/W2549733625","https://openalex.org/W2560573001","https://openalex.org/W2569614323","https://openalex.org/W2583137229","https://openalex.org/W2591643707","https://openalex.org/W2592076308","https://openalex.org/W2772837506","https://openalex.org/W2919115771","https://openalex.org/W2962747693","https://openalex.org/W2962938178","https://openalex.org/W2963165299","https://openalex.org/W2964350391","https://openalex.org/W3110909889","https://openalex.org/W4211008118"],"related_works":["https://openalex.org/W4387878404","https://openalex.org/W3140574787","https://openalex.org/W3133583653","https://openalex.org/W2990251955","https://openalex.org/W2955244041","https://openalex.org/W2584040191","https://openalex.org/W2561695978","https://openalex.org/W2490667451","https://openalex.org/W2064167013","https://openalex.org/W1950486549"],"abstract_inverted_index":{"Extracting":[0],"a":[1,21,30,65,96,135,141],"set":[2,136],"of":[3,10,26,64,86,114,119,137,151,154,162],"generalizable":[4],"rules":[5,88,118,138],"that":[6,61,139],"govern":[7,140],"the":[8,34,51,76,84,112,155,160],"dynamics":[9],"complex,":[11],"high-level":[12,22,117],"interactions":[13,121],"between":[14,145],"humans":[15],"based":[16,148],"only":[17],"on":[18,149],"observations":[19,150],"is":[20,49],"cognitive":[23],"ability.":[24],"Mastery":[25],"this":[27],"skill":[28],"marks":[29],"significant":[31],"milestone":[32],"in":[33,41,46,58,83,111,168],"human":[35,120,166],"developmental":[36],"process.":[37],"A":[38],"key":[39],"challenge":[40],"designing":[42],"such":[43],"an":[44,102],"ability":[45],"autonomous":[47],"robots":[48],"discovering":[50,75],"relationships":[52,77],"among":[53,80],"discriminatory":[54],"features.":[55],"Identifying":[56],"features":[57,82],"natural":[59],"scenes":[60],"are":[62,89],"representative":[63],"particular":[66],"event":[67],"or":[68],"interaction":[69],"(i.e.":[70],"\u00bbdiscriminatory":[71],"features\u00bb)":[72],"and":[73],"then":[74],"(e.g.,":[78],"temporal/spatial/spatio-temporal/causal)":[79],"those":[81],"form":[85],"generalized":[87],"non-trivial":[90],"problems.":[91],"They":[92],"often":[93],"appear":[94],"as":[95],"\u00bbchicken-and-egg\u00bb":[97],"dilemma.":[98],"This":[99],"paper":[100],"proposes":[101],"end-to-end":[103],"learning":[104,115,131],"framework":[105,132,164],"to":[106,133],"tackle":[107],"these":[108],"two":[109,146],"problems":[110],"context":[113],"generalized,":[116],"from":[122],"structured":[123],"demonstrations.":[124],"We":[125,157],"employed":[126],"our":[127,163],"proposed":[128],"deep":[129],"reinforcement":[130],"learn":[134],"behavioral":[142],"intervention":[143],"session":[144],"agents":[147],"several":[152],"instances":[153],"session.":[156],"also":[158],"tested":[159],"accuracy":[161],"with":[165],"subjects":[167],"diverse":[169],"situations.":[170]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W2790734939","counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":2}],"updated_date":"2024-12-12T10:20:00.383322","created_date":"2018-03-29"}