{"id":"https://openalex.org/W4389666497","doi":"https://doi.org/10.1109/iros55552.2023.10341801","title":"Learning Constraints on Autonomous Behavior from Proactive Feedback","display_name":"Learning Constraints on Autonomous Behavior from Proactive Feedback","publication_year":2023,"publication_date":"2023-10-01","ids":{"openalex":"https://openalex.org/W4389666497","doi":"https://doi.org/10.1109/iros55552.2023.10341801"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros55552.2023.10341801","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047063533","display_name":"Connor Basich","orcid":"https://orcid.org/0000-0001-9522-5277"},"institutions":[{"id":"https://openalex.org/I177605424","display_name":"Amherst College","ror":"https://ror.org/028vqfs63","country_code":"US","type":"funder","lineage":["https://openalex.org/I177605424"]},{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"funder","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Connor Basich","raw_affiliation_strings":["University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA","institution_ids":["https://openalex.org/I177605424","https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056120915","display_name":"Saaduddin Mahmud","orcid":null},"institutions":[{"id":"https://openalex.org/I177605424","display_name":"Amherst College","ror":"https://ror.org/028vqfs63","country_code":"US","type":"funder","lineage":["https://openalex.org/I177605424"]},{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"funder","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saaduddin Mahmud","raw_affiliation_strings":["University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA","institution_ids":["https://openalex.org/I177605424","https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027224308","display_name":"Shlomo Zilberstein","orcid":"https://orcid.org/0000-0001-9817-7848"},"institutions":[{"id":"https://openalex.org/I177605424","display_name":"Amherst College","ror":"https://ror.org/028vqfs63","country_code":"US","type":"funder","lineage":["https://openalex.org/I177605424"]},{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"funder","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shlomo Zilberstein","raw_affiliation_strings":["University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"University of Massachusetts Amherst, Manning College of Information and Computer Sciences, Amherst, MA, USA","institution_ids":["https://openalex.org/I177605424","https://openalex.org/I24603500"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.345,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.431761,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":65,"max":76},"biblio":{"volume":null,"issue":null,"first_page":"3680","last_page":"3687"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.993,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9799,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.8744619},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.79360235},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.78523767},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.67651594},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.61699235},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.55122244},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4461754},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41221285},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.32500464},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10769799},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros55552.2023.10341801","pdf_url":null,"source":{"id":"https://openalex.org/S4363607734","display_name":"2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation","award_id":"1954782"}],"datasets":[],"versions":[],"referenced_works_count":31,"referenced_works":["https://openalex.org/W1854776945","https://openalex.org/W1964535365","https://openalex.org/W2092898161","https://openalex.org/W2098441518","https://openalex.org/W2102660061","https://openalex.org/W2151074445","https://openalex.org/W2154018708","https://openalex.org/W2166468218","https://openalex.org/W2215828449","https://openalex.org/W2502094132","https://openalex.org/W2763152536","https://openalex.org/W2789758093","https://openalex.org/W2792089292","https://openalex.org/W2889990052","https://openalex.org/W2903994599","https://openalex.org/W2966994213","https://openalex.org/W3130163632","https://openalex.org/W3138984732","https://openalex.org/W3196243818","https://openalex.org/W3207713159","https://openalex.org/W398859631","https://openalex.org/W4200298307","https://openalex.org/W4210909794","https://openalex.org/W4280606444","https://openalex.org/W4287083725","https://openalex.org/W4312461184","https://openalex.org/W4312772252","https://openalex.org/W4313325089","https://openalex.org/W4382239602","https://openalex.org/W4385431139","https://openalex.org/W569478347"],"related_works":["https://openalex.org/W5922282","https://openalex.org/W563589758","https://openalex.org/W4388311650","https://openalex.org/W4299447939","https://openalex.org/W4245343541","https://openalex.org/W2954004777","https://openalex.org/W2951102138","https://openalex.org/W2949638731","https://openalex.org/W2386077341","https://openalex.org/W1974056099"],"abstract_inverted_index":{"Learning":[0],"from":[1,52],"feedback":[2,146],"is":[3,11],"a":[4,15,25,46,71,125,138],"common":[5],"paradigm":[6],"to":[7,13,41,80,123,134],"acquire":[8],"information":[9],"that":[10,30,43,117,131,142,152],"hard":[12],"specify":[14],"priori.":[16],"In":[17],"this":[18],"work,":[19],"we":[20,76,94],"consider":[21,144],"an":[22,121,148],"agent":[23,38,122],"with":[24,128],"known":[26],"nominal":[27],"reward":[28],"model":[29],"captures":[31],"its":[32],"high-level":[33],"task":[34],"objective.":[35],"Furthermore,":[36],"the":[37,91,100],"operates":[39],"subject":[40],"constraints":[42],"are":[44],"unknown":[45],"priori":[47],"and":[48,93,109],"must":[49],"be":[50,87],"inferred":[51],"human":[53],"interventions.":[54],"Unlike":[55],"existing":[56],"methods,":[57],"our":[58,113,118],"approach":[59],"does":[60,153],"not":[61,154],"rely":[62],"on":[63,107],"full":[64],"or":[65,69],"partial":[66],"demonstration":[67],"trajectories":[68],"assume":[70,77],"fully":[72],"reactive":[73,145],"human.":[74,101],"Instead,":[75],"access":[78],"only":[79,95,143],"sparse":[81],"interventions,":[82],"which":[83],"may":[84],"in":[85,162],"fact":[86],"generated":[88],"proactively":[89],"by":[90],"human,":[92],"make":[96],"minimal":[97],"assumptions":[98],"about":[99],"We":[102,115],"provide":[103],"both":[104],"theoretical":[105],"bounds":[106],"performance":[108],"empirical":[110],"validations":[111],"of":[112],"method.":[114],"show":[116],"method":[119],"enables":[120],"learn":[124,147],"constraint":[126,150,158],"set":[127,151],"high":[129],"accuracy":[130],"generalizes":[132],"well":[133],"new":[135,163],"environments":[136],"within":[137],"domain,":[139],"whereas":[140],"methods":[141],"incorrect":[149],"generalize":[155],"well,":[156],"making":[157],"violations":[159],"more":[160],"likely":[161],"environments.":[164]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4389666497","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-04-17T16:11:59.488167","created_date":"2023-12-14"}