{"id":"https://openalex.org/W4389363342","doi":"https://doi.org/10.48550/arxiv.2312.01097","title":"Planning as In-Painting: A Diffusion-Based Embodied Task Planning Framework for Environments under Uncertainty","display_name":"Planning as In-Painting: A Diffusion-Based Embodied Task Planning Framework for Environments under Uncertainty","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4389363342","doi":"https://doi.org/10.48550/arxiv.2312.01097"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2312.01097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2312.01097","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103056761","display_name":"Cheng-Fu Yang","orcid":"https://orcid.org/0000-0002-6916-2142"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Cheng-Fu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101565189","display_name":"Haoyang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Haoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102433365","display_name":"Te-Lin Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Te-Lin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023073132","display_name":"Xiaofeng Gao","orcid":"https://orcid.org/0000-0003-3331-9846"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Xiaofeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087096372","display_name":"Kai-Wei Chang","orcid":"https://orcid.org/0000-0001-5365-0072"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Kai-Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101697250","display_name":"Feng Gao","orcid":"https://orcid.org/0000-0003-3835-6929"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Feng","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.762268,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":68,"max":79},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.894,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.894,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.8769,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8746,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.48546368}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.78766},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5066122},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4992137},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.48546368},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.42981568},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35680336},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33898515},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.09609595},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2312.01097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.01097","pdf_url":"http://arxiv.org/pdf/2312.01097","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2312.01097","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2312.01097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.65,"id":"https://metadata.un.org/sdg/11"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4381280689","https://openalex.org/W3196817267","https://openalex.org/W3128025644","https://openalex.org/W3033859939","https://openalex.org/W2847365777","https://openalex.org/W2787993192","https://openalex.org/W2375707231","https://openalex.org/W2158269427","https://openalex.org/W2072180474","https://openalex.org/W1960052459"],"abstract_inverted_index":{"Task":[0],"planning":[1,46,140,166],"for":[2,68,131],"embodied":[3,156],"AI":[4,157],"has":[5],"been":[6],"one":[7],"of":[8,23,39,109],"the":[9,14,88,91,107,110,114,128,145],"most":[10],"challenging":[11],"problems":[12],"where":[13],"community":[15],"does":[16],"not":[17],"meet":[18],"a":[19,35,45,51,63,132,168],"consensus":[20],"in":[21,154,167],"terms":[22],"formulation.":[24],"In":[25,58],"this":[26,32,59],"paper,":[27],"we":[28,49,61,136],"aim":[29],"to":[30,87,105,142],"tackle":[31],"problem":[33],"with":[34,144],"unified":[36],"framework":[37,150],"consisting":[38],"an":[40,138],"end-to-end":[41],"trainable":[42],"method":[43,53,96],"and":[44,76,102,164],"algorithm.":[47],"Particularly,":[48],"propose":[50,137],"task-agnostic":[52],"named":[54],"'planning":[55],"as":[56],"in-painting'.":[57],"method,":[60],"use":[62],"Denoising":[64],"Diffusion":[65],"Model":[66],"(DDM)":[67],"plan":[69,129],"generation,":[70],"conditioned":[71],"on":[72],"both":[73,99],"language":[74],"instructions":[75],"perceptual":[77],"inputs":[78],"under":[79],"partially":[80],"observable":[81],"environments.":[82],"Partial":[83],"observation":[84],"often":[85],"leads":[86],"model":[89],"hallucinating":[90],"planning.":[92],"Therefore,":[93],"our":[94],"diffusion-based":[95,146],"jointly":[97],"models":[98],"state":[100],"trajectory":[101],"goal":[103],"estimation":[104],"improve":[106],"reliability":[108],"generated":[111],"plan,":[112],"given":[113],"limited":[115],"available":[116,175],"information":[117,126],"at":[118],"each":[119],"step.":[120],"To":[121],"better":[122],"leverage":[123],"newly":[124],"discovered":[125],"along":[127],"execution":[130],"higher":[133],"success":[134],"rate,":[135],"on-the-fly":[139],"algorithm":[141],"collaborate":[143],"planner.":[147],"The":[148,172],"proposed":[149],"achieves":[151],"promising":[152],"performances":[153],"various":[155],"tasks,":[158],"including":[159],"vision-language":[160],"navigation,":[161],"object":[162],"manipulation,":[163],"task":[165],"photorealistic":[169],"virtual":[170],"environment.":[171],"code":[173],"is":[174],"at:":[176],"https://github.com/joeyy5588/planning-as-inpainting.":[177]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4389363342","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2024-12-30T18:54:39.237127","created_date":"2023-12-06"}