{"id":"https://openalex.org/W4386942247","doi":"https://doi.org/10.48550/arxiv.2309.11281","title":"Language-driven Object Fusion into Neural Radiance Fields with Pose-Conditioned Dataset Updates","display_name":"Language-driven Object Fusion into Neural Radiance Fields with Pose-Conditioned Dataset Updates","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386942247","doi":"https://doi.org/10.48550/arxiv.2309.11281"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.11281","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2309.11281","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092506210","display_name":"Ka Chun Shum","orcid":"https://orcid.org/0000-0001-6398-5693"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shum, Ka Chun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015194203","display_name":"Jenny J. Kim","orcid":"https://orcid.org/0000-0002-0432-6847"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Jaeyeon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028533837","display_name":"Binh\u2010Son Hua","orcid":"https://orcid.org/0000-0002-5706-8634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hua, Binh-Son","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024634557","display_name":"Duc Thanh Nguyen","orcid":"https://orcid.org/0000-0002-2285-2066"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Duc Thanh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5027689970","display_name":"Sai-Kit Yeung","orcid":"https://orcid.org/0000-0001-7974-0607"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yeung, Sai-Kit","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.700164,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":65,"max":76},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.994,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9936,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.42909315}],"concepts":[{"id":"https://openalex.org/C23690007","wikidata":"https://www.wikidata.org/wiki/Q1411145","display_name":"Radiance","level":2,"score":0.9447924},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7814194},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.73229223},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.71040136},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6947049},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.51644087},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4545554},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.42909315},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4241553},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4166286},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.34216124},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.22276023},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.20924157},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.11924988},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07761818},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.11281","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.11281","pdf_url":"http://arxiv.org/pdf/2309.11281","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2309.11281","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2309.11281","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4321518006","https://openalex.org/W4319309705","https://openalex.org/W4292830139","https://openalex.org/W2896728493","https://openalex.org/W2392142157","https://openalex.org/W2331836163","https://openalex.org/W2043512367","https://openalex.org/W2005276308","https://openalex.org/W1994657804","https://openalex.org/W1834370135"],"abstract_inverted_index":{"Neural":[0],"radiance":[1,24,53,75,111,139,208],"field":[2,112,140,209],"is":[3],"an":[4],"emerging":[5],"rendering":[6],"method":[7,172,191],"that":[8,89,114,137,160,189],"generates":[9,192],"high-quality":[10],"multi-view":[11,70],"consistent":[12],"images":[13,71,88,103,119,194],"from":[14,178],"a":[15,44,61,67,73,79,133],"neural":[16,23,52,207],"scene":[17,30],"representation":[18],"and":[19,85,124,199,206],"volume":[20],"rendering.":[21],"Although":[22],"field-based":[25],"techniques":[26],"are":[27,104],"robust":[28],"for":[29,48,107,173],"reconstruction,":[31],"their":[32],"ability":[33],"to":[34,59,83,146,151,155],"add":[35],"or":[36],"remove":[37],"objects":[38],"remains":[39],"limited.":[40],"This":[41],"paper":[42],"proposes":[43],"new":[45,62],"language-driven":[46],"approach":[47],"object":[49,64,92,123,174,184],"manipulation":[50],"with":[51,142],"fields":[54],"through":[55],"dataset":[56,134,164],"updates.":[57],"Specifically,":[58],"insert":[60],"foreground":[63],"represented":[65],"by":[66],"set":[68],"of":[69,93,195],"into":[72,95],"background":[74,98,110],"field,":[76],"we":[77,115,131,167],"use":[78],"text-to-image":[80],"diffusion":[81],"model":[82],"learn":[84],"generate":[86],"combined":[87,102],"fuse":[90],"the":[91,96,109,122,125,147,153,162,196],"interest":[94],"given":[97],"across":[99],"views.":[100,157],"These":[101],"then":[105],"used":[106],"refining":[108],"so":[113],"can":[116,168],"render":[117],"view-consistent":[118],"containing":[120],"both":[121],"background.":[126],"To":[127],"ensure":[128],"view":[129],"consistency,":[130],"propose":[132],"updates":[135,165],"strategy":[136],"prioritizes":[138],"training":[141,154],"camera":[143],"views":[144,149],"close":[145],"already-trained":[148],"prior":[150],"propagating":[152],"remaining":[156],"We":[158],"show":[159,188],"under":[161],"same":[163],"strategy,":[166],"easily":[169],"adapt":[170],"our":[171,190],"insertion":[175],"using":[176],"data":[177],"text-to-3D":[179],"models":[180],"as":[181,183],"well":[182],"removal.":[185],"Experimental":[186],"results":[187],"photorealistic":[193],"edited":[197],"scenes,":[198],"outperforms":[200],"state-of-the-art":[201],"methods":[202],"in":[203],"3D":[204],"reconstruction":[205],"blending.":[210]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386942247","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-04-20T11:15:52.486575","created_date":"2023-09-22"}