{"id":"https://openalex.org/W4392222072","doi":"https://doi.org/10.48550/arxiv.2402.16174","title":"GenNBV: Generalizable Next-Best-View Policy for Active 3D Reconstruction","display_name":"GenNBV: Generalizable Next-Best-View Policy for Active 3D Reconstruction","publication_year":2024,"publication_date":"2024-02-25","ids":{"openalex":"https://openalex.org/W4392222072","doi":"https://doi.org/10.48550/arxiv.2402.16174"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16174","pdf_url":"http://arxiv.org/pdf/2402.16174","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2402.16174","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094018452","display_name":"Xiao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094018453","display_name":"Quanyi Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Quanyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094018454","display_name":"Tai Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Tai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094018455","display_name":"Tianfan Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Tianfan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020672335","display_name":"Jiangmiao Pang","orcid":"https://orcid.org/0000-0002-6711-9319"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pang, Jiangmiao","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":84},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9559,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9559,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9543,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.9262,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/3d-reconstruction","display_name":"3D Reconstruction","score":0.570676},{"id":"https://openalex.org/keywords/deformable-image-registration","display_name":"Deformable Image Registration","score":0.515828},{"id":"https://openalex.org/keywords/imaging","display_name":"Imaging","score":0.511467},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image Segmentation","score":0.510248}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48920965}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16174","pdf_url":"http://arxiv.org/pdf/2402.16174","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.16174","pdf_url":"http://arxiv.org/pdf/2402.16174","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391913857","https://openalex.org/W2748952813","https://openalex.org/W2530322880","https://openalex.org/W2478288626","https://openalex.org/W2390279801","https://openalex.org/W2382290278","https://openalex.org/W2376932109","https://openalex.org/W2358668433","https://openalex.org/W2350741829","https://openalex.org/W2001405890"],"abstract_inverted_index":{"While":[0],"recent":[1],"advances":[2],"in":[3],"neural":[4],"radiance":[5],"field":[6],"enable":[7],"realistic":[8],"digitization":[9],"for":[10,33],"large-scale":[11],"scenes,":[12],"the":[13,29,38,109,131,136],"image-capturing":[14],"process":[15,27],"is":[16],"still":[17],"time-consuming":[18],"and":[19,79,99,123,138,154],"labor-intensive.":[20],"Previous":[21],"works":[22],"attempt":[23],"to":[24,85,94,141],"automate":[25],"this":[26,143],"using":[28,130],"Next-Best-View":[30],"(NBV)":[31],"policy":[32,72,150],"active":[34],"3D":[35],"reconstruction.":[36],"However,":[37],"existing":[39],"NBV":[40,69,144],"policies":[41],"heavily":[42],"rely":[43],"on":[44,158],"hand-crafted":[45],"criteria,":[46],"limited":[47,82],"action":[48,83,124],"space,":[49],"or":[50],"per-scene":[51],"optimized":[52],"representations.":[53,125],"These":[54],"constraints":[55],"limit":[56],"their":[57],"cross-dataset":[58,110],"generalizability.":[59],"To":[60,107],"overcome":[61],"them,":[62],"we":[63,112],"propose":[64,114],"GenNBV,":[65],"an":[66],"end-to-end":[67],"generalizable":[68],"policy.":[70,145],"Our":[71],"adopts":[73],"a":[74,115,128,152],"reinforcement":[75],"learning":[76],"(RL)-based":[77],"framework":[78],"extends":[80],"typical":[81],"space":[84],"5D":[86],"free":[87],"space.":[88],"It":[89],"empowers":[90],"our":[91,149],"agent":[92],"drone":[93],"scan":[95],"from":[96,162],"any":[97],"viewpoint,":[98],"even":[100],"interact":[101],"with":[102,135],"unseen":[103,159],"geometries":[104],"during":[105],"training.":[106],"boost":[108],"generalizability,":[111],"also":[113],"novel":[116],"multi-source":[117],"state":[118],"embedding,":[119],"including":[120],"geometric,":[121],"semantic,":[122],"We":[126],"establish":[127],"benchmark":[129],"Isaac":[132],"Gym":[133],"simulator":[134],"Houses3K":[137],"OmniObject3D":[139],"datasets":[140],"evaluate":[142],"Experiments":[146],"demonstrate":[147],"that":[148],"achieves":[151],"98.26%":[153],"97.12%":[155],"coverage":[156],"ratio":[157],"building-scale":[160],"objects":[161],"these":[163],"datasets,":[164],"respectively,":[165],"outperforming":[166],"prior":[167],"solutions.":[168]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4392222072","counts_by_year":[],"updated_date":"2024-12-05T18:01:25.860305","created_date":"2024-02-28"}