{"id":"https://openalex.org/W3118341329","doi":"https://doi.org/10.1609/aaai.v35i2.16207","title":"Voxel R-CNN: Towards High Performance Voxel-based 3D Object Detection","display_name":"Voxel R-CNN: Towards High Performance Voxel-based 3D Object Detection","publication_year":2021,"publication_date":"2021-05-18","ids":{"openalex":"https://openalex.org/W3118341329","doi":"https://doi.org/10.1609/aaai.v35i2.16207","mag":"3118341329"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i2.16207","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16207/16014","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16207/16014","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089561793","display_name":"Jiajun Deng","orcid":"https://orcid.org/0000-0001-9624-7451"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiajun Deng","raw_affiliation_strings":["CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083443210","display_name":"Shaoshuai Shi","orcid":"https://orcid.org/0000-0003-2558-181X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaoshuai Shi","raw_affiliation_strings":["Multimedia Laboratory, The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory, The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018494554","display_name":"Peiwei Li","orcid":"https://orcid.org/0000-0002-2144-2022"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peiwei Li","raw_affiliation_strings":["CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046805800","display_name":"Wengang Zhou","orcid":"https://orcid.org/0000-0003-1690-9836"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wengang Zhou","raw_affiliation_strings":["CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China\nInstitute of Artificial Intelligence, Hefei Comprehensive National Science Center"],"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China\nInstitute of Artificial Intelligence, Hefei Comprehensive National Science Center","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053344541","display_name":"Yanyong Zhang","orcid":"https://orcid.org/0000-0001-6520-255X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanyong Zhang","raw_affiliation_strings":["Department of Computer Science, University of Science and Technology of China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Science and Technology of China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Houqiang Li","raw_affiliation_strings":["CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China\nInstitute of Artificial Intelligence, Hefei Comprehensive National Science Center"],"affiliations":[{"raw_affiliation_string":"CAS Key Laboratory of GIPAS, EEIS Department, University of Science and Technology of China\nInstitute of Artificial Intelligence, Hefei Comprehensive National Science Center","institution_ids":["https://openalex.org/I126520041"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":34.501,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":540,"citation_normalized_percentile":{"value":0.999868,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"35","issue":"2","first_page":"1201","last_page":"1209"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Deep Learning in Computer Vision and Image Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Deep Learning in Computer Vision and Image Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Simultaneous Localization and Mapping","score":0.9994,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Geospatial Modelling Techniques","score":0.9982,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object Detection","score":0.611484},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5486532},{"id":"https://openalex.org/keywords/3d-mapping","display_name":"3D Mapping","score":0.543998},{"id":"https://openalex.org/keywords/visual-odometry","display_name":"Visual Odometry","score":0.524909},{"id":"https://openalex.org/keywords/3d-reconstruction","display_name":"3D Reconstruction","score":0.519065},{"id":"https://openalex.org/keywords/structure-from-motion","display_name":"Structure from Motion","score":0.502713},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46425703}],"concepts":[{"id":"https://openalex.org/C54170458","wikidata":"https://www.wikidata.org/wiki/Q663554","display_name":"Voxel","level":2,"score":0.93225336},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8268062},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7502059},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5874613},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.57512337},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5486532},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5423809},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.47994712},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46425703},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4298194},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.42957613},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14020354},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1128158},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i2.16207","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16207/16014","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2012.15712","pdf_url":"https://arxiv.org/pdf/2012.15712","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v35i2.16207","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/16207/16014","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":46,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W2555618208","https://openalex.org/W2560609797","https://openalex.org/W2570343428","https://openalex.org/W2613718673","https://openalex.org/W2769571673","https://openalex.org/W2798965597","https://openalex.org/W2886904239","https://openalex.org/W2897529137","https://openalex.org/W2914821954","https://openalex.org/W2924050502","https://openalex.org/W2949708697","https://openalex.org/W2951517617","https://openalex.org/W2953106684","https://openalex.org/W2963121255","https://openalex.org/W2963351448","https://openalex.org/W2963400571","https://openalex.org/W2963727135","https://openalex.org/W2964062501","https://openalex.org/W2964166085","https://openalex.org/W2964350391","https://openalex.org/W2968296999","https://openalex.org/W2980072470","https://openalex.org/W2981949127","https://openalex.org/W2995681297","https://openalex.org/W2997188997","https://openalex.org/W2997814983","https://openalex.org/W3008105217","https://openalex.org/W3012494314","https://openalex.org/W3031752193","https://openalex.org/W3034236957","https://openalex.org/W3034314779","https://openalex.org/W3034602892","https://openalex.org/W3035172746","https://openalex.org/W3035346742","https://openalex.org/W3035574168","https://openalex.org/W3036853234","https://openalex.org/W3039666984","https://openalex.org/W3042259089","https://openalex.org/W3099930232","https://openalex.org/W3106250896","https://openalex.org/W3107212734","https://openalex.org/W3109646990","https://openalex.org/W4288093950","https://openalex.org/W4300939921","https://openalex.org/W4302979690"],"related_works":["https://openalex.org/W803346624","https://openalex.org/W4287804464","https://openalex.org/W3108539254","https://openalex.org/W3103989898","https://openalex.org/W3022252430","https://openalex.org/W2953234277","https://openalex.org/W2900413183","https://openalex.org/W2626256601","https://openalex.org/W2152352598","https://openalex.org/W147410782"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"on":[2,8,197,240],"3D":[3,11,24,97,162],"object":[4,98],"detection":[5,99,110,143,224],"heavily":[6],"rely":[7],"how":[9],"the":[10,51,66,102,154,198,204],"data":[12,68],"are":[13,26,69,195],"represented,":[14],"i.e.,":[15,233],"voxel-based":[16,52,123,217],"or":[17],"point-based":[18,27,147],"representation.":[19],"Many":[20],"existing":[21,216],"high":[22,42,95],"performance":[23,96],"detectors":[25],"because":[28,65],"this":[29,74,113],"structure":[30,53],"can":[31,106],"better":[32,55],"retain":[33],"precise":[34,86],"point":[35],"positions.":[36],"Nevertheless,":[37],"point-level":[38],"features":[39,134,185,189],"lead":[40],"to":[41,46,182,215],"computation":[43,155],"overheads":[44],"due":[45],"unordered":[47],"storage.":[48],"In":[49,73],"contrast,":[50],"is":[54,91,180,249],"suited":[56],"for":[57,94,190],"feature":[58],"extraction":[59],"but":[60,121,149],"often":[61],"yields":[62],"lower":[63],"accuracy":[64,144,225],"input":[67],"divided":[70],"into":[71],"grids.":[72],"paper,":[75],"we":[76,83,117],"take":[77],"a":[78,119,136,151,161,165,173,222,228,235],"slightly":[79],"different":[80],"viewpoint":[81],"---":[82],"find":[84],"that":[85,101,213],"positioning":[87],"of":[88,132,153,160,237],"raw":[89],"points":[90],"not":[92],"essential":[93],"and":[100,172,203],"coarse":[103],"voxel":[104,133,177,188],"granularity":[105],"also":[107],"offer":[108],"sufficient":[109],"accuracy.":[111],"Bearing":[112],"view":[114],"in":[115,135],"mind,":[116],"devise":[118],"simple":[120],"effective":[122],"framework,":[124],"named":[125],"Voxel":[126,157,219],"R-CNN.":[127],"By":[128],"taking":[129],"full":[130],"advantage":[131],"two-stage":[137],"approach,":[138],"our":[139],"method":[140],"achieves":[141],"comparable":[142],"with":[145],"state-of-the-art":[146],"models,":[148],"at":[150,234,251],"fraction":[152],"cost.":[156],"R-CNN":[158,220],"consists":[159],"backbone":[163],"network,":[164],"2D":[166],"bird-eye-view":[167],"(BEV)":[168],"Region":[169],"Proposal":[170],"Network,":[171],"detect":[174],"head.":[175],"A":[176],"RoI":[178,184],"pooling":[179],"devised":[181],"extract":[183],"directly":[186],"from":[187],"further":[191],"refinement.":[192],"Extensive":[193],"experiments":[194],"conducted":[196],"widely":[199],"used":[200],"KITTI":[201],"Dataset":[202],"more":[205],"recent":[206],"Waymo":[207],"Open":[208],"Dataset.":[209],"Our":[210],"results":[211],"show":[212],"compared":[214],"methods,":[218],"delivers":[221],"higher":[223],"while":[226],"maintaining":[227],"real-time":[229],"frame":[230],"processing":[231],"rate,":[232],"speed":[236],"25":[238],"FPS":[239],"an":[241],"NVIDIA":[242],"RTX":[243],"2080":[244],"Ti":[245],"GPU.":[246],"The":[247],"code":[248],"available":[250],"https://github.com/djiajunustc/Voxel-R-CNN.":[252]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3118341329","counts_by_year":[{"year":2024,"cited_by_count":143},{"year":2023,"cited_by_count":242},{"year":2022,"cited_by_count":101},{"year":2021,"cited_by_count":27}],"updated_date":"2024-11-28T13:24:55.522773","created_date":"2021-01-18"}