{"id":"https://openalex.org/W4387560259","doi":"https://doi.org/10.48550/arxiv.2310.05666","title":"Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection","display_name":"Anchor-Intermediate Detector: Decoupling and Coupling Bounding Boxes for Accurate Object Detection","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4387560259","doi":"https://doi.org/10.48550/arxiv.2310.05666"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.05666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2310.05666","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001189481","display_name":"Yilong Lv","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lv, Yilong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101816655","display_name":"Min Li","orcid":"https://orcid.org/0000-0003-0128-5143"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Min","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062694900","display_name":"Yujie He","orcid":"https://orcid.org/0000-0002-2299-4945"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Yujie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100737906","display_name":"Shaopeng Li","orcid":"https://orcid.org/0000-0001-7560-9951"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shaopeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087413884","display_name":"Zhuzhen He","orcid":"https://orcid.org/0009-0008-8056-0863"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Zhuzhen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084958010","display_name":"Aitao Yang","orcid":"https://orcid.org/0000-0003-2535-2371"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Aitao","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.700164,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":65,"max":76},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9828,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9758,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.78632975},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.70133966},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.66085476},{"id":"https://openalex.org/keywords/corner-detection","display_name":"Corner detection","score":0.42735028}],"concepts":[{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.78632975},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.7278997},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.70133966},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.66085476},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.61625224},{"id":"https://openalex.org/C175291020","wikidata":"https://www.wikidata.org/wiki/Q1156822","display_name":"Offset (computer science)","level":2,"score":0.59928936},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.56212956},{"id":"https://openalex.org/C39499422","wikidata":"https://www.wikidata.org/wiki/Q697320","display_name":"Corner detection","level":3,"score":0.42735028},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.41785342},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.41682377},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4027045},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37981433},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.32107323},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29018468},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.21893165},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.19935867},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14122635},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08046931},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.05666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.05666","pdf_url":"http://arxiv.org/pdf/2310.05666","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2310.05666","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2310.05666","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4390524233","https://openalex.org/W4287027631","https://openalex.org/W4237171675","https://openalex.org/W3209723314","https://openalex.org/W3205398323","https://openalex.org/W3192357901","https://openalex.org/W3036286480","https://openalex.org/W2952736415","https://openalex.org/W2883297582","https://openalex.org/W2387360586"],"abstract_inverted_index":{"Anchor-based":[0],"detectors":[1],"have":[2],"been":[3],"continuously":[4],"developed":[5],"for":[6],"object":[7],"detection.":[8],"However,":[9],"the":[10,19,49,54,60,65,79,84,91,102,126,134,146,164],"individual":[11],"anchor":[12],"box":[13,28,131],"makes":[14],"it":[15],"difficult":[16],"to":[17,39,73,82,124,132],"predict":[18],"boundary's":[20],"offset":[21],"accurately.":[22],"Instead":[23],"of":[24,68,128],"taking":[25],"each":[26,74,129],"bounding":[27,130],"as":[29],"a":[30,94],"closed":[31],"individual,":[32],"we":[33,77],"consider":[34],"using":[35],"multiple":[36],"boxes":[37],"together":[38],"get":[40],"prediction":[41],"boxes.":[42,70],"To":[43,89],"this":[44,46],"end,":[45],"paper":[47],"proposes":[48],"\\textbf{Box":[50],"Decouple-Couple(BDC)":[51],"strategy}":[52],"in":[53],"inference,":[55],"which":[56,105],"no":[57],"longer":[58],"discards":[59],"overlapping":[61],"boxes,":[62],"but":[63,96],"decouples":[64],"corner":[66,80,87,137],"points":[67,81],"these":[69],"Then,":[71],"according":[72],"corner's":[75],"score,":[76],"couple":[78],"select":[83],"most":[85],"accurate":[86],"pairs.":[88],"meet":[90],"BDC":[92],"strategy,":[93],"simple":[95],"novel":[97],"model":[98],"is":[99,122,175],"designed":[100],"named":[101],"\\textbf{Anchor-Intermediate":[103],"Detector(AID)},":[104],"contains":[106],"two":[107],"head":[108,113,121],"networks,":[109],"i.e.,":[110],"an":[111,115],"anchor-based":[112],"and":[114,155,160,172],"anchor-free":[116],"\\textbf{Corner-aware":[117],"head}.":[118],"The":[119],"corner-aware":[120],"able":[123],"score":[125],"corners":[127],"facilitate":[133],"coupling":[135],"between":[136],"points.":[138],"Extensive":[139],"experiments":[140],"on":[141,163],"MS":[142,165],"COCO":[143,166],"show":[144],"that":[145],"proposed":[147],"anchor-intermediate":[148],"detector":[149],"respectively":[150],"outperforms":[151],"their":[152],"baseline":[153],"RetinaNet":[154],"GFL":[156],"method":[157],"by":[158],"$\\sim$2.4":[159],"$\\sim$1.2":[161],"AP":[162],"test-dev":[167],"dataset":[168],"without":[169],"any":[170],"bells":[171],"whistles.":[173],"Code":[174],"available":[176],"at:":[177],"https://github.com/YilongLv/AID.":[178]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4387560259","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-04-21T22:41:41.710324","created_date":"2023-10-12"}