{"id":"https://openalex.org/W4387623711","doi":"https://doi.org/10.1109/tpami.2023.3324021","title":"Towards Codebook-Free Deep Probabilistic Quantization for Image Retrieval","display_name":"Towards Codebook-Free Deep Probabilistic Quantization for Image Retrieval","publication_year":2023,"publication_date":"2023-10-13","ids":{"openalex":"https://openalex.org/W4387623711","doi":"https://doi.org/10.1109/tpami.2023.3324021","pmid":"https://pubmed.ncbi.nlm.nih.gov/37831563"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2023.3324021","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100340979","display_name":"Min Wang","orcid":"https://orcid.org/0000-0003-3048-6980"},"institutions":[],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Wang","raw_affiliation_strings":["Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046805800","display_name":"Wengang Zhou","orcid":"https://orcid.org/0000-0003-1690-9836"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wengang Zhou","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103015022","display_name":"Yao Xin","orcid":"https://orcid.org/0000-0002-2166-9315"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Yao","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Artificial Intelligence, Cloud BU, Huawei, China"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence, Cloud BU, Huawei, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Houqiang Li","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.325,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.588886,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":69,"max":80},"biblio":{"volume":"46","issue":"1","first_page":"626","last_page":"640"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Image Feature Retrieval and Recognition Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Image Feature Retrieval and Recognition Techniques","score":0.9997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Shape Matching and Object Recognition","score":0.9988,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Advances in Transfer Learning and Domain Adaptation","score":0.9804,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image Retrieval","score":0.549084},{"id":"https://openalex.org/keywords/content-based-image-retrieval","display_name":"Content-Based Image Retrieval","score":0.545266},{"id":"https://openalex.org/keywords/visual-recognition","display_name":"Visual Recognition","score":0.529202},{"id":"https://openalex.org/keywords/representation-learning","display_name":"Representation Learning","score":0.525199},{"id":"https://openalex.org/keywords/feature-matching","display_name":"Feature Matching","score":0.521918},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.50445473},{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.46578494},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.42578197}],"concepts":[{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.7192094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6808585},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6580781},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.629079},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.6110087},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.59418523},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5897346},{"id":"https://openalex.org/C24881265","wikidata":"https://www.wikidata.org/wiki/Q757267","display_name":"Voronoi diagram","level":2,"score":0.5848432},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.50445473},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.47711352},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.46578494},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.43299574},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.42578197},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.41173717},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3016336},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2667645},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.18785155},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2023.3324021","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37831563","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":["National Institutes of Health"],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.76,"display_name":"Reduced inequalities"}],"grants":[{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"61836011"},{"funder":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China","award_id":"62102128"},{"funder":"https://openalex.org/F4320325599","funder_display_name":"University of Science and Technology of China","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":40,"referenced_works":["https://openalex.org/W1566135517","https://openalex.org/W1861492603","https://openalex.org/W1910300841","https://openalex.org/W1974647172","https://openalex.org/W1992371516","https://openalex.org/W2007972815","https://openalex.org/W2108598243","https://openalex.org/W2117539524","https://openalex.org/W2119717200","https://openalex.org/W2124386111","https://openalex.org/W2124509324","https://openalex.org/W2148554573","https://openalex.org/W2194775991","https://openalex.org/W2293824885","https://openalex.org/W2473499128","https://openalex.org/W2508837377","https://openalex.org/W2538995153","https://openalex.org/W2562322388","https://openalex.org/W2738649458","https://openalex.org/W2765323189","https://openalex.org/W2781821509","https://openalex.org/W2798834175","https://openalex.org/W2799245683","https://openalex.org/W2889024947","https://openalex.org/W2889119508","https://openalex.org/W2962849264","https://openalex.org/W2964280870","https://openalex.org/W2966153044","https://openalex.org/W2966196493","https://openalex.org/W2974986023","https://openalex.org/W2982512683","https://openalex.org/W2997729898","https://openalex.org/W3003460937","https://openalex.org/W3034239448","https://openalex.org/W3035732386","https://openalex.org/W3093826451","https://openalex.org/W3114063012","https://openalex.org/W3170038038","https://openalex.org/W3176085205","https://openalex.org/W4313153605"],"related_works":["https://openalex.org/W2391875658","https://openalex.org/W2387054321","https://openalex.org/W2352648934","https://openalex.org/W2148772884","https://openalex.org/W2100120615","https://openalex.org/W2062765737","https://openalex.org/W2017514583","https://openalex.org/W2017401491","https://openalex.org/W2012827167","https://openalex.org/W1929869830"],"abstract_inverted_index":{"As":[0],"a":[1,77,174],"classical":[2],"feature":[3,22,29,61],"compression":[4],"technique,":[5],"quantization":[6,18,81,182],"is":[7,44,169],"usually":[8],"coupled":[9],"with":[10,129,160],"inverted":[11,88,115,127,158],"indices":[12,89],"for":[13,51],"scalable":[14],"image":[15,53,103,124,188,199],"retrieval.":[16,54,200],"Most":[17],"methods":[19],"explicitly":[20],"divide":[21],"space":[23,49,62,178],"into":[24,34,113,125],"Voronoi":[25,42,70],"cells,":[26],"and":[27,106,135],"quantize":[28,122],"vectors":[30],"in":[31],"each":[32,114,123,140],"cell":[33],"the":[35,97,126,130,137,148,154,157,166,191],"centroids":[36],"learned":[37],"from":[38],"data":[39],"distribution.":[40],"However,":[41],"decomposition":[43],"difficult":[45],"to":[46,152,173],"achieve":[47],"discriminative":[48,177],"partition":[50,63,179],"semantic":[52,198],"In":[55,94,163],"this":[56,73,164],"paper,":[57],"we":[58,75,120],"explore":[59],"semantic-aware":[60],"by":[64],"deep":[65,79,98,149],"neural":[66,99,150],"network":[67,100,151],"instead":[68],"of":[69,110,139,156,193],"cells.":[71],"To":[72],"end,":[74],"propose":[76],"new":[78],"probabilistic":[80],"method,":[82,96],"abbreviated":[83],"as":[84,104],"DeepIndex,":[85],"which":[86],"constructs":[87],"without":[90],"explicit":[91],"centroid":[92],"learning.":[93],"our":[95,194],"takes":[101],"an":[102],"input":[105],"outputs":[107],"its":[108],"probability":[109,155],"being":[111],"put":[112],"index":[116],"list.":[117],"During":[118],"training,":[119],"progressively":[121],"lists":[128],"top-":[131],"T":[132],"maximal":[133,161],"probabilities,":[134],"calculate":[136],"reward":[138],"trial":[141],"based":[142],"on":[143,186,197],"retrieval":[144,167],"accuracy.":[145],"We":[146],"optimize":[147],"maximize":[153],"list":[159],"reward.":[162],"way,":[165],"performance":[168],"directly":[170],"optimized,":[171],"leading":[172],"more":[175],"semantically":[176],"than":[180],"other":[181],"methods.":[183],"The":[184],"experiments":[185],"public":[187],"datasets":[189],"demonstrate":[190],"effectiveness":[192],"DeepIndex":[195],"method":[196]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4387623711","counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2024-12-01T00:48:12.141320","created_date":"2023-10-14"}