{"id":"https://openalex.org/W4386076111","doi":"https://doi.org/10.1109/cvpr52729.2023.02220","title":"Where We Are and What We're Looking At: Query Based Worldwide Image Geo-localization Using Hierarchies and Scenes","display_name":"Where We Are and What We're Looking At: Query Based Worldwide Image Geo-localization Using Hierarchies and Scenes","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4386076111","doi":"https://doi.org/10.1109/cvpr52729.2023.02220"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02220","pdf_url":null,"source":{"id":"https://openalex.org/S4363607701","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2303.04249","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110331713","display_name":"Brandon Clark","orcid":null},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brandon Clark","raw_affiliation_strings":["Center for Research in Computer, Vision University of Central Florida, Orlando, USA"],"affiliations":[{"raw_affiliation_string":"Center for Research in Computer, Vision University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026216387","display_name":"Alec Kerrigan","orcid":null},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alec Kerrigan","raw_affiliation_strings":["Center for Research in Computer, Vision University of Central Florida, Orlando, USA"],"affiliations":[{"raw_affiliation_string":"Center for Research in Computer, Vision University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062715029","display_name":"Parth Parag Kulkarni","orcid":null},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Parth Parag Kulkarni","raw_affiliation_strings":["Center for Research in Computer, Vision University of Central Florida, Orlando, USA"],"affiliations":[{"raw_affiliation_string":"Center for Research in Computer, Vision University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007754816","display_name":"Vicente Vivanco Cepeda","orcid":null},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vicente Vivanco Cepeda","raw_affiliation_strings":["Center for Research in Computer, Vision University of Central Florida, Orlando, USA"],"affiliations":[{"raw_affiliation_string":"Center for Research in Computer, Vision University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080823547","display_name":"Mubarak Shah","orcid":"https://orcid.org/0000-0001-6172-5572"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mubarak Shah","raw_affiliation_strings":["Center for Research in Computer, Vision University of Central Florida, Orlando, USA"],"affiliations":[{"raw_affiliation_string":"Center for Research in Computer, Vision University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.069,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.42393,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9981,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9968,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/geographic-coordinate-system","display_name":"Geographic coordinate system","score":0.61722493},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.4599378},{"id":"https://openalex.org/keywords/representation","display_name":"Representation","score":0.45425797},{"id":"https://openalex.org/keywords/geotagging","display_name":"Geotagging","score":0.42480925}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.80678797},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.7322849},{"id":"https://openalex.org/C123046963","wikidata":"https://www.wikidata.org/wiki/Q22664","display_name":"Geographic coordinate system","level":2,"score":0.61722493},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.59632295},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.46965116},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.4599378},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4552199},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.45425797},{"id":"https://openalex.org/C53605480","wikidata":"https://www.wikidata.org/wiki/Q852595","display_name":"Geotagging","level":2,"score":0.42480925},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.41449678},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3434938},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3237859},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.19381768},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.13886476},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02220","pdf_url":null,"source":{"id":"https://openalex.org/S4363607701","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2303.04249","pdf_url":"https://arxiv.org/pdf/2303.04249","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2303.04249","pdf_url":"https://arxiv.org/pdf/2303.04249","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.82,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":23,"referenced_works":["https://openalex.org/W2103163130","https://openalex.org/W2250384498","https://openalex.org/W2284646714","https://openalex.org/W2587639398","https://openalex.org/W2732026016","https://openalex.org/W2886604692","https://openalex.org/W2895392434","https://openalex.org/W2964213180","https://openalex.org/W2971132234","https://openalex.org/W2981670313","https://openalex.org/W3023735075","https://openalex.org/W3030520226","https://openalex.org/W3035158519","https://openalex.org/W3094502228","https://openalex.org/W3138516171","https://openalex.org/W3160331414","https://openalex.org/W3169064633","https://openalex.org/W3174800995","https://openalex.org/W3179267034","https://openalex.org/W4212816667","https://openalex.org/W4312478462","https://openalex.org/W4312703192","https://openalex.org/W4320013936"],"related_works":["https://openalex.org/W4367046659","https://openalex.org/W4289559977","https://openalex.org/W2997512100","https://openalex.org/W2950265648","https://openalex.org/W2909382770","https://openalex.org/W2461263520","https://openalex.org/W2393933887","https://openalex.org/W2331043530","https://openalex.org/W2087332570","https://openalex.org/W1594844924"],"abstract_inverted_index":{"Determining":[0],"the":[1,24,59,71,88,101,140,155,192,212,245,252],"exact":[2],"latitude":[3],"and":[4,14,74,100,123,167,184,248],"longitude":[5],"that":[6,63,86],"a":[7,12,117,129,214,231],"photo":[8],"was":[9],"taken":[10,206,240],"is":[11],"useful":[13],"widely":[15],"applicable":[16],"task,":[17,217],"yet":[18],"it":[19,220],"remains":[20],"exceptionally":[21],"difficult":[22],"despite":[23],"accelerated":[25],"progress":[26],"of":[27,41,51,154,201,238,251],"other":[28],"computer":[29],"vision":[30],"tasks.":[31],"Most":[32],"previous":[33,193,196],"approaches":[34,55],"have":[35],"opted":[36],"to":[37,57,66,97],"learn":[38,128],"single":[39],"representations":[40,179],"query":[42,118],"images,":[43],"which":[44,186,210],"are":[45,143],"then":[46],"classified":[47],"at":[48,260],"different":[49,60,67,91,133,137,148,178,181],"levels":[50,93],"geographic":[52,92,121],"granularity.":[53],"These":[54],"fail":[56],"exploit":[58],"visual":[61,103,149,182],"cues":[62],"give":[64],"context":[65],"hierarchies,":[68],"such":[69],"as":[70,98,136,169,171],"country,":[72],"state,":[73],"city":[75],"level.":[76],"To":[77,225],"this":[78,114,227],"end,":[79],"we":[80,95,127,229],"introduce":[81,230],"an":[82,107],"end-to-end":[83],"transformer-based":[84],"architecture":[85],"exploits":[87],"relationship":[89],"between":[90],"(which":[94],"refer":[96],"hierarchies)":[99],"corresponding":[102],"scene":[104,124],"information":[105],"in":[106,139,191],"image":[108],"through":[109],"hierarchical":[110],"cross-attention.":[111],"We":[112,151],"achieve":[113,152],"by":[115,146],"learning":[116],"for":[119,132,180],"each":[120],"hierarchy":[122],"type.":[125],"Furthermore,":[126],"separate":[130],"representation":[131],"environmental":[134],"scenes,":[135,185],"scenes":[138],"same":[141],"location":[142],"often":[144],"defined":[145],"completely":[147],"features.":[150],"state":[153,250],"art":[156,253],"accuracy":[157],"on":[158],"4":[159],"standard":[160],"geo-localization":[161],"datasets":[162,198],":":[163],"Im2GPS,":[164],"Im2GPS3k,":[165],"YFCC4k,":[166],"YFCC26k,":[168],"well":[170],"qualitatively":[172],"demonstrate":[173],"how":[174],"our":[175],"method":[176],"learns":[177],"hierarchies":[183],"has":[187],"not":[188],"been":[189],"demonstrated":[190],"methods.":[194],"Above":[195],"testing":[197,234],"mostly":[199],"consist":[200],"iconic":[202],"landmarks":[203],"or":[204,218],"images":[205,239],"from":[207,241],"social":[208],"media,":[209],"makes":[211,219],"dataset":[213],"simple":[215],"memory":[216],"biased":[221],"towards":[222],"certain":[223],"places.":[224],"address":[226],"issue":[228],"much":[232],"harder":[233],"dataset,":[235],"Google-World-Streets-15k,":[236],"comprised":[237],"Google":[242],"Streetview":[243],"covering":[244],"whole":[246],"planet":[247],"present":[249],"results.":[254],"Our":[255],"code":[256],"can":[257],"be":[258],"found":[259],"https://github.com/AHKerrigan/GeoGuessNet.":[261]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386076111","counts_by_year":[{"year":2024,"cited_by_count":8}],"updated_date":"2025-01-21T06:06:58.266301","created_date":"2023-08-23"}