{"id":"https://openalex.org/W4386083094","doi":"https://doi.org/10.1109/cvpr52729.2023.02205","title":"Query - Dependent Video Representation for Moment Retrieval and Highlight Detection","display_name":"Query - Dependent Video Representation for Moment Retrieval and Highlight Detection","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4386083094","doi":"https://doi.org/10.1109/cvpr52729.2023.02205"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02205","pdf_url":null,"source":{"id":"https://openalex.org/S4363607701","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2303.13874","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001141317","display_name":"WonJun Moon","orcid":"https://orcid.org/0000-0003-2805-0926"},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"WonJun Moon","raw_affiliation_strings":["Sungkyunkwan University"],"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University","institution_ids":["https://openalex.org/I848706"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057187648","display_name":"Sangeek Hyun","orcid":"https://orcid.org/0000-0002-4050-6896"},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Sangeek Hyun","raw_affiliation_strings":["Sungkyunkwan University"],"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University","institution_ids":["https://openalex.org/I848706"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112985513","display_name":"SangUk Park","orcid":null},"institutions":[{"id":"https://openalex.org/I4210106348","display_name":"Teylers Museum","ror":"https://ror.org/01f0ym620","country_code":"NL","type":"archive","lineage":["https://openalex.org/I4210106348"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"SangUk Park","raw_affiliation_strings":["Pyler"],"affiliations":[{"raw_affiliation_string":"Pyler","institution_ids":["https://openalex.org/I4210106348"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066171177","display_name":"Dongchan Park","orcid":"https://orcid.org/0000-0002-6098-0210"},"institutions":[{"id":"https://openalex.org/I4210106348","display_name":"Teylers Museum","ror":"https://ror.org/01f0ym620","country_code":"NL","type":"archive","lineage":["https://openalex.org/I4210106348"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Dongchan Park","raw_affiliation_strings":["Pyler"],"affiliations":[{"raw_affiliation_string":"Pyler","institution_ids":["https://openalex.org/I4210106348"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029469141","display_name":"Jae\u2010Pil Heo","orcid":"https://orcid.org/0000-0001-9684-7641"},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jae-Pil Heo","raw_affiliation_strings":["Sungkyunkwan University"],"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University","institution_ids":["https://openalex.org/I848706"]}]}],"institution_assertions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":11.236,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.999956,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"23023","last_page":"23033"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.63440686},{"id":"https://openalex.org/keywords/video-retrieval","display_name":"Video retrieval","score":0.43674967}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.760391},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.6440673},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.63440686},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5926293},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.5612693},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.49411824},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.44182116},{"id":"https://openalex.org/C2983174267","wikidata":"https://www.wikidata.org/wiki/Q3775098","display_name":"Video retrieval","level":2,"score":0.43674967},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4311891},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.4223683},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37316817},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.310233},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.16585708},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02205","pdf_url":null,"source":{"id":"https://openalex.org/S4363607701","display_name":"2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2303.13874","pdf_url":"http://arxiv.org/pdf/2303.13874","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2303.13874","pdf_url":"http://arxiv.org/pdf/2303.13874","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[{"score":0.51,"id":"https://metadata.un.org/sdg/4","display_name":"Quality education"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":59,"referenced_works":["https://openalex.org/W1924343884","https://openalex.org/W1958932515","https://openalex.org/W2103908291","https://openalex.org/W2194775991","https://openalex.org/W2467794422","https://openalex.org/W2512435841","https://openalex.org/W2737677090","https://openalex.org/W2776277180","https://openalex.org/W2798354744","https://openalex.org/W2897091983","https://openalex.org/W2904824998","https://openalex.org/W2919974746","https://openalex.org/W2962766617","https://openalex.org/W2962869524","https://openalex.org/W2963017553","https://openalex.org/W2963095467","https://openalex.org/W2963351448","https://openalex.org/W2963729528","https://openalex.org/W2963919999","https://openalex.org/W2964089981","https://openalex.org/W2964158702","https://openalex.org/W2964232540","https://openalex.org/W2966848258","https://openalex.org/W2970401629","https://openalex.org/W2970898753","https://openalex.org/W2996108195","https://openalex.org/W2997429269","https://openalex.org/W2998495542","https://openalex.org/W3034743747","https://openalex.org/W3092462694","https://openalex.org/W3096609285","https://openalex.org/W3100255860","https://openalex.org/W3104862079","https://openalex.org/W3106775073","https://openalex.org/W3109316002","https://openalex.org/W3159619744","https://openalex.org/W3170874841","https://openalex.org/W3196253003","https://openalex.org/W3201832684","https://openalex.org/W3202168743","https://openalex.org/W3203003533","https://openalex.org/W3210314917","https://openalex.org/W3213165621","https://openalex.org/W3214448253","https://openalex.org/W329267344","https://openalex.org/W4214582399","https://openalex.org/W4214627427","https://openalex.org/W4221166385","https://openalex.org/W4226013992","https://openalex.org/W4283819318","https://openalex.org/W4312312588","https://openalex.org/W4312447943","https://openalex.org/W4312544061","https://openalex.org/W4312680331","https://openalex.org/W4312693115","https://openalex.org/W4312713480","https://openalex.org/W4312815172","https://openalex.org/W4385245566","https://openalex.org/W4390873008"],"related_works":["https://openalex.org/W2901901036","https://openalex.org/W2572349046","https://openalex.org/W2538384344","https://openalex.org/W2124814993","https://openalex.org/W2096359267","https://openalex.org/W2093300859","https://openalex.org/W2026738364","https://openalex.org/W2013069866","https://openalex.org/W1793997780","https://openalex.org/W1560919561"],"abstract_inverted_index":{"Recently,":[0],"video":[1,15,74,130],"moment":[2,29,82],"retrieval":[3],"and":[4,30,73,83,218],"highlight":[5],"detection":[6,96],"(MR/HD)":[7],"are":[8,157,222],"being":[9],"spotlighted":[10],"as":[11],"the":[12,28,39,44,60,68,81,104,124,135,140,145,168,187,193,201,205],"demand":[13],"for":[14,99,192,208],"understanding":[16],"is":[17,25,76],"drastically":[18],"increased.":[19],"The":[20],"key":[21],"objective":[22],"of":[23,62,107,126,138,189,203],"MR/HD":[24],"to":[26,38,121,133,148,159,170],"localize":[27],"estimate":[31,171],"clip-wise":[32],"accordance":[33,173],"level,":[34],"i.e.,":[35],"saliency":[36,162,182,190],"score,":[37],"given":[40,64,109,194],"text":[41,71,127],"query.":[42,65],"Although":[43],"recent":[45],"transformer-based":[46],"models":[47],"brought":[48],"some":[49],"advances,":[50],"we":[51,90,102,143,178],"found":[52],"that":[53],"these":[54],"methods":[55,214],"do":[56],"not":[57],"fully":[58],"exploit":[59],"information":[61],"a":[63,95,108],"For":[66],"example,":[67],"relevance":[69],"between":[70,174],"query":[72,110,128,141],"contents":[75],"sometimes":[77],"neglected":[78],"when":[79],"predicting":[80],"its":[84],"saliency.":[85],"To":[86],"tackle":[87],"this":[88],"issue,":[89],"introduce":[91],"Query-Dependent":[92],"DETR":[93],"(QD-DETR),":[94],"transformer":[97,112],"tailored":[98],"MR/HD.":[100,209],"As":[101],"observe":[103],"insignificant":[105],"role":[106],"in":[111,165],"architectures,":[113],"our":[114],"encoding":[115],"module":[116],"starts":[117],"with":[118],"cross-attention":[119],"layers":[120],"explicitly":[122],"inject":[123],"context":[125],"into":[129],"representation.":[131],"Then,":[132],"enhance":[134],"model's":[136],"capability":[137],"exploiting":[139],"information,":[142],"manipulate":[144],"video-query":[146,155,195],"pairs":[147,156],"produce":[149],"irrelevant":[150],"pairs.":[151,176,196],"Such":[152],"negative":[153],"(irrelevant)":[154],"trained":[158],"yield":[160],"low":[161],"scores,":[163],"which":[164,184],"turn,":[166],"encourages":[167],"model":[169],"precise":[172],"query-video":[175],"Lastly,":[177],"present":[179],"an":[180],"input-adaptive":[181],"predictor":[183],"adaptively":[185],"defines":[186],"criterion":[188],"scores":[191],"Our":[197],"extensive":[198],"studies":[199],"verify":[200],"importance":[202],"building":[204],"query-dependent":[206],"representation":[207],"Specifically,":[210],"QD-DETR":[211],"outperforms":[212],"state-of-the-art":[213],"on":[215],"QVHighlights,":[216],"TVSum,":[217],"Charades-STA":[219],"datasets.":[220],"Codes":[221],"available":[223],"at":[224],"github.com/wjun0830IQD-DETR.":[225]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4386083094","counts_by_year":[{"year":2024,"cited_by_count":31},{"year":2023,"cited_by_count":6}],"updated_date":"2024-12-26T14:50:46.708157","created_date":"2023-08-23"}