{"id":"https://openalex.org/W4399838053","doi":"https://doi.org/10.48550/arxiv.2406.12831","title":"VIA: A Spatiotemporal Video Adaptation Framework for Global and Local\n Video Editing","display_name":"VIA: A Spatiotemporal Video Adaptation Framework for Global and Local\n Video Editing","publication_year":2024,"publication_date":"2024-06-18","ids":{"openalex":"https://openalex.org/W4399838053","doi":"https://doi.org/10.48550/arxiv.2406.12831"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.12831","pdf_url":"http://arxiv.org/pdf/2406.12831","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2406.12831","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100370035","display_name":"Jing Gu","orcid":"https://orcid.org/0000-0002-4035-9072"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Jing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102952667","display_name":"Yuwei Fang","orcid":"https://orcid.org/0000-0002-8684-089X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Yuwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028188014","display_name":"Ivan Skorokhodov","orcid":"https://orcid.org/0000-0002-7611-9310"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Skorokhodov, Ivan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076768552","display_name":"Peter Wonka","orcid":"https://orcid.org/0000-0003-0627-9746"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wonka, Peter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101382802","display_name":"Xinya Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Xinya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058028206","display_name":"Sergey Tulyakov","orcid":"https://orcid.org/0000-0003-3465-1592"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tulyakov, Sergey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100328100","display_name":"Xin Wang","orcid":"https://orcid.org/0000-0003-2605-5504"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xin Eric","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9685,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9685,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9387,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.5096445}],"concepts":[{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6680991},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.65302795},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.5096445},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.39469346},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.092068136},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.12831","pdf_url":"http://arxiv.org/pdf/2406.12831","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.12831","pdf_url":"http://arxiv.org/pdf/2406.12831","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4396701345","https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2388962967","https://openalex.org/W2376932109","https://openalex.org/W2368355376","https://openalex.org/W2365286546","https://openalex.org/W2358668433","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Video":[0],"editing":[1,68,87,95,102,149,195,204],"stands":[2],"as":[3],"a":[4,51,84,92],"cornerstone":[5],"of":[6,23,66,81],"digital":[7],"media,":[8],"from":[9],"entertainment":[10],"and":[11,28,34,59,104,108,138,178],"education":[12],"to":[13,32,72,118,146,156,168],"professional":[14],"communication.":[15],"However,":[16],"previous":[17],"methods":[18],"often":[19],"overlook":[20],"the":[21,38,64,79,105,123,143,148,169,175,199],"necessity":[22],"comprehensively":[24],"understanding":[25],"both":[26],"global":[27,58,120],"local":[29,60,74,115,182],"contexts,":[30],"leading":[31],"inaccurate":[33],"inconsistency":[35],"edits":[36,163],"in":[37,135,174,181,196],"spatiotemporal":[39,53,128,176],"dimension,":[40],"especially":[41],"for":[42,57,97,113,201],"long":[43,193,207],"videos.":[44,70],"In":[45],"this":[46],"paper,":[47],"we":[48,126,186],"introduce":[49,127],"VIA,":[50],"unified":[52],"VIdeo":[54],"Adaptation":[55],"framework":[56],"video":[61,124,194,203,208],"editing,":[62],"pushing":[63],"limits":[65],"consistently":[67],"minute-long":[69],"First,":[71],"ensure":[73],"consistency":[75,99,121],"within":[76],"individual":[77],"frames,":[78],"foundation":[80],"VIA":[82,160,189],"is":[83],"novel":[85],"test-time":[86],"adaptation":[88,129],"method,":[89],"which":[90],"adapts":[91,109,131],"pre-trained":[93],"image":[94],"model":[96],"improving":[98],"between":[100],"potential":[101],"directions":[103],"text":[106],"instruction,":[107],"masked":[110],"latent":[111],"variables":[112,134],"precise":[114,180],"control.":[116,183],"Furthermore,":[117],"maintain":[119],"over":[122,206],"sequence,":[125],"that":[130,164,188],"consistent":[132,192],"attention":[133],"key":[136],"frames":[137],"strategically":[139],"applies":[140],"them":[141],"across":[142],"whole":[144],"sequence":[145],"realize":[147],"effects.":[150],"Extensive":[151],"experiments":[152],"demonstrate":[153],"that,":[154],"compared":[155],"baseline":[157],"methods,":[158],"our":[159],"approach":[161],"produces":[162],"are":[165],"more":[166,172,179],"faithful":[167],"source":[170],"videos,":[171],"coherent":[173],"context,":[177],"More":[184],"importantly,":[185],"show":[187],"can":[190],"achieve":[191],"minutes,":[197],"unlocking":[198],"potentials":[200],"advanced":[202],"tasks":[205],"sequences.":[209]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4399838053","counts_by_year":[],"updated_date":"2025-04-19T04:52:49.183335","created_date":"2024-06-20"}