{"id":"https://openalex.org/W4402699833","doi":"https://doi.org/10.48550/arxiv.2408.13239","title":"CustomCrafter: Customized Video Generation with Preserving Motion and\n Concept Composition Abilities","display_name":"CustomCrafter: Customized Video Generation with Preserving Motion and\n Concept Composition Abilities","publication_year":2024,"publication_date":"2024-08-23","ids":{"openalex":"https://openalex.org/W4402699833","doi":"https://doi.org/10.48550/arxiv.2408.13239"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.13239","pdf_url":"http://arxiv.org/pdf/2408.13239","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2408.13239","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101576189","display_name":"Tao Wu","orcid":"https://orcid.org/0000-0002-6925-109X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100419716","display_name":"Yong Zhang","orcid":"https://orcid.org/0000-0001-6577-5235"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101538534","display_name":"Xintao Wang","orcid":"https://orcid.org/0000-0001-6585-8604"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xintao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039357854","display_name":"Xianpan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Xianpan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088316957","display_name":"Guangcong Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Guangcong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101500719","display_name":"Zhongang Qi","orcid":"https://orcid.org/0000-0001-8298-4063"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Zhongang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102004349","display_name":"Ying Shan","orcid":"https://orcid.org/0000-0001-7673-8325"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shan, Ying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5111337285","display_name":"Xi Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xi","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":83},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9915,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9915,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9903,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9634,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[],"concepts":[{"id":"https://openalex.org/C40231798","wikidata":"https://www.wikidata.org/wiki/Q1333743","display_name":"Composition (language)","level":2,"score":0.68678683},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.63928884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.550542},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.40249762},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36672354},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.096114576},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.13239","pdf_url":"http://arxiv.org/pdf/2408.13239","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.13239","pdf_url":"http://arxiv.org/pdf/2408.13239","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3116076068","https://openalex.org/W2951359407","https://openalex.org/W2775347418","https://openalex.org/W2772917594","https://openalex.org/W2755342338","https://openalex.org/W2229312674","https://openalex.org/W2166024367","https://openalex.org/W2079911747","https://openalex.org/W2058170566","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Customized":[0],"video":[1,34,52,107,159],"generation":[2,100,203],"aims":[3],"to":[4,38,54,57,110,122,132,154,213,228,256],"generate":[5,42,214],"high-quality":[6],"videos":[7,69],"guided":[8],"by":[9],"text":[10],"prompts":[11],"and":[12,41,70,101,108,137],"subject's":[13,243],"reference":[14],"images.":[15],"However,":[16],"since":[17],"it":[18],"is":[19,81],"only":[20],"trained":[21],"on":[22,168,201],"static":[23],"images,":[24],"the":[25,55,61,74,97,129,134,138,156,161,169,175,187,196,205,211,219,230,234,239,242],"fine-tuning":[26,109],"process":[27],"of":[28,33,67,73,140,158,164,171,189,198,208,216,222,233,241],"subject":[29,172,191],"learning":[30,192],"disrupts":[31],"abilities":[32,104],"diffusion":[35],"models":[36],"(VDMs)":[37],"combine":[39],"concepts":[40],"motions.":[43],"To":[44],"restore":[45,155,225],"these":[46],"abilities,":[47],"some":[48],"methods":[49],"use":[50],"additional":[51,106],"similar":[53],"prompt":[56],"fine-tune":[58],"or":[59],"guide":[60],"model.":[62],"This":[63],"requires":[64],"frequent":[65],"changes":[66],"guiding":[68],"even":[71],"re-tuning":[72],"model":[75],"when":[76],"generating":[77],"different":[78],"motions,":[79],"which":[80],"very":[82],"inconvenient":[83],"for":[84,143],"users.":[85],"In":[86,218],"this":[87,199,226],"paper,":[88],"we":[89,117,149,179,194,224],"propose":[90,180],"CustomCrafter,":[91],"a":[92,119,252],"novel":[93],"framework":[94],"that":[95,151,248],"preserves":[96],"model's":[98,130],"motion":[99,147,157,202,215],"conceptual":[102,114],"combination":[103,115],"without":[105],"recovery.":[111],"For":[112,146],"preserving":[113,210],"ability,":[116],"design":[118],"plug-and-play":[120],"module":[121,200,227],"update":[123],"few":[124],"parameters":[125],"in":[126,160,174,204],"VDMs,":[127],"enhancing":[128],"ability":[131,139,212],"capture":[133],"appearance":[135,231],"details":[136,173,232],"concept":[141],"combinations":[142],"new":[144],"subjects.":[145],"generation,":[148],"observed":[150],"VDMs":[152],"tend":[153],"early":[162,206],"stage":[163,207,221],"denoising,":[165,209,223],"while":[166],"focusing":[167],"recovery":[170],"later":[176,220],"stage.":[177],"Therefore,":[178],"Dynamic":[181],"Weighted":[182],"Video":[183],"Sampling":[184],"Strategy.":[185],"Using":[186],"pluggability":[188],"our":[190,249],"modules,":[193],"reduce":[195],"impact":[197],"VDMs.":[217],"repair":[229],"specified":[235],"subject,":[236],"thereby":[237],"ensuring":[238],"fidelity":[240],"appearance.":[244],"Experimental":[245],"results":[246],"show":[247],"method":[250],"has":[251],"significant":[253],"improvement":[254],"compared":[255],"previous":[257],"methods.":[258]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4402699833","counts_by_year":[],"updated_date":"2025-01-08T21:25:21.272811","created_date":"2024-09-21"}