{"id":"https://openalex.org/W4403619157","doi":"https://doi.org/10.48550/arxiv.2407.14505","title":"T2V-CompBench: A Comprehensive Benchmark for Compositional Text-to-video\n Generation","display_name":"T2V-CompBench: A Comprehensive Benchmark for Compositional Text-to-video\n Generation","publication_year":2024,"publication_date":"2024-07-19","ids":{"openalex":"https://openalex.org/W4403619157","doi":"https://doi.org/10.48550/arxiv.2407.14505"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.14505","pdf_url":"http://arxiv.org/pdf/2407.14505","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://arxiv.org/pdf/2407.14505","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101853880","display_name":"Kaiyue Sun","orcid":"https://orcid.org/0000-0003-1401-4051"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Kaiyue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080404996","display_name":"Kaiyi Huang","orcid":"https://orcid.org/0000-0003-4884-4387"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Kaiyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008814691","display_name":"Liu Xian","orcid":"https://orcid.org/0000-0001-8835-9904"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101983893","display_name":"Yue Wu","orcid":"https://orcid.org/0000-0002-2248-4566"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101623273","display_name":"Zihan Xu","orcid":"https://orcid.org/0009-0008-9669-476X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103196797","display_name":"Zhenguo Li","orcid":"https://orcid.org/0000-0002-8492-3069"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhenguo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5027234036","display_name":"Xihui Liu","orcid":"https://orcid.org/0000-0002-1791-8745"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xihui","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":77},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9864,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9864,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9472,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9123,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.84376323}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.84376323},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.55273634},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33244482},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.15613908},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.11659327}],"mesh":[],"locations_count":1,"locations":[{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.14505","pdf_url":"http://arxiv.org/pdf/2407.14505","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.14505","pdf_url":"http://arxiv.org/pdf/2407.14505","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_indexed_in_scopus":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W4321353415","https://openalex.org/W4246352526","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2745001401","https://openalex.org/W2378211422","https://openalex.org/W2130974462","https://openalex.org/W2086519370","https://openalex.org/W2028665553"],"abstract_inverted_index":{"Text-to-video":[0],"(T2V)":[1],"generation":[2,102,148],"models":[3,131,138],"have":[4],"advanced":[5],"significantly,":[6],"yet":[7],"their":[8],"ability":[9,30],"to":[10],"compose":[11],"different":[12,137,140],"objects,":[13],"attributes,":[14],"actions,":[15],"and":[16,78,92,132,139,155],"motions":[17],"into":[18],"a":[19],"video":[20],"remains":[21],"unexplored.":[22],"Previous":[23],"text-to-video":[24,44,55,101,129,147],"benchmarks":[25],"also":[26,126],"neglect":[27],"this":[28,34,168],"important":[29],"for":[31,53,152],"evaluation.":[32],"In":[33],"work,":[35],"we":[36,156],"conduct":[37,133],"the":[38,49,99,115],"first":[39,50],"systematic":[40],"study":[41],"on":[42,164],"compositional":[43,54,100,141,146],"generation.":[45,56],"We":[46,81,125,143],"propose":[47],"T2V-CompBench,":[48],"benchmark":[51,127],"tailored":[52],"T2V-CompBench":[57],"encompasses":[58],"diverse":[59],"aspects":[60],"of":[61,87,104,114],"compositionality,":[62],"including":[63],"consistent":[64],"attribute":[65,68],"binding,":[66,69,73,75],"dynamic":[67],"spatial":[70],"relationships,":[71],"motion":[72],"action":[74],"object":[76],"interactions,":[77],"generative":[79,130],"numeracy.":[80],"further":[82],"carefully":[83],"design":[84],"evaluation":[85],"metrics":[86,117],"MLLM-based":[88],"metrics,":[89,91,94],"detection-based":[90],"tracking-based":[93],"which":[95],"can":[96],"better":[97],"reflect":[98],"quality":[103],"seven":[105],"proposed":[106,116],"categories":[107],"with":[108,122],"700":[109],"text":[110],"prompts.":[111],"The":[112],"effectiveness":[113],"is":[118,149],"verified":[119],"by":[120],"correlation":[121],"human":[123],"evaluations.":[124],"various":[128],"in-depth":[134],"analysis":[135],"across":[136],"categories.":[142],"find":[144],"that":[145,158],"highly":[150],"challenging":[151],"current":[153],"models,":[154],"hope":[157],"our":[159],"attempt":[160],"will":[161],"shed":[162],"light":[163],"future":[165],"research":[166],"in":[167],"direction.":[169]},"abstract_inverted_index_v3":null,"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4403619157","counts_by_year":[],"updated_date":"2025-04-15T20:27:45.305294","created_date":"2024-10-22"}