{"id":"https://openalex.org/W4367177429","doi":"https://doi.org/10.48550/arxiv.2304.12561","title":"TCR: Short Video Title Generation and Cover Selection with Attention Refinement","display_name":"TCR: Short Video Title Generation and Cover Selection with Attention Refinement","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4367177429","doi":"https://doi.org/10.48550/arxiv.2304.12561"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.12561","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2304.12561","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040824128","display_name":"Yakun Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Yakun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028346805","display_name":"Jiuding Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jiuding","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038898235","display_name":"Weidong Guo","orcid":"https://orcid.org/0000-0003-0299-6393"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Weidong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100387509","display_name":"Hui Liu","orcid":"https://orcid.org/0000-0001-6654-4965"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Hui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100606304","display_name":"Yu Xu","orcid":"https://orcid.org/0009-0000-1297-1312"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5032424832","display_name":"Di Niu","orcid":"https://orcid.org/0000-0002-5250-7327"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niu, Di","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":67},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9947,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9947,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9943,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.85801405},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.5831092}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.85801405},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8135748},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.7719221},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.68076295},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6094758},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.5831092},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.47757867},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46445322},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.41614217},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.39965993},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.33721358},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3278982},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.115323424},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.12561","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2304.12561","pdf_url":"http://arxiv.org/pdf/2304.12561","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2304.12561","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2304.12561","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4388893791","https://openalex.org/W4290852288","https://openalex.org/W4283207562","https://openalex.org/W4210416330","https://openalex.org/W3088136942","https://openalex.org/W2963177403","https://openalex.org/W2949522393","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W2330246314"],"abstract_inverted_index":{"With":[0],"the":[1,75,83,98,106],"widespread":[2],"popularity":[3],"of":[4,47,86],"user-generated":[5],"short":[6,29,87,198],"videos,":[7],"it":[8],"becomes":[9],"increasingly":[10],"challenging":[11],"for":[12,28,57,63,77,100,147,195],"content":[13,18],"creators":[14],"to":[15,19,53,80,104,166,179,191],"promote":[16],"their":[17],"potential":[20],"viewers.":[21],"Automatically":[22],"generating":[23,44,186],"appealing":[24,129],"titles":[25,55,130,187],"and":[26,91,114,131,139,156,160,188],"covers":[27,194],"videos":[30,127],"can":[31],"help":[32],"grab":[33],"viewers'":[34],"attention.":[35,60],"Existing":[36],"studies":[37],"on":[38,43,67],"video":[39,54,88,182],"captioning":[40,183],"mostly":[41],"focus":[42],"factual":[45],"descriptions":[46],"actions,":[48],"which":[49],"do":[50],"not":[51],"conform":[52],"intended":[56],"catching":[58],"viewer":[59],"Furthermore,":[61],"research":[62],"cover":[64,92],"selection":[65,93,141],"based":[66],"multimodal":[68],"information":[69],"is":[70,177,189],"sparse.":[71],"These":[72],"problems":[73],"motivate":[74],"need":[76],"tailored":[78],"methods":[79,184],"specifically":[81],"support":[82,105],"joint":[84],"task":[85],"title":[89],"generation":[90,138],"(TG-CS)":[94],"as":[95,97],"well":[96],"demand":[99],"creating":[101],"corresponding":[102],"datasets":[103],"studies.":[107],"In":[108],"this":[109],"paper,":[110],"we":[111],"first":[112],"collect":[113],"present":[115],"a":[116,136],"real-world":[117,197],"dataset":[118],"named":[119],"Short":[120],"Video":[121],"Title":[122,137],"Generation":[123],"(SVTG)":[124],"that":[125,173],"contains":[126],"with":[128,142],"covers.":[132],"We":[133],"then":[134],"propose":[135],"Cover":[140],"attention":[143],"Refinement":[144],"(TCR)":[145],"method":[146,176],"TG-CS.":[148],"The":[149],"refinement":[150],"procedure":[151],"progressively":[152],"selects":[153],"high-quality":[154],"samples":[155],"highly":[157],"relevant":[158],"frames":[159],"text":[161],"tokens":[162],"within":[163],"each":[164],"sample":[165],"refine":[167],"model":[168],"training.":[169],"Extensive":[170],"experiments":[171],"show":[172],"our":[174],"TCR":[175],"superior":[178],"various":[180],"existing":[181],"in":[185],"able":[190],"select":[192],"better":[193],"noisy":[196],"videos.":[199]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4367177429","counts_by_year":[],"updated_date":"2025-01-08T22:06:42.978934","created_date":"2023-04-28"}