{"id":"https://openalex.org/W4362653498","doi":"https://doi.org/10.1109/tmm.2023.3264847","title":"Energy-Based Temporal Summarized Attentive Network for Zero-Shot Action Recognition","display_name":"Energy-Based Temporal Summarized Attentive Network for Zero-Shot Action Recognition","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4362653498","doi":"https://doi.org/10.1109/tmm.2023.3264847"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3264847","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"journal-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034290568","display_name":"Cheng Qi","orcid":"https://orcid.org/0000-0001-6888-287X"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Qi","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100736532","display_name":"Zhiyong Feng","orcid":"https://orcid.org/0000-0001-8158-7453"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Feng","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100673909","display_name":"Meng Xing","orcid":"https://orcid.org/0000-0001-6082-4675"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Xing","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043830283","display_name":"Yong Su","orcid":"https://orcid.org/0000-0002-6851-4142"},"institutions":[{"id":"https://openalex.org/I15062923","display_name":"Tianjin Normal University","ror":"https://ror.org/05x2td559","country_code":"CN","type":"education","lineage":["https://openalex.org/I15062923"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Su","raw_affiliation_strings":["Tianjin Key Laboratory of Wireless Mobile Communications and Power Transmission, Tianjin Normal University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Wireless Mobile Communications and Power Transmission, Tianjin Normal University, Tianjin, China","institution_ids":["https://openalex.org/I15062923"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080383203","display_name":"Jinqing Zheng","orcid":"https://orcid.org/0000-0002-1772-0085"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinqing Zheng","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100395366","display_name":"Yiming Zhang","orcid":"https://orcid.org/0000-0002-5780-0709"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiming Zhang","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.811,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.771113,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":94},"biblio":{"volume":"25","issue":null,"first_page":"1940","last_page":"1953"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.65241444}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8584441},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.65241444},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.61281145},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5384554},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5199431}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3264847","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"grants":[],"datasets":[],"versions":[],"referenced_works_count":60,"referenced_works":["https://openalex.org/W1498368596","https://openalex.org/W1522734439","https://openalex.org/W1595717062","https://openalex.org/W1787683252","https://openalex.org/W1927052826","https://openalex.org/W1966385142","https://openalex.org/W2016053056","https://openalex.org/W2044913453","https://openalex.org/W2064675550","https://openalex.org/W2064851185","https://openalex.org/W2068611653","https://openalex.org/W2100771357","https://openalex.org/W2100916003","https://openalex.org/W2105101328","https://openalex.org/W2108598243","https://openalex.org/W2126579184","https://openalex.org/W2128532956","https://openalex.org/W2156303437","https://openalex.org/W2157331557","https://openalex.org/W2161914416","https://openalex.org/W2161969291","https://openalex.org/W2194775991","https://openalex.org/W2283717164","https://openalex.org/W24089286","https://openalex.org/W2463762378","https://openalex.org/W2520613337","https://openalex.org/W2619947201","https://openalex.org/W2737677090","https://openalex.org/W2740825418","https://openalex.org/W2748618181","https://openalex.org/W2750023899","https://openalex.org/W2781922022","https://openalex.org/W2887051120","https://openalex.org/W2904378456","https://openalex.org/W2951528484","https://openalex.org/W2962709777","https://openalex.org/W2963315828","https://openalex.org/W2963524571","https://openalex.org/W2963689837","https://openalex.org/W2964105864","https://openalex.org/W2965373098","https://openalex.org/W2970607325","https://openalex.org/W3021778166","https://openalex.org/W3035254087","https://openalex.org/W3048275157","https://openalex.org/W3069380482","https://openalex.org/W3092527263","https://openalex.org/W3124887724","https://openalex.org/W3142341292","https://openalex.org/W3170414130","https://openalex.org/W3173621652","https://openalex.org/W3209038819","https://openalex.org/W4214746887","https://openalex.org/W4287997702","https://openalex.org/W4294170691","https://openalex.org/W4295312788","https://openalex.org/W4312254032","https://openalex.org/W4312584871","https://openalex.org/W4320013936","https://openalex.org/W652269744"],"related_works":["https://openalex.org/W4387297750","https://openalex.org/W4386462264","https://openalex.org/W4312192474","https://openalex.org/W4306674287","https://openalex.org/W4210805261","https://openalex.org/W3209574120","https://openalex.org/W3170094116","https://openalex.org/W3107602296","https://openalex.org/W3046775127","https://openalex.org/W2961085424"],"abstract_inverted_index":{"Recently,":[0],"Action":[1,29],"Recognition":[2,30],"(AR)":[3],"is":[4,19,32,89,210,319],"facing":[5],"the":[6,15,39,58,63,71,79,97,112,116,122,134,153,162,184,192,214,220,225,239,261,268,272,278,285,295,303,306,310],"scalability":[7],"problem,":[8],"since":[9],"collecting":[10],"and":[11,21,35,76,167,172,175,199,247,280],"annotating":[12],"data":[13],"for":[14,96],"ever-growing":[16],"action":[17],"categories":[18,52],"exhausting":[20],"inappropriate.":[22],"As":[23],"an":[24,140,231],"alternative":[25],"to":[26,49,69,92,103,120,147,151,160,190,212,224,237],"AR,":[27],"Zero-Shot":[28],"(ZSAR)":[31],"getting":[33],"more":[34,36],"attention":[37],"in":[38,308],"community,":[40],"as":[41,83,85],"they":[42],"could":[43],"utilize":[44],"a":[45,204],"shared":[46],"semantic/attribute":[47],"space":[48],"recognize":[50],"novel":[51],"without":[53],"annotated":[54],"data.":[55],"Different":[56],"from":[57],"AR":[59],"focuses":[60],"on":[61,128,170,277,294],"learning":[62],"correlation":[64,72,193,215],"between":[65,244],"actions,":[66],"ZSAR":[67,101,126],"needs":[68,159],"consider":[70],"of":[73,100,114,125,136,155,164,194,216,260,271,299,305,313],"action-action,":[74],"label-label":[75,217],"action-label":[77,274],"at":[78,321],"same":[80],"time.":[81],"However,":[82],"far":[84],"we":[86,110,138,181,229],"know,":[87],"there":[88],"no":[90],"work":[91],"provide":[93],"structural":[94],"guidance":[95,135],"framework":[98,123,255,311],"design":[99,124,183,312],"according":[102,223],"its":[104],"task":[105],"characteristics.":[106],"In":[107,315],"this":[108,179],"paper,":[109],"demonstrate":[111],"rationality":[113],"using":[115],"Energy-Based":[117],"Model":[118],"(EBM)":[119],"guide":[121],"based":[127,169,293],"their":[129],"inference":[130],"mechanism.":[131],"Furthermore,":[132],"under":[133],"EBM,":[137],"propose":[139],"Energy-based":[141],"Temporal":[142,185],"Summarized":[143,186],"Attentive":[144,187],"Network":[145],"(ETSAN)":[146],"achieve":[148],"ZSAR.":[149,314],"Specifically,":[150],"ensure":[152],"effectiveness":[154],"cross-modal":[156],"matching,":[157],"EBM":[158,307],"capture":[161,191,257],"correlations":[163,262],"input-input,":[165],"output-output":[166],"input-output,":[168],"discriminative":[171,198],"focused":[173,200],"input":[174,201],"output":[176],"space.":[177,202],"To":[178],"end,":[180],"first":[182],"Mechanism":[188,208,235],"(TSAM)":[189],"action-action":[195],"by":[196,218,266],"constructing":[197],"Then,":[203],"Label":[205],"Semantic":[206],"Adaptive":[207],"(LSAM)":[209],"proposed":[211,286],"learn":[213],"adjusting":[219],"semantic":[221,249],"structure":[222],"target":[226],"task.":[227],"Finally,":[228],"devise":[230],"Energy":[232],"Score":[233],"Estimation":[234],"(ESEM)":[236],"measure":[238],"compatibility":[240],"(i.e.":[241],"energy":[242,269],"score)":[243],"video":[245],"representation":[246],"label":[248],"embedding.":[250],"With":[251],"end-to-end":[252],"training,":[253],"our":[254,317],"can":[256],"all":[258],"three":[259],"mentioned":[263],"above":[264],"simultaneously":[265],"minimizing":[267],"score":[270],"correct":[273],"pair.":[275],"Experiments":[276],"HMDB51":[279],"UCF101":[281],"datasets":[282],"show":[283],"that":[284],"architecture":[287],"achieves":[288],"comparable":[289],"results":[290],"among":[291],"methods":[292],"spatial-temporal":[296],"visual":[297],"feature":[298],"sequence-level,":[300],"which":[301],"demonstrates":[302],"efficiency":[304],"guiding":[309],"addition,":[316],"code":[318],"available":[320],"https://github.com/oOHCIOo/ETSAN":[324],".":[325]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4362653498","counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3}],"updated_date":"2025-01-19T01:35:56.901687","created_date":"2023-04-07"}