{"id":"https://openalex.org/W4383501701","doi":"https://doi.org/10.1109/aicas57966.2023.10168610","title":"Temporal Similarity-Based Computation Reduction for Video Transformers in Edge Camera Nodes","display_name":"Temporal Similarity-Based Computation Reduction for Video Transformers in Edge Camera Nodes","publication_year":2023,"publication_date":"2023-06-11","ids":{"openalex":"https://openalex.org/W4383501701","doi":"https://doi.org/10.1109/aicas57966.2023.10168610"},"language":"en","primary_location":{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/aicas57966.2023.10168610","pdf_url":null,"source":{"id":"https://openalex.org/S4363608281","display_name":"2022 IEEE 4th International Conference on Artificial Intelligence Circuits and Systems (AICAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false},"type":"article","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037314795","display_name":"Udari De Alwis","orcid":"https://orcid.org/0000-0002-0824-7724"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Udari De Alwis","raw_affiliation_strings":["ECE Dept., National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"ECE Dept., National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114064890","display_name":"Zhongheng Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhongheng Xie","raw_affiliation_strings":["ECE Dept., National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"ECE Dept., National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052037141","display_name":"Massimo Alioto","orcid":"https://orcid.org/0000-0002-4127-8258"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Massimo Alioto","raw_affiliation_strings":["ECE Dept., National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"ECE Dept., National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institution_assertions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":68},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9971,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action Recognition","score":0.539381},{"id":"https://openalex.org/keywords/visual-tracking","display_name":"Visual Tracking","score":0.53824},{"id":"https://openalex.org/keywords/motion-detection","display_name":"Motion Detection","score":0.526476},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer Vision","score":0.521515},{"id":"https://openalex.org/keywords/real-time-tracking","display_name":"Real-time Tracking","score":0.514124}],"concepts":[{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.8737927},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.7686445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7226071},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.5776124},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5021982},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38359532},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3530772},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20314687},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12647697},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.11436978},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.087555915},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"is_oa":false,"landing_page_url":"https://doi.org/10.1109/aicas57966.2023.10168610","pdf_url":null,"source":{"id":"https://openalex.org/S4363608281","display_name":"2022 IEEE 4th International Conference on Artificial Intelligence Circuits and Systems (AICAS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false}],"best_oa_location":null,"sustainable_development_goals":[],"grants":[{"funder":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation","award_id":null}],"datasets":[],"versions":[],"referenced_works_count":15,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W2619947201","https://openalex.org/W2908510526","https://openalex.org/W3012362498","https://openalex.org/W3094502228","https://openalex.org/W3113370935","https://openalex.org/W3174402370","https://openalex.org/W4214612132","https://openalex.org/W4214614183","https://openalex.org/W4226407477","https://openalex.org/W4295855159","https://openalex.org/W4311224395","https://openalex.org/W4312340826","https://openalex.org/W4312769131","https://openalex.org/W4360831786"],"related_works":["https://openalex.org/W4361193049","https://openalex.org/W4283332100","https://openalex.org/W4231775656","https://openalex.org/W3134658850","https://openalex.org/W2981757109","https://openalex.org/W2383646825","https://openalex.org/W2371018915","https://openalex.org/W2354191502","https://openalex.org/W2046435967","https://openalex.org/W1972225038"],"abstract_inverted_index":{"Recognizing":[0],"human":[1],"actions":[2],"in":[3,11,50,68,72,130],"video":[4,12,69,79],"sequences":[5],"has":[6],"become":[7],"an":[8,77,124],"essential":[9],"task":[10],"surveillance":[13],"applications.":[14],"In":[15,53],"such":[16],"applications,":[17],"transformer":[18,70,80],"models":[19],"have":[20],"rapidly":[21],"gained":[22],"wide":[23],"interest":[24],"thanks":[25],"to":[26,47,62],"their":[27,30],"performance.":[28],"However,":[29],"advantages":[31],"come":[32],"at":[33],"the":[34,64,91,103,108,114],"cost":[35],"of":[36,127],"a":[37],"high":[38],"computational":[39],"and":[40,133],"memory":[41],"cost,":[42],"especially":[43],"when":[44],"they":[45],"need":[46],"be":[48],"incorporated":[49],"edge":[51],"devices.":[52],"this":[54],"work,":[55],"temporal":[56,86],"similarity":[57],"tunnel":[58],"insertion":[59],"is":[60,82],"utilized":[61],"reduce":[63],"overall":[65],"computation":[66,92,100,119],"burden":[67],"networks":[71],"action":[73],"recognition":[74],"tasks.":[75],"Furthermore,":[76],"edge-friendly":[78],"model":[81],"proposed":[83],"based":[84],"on":[85],"similarity,":[87],"which":[88],"substantially":[89],"reduces":[90,118],"cost.":[93],"Its":[94],"smaller":[95],"variant":[96,116],"EMViT":[97],"achieves":[98],"38%":[99],"reduction":[101],"under":[102],"UCF101":[104],"dataset,":[105],"while":[106],"keeping":[107],"accuracy":[109,125],"degradation":[110,126],"insignificant":[111],"(<0.02%).":[112],"Also,":[113],"larger":[115],"CMViT":[117],"by":[120],"14%":[121],"(13%)":[122],"with":[123],"2%":[128],"(3%)":[129],"scaled":[131],"Kinetic400":[132],"Jester":[134],"datasets.":[135]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4383501701","counts_by_year":[],"updated_date":"2024-12-05T05:47:06.280651","created_date":"2023-07-08"}