{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T21:34:22Z","timestamp":1730237662603,"version":"3.28.0"},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003452","name":"Innovation and Technology Commission","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003452","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,10,1]]},"DOI":"10.1109\/iccv51070.2023.01482","type":"proceedings-article","created":{"date-parts":[[2024,1,15]],"date-time":"2024-01-15T20:55:59Z","timestamp":1705352159000},"page":"16130-16140","source":"Crossref","is-referenced-by-count":1,"title":["SparseMAE: Sparse Training Meets Masked Autoencoders"],"prefix":"10.1109","author":[{"given":"Aojun","family":"Zhou","sequence":"first","affiliation":[{"name":"The Chinese University of Hong Kong"}]},{"given":"Yang","family":"Li","sequence":"additional","affiliation":[{"name":"SenseTime Research"}]},{"given":"Zipeng","family":"Qin","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong"}]},{"given":"Jianbo","family":"Liu","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong"}]},{"given":"Junting","family":"Pan","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong"}]},{"given":"Renrui","family":"Zhang","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong"}]},{"given":"Rui","family":"Zhao","sequence":"additional","affiliation":[{"name":"SenseTime Research"}]},{"given":"Peng","family":"Gao","sequence":"additional","affiliation":[{"name":"Shanghai AI Lab"}]},{"given":"Hongsheng","family":"Li","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong"}]}],"member":"263","reference":[{"key":"ref1","first-page":"1298","article-title":"Data2vec: A general framework for self-supervised learning in speech, vision and language","volume-title":"International Conference on Machine Learning","author":"Baevski"},{"article-title":"Beit: Bert pre-training of image transformers","year":"2021","author":"Bao","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"ref4","first-page":"19974","article-title":"Chasing sparsity in vision transformers: An end-to-end exploration","volume":"34","author":"Chen","year":"2021","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-023-01852-4"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00950"},{"article-title":"Flashattention: Fast and memory-efficient exact attention with io-awareness","year":"2022","author":"Dao","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref9","first-page":"2943","article-title":"Rigging the lottery: Making all tickets winners","volume-title":"International Conference on Machine Learning","author":"Evci"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TVLSI.2022.3197282"},{"article-title":"The lottery ticket hypothesis: Finding sparse, trainable neural networks","year":"2018","author":"Frankle","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-023-01898-4"},{"article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and huffman coding","year":"2015","author":"Han","key":"ref13"},{"key":"ref14","article-title":"Learning both weights and connections for efficient neural network","volume":"28","author":"Han","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"article-title":"Benchmarking neural network robustness to common corruptions and perturbations","volume-title":"Proceedings of the International Conference on Learning Representations","author":"Hendrycks","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01501"},{"issue":"1","key":"ref18","first-page":"10882","article-title":"Sparsity in deep learning: Pruning and growth for efficient inference and training in neural networks","volume":"22","author":"Hoefler","year":"2021","journal-title":"The Journal of Machine Learning Research"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01535"},{"article-title":"ovit: An accurate second-order pruning framework for vision transformers","year":"2022","author":"Kuznedelev","key":"ref20"},{"key":"ref21","article-title":"Optimal brain damage","volume":"2","author":"LeCun","year":"1989","journal-title":"Advances in neural information processing systems"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_17"},{"article-title":"Dynamic model pruning with feedback","year":"2020","author":"Lin","key":"ref23"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref25","first-page":"6989","article-title":"Do we actually need dense over-parameterization? in-time over-parameterization in sparse training","volume-title":"International Conference on Machine Learning","author":"Liu"},{"article-title":"Rethinking the value of network pruning","year":"2018","author":"Liu","key":"ref26"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2020.2979965"},{"article-title":"Accelerating sparse deep neural networks","year":"2021","author":"Mishra","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-018-04316-3"},{"key":"ref30","first-page":"8821","article-title":"Zero-shot text-to-image generation","volume-title":"International Conference on Machine Learning","author":"Ramesh"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00359"},{"article-title":"Dominosearch: Find layer-wise fine-grained n:m sparse schemes from dense neural networks","volume-title":"Thirty-Fifth Conference on Neural Information Processing Systems","author":"Sun","key":"ref32"},{"key":"ref33","first-page":"10347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"International conference on machine learning","author":"Touvron"},{"article-title":"A closer look at self-supervised lightweight vision transformers","year":"2022","author":"Wang","key":"ref34"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01426"},{"key":"ref36","article-title":"Discovering neural wirings","volume":"32","author":"Wortsman","year":"2019","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01228-1_26"},{"article-title":"Slimmable neural networks","year":"2018","author":"Yu","key":"ref38"},{"article-title":"Point-m2ae: Multi-scale masked autoencoders for hierarchical point cloud pre-training","volume-title":"NeurIPS 2022","author":"Zhang","key":"ref39"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02085"},{"article-title":"Learning best combination for efficient n:m sparsity","year":"2022","author":"Zhang","key":"ref41"},{"article-title":"Learning n: M fine-grained structured sparse neural networks from scratch","year":"2021","author":"Zhou","key":"ref42"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.544"}],"event":{"name":"2023 IEEE\/CVF International Conference on Computer Vision (ICCV)","start":{"date-parts":[[2023,10,1]]},"location":"Paris, France","end":{"date-parts":[[2023,10,6]]}},"container-title":["2023 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10376473\/10376477\/10377674.pdf?arnumber=10377674","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,18]],"date-time":"2024-01-18T01:17:15Z","timestamp":1705540635000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10377674\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,1]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/iccv51070.2023.01482","relation":{},"subject":[],"published":{"date-parts":[[2023,10,1]]}}}