{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T21:17:14Z","timestamp":1730323034856,"version":"3.28.0"},"publisher-location":"New York, NY, USA","reference-count":51,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,10,12]]},"DOI":"10.1145\/3394171.3413603","type":"proceedings-article","created":{"date-parts":[[2020,10,12]],"date-time":"2020-10-12T09:12:00Z","timestamp":1602493920000},"page":"3986-3994","update-policy":"http:\/\/dx.doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":12,"title":["A Unified Framework for Detecting Audio Adversarial Examples"],"prefix":"10.1145","author":[{"given":"Xia","family":"Du","sequence":"first","affiliation":[{"name":"University of Macau, Macau, Macao"}]},{"given":"Chi-Man","family":"Pun","sequence":"additional","affiliation":[{"name":"University of Macau, Macau, Macao"}]},{"given":"Zheng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology & University of Macau, Shenzhen, China"}]}],"member":"320","published-online":{"date-parts":[[2020,10,12]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1121\/1.382599"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2019.2901195"},{"key":"e_1_3_2_2_3_1","volume-title":"Proceedings of the 35th International Conference on Machine Learning (Proceedings of Machine Learning Research), JenniferDy and Andreas Krause (Eds.)","volume":"80","author":"Athalye Anish","year":"2018"},{"volume-title":"international conference on learning representations (ICLR","year":"2015","author":"Bahdanau Dzmitry","key":"e_1_3_2_2_4_1"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-010-5188-5"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1128817.1128824"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/SPW.2018.00009"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1015330.1015432"},{"volume-title":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases. Springer, 52--68","year":"2018","author":"Chen Shang-Tse","key":"e_1_3_2_2_9_1"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00175"},{"key":"e_1_3_2_2_11_1","unstructured":"Virginie Gilg Christophe Beaugeant and Bernt Andrassy. 2020. METHODOLOGY FOR THE DESIGN OF A ROBUST VOICE ACTIVITY DETECTOR FOR SPEECH ENHANCEMENT. (04 2020). Virginie Gilg Christophe Beaugeant and Bernt Andrassy. 2020. METHODOLOGY FOR THE DESIGN OF A ROBUST VOICE ACTIVITY DETECTOR FOR SPEECH ENHANCEMENT. (04 2020)."},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.5120\/11638-7118"},{"volume-title":"Explaining and Harnessing Adversarial Examples. In International Conference on Learning Representations.","year":"2015","author":"Goodfellow Ian","key":"e_1_3_2_2_13_1"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/TENCON.1993.327987"},{"key":"e_1_3_2_2_16_1","unstructured":"Awni Hannun Carl Case Jared Casper Bryan Catanzaro Greg Diamos Erich Elsen Ryan Prenger Sanjeev Satheesh Shubho Sengupta Adam Coates etal 2014. Deep speech: Scaling up end-to-end speech recognition. arXiv preprint arXiv:1412.5567 (2014). Awni Hannun Carl Case Jared Casper Bryan Catanzaro Greg Diamos Erich Elsen Ryan Prenger Sanjeev Satheesh Shubho Sengupta Adam Coates et al. 2014. Deep speech: Scaling up end-to-end speech recognition. arXiv preprint arXiv:1412.5567 (2014)."},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/34.58871"},{"volume-title":"Proceedings of the Second International Conference on Learning Representations (ICLR","year":"2014","author":"Hermann Karl Moritz","key":"e_1_3_2_2_18_1"},{"key":"e_1_3_2_2_19_1","unstructured":"IEEE 2019. Targeted adversarial examples for black box audio systems. IEEE. IEEE 2019. Targeted adversarial examples for black box audio systems. IEEE."},{"key":"e_1_3_2_2_20_1","unstructured":"Andrew Ilyas Shibani Santurkar Dimitris Tsipras Logan Engstrom Brandon Tran and Aleksander Madry. 2019. Adversarial examples are not bugs they are features. In Advances in Neural Information Processing Systems. 125--136. Andrew Ilyas Shibani Santurkar Dimitris Tsipras Logan Engstrom Brandon Tran and Aleksander Madry. 2019. Adversarial examples are not bugs they are features. In Advances in Neural Information Processing Systems. 125--136."},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.1989.10478785"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"crossref","unstructured":"Matthew A Jaro. 1995. Probabilistic linkage of large public health data files. Statistics in medicine 14 5--7 (1995) 491--498. Matthew A Jaro. 1995. Probabilistic linkage of large public health data files. Statistics in medicine 14 5--7 (1995) 491--498.","DOI":"10.1002\/sim.4780140510"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDSP.2009.5201259"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3351088"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2013.6701894"},{"key":"e_1_3_2_2_26_1","unstructured":"Stepan Komkov and Aleksandr Petiushko. 2019. AdvHat: Real-world adversarial attack on ArcFace Face ID system. arXiv preprint arXiv:1908.08705 (2019). Stepan Komkov and Aleksandr Petiushko. 2019. AdvHat: Real-world adversarial attack on ArcFace Face ID system. arXiv preprint arXiv:1908.08705 (2019)."},{"key":"e_1_3_2_2_27_1","unstructured":"Anders Krogh and Jesper Vedelsby. 1995. Neural network ensembles cross validation and active learning. In Advances in neural information processing systems. 231--238. Anders Krogh and Jesper Vedelsby. 1995. Neural network ensembles cross validation and active learning. In Advances in neural information processing systems. 231--238."},{"key":"e_1_3_2_2_28_1","unstructured":"Alexey Kurakin Ian Goodfellow and Samy Bengio. 2016. Adversarial examples in the physical world. arXiv preprint arXiv:1607.02533 (2016). Alexey Kurakin Ian Goodfellow and Samy Bengio. 2016. Adversarial examples in the physical world. arXiv preprint arXiv:1607.02533 (2016)."},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3319535.3363246"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"crossref","unstructured":"Y LeCun Y Bengio and G Hinton. 2015. Deep learning. nature 521 (7553): 436. Google Scholar (2015). Y LeCun Y Bengio and G Hinton. 2015. Deep learning. nature 521 (7553): 436. Google Scholar (2015).","DOI":"10.1038\/nature14539"},{"key":"e_1_3_2_2_31_1","unstructured":"Bowon Lee and Mark Hasegawa-Johnson. 2007. Minimum mean squared error a posteriori estimation of high variance vehicular noise. Biennial on DSP for In-Vehicle and Mobile Systems (2007). Bowon Lee and Mark Hasegawa-Johnson. 2007. Minimum mean squared error a posteriori estimation of high variance vehicular noise. Biennial on DSP for In-Vehicle and Mobile Systems (2007)."},{"volume-title":"Soviet physics doklady","author":"Levenshtein Vladimir I","key":"e_1_3_2_2_32_1"},{"volume-title":"International Conference on Machine Learning. 3896--3904","year":"2019","author":"Li Juncheng","key":"e_1_3_2_2_33_1"},{"key":"e_1_3_2_2_34_1","unstructured":"Shasha Li Ajaya Neupane Sujoy Paul Chengyu Song Srikanth V Krishnamurthy Amit K Roy Chowdhury and Ananthram Swami. 2018. Adversarial perturbations against real-time video classification systems. arXiv preprint arXiv:1807.00458 (2018). Shasha Li Ajaya Neupane Sujoy Paul Chengyu Song Srikanth V Krishnamurthy Amit K Roy Chowdhury and Ananthram Swami. 2018. Adversarial perturbations against real-time video classification systems. arXiv preprint arXiv:1807.00458 (2018)."},{"key":"e_1_3_2_2_35_1","unstructured":"Satoshi Nakamura Kazuo Hiyane Futoshi Asano Takanobu Nishiura and Takeshi Yamada. 2000. Acoustical sound database in real environments for sound scene understanding and hands-free speech recognition. (2000). Satoshi Nakamura Kazuo Hiyane Futoshi Asano Takanobu Nishiura and Takeshi Yamada. 2000. Acoustical sound database in real environments for sound scene understanding and hands-free speech recognition. (2000)."},{"key":"e_1_3_2_2_36_1","unstructured":"Luis Perez and Jason Wang. 2017. The effectiveness of data augmentation in image classification using deep learning. arXiv preprint arXiv:1712.04621 (2017). Luis Perez and Jason Wang. 2017. The effectiveness of data augmentation in image classification using deep learning. arXiv preprint arXiv:1712.04621 (2017)."},{"key":"e_1_3_2_2_37_1","volume-title":"Proceedings of the 36th International Conference on Machine Learning (Proceedings of Machine Learning Research), Kamalika Chaudhuri and Ruslan Salakhutdinov (Eds.)","volume":"97","author":"Qin Yao","year":"2019"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISSPIT.2018.8642623"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461310"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.674443"},{"volume-title":"international conference on learning representations (ICLR","year":"2014","author":"Szegedy Christian","key":"e_1_3_2_2_41_1"},{"key":"e_1_3_2_2_42_1","unstructured":"Pete Warden. 2018. Speech commands: A dataset for limited-vocabulary speech recognition. arXiv preprint arXiv:1804.03209 (2018). Pete Warden. 2018. Speech commands: A dataset for limited-vocabulary speech recognition. arXiv preprint arXiv:1804.03209 (2018)."},{"key":"e_1_3_2_2_43_1","unstructured":"William E Winkler. 1990. String Comparator Metrics and Enhanced Decision Rules in the Fellegi-Sunter Model of Record Linkage. (1990). William E Winkler. 1990. String Comparator Metrics and Enhanced Decision Rules in the Fellegi-Sunter Model of Record Linkage. (1990)."},{"volume-title":"Mitigating Adversarial Effects Through Randomization. In International Conference on Learning Representations.","year":"2018","author":"Xie Cihang","key":"e_1_3_2_2_44_1"},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.153"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2925934"},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/741"},{"key":"e_1_3_2_2_48_1","unstructured":"Zhuolin Yang Bo Li Pin-Yu Chen and Dawn Song. 2018. Towards mitigating audio adversarial perturbations. (2018). Zhuolin Yang Bo Li Pin-Yu Chen and Dawn Song. 2018. Towards mitigating audio adversarial perturbations. (2018)."},{"volume-title":"Characterizing Audio Adversarial Examples Using Temporal Dependency. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=r1g4E3C9t7","year":"2019","author":"Yang Zhuolin","key":"e_1_3_2_2_49_1"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2911164"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240639"}],"event":{"name":"MM '20: The 28th ACM International Conference on Multimedia","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Seattle WA USA","acronym":"MM '20"},"container-title":["Proceedings of the 28th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3394171.3413603","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,5]],"date-time":"2023-01-05T15:19:37Z","timestamp":1672931977000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3394171.3413603"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10,12]]},"references-count":51,"alternative-id":["10.1145\/3394171.3413603","10.1145\/3394171"],"URL":"https:\/\/doi.org\/10.1145\/3394171.3413603","relation":{},"subject":[],"published":{"date-parts":[[2020,10,12]]},"assertion":[{"value":"2020-10-12","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}