{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,8]],"date-time":"2025-04-08T13:47:05Z","timestamp":1744120025972,"version":"3.37.3"},"reference-count":47,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T00:00:00Z","timestamp":1556668800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T00:00:00Z","timestamp":1556668800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T00:00:00Z","timestamp":1556668800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Italian University and Research Consortium"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE J. Sel. Top. Signal Process."],"published-print":{"date-parts":[[2019,5]]},"DOI":"10.1109\/jstsp.2019.2902305","type":"journal-article","created":{"date-parts":[[2019,2,28]],"date-time":"2019-02-28T20:02:01Z","timestamp":1551384121000},"page":"310-322","source":"Crossref","is-referenced-by-count":44,"title":["Polyphonic Sound Event Detection by Using Capsule Neural Networks"],"prefix":"10.1109","volume":"13","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7748-5454","authenticated-orcid":false,"given":"Fabio","family":"Vesperini","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3812-0900","authenticated-orcid":false,"given":"Leonardo","family":"Gabrielli","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2835-7277","authenticated-orcid":false,"given":"Emanuele","family":"Principi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9374-0128","authenticated-orcid":false,"given":"Stefano","family":"Squartini","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"journal-title":"Keras","year":"2015","author":"chollet","key":"ref39"},{"key":"ref38","first-page":"249","article-title":"Understanding the difficulty of training deep feedforward neural networks","volume":"9","author":"glorot","year":"2010","journal-title":"J Mach Learn Res"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.3390\/app6060162"},{"key":"ref32","first-page":"281","article-title":"Random search for hyper-parameter optimization","volume":"13","author":"bergstra","year":"2012","journal-title":"J Mach Learn Res"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.2307\/1267351"},{"article-title":"AdaDelta: an adaptive learning rate method","year":"2012","author":"zeiler","key":"ref37"},{"key":"ref36","first-page":"80","article-title":"Rare sound event detection using 1D convolutional recurrent neural networks","author":"lim","year":"0","journal-title":"Workshop on Detection and Classification of Acoustic Scenes and Events"},{"article-title":"A report on sound event detection with different binaural features","year":"2017","author":"adavanne","key":"ref35"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2017.8081712"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2011.2159700"},{"article-title":"TensorFlow: Large-scale machine learning on heterogeneous systems","year":"2016","author":"abadi","key":"ref40"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2002.806626"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2015.2389618"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2109382"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MLSP.2015.7324337"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472669"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2017.2756439"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1186\/s13636-015-0069-2"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2690575"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15825-4_10"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2015.06.026"},{"key":"ref27","article-title":"Auditory toolbox","volume":"10","author":"slaney","year":"1998"},{"key":"ref3","first-page":"1218","article-title":"Healthcare audio event classification using hidden Markov models and hierarchical hidden Markov models","author":"peng","year":"0","journal-title":"Proc IEEE Int Conf Multimedia Expo"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2017.8081512"},{"key":"ref29","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"J Mach Learn Res"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2017.2657381"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2011.2146229"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2015.7336885"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2871183"},{"key":"ref9","first-page":"1272","article-title":"Audio context recognition using audio event histograms","author":"heittola","year":"0","journal-title":"Proc Eur Signal Process Conf"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-63450-0"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.23919\/ICIF.2018.8455725"},{"journal-title":"Detection and Classification of Acoustic Scenes and Events","year":"2017","author":"virtanen","key":"ref20"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-00919-9_45"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO.2018.8553198"},{"key":"ref47","first-page":"3859","article-title":"Matrix capsules with EM routing","author":"hinton","year":"0","journal-title":"Proc Int Conf Learn Representations"},{"article-title":"A capsule neural networks based approach for bird audio detection","year":"2018","author":"vesperini","key":"ref21"},{"key":"ref42","first-page":"1497","article-title":"Hierarchic ConvNets framework for rare sound event detection","author":"vesperini","year":"0","journal-title":"Proc Eur Signal Process Conf"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-21735-7_6"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.25080\/Majora-7b98e3ed-003"},{"key":"ref23","first-page":"3856","article-title":"Dynamic routing between capsules","author":"sabour","year":"0","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.3390\/s18093153"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1888"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref25","first-page":"85","article-title":"DCASE2017 challenge setup: Tasks, datasets and baseline system","author":"mesaros","year":"0","journal-title":"Proceedings of the Detection and Classification of Acoustic Scenes and Events 2017 Workshop (DCASE 2017)"}],"container-title":["IEEE Journal of Selected Topics in Signal Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/4200690\/8717740\/08654643.pdf?arnumber=8654643","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,13]],"date-time":"2022-07-13T21:08:15Z","timestamp":1657746495000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8654643\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,5]]},"references-count":47,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/jstsp.2019.2902305","relation":{},"ISSN":["1932-4553","1941-0484"],"issn-type":[{"type":"print","value":"1932-4553"},{"type":"electronic","value":"1941-0484"}],"subject":[],"published":{"date-parts":[[2019,5]]}}}