{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T11:43:42Z","timestamp":1725450222498},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2013,1,9]],"date-time":"2013-01-09T00:00:00Z","timestamp":1357689600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J AUDIO SPEECH MUSIC PROC."],"published-print":{"date-parts":[[2013,12]]},"DOI":"10.1186\/1687-4722-2013-1","type":"journal-article","created":{"date-parts":[[2013,1,9]],"date-time":"2013-01-09T16:21:05Z","timestamp":1357748465000},"source":"Crossref","is-referenced-by-count":151,"title":["Context-dependent sound event detection"],"prefix":"10.1186","volume":"2013","author":[{"given":"Toni","family":"Heittola","sequence":"first","affiliation":[]},{"given":"Annamaria","family":"Mesaros","sequence":"additional","affiliation":[]},{"given":"Antti","family":"Eronen","sequence":"additional","affiliation":[]},{"given":"Tuomas","family":"Virtanen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,1,9]]},"reference":[{"key":"70_CR1","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1007\/s007790170019","volume":"5","author":"AK Dey","year":"2001","unstructured":"Dey AK: Understanding and using context. Person. Ubiquit Comput 2001, 5: 4-7. 10.1007\/s007790170019","journal-title":"Ubiquit Comput"},{"key":"70_CR2","doi-asserted-by":"publisher","DOI":"10.1109\/9780470043387","volume-title":"Computational Auditory Scene Analysis: Principles, Algorithms, and Applications","author":"D Wang","year":"2006","unstructured":"Wang D, Brown GJ: Computational Auditory Scene Analysis: Principles, Algorithms, and Applications. Wiley-IEEE Press, New York; 2006."},{"issue":"3","key":"70_CR3","doi-asserted-by":"publisher","first-page":"1026","DOI":"10.1109\/TSA.2005.857575","volume":"14","author":"R Cai","year":"2006","unstructured":"Cai R, Lu L, Hanjalic A, Zhang H, Cai LH: A flexible framework for key audio effects detection and auditory context inference. IEEE Trans. Audio Speech Lang. Process 2006, 14(3):1026-1039.","journal-title":"IEEE Trans. Audio Speech Lang. Process"},{"issue":"2","key":"70_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1352012.1352015","volume":"4","author":"M Xu","year":"2008","unstructured":"Xu M, Xu C, Duan L, Jin JS, Luo S: Audio keywords generation for sports video analysis. ACM Trans. Multimed. Comput. Commun. Appl 2008, 4(2):1-23.","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl"},{"key":"70_CR5","doi-asserted-by":"publisher","first-page":"1218","DOI":"10.1109\/ICME.2009.5202720","volume-title":"IEEE International Conference on Multimedia and Expo, 2009. ICME 2009","author":"Y Peng","year":"2009","unstructured":"Peng Y, Lin C, Sun M, Tsai K: Healthcare audio event classification using hidden Markov models and hierarchical hidden Markov models. In IEEE International Conference on Multimedia and Expo, 2009. ICME 2009. IEEE Computer Society, New York, NY, USA; 2009:1218-1221."},{"key":"70_CR6","first-page":"634","volume-title":"IEEE International Conference on Multimedia and Expo","author":"A H\u00e4rm\u00e4","year":"2005","unstructured":"H\u00e4rm\u00e4 A, McKinney MF, Skowronek J: Automatic surveillance of the acoustic activity in our living environment. In IEEE International Conference on Multimedia and Expo. IEEE Computer Society, Amsterdam Netherlands; 2005:634-637."},{"key":"70_CR7","first-page":"165","volume-title":"IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP \u201909","author":"S Ntalampiras","year":"2009","unstructured":"Ntalampiras S, Potamitis I, Fakotakis N: On acoustic surveillance of hazardous situations. In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP \u201909. IEEE Computer Society, Washington, DC, USA; 2009:165-168."},{"issue":"6","key":"70_CR8","doi-asserted-by":"publisher","first-page":"1142","DOI":"10.1109\/TASL.2009.2017438","volume":"17","author":"S Chu","year":"2009","unstructured":"Chu S, Narayanan S, Kuo CCJ: Environmental sound recognition with time-frequency audio features. IEEE Trans. Audio Speech Lang. Process 2009, 17(6):1142-1158.","journal-title":"IEEE Trans. Audio Speech Lang. Process"},{"key":"70_CR9","first-page":"1272","volume-title":"18th European Signal Processing Conference","author":"T Heittola","year":"2010","unstructured":"Heittola T, Mesaros A, Eronen A, Virtanen T: Audio context recognition using audio event histograms. In 18th European Signal Processing Conference. Aalborg, Denmark; 2010:1272-1276."},{"key":"70_CR10","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1109\/ESPA.2012.6152455","volume-title":"2012 IEEE International Conference on Emerging Signal Processing Applications (ESPA)","author":"M Shah","year":"2012","unstructured":"Shah M, Mears B, Chakrabarti C, Spanias A: Lifelogging: archival and retrieval of continuously recorded audio using wearable devices. In 2012 IEEE International Conference on Emerging Signal Processing Applications (ESPA). IEEE Computer Society, Las Vegas, NV, USA; 2012:99-102."},{"issue":"3","key":"70_CR11","doi-asserted-by":"publisher","first-page":"688","DOI":"10.1109\/TASL.2010.2041384","volume":"18","author":"G Wichern","year":"2010","unstructured":"Wichern G, Xue J, Thornburg H, Mechtley B, Spanias A: Segmentation, indexing, and retrieval for environmental and natural sounds. IEEE Trans. Audio Speech Lang. Process 2010, 18(3):688-707.","journal-title":"IEEE Trans. Audio Speech Lang. Process"},{"key":"70_CR12","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/1486.001.0001","volume-title":"Auditory Scene Analysis","author":"AS Bregman","year":"1990","unstructured":"Bregman AS: Auditory Scene Analysis. MIT Press, Cambridge MA; 1990."},{"issue":"7","key":"70_CR13","doi-asserted-by":"publisher","first-page":"280","DOI":"10.1016\/j.tics.2007.05.005","volume":"11","author":"M Bar","year":"2007","unstructured":"Bar M: The proactive brain: using analogies and associations to generate predictions. Trends Cogn. Sci 2007, 11(7):280-289. 10.1016\/j.tics.2007.05.005","journal-title":"Trends Cogn. Sci"},{"issue":"12","key":"70_CR14","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1016\/j.tics.2007.09.009","volume":"11","author":"A Oliva","year":"2007","unstructured":"Oliva A, Torralba A: The role of context in object recognition. Trends Cogn. Sci 2007, 11(12):520-527. 10.1016\/j.tics.2007.09.009","journal-title":"Trends Cogn. Sci"},{"key":"70_CR15","first-page":"88","volume-title":"IEEE International Conference on Semantic Computing","author":"M Niessen","year":"2008","unstructured":"Niessen M, van Maanen L, Andringa T: Disambiguating sounds through context. In IEEE International Conference on Semantic Computing. IEEE Computer Society, Santa Clara, CA, USA; 2008:88-95."},{"key":"70_CR16","first-page":"1306","volume-title":"IEEE International Conference on Multimedia and Expo","author":"C Clavel","year":"2005","unstructured":"Clavel C, Ehrette T, Richard G: Events detection for an audio-based surveillance system. In IEEE International Conference on Multimedia and Expo. IEEE Computer Society, Los Alamitos, CA, USA; 2005:1306-1309."},{"key":"70_CR17","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1109\/TFUZZ.2006.889760","volume":"15","author":"H Wu","year":"2007","unstructured":"Wu H, Mendel J: Classification of battlefield ground vehicles using acoustic features and fuzzy logic rule-based classifiers. IEEE Trans. Fuzzy Syst 2007, 15: 56-72.","journal-title":"IEEE Trans. Fuzzy Syst"},{"issue":"9","key":"70_CR18","doi-asserted-by":"publisher","first-page":"1319","DOI":"10.1109\/5.535250","volume":"84","author":"L Atlas","year":"1996","unstructured":"Atlas L, Bernard G, Narayanan S: Applications of time-frequency analysis to signals from manufacturing and machine monitoring sensors. Proc. IEEE 1996, 84(9):1319-1329. 10.1109\/5.535250","journal-title":"Proc. IEEE"},{"key":"70_CR19","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1155\/2007\/38637","volume":"2007","author":"S Fagerlund","year":"2007","unstructured":"Fagerlund S, Bird species recognition using support vector machines: EURASIP J. Appl. Signal Process. 2007, 2007: 64-64.","journal-title":"EURASIP J. Appl. Signal Process"},{"key":"70_CR20","doi-asserted-by":"crossref","first-page":"2689","DOI":"10.21437\/Interspeech.2005-261","volume-title":"Proceedings of Interspeech","author":"F Kraft","year":"2005","unstructured":"Kraft F, Malkin R, Schaaf T, Waibel A: Temporal ICA for classification of acoustic events in a kitchen environment. In Proceedings of Interspeech. International Speech Communication Association, Lisboa, Portugal; 2005:2689-2692."},{"key":"70_CR21","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1007\/11428572_4","volume-title":"Pervasive Computing","author":"J Chen","year":"2005","unstructured":"Chen J, Kam AH, Zhang J, Liu N, Shue L: Bathroom activity monitoring based on sound. In Pervasive Computing. Springer, Berlin; 2005:47-61."},{"issue":"4","key":"70_CR22","doi-asserted-by":"publisher","first-page":"682","DOI":"10.1016\/j.patcog.2005.11.005","volume":"39","author":"A Temko","year":"2006","unstructured":"Temko A, Nadeu C: Classification of acoustic events using SVM-based clustering schemes. Pattern Recognit 2006, 39(4):682-694. 10.1016\/j.patcog.2005.11.005","journal-title":"Pattern Recognit"},{"key":"70_CR23","first-page":"2272","volume-title":"IEEE International Conference on Acoustics, Speech and Signal Processing","author":"TH Dat","year":"2011","unstructured":"Dat TH, Li H: Probabilistic distance SVM with Hellinger-exponential kernel for sound event classification. In IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE Computer Society, Prague, Czech Republic; 2011:2272-2275."},{"key":"70_CR24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-68585-2","volume-title":"Multimodal Technologies for Perception of Humans: International Evaluation Workshops CLEAR 2007 and RT 2007","author":"R Stiefelhagen","year":"2008","unstructured":"Stiefelhagen R, Bowers R, Fiscus J(eds): Multimodal Technologies for Perception of Humans: International Evaluation Workshops CLEAR 2007 and RT 2007. Springer, Berlin Germany; 2008."},{"key":"70_CR25","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1007\/978-3-540-68585-2_33","volume-title":"Multimodal Technologies for Perception of Humans: International Evaluation Workshops CLEAR 2007 and RT 2007","author":"X Zhou","year":"2008","unstructured":"Zhou X, Zhuang X, Liu M, Tang H, Hasegawa-Johnson M, Huang T: HMM-based acoustic event detection with AdaBoost feature selection. In Multimodal Technologies for Perception of Humans: International Evaluation Workshops CLEAR 2007 and RT 2007. Springer, Berlin, Germany; 2008:345-353."},{"issue":"12","key":"70_CR26","doi-asserted-by":"publisher","first-page":"1543","DOI":"10.1016\/j.patrec.2010.02.005","volume":"31","author":"X Zhuang","year":"2010","unstructured":"Zhuang X, Zhou X, Hasegawa-Johnson MA, Huang TS: Real-world acoustic event detection. Pattern Recognit. Lett. (Pattern Recognition of Non-Speech Audio) 2010, 31(12):1543-1551.","journal-title":"Pattern Recognit. Lett. (Pattern Recognition of Non-Speech Audio)"},{"key":"70_CR27","first-page":"1267","volume-title":"18th European Signal Processing Conference","author":"A Mesaros","year":"2010","unstructured":"Mesaros A, Heittola T, Eronen A, Virtanen T: Acoustic event detection in real-life recordings. In 18th European Signal Processing Conference. Aalborg, Denmark; 2010:1267-1271."},{"issue":"2","key":"70_CR28","doi-asserted-by":"publisher","first-page":"465","DOI":"10.1109\/TASL.2006.881694","volume":"15","author":"M Akbacak","year":"2007","unstructured":"Akbacak M, Hansen JHL: Environmental sniffing: noise knowledge estimation for robust speech systems. IEEE Trans. Audio Speech Lang. Process 2007, 15(2):465-477.","journal-title":"IEEE Trans. Audio Speech Lang. Process"},{"key":"70_CR29","first-page":"1307","volume-title":"19th European Signal Processing Conference","author":"A Mesaros","year":"2011","unstructured":"Mesaros A, Heittola H, Klapuri A: Latent semantic analysis in sound event detection. In 19th European Signal Processing Conference. Barcelona, Spain; 2011:1307-1311."},{"key":"70_CR30","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1109\/TSA.2005.854103","volume":"14","author":"A Eronen","year":"2006","unstructured":"Eronen A, Peltonen V, Tuomi J, Klapuri A, Fagerlund S, Sorsa T, Lorho G, Huopaniemi J: Audio-based context recognition. IEEE Trans. Audio Speech Lang. Process 2006, 14: 321-329.","journal-title":"IEEE Trans. Audio Speech Lang. Process"},{"issue":"2","key":"70_CR31","doi-asserted-by":"publisher","first-page":"881","DOI":"10.1121\/1.2750160","volume":"122","author":"JJ Aucouturier","year":"2007","unstructured":"Aucouturier JJ, Defr\u00e9ville B, Pacher F: The bag-of-frames approach to audio pattern recognition: a sufficient model for urban soundscapes but not for polyphonic music. J. Acoust. Soc. Am 2007, 122(2):881-891. 10.1121\/1.2750160","journal-title":"J. Acoust. Soc. Am"},{"issue":"4","key":"70_CR32","doi-asserted-by":"publisher","first-page":"596","DOI":"10.1109\/TMM.2008.921739","volume":"10","author":"R Cai","year":"2008","unstructured":"Cai R, Lu L, Hanjalic A: Co-clustering for auditory scene categorization. IEEE Trans. Multimed 2008, 10(4):596-606.","journal-title":"IEEE Trans. Multimed"},{"issue":"4","key":"70_CR33","doi-asserted-by":"publisher","first-page":"658","DOI":"10.1109\/TMM.2009.2017607","volume":"11","author":"L Lie","year":"2009","unstructured":"Lie L, Hanjalic A: Text-like segmentation of general audio for content-based retrieval. IEEE Trans. Multimed 2009, 11(4):658-669.","journal-title":"IEEE Trans. Multimed"},{"issue":"2","key":"70_CR34","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1109\/5.18626","volume":"77","author":"LR Rabiner","year":"1989","unstructured":"Rabiner LR: A tutorial on hidden Markov models and selected applications in speech recognition. Proc. IEEE 1989, 77(2):257-286. 10.1109\/5.18626","journal-title":"Proc. IEEE"},{"key":"70_CR35","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1109\/89.365379","volume":"3","author":"D Reynolds","year":"1995","unstructured":"Reynolds D, Rose R: Robust text-independent speaker identification using Gaussian mixture speaker models. IEEE Trans. Speech Audio Process 1995, 3: 72-83. 10.1109\/89.365379","journal-title":"IEEE Trans. Speech Audio Process"},{"issue":"3","key":"70_CR36","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1109\/PROC.1973.9030","volume":"61","author":"GD Forney","year":"1973","unstructured":"Forney GD: The Viterbi algorithm. Proc. IEEE 1973, 61(3):268-278.","journal-title":"Proc. IEEE"},{"key":"70_CR37","doi-asserted-by":"publisher","first-page":"319","DOI":"10.1109\/ASPAA.2005.1540233","volume-title":"Proceedings of the 2005 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics","author":"M Ryyn\u00e4nen","year":"2005","unstructured":"Ryyn\u00e4nen M, Klapuri A: Polyphonic music transcription using note event modeling. In Proceedings of the 2005 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics. IEEE Computer Society, New York, NY, USA; 2005:319-322."},{"key":"70_CR38","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1007\/978-1-84882-054-8_7","volume-title":"Computers in the Human Interaction Loop","author":"A Temko","year":"2009","unstructured":"Temko A, Nadeu C, Macho D, Malkin R, Zieger C, Omologo M: Acoustic event detection and classification. In Computers in the Human Interaction Loop. Edited by: Waibel AH, Stiefelhagen R. Springer, New York; 2009:61-73."},{"key":"70_CR39","first-page":"996","volume-title":"Proceedings of the NAG\/DAGA Meeting 2009","author":"M Grootel","year":"2009","unstructured":"Grootel M, Andringa T, Krijnders J: DARES-G1: database of annotated real-world everyday sounds. In Proceedings of the NAG\/DAGA Meeting 2009. Rotterdam, Netherlands; 2009:996-999."},{"key":"70_CR40","first-page":"36","volume-title":"Workshop on Machine Listening in Multisource Environments, CHiME2011","author":"T Heittola","year":"2011","unstructured":"Heittola T, Mesaros A, Virtanen T, Eronen A: Sound event detection in multisource environments using source separation. In Workshop on Machine Listening in Multisource Environments, CHiME2011. Florence, Italy; 2011:36-40."}],"container-title":["EURASIP Journal on Audio, Speech, and Music Processing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1687-4722-2013-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1687-4722-2013-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1687-4722-2013-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,2,5]],"date-time":"2022-02-05T15:36:52Z","timestamp":1644075412000},"score":1,"resource":{"primary":{"URL":"https:\/\/asmp-eurasipjournals.springeropen.com\/articles\/10.1186\/1687-4722-2013-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,1,9]]},"references-count":40,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2013,12]]}},"alternative-id":["70"],"URL":"https:\/\/doi.org\/10.1186\/1687-4722-2013-1","relation":{},"ISSN":["1687-4722"],"issn-type":[{"value":"1687-4722","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,1,9]]},"article-number":"1"}}