{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T22:40:02Z","timestamp":1725230402584},"reference-count":79,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2021,6,15]],"date-time":"2021-06-15T00:00:00Z","timestamp":1623715200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,6,15]],"date-time":"2021-06-15T00:00:00Z","timestamp":1623715200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2021,12]]},"DOI":"10.1007\/s00034-021-01753-2","type":"journal-article","created":{"date-parts":[[2021,6,15]],"date-time":"2021-06-15T21:02:17Z","timestamp":1623790937000},"page":"6067-6097","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Multi-objective Approach to Speech Enhancement Using Tunable Q-Factor-based Wavelet Transform and ANN Techniques"],"prefix":"10.1007","volume":"40","author":[{"ORCID":"http:\/\/orcid.org\/0000-0002-7964-7485","authenticated-orcid":false,"given":"Tusar Kanti","family":"Dash","sequence":"first","affiliation":[]},{"given":"Sandeep Singh","family":"Solanki","sequence":"additional","affiliation":[]},{"given":"Ganapati","family":"Panda","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,6,15]]},"reference":[{"key":"1753_CR1","unstructured":"S. Ayat, M.T. Manzuri, R. Dianat, Wavelet based speech enhancement using a new thresholding algorithm, in Proceedings of 2004 International Symposium on Intelligent Multimedia, Video and Speech Processing, pp. 238\u2013241 (2004)"},{"issue":"12","key":"1753_CR2","doi-asserted-by":"publisher","first-page":"1620","DOI":"10.1016\/j.specom.2006.06.004","volume":"48","author":"M Bahoura","year":"2006","unstructured":"M. Bahoura, J. Rouat, Wavelet speech enhancement based on time-scale adaptation. Speech Commun. 48(12), 1620\u20131637 (2006)","journal-title":"Speech Commun."},{"key":"1753_CR3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-74524-4","volume-title":"Fundamentals of Speech Enhancement","author":"J Benesty","year":"2018","unstructured":"J. Benesty, Fundamentals of Speech Enhancement (Springer, Berlin, 2018)"},{"key":"1753_CR4","doi-asserted-by":"publisher","first-page":"706","DOI":"10.1016\/j.compeleceng.2017.01.013","volume":"62","author":"A Bhowmick","year":"2017","unstructured":"A. Bhowmick, M. Chandra, Speech enhancement using voiced speech probability based wavelet decomposition. Comput. Electr. Eng. 62, 706\u2013718 (2017)","journal-title":"Comput. Electr. Eng."},{"issue":"4","key":"1753_CR5","doi-asserted-by":"publisher","first-page":"813","DOI":"10.1007\/s10772-017-9448-7","volume":"20","author":"A Bhowmick","year":"2017","unstructured":"A. Bhowmick, M. Chandra, A. Biswas, Speech enhancement using Teager energy operated ERB-like perceptual wavelet packet decomposition. Int. J. Speech Technol. 20(4), 813\u2013827 (2017)","journal-title":"Int. J. Speech Technol."},{"issue":"6","key":"1753_CR6","doi-asserted-by":"publisher","first-page":"1622","DOI":"10.1109\/78.765133","volume":"47","author":"B Carnero","year":"1999","unstructured":"B. Carnero, A. Drygajlo, Perceptual speech coding and enhancement using frame-synchronized fast wavelet packet transform algorithms. IEEE Trans. Signal Process. 47(6), 1622\u20131635 (1999)","journal-title":"IEEE Trans. Signal Process."},{"key":"1753_CR7","doi-asserted-by":"publisher","unstructured":"J. Chen, J. Benesty, Y. Huang, E.J Diethorn, Fundamentals of Noise Reduction. In: Benesty J., Sondhi M.M., Huang Y.A. (eds) Springer Handbook of Speech Processing. Springer Handbooks. Springer, Berlin, Heidelberg (2008). https:\/\/doi.org\/10.1007\/978-3-540-49127-9_43","DOI":"10.1007\/978-3-540-49127-9_43"},{"issue":"2\u20133","key":"1753_CR8","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1023\/B:VLSI.0000015092.19005.62","volume":"36","author":"SH Chen","year":"2004","unstructured":"S.H. Chen, J.F. Wang, Speech enhancement using perceptual wavelet packet decomposition and Teager energy operator. J. VLSI Signal Process. Syst. Signal Image Video Technol. 36(2\u20133), 125\u2013139 (2004)","journal-title":"J. VLSI Signal Process. Syst. Signal Image Video Technol."},{"key":"1753_CR9","volume-title":"Evolutionary Algorithms for Solving Multi-Objective Problems","author":"CAC Coello","year":"2007","unstructured":"C.A.C. Coello, G.B. Lamont, D.A.V. Veldhuizen et al., Evolutionary Algorithms for Solving Multi-Objective Problems, vol. 5 (Springer, Berlin, 2007)"},{"key":"1753_CR10","doi-asserted-by":"crossref","unstructured":"C.C. Coello, M.S. Lechuga, MOPSO: A proposal for multiple objective particle swarm optimization, in Proceedings of the 2002 Congress on Evolutionary Computation. CEC\u201902 (Cat. No. 02TH8600), vol.\u00a02, pp. 1051\u20131056 (2002)","DOI":"10.1109\/CEC.2002.1004388"},{"issue":"2","key":"1753_CR11","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1007\/s10772-010-9073-1","volume":"13","author":"K Daqrouq","year":"2010","unstructured":"K. Daqrouq, I.N. Abu-Isbeih, O. Daoud, E. Khalaf, An investigation of speech enhancement using wavelet filtering method. Int. J. Speech Technol. 13(2), 101\u2013115 (2010)","journal-title":"Int. J. Speech Technol."},{"issue":"12","key":"1753_CR12","first-page":"868","volume":"78","author":"TK Dash","year":"2019","unstructured":"T.K. Dash, S.S. Solanki, Investigation on the effect of the input features in the noise level classification of noisy speech. J. Sci. Ind. Res. 78(12), 868\u2013872 (2019)","journal-title":"J. Sci. Ind. Res."},{"key":"1753_CR13","doi-asserted-by":"publisher","first-page":"465","DOI":"10.1007\/s10470-019-01566-z","volume":"102","author":"TK Dash","year":"2020","unstructured":"T.K. Dash, S.S. Solanki, G. Panda, Improved phase aware speech enhancement using bio-inspired and ANN techniques. Analog Integr. Circ. Sig. Process 102, 465\u2013477 (2020)","journal-title":"Analog Integr. Circ. Sig. Process"},{"key":"1753_CR14","doi-asserted-by":"publisher","unstructured":"T.K. Dash, S.S. Solanki, G. Panda et al. Development of statistical estimators for speech enhancement using multi-objective grey wolf optimizer. Evol. Intel. 14, 767\u2013778 (2021). https:\/\/doi.org\/10.1007\/s12065-020-00446-0","DOI":"10.1007\/s12065-020-00446-0"},{"issue":"3","key":"1753_CR15","doi-asserted-by":"publisher","first-page":"572","DOI":"10.1109\/TASLP.2016.2641904","volume":"25","author":"CS Doire","year":"2017","unstructured":"C.S. Doire, M. Brookes, P.A. Naylor, C.M. Hicks, D. Betts, M.A. Dmour, S.H. Jensen, Single-channel online enhancement of speech corrupted by reverberation and noise. IEEE\/ACM Trans. Audio Speech Lang. Process. 25(3), 572\u2013587 (2017)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"issue":"3","key":"1753_CR16","doi-asserted-by":"publisher","first-page":"613","DOI":"10.1109\/18.382009","volume":"41","author":"DL Donoho","year":"1995","unstructured":"D.L. Donoho, De-noising by soft-thresholding. IEEE Trans. Inf. Theory 41(3), 613\u2013627 (1995)","journal-title":"IEEE Trans. Inf. Theory"},{"issue":"3","key":"1753_CR17","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1093\/biomet\/81.3.425","volume":"81","author":"DL Donoho","year":"1994","unstructured":"D.L. Donoho, J.M. Johnstone, Ideal spatial adaptation by wavelet shrinkage. Biometrika 81(3), 425\u2013455 (1994)","journal-title":"Biometrika"},{"key":"1753_CR18","doi-asserted-by":"crossref","unstructured":"J.S. Garofolo, L.F. Lamel, W.M. Fisher, J.G. Fiscus, D.S. Pallett, DARPA TIMIT acoustic-phonetic continuous speech corpus CD-ROM. NIST speech disc 1-1.1. NASA STI\/Recon technical report n 93 (1993)","DOI":"10.6028\/NIST.IR.4930"},{"issue":"6","key":"1753_CR19","first-page":"399","volume":"60","author":"D Giannoulis","year":"2012","unstructured":"D. Giannoulis, M. Massberg, J.D. Reiss, Digital dynamic range compressor design\u2014a tutorial and analysis. J. Audio Eng. Soc. 60(6), 399\u2013408 (2012)","journal-title":"J. Audio Eng. Soc."},{"key":"1753_CR20","doi-asserted-by":"publisher","unstructured":"M.M. Goodwin, The STFT, Sinusoidal Models, and Speech Modification. In: Benesty J., Sondhi M.M., Huang Y.A. (eds) Springer Handbook of Speech Processing. Springer Handbooks. Springer, Berlin, Heidelberg (2008). https:\/\/doi.org\/10.1007\/978-3-540-49127-9_12","DOI":"10.1007\/978-3-540-49127-9_12"},{"key":"1753_CR21","doi-asserted-by":"publisher","unstructured":"V. Grancharov, W. Kleijn, Speech Quality Assessment. In: J. Benesty, M.M. Sondhi, Y.A. Huang (eds) Springer Handbook of Speech Processing. Springer Handbooks. Springer, Berlin, Heidelberg. (2008). https:\/\/doi.org\/10.1007\/978-3-540-49127-9_5","DOI":"10.1007\/978-3-540-49127-9_5"},{"key":"1753_CR22","unstructured":"G. Grindlay, Blind Dereverberation of Audio Signals. E4810 Final Project, University of Columbia (2008)"},{"key":"1753_CR23","unstructured":"H.G. Hirsch, D. Pearce, The Aurora experimental framework for the performance evaluation of speech recognition systems under noisy conditions, in ASR2000-Automatic Speech Recognition: Challenges for the new Millenium ISCA Tutorial and Research Workshop (ITRW) (2000)"},{"issue":"1","key":"1753_CR24","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1109\/TSA.2003.819949","volume":"12","author":"Y Hu","year":"2004","unstructured":"Y. Hu, P.C. Loizou, Speech enhancement based on wavelet thresholding the multitaper spectrum. IEEE Trans. Speech Audio Process. 12(1), 59\u201367 (2004)","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"1753_CR25","doi-asserted-by":"crossref","unstructured":"Y. Hu, P.C. Loizou, Evaluation of objective measures for speech enhancement, in Ninth International Conference on Spoken Language Processing (2006)","DOI":"10.21437\/Interspeech.2006-84"},{"issue":"1","key":"1753_CR26","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1109\/TASL.2007.911054","volume":"16","author":"Y Hu","year":"2007","unstructured":"Y. Hu, P.C. Loizou, Evaluation of objective quality measures for speech enhancement. IEEE Trans. Audio Speech Lang. Process. 16(1), 229\u2013238 (2007)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"issue":"1","key":"1753_CR27","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1109\/TASL.2007.911054","volume":"16","author":"Y Hu","year":"2008","unstructured":"Y. Hu, P.C. Loizou, Evaluation of objective quality measures for speech enhancement. IEEE Trans. Audio Speech Lang. Process. 16(1), 229\u2013238 (2008)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"1753_CR28","first-page":"1","volume":"5","author":"J Indra","year":"2020","unstructured":"J. Indra, R.K. Shankar, N. Kasthuri, S.G. Manjuri, A modified tunable-Q wavelet transform approach for tamil speech enhancement. IETE J. Res. 5, 1\u201314 (2020)","journal-title":"IETE J. Res."},{"issue":"4","key":"1753_CR29","doi-asserted-by":"publisher","first-page":"445","DOI":"10.1007\/s11265-019-01480-7","volume":"92","author":"MS Islam","year":"2020","unstructured":"M.S. Islam, T.H.A. Mahmud, W.U. Khan, Z. Ye, Supervised single channel speech enhancement based on stationary wavelet transforms and non-negative matrix factorization with concatenated framing process and subband smooth ratio mask. J. Signal Process. Syst. 92(4), 445\u2013458 (2020)","journal-title":"J. Signal Process. Syst."},{"key":"1753_CR30","doi-asserted-by":"crossref","unstructured":"M.T. Islam, C. Shahnaz, W.P. Zhu, M.O. Ahmad, Speech enhancement based on student $$t$$ modeling of Teager energy operated perceptual wavelet packet coefficients and a custom thresholding function. IEEE\/ACM Trans. Audio Speech Langu. Process. 23(11), 1800\u20131811 (2015)","DOI":"10.1109\/TASLP.2015.2443983"},{"key":"1753_CR31","unstructured":"M. Jeub, M. Jeub (2020) Blind Reverberation Time Estimation (https:\/\/www.mathworks.com\/matlabcentral\/fileexchange\/35740-blind-reverberation-time-estimation). MATLAB Central File Exchange. https:\/\/www.mathworks.com\/matlabcentral\/fileexchange\/35740-blind-reverberation-time-estimation"},{"issue":"2","key":"1753_CR32","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1016\/j.specom.2006.12.002","volume":"49","author":"MT Johnson","year":"2007","unstructured":"M.T. Johnson, X. Yuan, Y. Ren, Speech signal enhancement through adaptive wavelet thresholding. Speech Commun. 49(2), 123\u2013133 (2007)","journal-title":"Speech Commun."},{"key":"1753_CR33","doi-asserted-by":"crossref","unstructured":"J. Kennedy, Particle swarm optimization, Encyclopedia Mach. Learning (2010) 4, 760\u2013766","DOI":"10.1007\/978-0-387-30164-8_630"},{"issue":"1","key":"1753_CR34","doi-asserted-by":"publisher","first-page":"873204","DOI":"10.1155\/2008\/873204","volume":"2008","author":"K Khaldi","year":"2008","unstructured":"K. Khaldi, A.O. Boudraa, A. Bouchikhi, M.T.H. Alouane, Speech enhancement via EMD. EURASIP J. Adv. Signal Process. 2008(1), 873204 (2008)","journal-title":"EURASIP J. Adv. Signal Process."},{"issue":"2","key":"1753_CR35","doi-asserted-by":"publisher","first-page":"643","DOI":"10.1007\/s00034-018-0873-x","volume":"38","author":"BK Khonglah","year":"2019","unstructured":"B.K. Khonglah, A. Dey, S.M. Prasanna, Speech enhancement using source information for phoneme recognition of speech with background music. Circuits Syst. Signal Process. 38(2), 643\u2013663 (2019)","journal-title":"Circuits Syst. Signal Process."},{"issue":"3","key":"1753_CR36","doi-asserted-by":"publisher","first-page":"1415","DOI":"10.1121\/1.3179673","volume":"126","author":"U Kjems","year":"2009","unstructured":"U. Kjems, J.B. Boldt, M.S. Pedersen, T. Lunner, D. Wang, Role of mask pattern in intelligibility of ideal binary-masked noisy speech. J. Acousti. Soc. Am. 126(3), 1415\u20131426 (2009)","journal-title":"J. Acousti. Soc. Am."},{"key":"1753_CR37","doi-asserted-by":"publisher","DOI":"10.1002\/9781118393550","volume-title":"An Introduction to Audio Content Analysis: Applications in Signal Processing and Music Informatics","author":"A Lerch","year":"2012","unstructured":"A. Lerch, An Introduction to Audio Content Analysis: Applications in Signal Processing and Music Informatics (Wiley-IEEE Press, New York, 2012)"},{"issue":"11","key":"1753_CR38","doi-asserted-by":"publisher","first-page":"5005","DOI":"10.1007\/s00034-018-0798-4","volume":"37","author":"ZX Li","year":"2018","unstructured":"Z.X. Li, L.R. Dai, Y. Song, I. McLoughlin, A conditional generative model for speech enhancement. Circuits Syst. Signal Process. 37(11), 5005\u20135022 (2018)","journal-title":"Circuits Syst. Signal Process."},{"key":"1753_CR39","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1016\/j.specom.2006.12.006","volume":"49","author":"P Loizou","year":"2007","unstructured":"P. Loizou, NOIZEUS: a noisy speech corpus for evaluation of speech enhancement algorithms. Speech Commun. 49, 588\u2013601 (2007)","journal-title":"Speech Commun."},{"key":"1753_CR40","doi-asserted-by":"publisher","DOI":"10.1201\/9781420015836","volume-title":"Speech Enhancement: Theory and Practice","author":"PC Loizou","year":"2007","unstructured":"P.C. Loizou, Speech Enhancement: Theory and Practice (CRC Press, Cambridge, 2007)"},{"key":"1753_CR41","doi-asserted-by":"publisher","unstructured":"P.C. Loizou, Speech Quality Assessment. In: W. Lin, D. Tao, J. Kacprzyk, Z. Li , E. Izquierdo, H. Wang (eds) Multimedia Analysis, Processing and Communications. Studies in Computational Intelligence, vol 346. Springer, Berlin, Heidelberg (2011). https:\/\/doi.org\/10.1007\/978-3-642-19551-8_23","DOI":"10.1007\/978-3-642-19551-8_23"},{"issue":"1","key":"1753_CR42","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1109\/TASL.2010.2045180","volume":"19","author":"PC Loizou","year":"2011","unstructured":"P.C. Loizou, G. Kim, Reasons why current speech-enhancement algorithms do not improve speech intelligibility and suggested solutions. IEEE Trans. Audio Speech Lang. Process. 19(1), 47\u201356 (2011)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"1753_CR43","unstructured":"H. L\u00f6llmann, E. Yilmaz, M. Jeub, P. Vary, An improved algorithm for blind reverberation time estimation, in Proceedings of International Workshop on Acoustic Echo and Noise Control (IWAENC), pp. 1\u20134 (2010)"},{"issue":"2\u20133","key":"1753_CR44","doi-asserted-by":"publisher","first-page":"409","DOI":"10.1016\/S0167-6393(03)00011-6","volume":"41","author":"CT Lu","year":"2003","unstructured":"C.T. Lu, H.C. Wang, Enhancement of single channel speech based on masking property and wavelet transform. Speech Commun. 41(2\u20133), 409\u2013427 (2003)","journal-title":"Speech Commun."},{"issue":"3","key":"1753_CR45","doi-asserted-by":"publisher","first-page":"340","DOI":"10.1016\/j.specom.2010.10.005","volume":"53","author":"J Ma","year":"2011","unstructured":"J. Ma, P.C. Loizou, SNR loss: a new objective measure for predicting the intelligibility of noise-suppressed speech. Speech Commun. 53(3), 340\u2013354 (2011)","journal-title":"Speech Commun."},{"issue":"3","key":"1753_CR46","doi-asserted-by":"publisher","first-page":"6800","DOI":"10.1016\/j.eswa.2008.08.008","volume":"36","author":"R Majhi","year":"2009","unstructured":"R. Majhi, G. Panda, G. Sahoo, Development and performance evaluation of FLANN based model for forecasting of stock markets. Expert Syst. Appl. 36(3), 6800\u20136808 (2009)","journal-title":"Expert Syst. Appl."},{"key":"1753_CR47","doi-asserted-by":"publisher","unstructured":"P. Malathi, G.R. Suresh, M. Moorthi et al. Speech Enhancement via Smart Larynx of Variable Frequency for Laryngectomee Patient for Tamil Language Syllables Using RADWT Algorithm. Circuits Syst Signal Process 38, 4202\u20134228 (2019). https:\/\/doi.org\/10.1007\/s00034-019-01055-8","DOI":"10.1007\/s00034-019-01055-8"},{"key":"1753_CR48","doi-asserted-by":"publisher","first-page":"286","DOI":"10.1016\/j.energy.2019.01.087","volume":"172","author":"H Mofid","year":"2019","unstructured":"H. Mofid, H. Jazayeri-Rad, M. Shahbazian, A. Fetanat, Enhancing the performance of a parallel nitrogen expansion liquefaction process (NELP) using the multi-objective particle swarm optimization (MOPSO) algorithm. Energy 172, 286\u2013303 (2019)","journal-title":"Energy"},{"key":"1753_CR49","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.swevo.2013.11.003","volume":"16","author":"SJ Nanda","year":"2014","unstructured":"S.J. Nanda, G. Panda, A survey on nature inspired metaheuristic algorithms for partitional clustering. Swarm Evolut. Comput. 16, 1\u201318 (2014)","journal-title":"Swarm Evolut. Comput."},{"key":"1753_CR50","doi-asserted-by":"crossref","unstructured":"A. Nishad, R.B. Pachori, Instantaneous fundamental frequency estimation of speech signals using tunable-$$Q$$ wavelet transform, in 2018 International Conference on Signal Processing and Communications (SPCOM), pp. 157\u2013161 (2018)","DOI":"10.1109\/SPCOM.2018.8724451"},{"key":"1753_CR51","unstructured":"K.K. Paliwal, L. Alsteris, Usefulness of phase in speech processing, in Proceedings IPSJ Spoken Language Processing Workshop, Gifu, Japan, pp. 1\u20136 (2003)"},{"key":"1753_CR52","unstructured":"Y.H. Pao, Adaptive pattern recognition and neuralnetwork. Addison-Wesley Publishing Company Int.; 1989"},{"issue":"2","key":"1753_CR53","doi-asserted-by":"publisher","first-page":"254","DOI":"10.1109\/3477.752797","volume":"29","author":"JC Patra","year":"1999","unstructured":"J.C. Patra, R.N. Pal, B.N. Chatterji, G. Panda, Identification of nonlinear dynamic systems using functional link artificial neural networks. IEEE Trans. Syst. Man Cybernet. Part B (cybernet) 29(2), 254\u2013262 (1999)","journal-title":"IEEE Trans. Syst. Man Cybernet. Part B (cybernet)"},{"issue":"6","key":"1753_CR54","doi-asserted-by":"publisher","first-page":"1134","DOI":"10.1016\/j.adhoc.2012.03.001","volume":"10","author":"PM Pradhan","year":"2012","unstructured":"P.M. Pradhan, G. Panda, Connectivity constrained wireless sensor deployment using multiobjective evolutionary algorithms and fuzzy decision making. Ad Hoc Netw. 10(6), 1134\u20131145 (2012)","journal-title":"Ad Hoc Netw."},{"key":"1753_CR55","volume-title":"Digital Processing of Speech Signals","author":"LR Rabiner","year":"1978","unstructured":"L.R. Rabiner, R.W. Schafer, Digital Processing of Speech Signals, vol. 100 (Prentice-Hall, Englewood Cliffs, 1978)"},{"key":"1753_CR56","unstructured":"I.T. Recommendation, Perceptual evaluation of speech quality (PESQ): An objective method for end-to-end speech quality assessment of narrow-band telephone networks and speech codecs. Rec. ITU-T P. 862 (2001)"},{"issue":"1","key":"1753_CR57","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1121\/1.2932070","volume":"124","author":"Y Ren","year":"2008","unstructured":"Y. Ren, M.T. Johnson, J. Tao, Perceptually motivated wavelet packet transform for bioacoustic signal enhancement. J. Acoust. Soc. Am. 124(1), 316\u2013327 (2008)","journal-title":"J. Acoust. Soc. Am."},{"key":"1753_CR58","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1016\/j.asoc.2018.10.022","volume":"74","author":"CO Sakar","year":"2019","unstructured":"C.O. Sakar, G. Serbes, A. Gunduz, H.C. Tunc, H. Nizam, B.E. Sakar, M. Tutuncu, T. Aydin, M.E. Isenkul, H. Apaydin, A comparative analysis of speech signal processing algorithms for Parkinson\u2019s disease classification and the use of the tunable Q-factor wavelet transform. Appl. Soft Comput. 74, 255\u2013263 (2019)","journal-title":"Appl. Soft Comput."},{"issue":"12","key":"1753_CR59","doi-asserted-by":"publisher","first-page":"2793","DOI":"10.1016\/j.sigpro.2010.10.018","volume":"91","author":"IW Selesnick","year":"2011","unstructured":"I.W. Selesnick, Resonance-based signal decomposition: a new sparsity-enabled signal analysis method. Sig. Process. 91(12), 2793\u20132809 (2011)","journal-title":"Sig. Process."},{"issue":"8","key":"1753_CR60","doi-asserted-by":"publisher","first-page":"3560","DOI":"10.1109\/TSP.2011.2143711","volume":"59","author":"IW Selesnick","year":"2011","unstructured":"I.W. Selesnick, Wavelet transform with tunable Q-factor. IEEE Trans. Signal Process. 59(8), 3560\u20133575 (2011)","journal-title":"IEEE Trans. Signal Process."},{"issue":"8","key":"1753_CR61","doi-asserted-by":"publisher","first-page":"2412","DOI":"10.1109\/TASL.2011.2136336","volume":"19","author":"GL Sicuranza","year":"2011","unstructured":"G.L. Sicuranza, A. Carini, A generalized FLANN filter for nonlinear active noise control. IEEE Trans. Audio Speech Lang. Process. 19(8), 2412\u20132417 (2011)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"1753_CR62","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1016\/j.specom.2017.11.004","volume":"96","author":"R Soleymani","year":"2018","unstructured":"R. Soleymani, I.W. Selesnick, D.M. Landsberger, SEDA: a tunable Q-factor wavelet-based noise reduction algorithm for multi-talker babble. Speech Commun. 96, 102\u2013115 (2018)","journal-title":"Speech Commun."},{"key":"1753_CR63","unstructured":"C. Stedman, A matlab implementation of an audio compressor (2012), 2123\u20138227, http:\/\/hdl.handle.net\/2123\/8227"},{"key":"1753_CR64","first-page":"1135","volume":"5","author":"CM Stein","year":"1981","unstructured":"C.M. Stein, Estimation of the mean of a multivariate normal distribution. Ann. Stat. 5, 1135\u20131151 (1981)","journal-title":"Ann. Stat."},{"key":"1753_CR65","doi-asserted-by":"crossref","unstructured":"C.H. Taal, R.C. Hendriks, R. Heusdens, J. Jensen, A short-time objective intelligibility measure for time-frequency weighted noisy speech, in 2010 IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 4214\u20134217 (2010)","DOI":"10.1109\/ICASSP.2010.5495701"},{"key":"1753_CR66","unstructured":"D.S. Trigueros, L. Meng, M. Hartnett, Face recognition: From traditional to deep learning methods. arXiv preprint arXiv:1811.00116 (2018)"},{"key":"1753_CR67","doi-asserted-by":"publisher","first-page":"106547","DOI":"10.1016\/j.knosys.2020.106547","volume":"211","author":"T Tuncer","year":"2021","unstructured":"T. Tuncer, S. Dogan, U.R. Acharya, Automated accurate speech emotion recognition system using twine shuffle pattern and iterative neighborhood component analysis techniques. Knowl. Based Syst. 211, 106547 (2021)","journal-title":"Knowl. Based Syst."},{"issue":"3","key":"1753_CR68","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1016\/0167-6393(93)90095-3","volume":"12","author":"A Varga","year":"1993","unstructured":"A. Varga, H.J. Steeneken, Assessment for automatic speech recognition: II. NOISEX-92: a database and an experiment to study the effect of additive noise on speech recognition systems. Speech Commun. 12(3), 247\u2013251 (1993)","journal-title":"Speech Commun."},{"key":"1753_CR69","unstructured":"E. Vincent, MUSHRAM: a MATLAB interface for MUSHRA listening tests. http:\/\/www.elec.qmul.ac.uk\/people\/emmanuelv\/mushram (2005)"},{"key":"1753_CR70","doi-asserted-by":"crossref","unstructured":"W.D. Voiers, Interdependencies among measures of speech intelligility and speech Quality, in ICASSP\u201980. IEEE International Conference on Acoustics, Speech, and Signal Processing, vol.\u00a05, pp. 703\u2013705 (1980)","DOI":"10.1109\/ICASSP.1980.1170874"},{"key":"1753_CR71","unstructured":"E. Wan, A. Nelson, R. Peterson, Speech enhancement assessment resource (SPEAR) database. CSLU, Oregon Graduate Institute of Science and Technology, Beta version Release v1. 0 (2002)"},{"key":"1753_CR72","doi-asserted-by":"publisher","unstructured":"L. Wang, A. Cavallaro, \u201cDeep Learning Assisted Time-Frequency Processing for Speech Enhancement on Drones\u201d, in IEEE Transactions on Emerging Topics in Computational Intelligence, https:\/\/doi.org\/10.1109\/TETCI.2020.3014934.","DOI":"10.1109\/TETCI.2020.3014934."},{"key":"1753_CR73","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1016\/j.physa.2014.01.020","volume":"400","author":"YH Wang","year":"2014","unstructured":"Y.H. Wang, C.H. Yeh, H.W.V. Young, K. Hu, M.T. Lo, On the computational complexity of the empirical mode decomposition algorithm. Physica A 400, 159\u2013167 (2014)","journal-title":"Physica A"},{"key":"1753_CR74","unstructured":"Y. Xi, L. Bing-wu, Y. Fang, Speech enhancement using bionic wavelet transform and adaptive threshold function, in 2010 Second International Conference on Computational Intelligence and Natural Computing, vol.\u00a01, pp. 265\u2013268 (2010)"},{"key":"1753_CR75","doi-asserted-by":"publisher","first-page":"336","DOI":"10.1016\/j.ijepes.2014.12.010","volume":"67","author":"A Zeinalzadeh","year":"2015","unstructured":"A. Zeinalzadeh, Y. Mohammadi, M.H. Moradi, Optimal multi objective placement and sizing of multiple DGs and shunt capacitor banks simultaneously considering load uncertainty via MOPSO approach. Int. J. Electr. Power Energy Syst. 67, 336\u2013349 (2015)","journal-title":"Int. J. Electr. Power Energy Syst."},{"key":"1753_CR76","doi-asserted-by":"crossref","unstructured":"Y. Zhao, B. Xu, R. Giri, T. Zhang, Perceptually guided speech enhancement using deep neural networks, in 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5074\u20135078 (2018)","DOI":"10.1109\/ICASSP.2018.8462593"},{"issue":"1","key":"1753_CR77","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1109\/TASLP.2018.2870742","volume":"27","author":"N Zheng","year":"2018","unstructured":"N. Zheng, X.L. Zhang, Phase-aware speech enhancement based on deep neural networks. IEEE\/ACM Trans. Audio Speech Lang. Process. 27(1), 63\u201376 (2018)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"issue":"4","key":"1753_CR78","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1016\/j.jfds.2017.05.001","volume":"2","author":"G Zhong","year":"2016","unstructured":"G. Zhong, L.N. Wang, X. Ling, J. Dong, An overview on data representation learning: from traditional feature learning to recent deep learning. J. Finance Data Sci. 2(4), 265\u2013278 (2016)","journal-title":"J. Finance Data Sci."},{"key":"1753_CR79","doi-asserted-by":"publisher","DOI":"10.1002\/9780470680018","volume-title":"Digital Audio Signal Processing","author":"U Z\u00f6lzer","year":"2008","unstructured":"U. Z\u00f6lzer, Digital Audio Signal Processing (Wiley, New York, 2008)"}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-021-01753-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-021-01753-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-021-01753-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T21:45:17Z","timestamp":1725227117000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-021-01753-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,15]]},"references-count":79,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2021,12]]}},"alternative-id":["1753"],"URL":"https:\/\/doi.org\/10.1007\/s00034-021-01753-2","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"type":"print","value":"0278-081X"},{"type":"electronic","value":"1531-5878"}],"subject":[],"published":{"date-parts":[[2021,6,15]]},"assertion":[{"value":"16 June 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 May 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 May 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 June 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}