{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T14:51:24Z","timestamp":1725807084161},"reference-count":25,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,3]]},"DOI":"10.1109\/icassp.2017.7953215","type":"proceedings-article","created":{"date-parts":[[2017,6,20]],"date-time":"2017-06-20T17:35:36Z","timestamp":1497980136000},"page":"5535-5539","source":"Crossref","is-referenced-by-count":30,"title":["Non-parallel voice conversion using i-vector PLDA: towards unifying speaker verification and transformation"],"prefix":"10.1109","author":[{"given":"Tomi","family":"Kinnunen","sequence":"first","affiliation":[]},{"given":"Lauri","family":"Juvela","sequence":"additional","affiliation":[]},{"given":"Paavo","family":"Alku","sequence":"additional","affiliation":[]},{"given":"Junichi","family":"Yamagishi","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"879","article-title":"A study of speaker adaptation for DNN-based speech synthesis","author":"wu","year":"2015","journal-title":"Proc INTERSPEECH"},{"key":"ref11","first-page":"5120","author":"qian","year":"2011","journal-title":"A frame mapping based HMM approach to cross-lingual voice transformation"},{"key":"ref12","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2008-419","article-title":"On the impact of alignment on voice conversion performance","author":"helander","year":"2008","journal-title":"Proc INTERSPEECH"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.857790"},{"key":"ref14","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2006-613","article-title":"Eigenvoice conversion based on gaussian mixture model","author":"toda","year":"2006","journal-title":"Proc INTERSPEECH"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2012.2225615"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2016.2593263"},{"key":"ref17","article-title":"A small footprint i-vector extractor","author":"kenny","year":"2012","journal-title":"Odyssey 2012 The Speaker and Language Recognition Workshop"},{"key":"ref18","article-title":"VB calibration to improve the interface between phone recognizer and i-vector extractor","author":"br\u00fcmmer","year":"2015","journal-title":"ArXiv e-prints"},{"key":"ref19","article-title":"Joint factor analysis of speaker and session variability: theory and algorithms","author":"kenny","year":"2006","journal-title":"Technical Report CRIM-06\/08-14"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2006.1660175"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/89.661472"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2064307"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1006\/dspr.1999.0361"},{"key":"ref8","first-page":"14","article-title":"Bayesian speaker verification with heavy-tailed priors","author":"kenny","year":"2010","journal-title":"Odyssey 2010 The Speaker and Language Recognition Workshop"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2007.4409052"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2009.08.009"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960401"},{"key":"ref9","first-page":"34","article-title":"The speaker partitioning problem","author":"br\u00fcmmer","year":"2010","journal-title":"Odyssey 2010 The Speaker and Language Recognition Workshop"},{"key":"ref20","first-page":"464","article-title":"Unifying probabilistic linear discriminant analysis variants in biometric authentication","author":"sizov","year":"2014","journal-title":"Structural Syntactic and Statistical Pattern Recognition-Joint IAPR InternationalWorkshop S+sspr 2014"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/PROC.1975.9792"},{"journal-title":"Perceptual spectral matching utilizing mel-scale filterbanks for statistical parametric speech synthesis with glottal excitation vocoder","year":"2015","author":"juvela","key":"ref21"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICSES.2008.4673475"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2005.10.004"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2006.870086"}],"event":{"name":"2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2017,3,5]]},"location":"New Orleans, LA","end":{"date-parts":[[2017,3,9]]}},"container-title":["2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7943262\/7951776\/07953215.pdf?arnumber=7953215","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,23]],"date-time":"2023-08-23T23:11:20Z","timestamp":1692832280000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7953215\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,3]]},"references-count":25,"URL":"https:\/\/doi.org\/10.1109\/icassp.2017.7953215","relation":{},"subject":[],"published":{"date-parts":[[2017,3]]}}}