{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T10:17:03Z","timestamp":1729678623209,"version":"3.28.0"},"reference-count":27,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7472172","type":"proceedings-article","created":{"date-parts":[[2016,6,23]],"date-time":"2016-06-23T21:58:30Z","timestamp":1466719110000},"page":"2722-2726","source":"Crossref","is-referenced-by-count":39,"title":["Improved speaker independent lip reading using speaker adaptive training and deep neural networks"],"prefix":"10.1109","author":[{"given":"Ibrahim","family":"Almajai","sequence":"first","affiliation":[]},{"given":"Stephen","family":"Cox","sequence":"additional","affiliation":[]},{"given":"Richard","family":"Harvey","sequence":"additional","affiliation":[]},{"given":"Yuxuan","family":"Lan","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"689","article-title":"Multimodal deep learning","author":"ngiam","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning"},{"key":"ref11","first-page":"7596","article-title":"Audio-visual deep learning for noise robust speech recognition","author":"jing","year":"2013","journal-title":"Acoustics Speech and Signal Processing (ICASSP) 2013 IEEE International Conference on"},{"key":"ref12","article-title":"Multimodal transfer deep learning for audio visual recognition","author":"moon","year":"2014","journal-title":"arXiv preprint arXiv 1412 3121"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178347"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"722","DOI":"10.1007\/s10489-014-0629-7","article-title":"Audio-visual speech recognition using deep learning","volume":"42","author":"kuniaki","year":"2015","journal-title":"Applied Intelligence"},{"article-title":"Improving lip-reading performance for robust audiovisual speech recognition using dnns","year":"2015","author":"thangthai","key":"ref15"},{"key":"ref16","first-page":"661","article-title":"Maximum likelihood modeling with gaussian distributions for classification","volume":"2","author":"ramesh","year":"1998","journal-title":"Proceedings of the IEEE International Conference on Acoustics Speech and Signal Processing"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"1306","DOI":"10.1109\/JPROC.2003.817150","article-title":"Re-cent advances in the automatic recognition of audiovisual speech","volume":"91","author":"potamianos","year":"2003","journal-title":"Proceedings of the IEEE"},{"key":"ref18","article-title":"Improved feature processing for Deep Neural Networks","author":"shakti","year":"2013","journal-title":"Proc of Interspeech"},{"key":"ref19","first-page":"7","article-title":"Improving visual features for lip-reading","author":"lan","year":"2010","journal-title":"AVSPN"},{"key":"ref4","article-title":"Audio-visual automatic speech recognition: An overview","author":"potamianos","year":"2004","journal-title":"Issues in Visual and Audio-Visual Speech Processing"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"1405","DOI":"10.3758\/BF03212142","article-title":"Effects of talker variability on speechread-ing","volume":"62","author":"deborah","year":"2000","journal-title":"Perception & Psychophysics"},{"key":"ref3","first-page":"179","article-title":"The challenge of multispeaker lip-reading","author":"cox","year":"2008","journal-title":"International Conference on Auditory-Visual Speech Processing"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.173"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6288999"},{"key":"ref8","first-page":"89010","article-title":"Recent developments in automated lipreading","volume":"8901","author":"bowden","year":"2013"},{"key":"ref7","article-title":"Re-source management rml 2.0","author":"price","year":"1993","journal-title":"Linguistic Data Consortium Philadelphia"},{"key":"ref2","first-page":"881","article-title":"Automatic lipreading with limited training data","volume":"3","author":"shi-lin","year":"2006","journal-title":"Pattern Recognition 2006 ICPR 2006 18th International Conference on"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","article-title":"Deep neural networks for acoustic modeling in speech recognition: The shared views of four research groups","volume":"29","author":"geoffrey","year":"2012","journal-title":"Signal Processing Magazine IEEE"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/34.982900"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2012.192"},{"journal-title":"The HTK Book (Version 3 2 1)","year":"2002","author":"young","key":"ref22"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459283"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1044\/jshr.1104.796"},{"key":"ref23","first-page":"1","article-title":"The Kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"Proc ASRU"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1997.596119"},{"journal-title":"Confusion modelling for lip-reading","year":"2015","author":"howell","key":"ref25"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2016,3,20]]},"location":"Shanghai","end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07472172.pdf?arnumber=7472172","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T13:00:25Z","timestamp":1498309225000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7472172\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7472172","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}