{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,12,30]],"date-time":"2024-12-30T18:37:04Z","timestamp":1735583824152,"version":"3.28.0"},"reference-count":25,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1109\/slt.2016.7846248","type":"proceedings-article","created":{"date-parts":[[2017,2,10]],"date-time":"2017-02-10T10:58:30Z","timestamp":1486724310000},"page":"76-82","source":"Crossref","is-referenced-by-count":24,"title":["Jointly learning to align and convert graphemes to phonemes with neural attention models"],"prefix":"10.1109","author":[{"given":"Shubham","family":"Toshniwal","sequence":"first","affiliation":[]},{"given":"Karen","family":"Livescu","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"Bi-directional conversion between graphemes and phonemes using a joint n-gram model","author":"galescu","year":"2001","journal-title":"4th ITRW on Speech Synthesis"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2010.2098440"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143891"},{"key":"ref13","article-title":"Sequence to Sequence Learning with Neural Networks","author":"sutskever","year":"2014","journal-title":"NIPS"},{"key":"ref14","article-title":"Generating Sequences with Recurrent Neural Networks","volume":"abs 1308 850","author":"graves","year":"2013","journal-title":"CoRR"},{"key":"ref15","article-title":"Recurrent Neural Network Regularization","volume":"abs 1409 2329","author":"zaremba","year":"2014","journal-title":"CoRR"},{"key":"ref16","article-title":"Grammar as a Foreign Language","author":"vinyals","year":"2015","journal-title":"NIPS"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1166"},{"key":"ref18","first-page":"2121","article-title":"Adaptive Subgradient Methods for Online Learning and Stochastic Optimization","volume":"12","author":"duchi","year":"2011","journal-title":"JMLR"},{"key":"ref19","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"nitish","year":"2014","journal-title":"JMLR"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref3","article-title":"Applying Many-to-Many Alignments and Hidden Markov Models to Letter-to-Phoneme Conversion","author":"jiampojamarn","year":"2007","journal-title":"NAACL-HLT"},{"key":"ref6","article-title":"Sequence-to-Sequence Neural Net Models for Grapheme-to-Phoneme Conversion","author":"yao","year":"2015","journal-title":"InterSpeech"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178767"},{"key":"ref8","article-title":"Listen, Attend and Spell","volume":"abs 1508 1211","author":"william","year":"2015","journal-title":"CoRR"},{"key":"ref7","article-title":"Neural Machine Translation by Jointly Learning to Align and Translate","volume":"abs 1409 473","author":"bahdanau","year":"2014","journal-title":"CoRR"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2008.01.002"},{"key":"ref9","article-title":"Show, Attend and Tell: Neural Image Caption Generation with Visual Attention","author":"xu","year":"2015","journal-title":"ICML"},{"key":"ref1","article-title":"Conditional and joint models for grapheme-to-phoneme conversion","author":"chen","year":"2003","journal-title":"Eurospeech"},{"key":"ref20","article-title":"Scheduled Sampling for Sequence Prediction with Recurrent Neural Networks","volume":"abs 1506 3099","author":"bengio","year":"2015","journal-title":"CoRR"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"article-title":"TensorFlow: Large-scale machine learning on heterogeneous systems","year":"2015","author":"abadi","key":"ref21"},{"key":"ref24","first-page":"2579","article-title":"Visualizing data using t-SNE","volume":"9","author":"van der maaten","year":"2008","journal-title":"JMLR"},{"key":"ref23","article-title":"Coverage-based neural machine translation","volume":"abs 1601 4811","author":"tu","year":"2016","journal-title":"CoRR"},{"key":"ref25","first-page":"367","article-title":"G2P conversion of proper names using word origin information","author":"waxmonsky","year":"2012","journal-title":"Stroudsburg PA USA NAACL-HLT"}],"event":{"name":"2016 IEEE Spoken Language Technology Workshop (SLT)","start":{"date-parts":[[2016,12,13]]},"location":"San Diego, CA","end":{"date-parts":[[2016,12,16]]}},"container-title":["2016 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7836849\/7846230\/07846248.pdf?arnumber=7846248","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,7,25]],"date-time":"2017-07-25T15:30:00Z","timestamp":1500996600000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7846248\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,12]]},"references-count":25,"URL":"https:\/\/doi.org\/10.1109\/slt.2016.7846248","relation":{},"subject":[],"published":{"date-parts":[[2016,12]]}}}