{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T14:06:50Z","timestamp":1730297210068,"version":"3.28.0"},"reference-count":36,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,1,9]]},"DOI":"10.1109\/slt54892.2023.10023388","type":"proceedings-article","created":{"date-parts":[[2023,1,27]],"date-time":"2023-01-27T18:54:03Z","timestamp":1674845643000},"page":"620-625","source":"Crossref","is-referenced-by-count":2,"title":["Mutual Learning of Single- and Multi-Channel End-to-End Neural Diarization"],"prefix":"10.1109","author":[{"given":"Shota","family":"Horiguchi","sequence":"first","affiliation":[{"name":"Hitachi, Ltd.,Japan"}]},{"given":"Yuki","family":"Takashima","sequence":"additional","affiliation":[{"name":"Hitachi, Ltd.,Japan"}]},{"given":"Shinji","family":"Watanabe","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,USA"}]},{"given":"Paola","family":"Garcia","sequence":"additional","affiliation":[{"name":"Johns Hopkins University,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2672401"},{"key":"ref2","first-page":"2632","article-title":"Multi-channel end-to-end speech recognition","author":"Ochiai","year":"2017","journal-title":"ICML"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461639"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054177"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1428"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/icassp40776.2020.9054577"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-1602"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746749"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2017.8268913"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/asru46091.2019.9003849"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746876"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1145\/1150402.1150464","article-title":"Model com-pression","author":"Bucilua","year":"2006","journal-title":"KDD"},{"article-title":"Distilling the know ledge in a neural network","volume-title":"NIPS Deep Learning and Representation Learning Workshop","author":"Hinton","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953173"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2432"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ISCSLP57327.2022.10038153"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003986"},{"key":"ref18","first-page":"5709","article-title":"On spatial features for supervised speech separation and its application to beamforming and ro-bust ASR","author":"Wang","year":"2018","journal-title":"ICASSP"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2125954"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/taslp.2022.3162080"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2014-432"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2018.8489456"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/icassp.2018.8461883"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-614"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2517"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003776"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683892"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953163"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2440"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053426"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10706"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2021\/362"},{"key":"ref34","article-title":"MUSAN: A music, speech, and noise corpus","author":"Snyder","year":"2015","journal-title":"arXiv"},{"article-title":"Corpus of spontaneous Japanese: Its design and evaluation","volume-title":"ISCA & IEEE Workshop on Spontaneous Speech Processing and Recognition","author":"Maekawa","key":"ref35"},{"key":"ref36","article-title":"Adam: A method for stochastic opti-mization","author":"Kingma","year":"2015","journal-title":"ICLR"}],"event":{"name":"2022 IEEE Spoken Language Technology Workshop (SLT)","start":{"date-parts":[[2023,1,9]]},"location":"Doha, Qatar","end":{"date-parts":[[2023,1,12]]}},"container-title":["2022 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10022052\/10022330\/10023388.pdf?arnumber=10023388","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,13]],"date-time":"2024-02-13T08:38:40Z","timestamp":1707813520000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10023388\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,9]]},"references-count":36,"URL":"https:\/\/doi.org\/10.1109\/slt54892.2023.10023388","relation":{},"subject":[],"published":{"date-parts":[[2023,1,9]]}}}