J. Hershey, Jonathan Le Roux, Shinji Watanabe, Scott Wisdom, Zhuo Chen, Y. Isik
{"title":"Novel Deep Architectures in Speech Processing","authors":"J. Hershey, Jonathan Le Roux, Shinji Watanabe, Scott Wisdom, Zhuo Chen, Y. Isik","doi":"10.1007/978-3-319-64680-0_6","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_6","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"14 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"127121246","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Hakan Erdogan, J. Hershey, Shinji Watanabe, Jonathan Le Roux
{"title":"Deep Recurrent Networks for Separation and Recognition of Single-Channel Speech in Nonstationary Background Audio","authors":"Hakan Erdogan, J. Hershey, Shinji Watanabe, Jonathan Le Roux","doi":"10.1007/978-3-319-64680-0_7","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_7","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"56 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132990455","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Shinji Watanabe, Takaaki Hori, Yajie Miao, Marc Delcroix, Florian Metze, J. Hershey
{"title":"Toolkits for Robust Speech Processing","authors":"Shinji Watanabe, Takaaki Hori, Yajie Miao, Marc Delcroix, Florian Metze, J. Hershey","doi":"10.1007/978-3-319-64680-0_17","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_17","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"26 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"116112717","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
M. Bacchiani, F. Beaufays, A. Gruenstein, P. Moreno, J. Schalkwyk, Trevor Strohman, H. Zen
{"title":"Speech Research at Google to Enable Universal Speech Interfaces","authors":"M. Bacchiani, F. Beaufays, A. Gruenstein, P. Moreno, J. Schalkwyk, Trevor Strohman, H. Zen","doi":"10.1007/978-3-319-64680-0_18","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_18","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"32 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"123934141","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Yuuki Tachioka, Toshiyuki Hanazawa, Tomohiro Narita, Jun Ishii
{"title":"Advanced ASR Technologies for Mitsubishi Electric Speech Applications","authors":"Yuuki Tachioka, Toshiyuki Hanazawa, Tomohiro Narita, Jun Ishii","doi":"10.1007/978-3-319-64680-0_20","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_20","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"23 5 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"126169983","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Xiong Xiao, Shinji Watanabe, Hakan Erdogan, Michael I. Mandel, Liang Lu, J. Hershey, M. Seltzer, Guoguo Chen, Yu Zhang, Dong Yu
{"title":"Discriminative Beamforming with Phase-Aware Neural Networks for Speech Enhancement and Recognition","authors":"Xiong Xiao, Shinji Watanabe, Hakan Erdogan, Michael I. Mandel, Liang Lu, J. Hershey, M. Seltzer, Guoguo Chen, Yu Zhang, Dong Yu","doi":"10.1007/978-3-319-64680-0_4","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_4","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"63 3 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132019373","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
V. Mitra, H. Franco, R. Stern, Julien van Hout, L. Ferrer, M. Graciarena, Wen Wang, D. Vergyri, A. Alwan, J. Hansen
{"title":"Robust Features in Deep-Learning-Based Speech Recognition","authors":"V. Mitra, H. Franco, R. Stern, Julien van Hout, L. Ferrer, M. Graciarena, Wen Wang, D. Vergyri, A. Alwan, J. Hansen","doi":"10.1007/978-3-319-64680-0_8","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_8","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"9 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"131887537","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
M. Karafiát, Karel Veselý, Kateřina Žmolíková, Marc Delcroix, Shinji Watanabe, L. Burget, J. Černocký, Igor Szöke
{"title":"Training Data Augmentation and Data Selection","authors":"M. Karafiát, Karel Veselý, Kateřina Žmolíková, Marc Delcroix, Shinji Watanabe, L. Burget, J. Černocký, Igor Szöke","doi":"10.1007/978-3-319-64680-0_10","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_10","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"93 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"131668652","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Multichannel Spatial Clustering Using Model-Based Source Separation","authors":"Michael I. Mandel, J. Barker","doi":"10.1007/978-3-319-64680-0_3","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_3","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"98 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"116182329","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"End-to-End Architectures for Speech Recognition","authors":"Yajie Miao, Florian Metze","doi":"10.1007/978-3-319-64680-0_13","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_13","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"13 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"128590951","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}