Sh. Watanabe, Marc Delcroix, Florian Metze, J. Hershey
{"title":"Preliminaries","authors":"Sh. Watanabe, Marc Delcroix, Florian Metze, J. Hershey","doi":"10.1007/978-3-319-64680-0_1","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_1","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"1 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2021-11-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"128852880","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"The CHiME Challenges: Robust Speech Recognition in Everyday Environments","authors":"J. Barker, R. Marxer, E. Vincent, Shinji Watanabe","doi":"10.1007/978-3-319-64680-0_14","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_14","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"29 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2017-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132587356","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Distant Speech Recognition Experiments Using the AMI Corpus","authors":"S. Renals, P. Swietojanski","doi":"10.1007/978-3-319-64680-0_16","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_16","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"315 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2017-10-30","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"120908569","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Y. Gong, Yan Huang, Kshitiz Kumar, Jinyu Li, Chaojun Liu, Guoli Ye, Shi-Xiong Zhang, Yong Zhao, Rui Zhao
{"title":"Challenges in and Solutions to Deep Learning Network Acoustic Modeling in Speech Recognition Products at Microsoft","authors":"Y. Gong, Yan Huang, Kshitiz Kumar, Jinyu Li, Chaojun Liu, Guoli Ye, Shi-Xiong Zhang, Yong Zhao, Rui Zhao","doi":"10.1007/978-3-319-64680-0_19","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_19","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"50 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2017-07-26","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"114764366","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Marc Delcroix, Takuya Yoshioka, N. Ito, A. Ogawa, K. Kinoshita, M. Fujimoto, T. Higuchi, S. Araki, T. Nakatani
{"title":"Multichannel Speech Enhancement Approaches to DNN-Based Far-Field Speech Recognition","authors":"Marc Delcroix, Takuya Yoshioka, N. Ito, A. Ogawa, K. Kinoshita, M. Fujimoto, T. Higuchi, S. Araki, T. Nakatani","doi":"10.1007/978-3-319-64680-0_2","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_2","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"10 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2017-07-26","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"133482093","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
K. Kinoshita, Marc Delcroix, S. Gannot, Emanuël Habets, Reinhold Häb-Umbach, Walter Kellermann, Volker Leutnant, R. Maas, T. Nakatani, B. Raj, A. Sehr, Takuya Yoshioka
{"title":"The REVERB Challenge: A Benchmark Task for Reverberation-Robust ASR Techniques","authors":"K. Kinoshita, Marc Delcroix, S. Gannot, Emanuël Habets, Reinhold Häb-Umbach, Walter Kellermann, Volker Leutnant, R. Maas, T. Nakatani, B. Raj, A. Sehr, Takuya Yoshioka","doi":"10.1007/978-3-319-64680-0_15","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_15","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"78 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2017-07-26","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"115816050","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Tara N. Sainath, Ron J. Weiss, K. Wilson, A. Narayanan, M. Bacchiani, Bo Li, Ehsan Variani, Izhak Shafran, A. Senior, K. K. Chin, Ananya Misra, Chanwoo Kim
{"title":"Raw Multichannel Processing Using Deep Neural Networks","authors":"Tara N. Sainath, Ron J. Weiss, K. Wilson, A. Narayanan, M. Bacchiani, Bo Li, Ehsan Variani, Izhak Shafran, A. Senior, K. K. Chin, Ananya Misra, Chanwoo Kim","doi":"10.1007/978-3-319-64680-0_5","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_5","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"48 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"127360846","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
K. Sim, Y. Qian, G. Mantena, Lahiru Samarakoon, Souvik Kundu, Tian Tan
{"title":"Adaptation of Deep Neural Network Acoustic Models for Robust Automatic Speech Recognition","authors":"K. Sim, Y. Qian, G. Mantena, Lahiru Samarakoon, Souvik Kundu, Tian Tan","doi":"10.1007/978-3-319-64680-0_9","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_9","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"36 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"125387672","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Sequence-Discriminative Training of Neural Networks","authors":"Guoguo Chen, Yu Zhang, Dong Yu","doi":"10.1007/978-3-319-64680-0_12","DOIUrl":"https://doi.org/10.1007/978-3-319-64680-0_12","url":null,"abstract":"","PeriodicalId":221985,"journal":{"name":"New Era for Robust Speech Recognition, Exploiting Deep Learning","volume":"604 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"116073681","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}