Hongsheng Chen, Guoliang Chen, Kai-Jyun Chen, Jing Lu
{"title":"Nonlinear residual echo suppression based on dual-stream DPRNN","authors":"Hongsheng Chen, Guoliang Chen, Kai-Jyun Chen, Jing Lu","doi":"10.1186/s13636-021-00221-8","DOIUrl":"https://doi.org/10.1186/s13636-021-00221-8","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-09-07","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"47420006","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Single-channel speech enhancement based on joint constrained dictionary learning","authors":"Linhui Sun, Yunyi Bu, Pingan Li, Zihao Wu","doi":"10.1186/s13636-021-00218-3","DOIUrl":"https://doi.org/10.1186/s13636-021-00218-3","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-07-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00218-3","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"43053647","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Alexandru-Lucian Georgescu, Alessandro Pappalardo, H. Cucu, Michaela Blott
{"title":"Performance vs. hardware requirements in state-of-the-art automatic speech recognition","authors":"Alexandru-Lucian Georgescu, Alessandro Pappalardo, H. Cucu, Michaela Blott","doi":"10.1186/s13636-021-00217-4","DOIUrl":"https://doi.org/10.1186/s13636-021-00217-4","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2021 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-07-21","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00217-4","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687725","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Timestamp-aligning and keyword-biasing end-to-end ASR front-end for a KWS system","authors":"Gui-Xin Shi, Weiqiang Zhang, Guan-Bo Wang, Jing Zhao, Shuzhou Chai, Ze-Yu Zhao","doi":"10.1186/s13636-021-00212-9","DOIUrl":"https://doi.org/10.1186/s13636-021-00212-9","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-07-08","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00212-9","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"45266436","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Tobias Gburrek, Joerg Schmalenstroeer, Reinhold Haeb-Umbach
{"title":"Geometry calibration in wireless acoustic sensor networks utilizing DoA and distance information","authors":"Tobias Gburrek, Joerg Schmalenstroeer, Reinhold Haeb-Umbach","doi":"10.1186/s13636-021-00210-x","DOIUrl":"https://doi.org/10.1186/s13636-021-00210-x","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-07-02","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00210-x","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"48425308","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Residual feedback suppression with extended model-based postfilters","authors":"Marco Gimm, Philipp Bulling, G. Schmidt","doi":"10.1186/s13636-021-00205-8","DOIUrl":"https://doi.org/10.1186/s13636-021-00205-8","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2021 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-05-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00205-8","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687591","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Neural network-based non-intrusive speech quality assessment using attention pooling function","authors":"Miao Liu, Jing Wang, Weiming Yi, F. Liu","doi":"10.1186/s13636-021-00209-4","DOIUrl":"https://doi.org/10.1186/s13636-021-00209-4","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2021 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-05-17","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00209-4","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687671","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Frequency-dependent auto-pooling function for weakly supervised sound event detection","authors":"Sichen Liu, Feiran Yang, Yin Cao, Jun Yang","doi":"10.1186/s13636-021-00206-7","DOIUrl":"https://doi.org/10.1186/s13636-021-00206-7","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2021 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2021-05-17","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00206-7","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687645","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Points2Sound: from mono to binaural audio using 3D point cloud scenes","authors":"Francesc Llu'is, V. Chatziioannou, A. Hofmann","doi":"10.1186/s13636-022-00265-4","DOIUrl":"https://doi.org/10.1186/s13636-022-00265-4","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2022 1","pages":"1-15"},"PeriodicalIF":2.4,"publicationDate":"2021-04-26","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"44744810","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Yuxuan Ke, Andong Li, C. Zheng, Renhua Peng, Xiaodong Li
{"title":"Low-complexity artificial noise suppression methods for deep learning-based speech enhancement algorithms","authors":"Yuxuan Ke, Andong Li, C. Zheng, Renhua Peng, Xiaodong Li","doi":"10.1186/s13636-021-00204-9","DOIUrl":"https://doi.org/10.1186/s13636-021-00204-9","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2021 1","pages":"1-15"},"PeriodicalIF":2.4,"publicationDate":"2021-04-12","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-021-00204-9","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"42924847","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}