Gongping Huang, Jingdong Chen, J. Benesty, I. Cohen, Xudong Zhao
{"title":"Steerable differential beamformers with planar microphone arrays","authors":"Gongping Huang, Jingdong Chen, J. Benesty, I. Cohen, Xudong Zhao","doi":"10.1186/s13636-020-00185-1","DOIUrl":"https://doi.org/10.1186/s13636-020-00185-1","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-11-04","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-00185-1","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"44203883","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Multichannel speaker interference reduction using frequency domain adaptive filtering","authors":"Patrick Meyer, Samy Elshamy, T. Fingscheidt","doi":"10.1186/s13636-020-00180-6","DOIUrl":"https://doi.org/10.1186/s13636-020-00180-6","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-11-04","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-00180-6","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"49656082","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Estimation of acoustic echoes using expectation-maximization methods","authors":"U. Saqib, S. Gannot, J. Jensen","doi":"10.1186/s13636-020-00179-z","DOIUrl":"https://doi.org/10.1186/s13636-020-00179-z","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2020 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-08-08","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-00179-z","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687697","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Joint speaker localization and array calibration using expectation-maximization","authors":"Yuval Dorfan, Ofer Schwartz, S. Gannot","doi":"10.1186/s13636-020-00177-1","DOIUrl":"https://doi.org/10.1186/s13636-020-00177-1","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2020 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-06-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-00177-1","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687610","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
L. Nanni, Yandre M. G. Costa, R. L. Aguiar, R. Mangolin, S. Brahnam, C. Silla
{"title":"Ensemble of convolutional neural networks to improve animal audio classification","authors":"L. Nanni, Yandre M. G. Costa, R. L. Aguiar, R. Mangolin, S. Brahnam, C. Silla","doi":"10.1186/s13636-020-00175-3","DOIUrl":"https://doi.org/10.1186/s13636-020-00175-3","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-05-26","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-00175-3","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"45629994","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Deep neural networks for automatic speech processing: a survey from large corpora to limited data","authors":"Vincent Roger, Jérôme Farinas, J. Pinquier","doi":"10.1186/s13636-022-00251-w","DOIUrl":"https://doi.org/10.1186/s13636-022-00251-w","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2022 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-03-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"42908797","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Jing Wang, Jin Wang, Kai Qian, Xiang Xie, Jin-jue Kuang
{"title":"Binaural sound localization based on deep neural network and affinity propagation clustering in mismatched HRTF condition","authors":"Jing Wang, Jin Wang, Kai Qian, Xiang Xie, Jin-jue Kuang","doi":"10.1186/s13636-020-0171-y","DOIUrl":"https://doi.org/10.1186/s13636-020-0171-y","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2020 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-02-10","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-0171-y","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687405","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Segment boundary detection directed attention for online end-to-end speech recognition","authors":"Junfeng Hou, Wu Guo, Yan Song, Lirong Dai","doi":"10.1186/s13636-020-0170-z","DOIUrl":"https://doi.org/10.1186/s13636-020-0170-z","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"32 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-01-30","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-020-0170-z","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687367","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"The aerodynamics of voiced stop closures","authors":"Luis M. T. Jesus, Maria Conceição Costa","doi":"10.1186/s13636-019-0162-z","DOIUrl":"https://doi.org/10.1186/s13636-019-0162-z","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"12 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2020-01-28","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-019-0162-z","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687470","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Introducing phonetic information to speaker embedding for speaker verification","authors":"Yi Liu, Liang He, Jia Liu, Michael T. Johnson","doi":"10.1186/s13636-019-0166-8","DOIUrl":"https://doi.org/10.1186/s13636-019-0166-8","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2019 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2019-12-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"https://sci-hub-pdf.com/10.1186/s13636-019-0166-8","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687558","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}