Yun-Ning Hung, Chih-Wei Wu, Iroro Orife, A. Hipple, W. Wolcott, Alexander Lerch
{"title":"A large TV dataset for speech and music activity detection","authors":"Yun-Ning Hung, Chih-Wei Wu, Iroro Orife, A. Hipple, W. Wolcott, Alexander Lerch","doi":"10.1186/s13636-022-00253-8","DOIUrl":"https://doi.org/10.1186/s13636-022-00253-8","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2022 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-09-03","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687851","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Alexander Bohlender, Lucas Van Severen, Jonathan Sterckx, N. Madhu
{"title":"DOA-guided source separation with direction-based initialization and time annotations using complex angular central Gaussian mixture models","authors":"Alexander Bohlender, Lucas Van Severen, Jonathan Sterckx, N. Madhu","doi":"10.1186/s13636-022-00246-7","DOIUrl":"https://doi.org/10.1186/s13636-022-00246-7","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-06-18","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"43510647","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Data-based spatial audio processing","authors":"M. Cobos, J. Ahrens, K. Kowalczyk, A. Politis","doi":"10.1186/s13636-022-00248-5","DOIUrl":"https://doi.org/10.1186/s13636-022-00248-5","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-06-08","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"45627222","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Improving sign-algorithm convergence rate using natural gradient for lossless audio compression","authors":"Taiyo Mineo, Hayaru Shouno","doi":"10.1186/s13636-022-00243-w","DOIUrl":"https://doi.org/10.1186/s13636-022-00243-w","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2022 1","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-05-21","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"65687838","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"An overview of machine learning and other data-based methods for spatial audio capture, processing, and reproduction","authors":"M. Cobos, J. Ahrens, K. Kowalczyk, A. Politis","doi":"10.1186/s13636-022-00242-x","DOIUrl":"https://doi.org/10.1186/s13636-022-00242-x","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-05-16","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"48642269","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Automated audio captioning: an overview of recent progress and new challenges","authors":"Xinhao Mei, Xubo Liu, M. Plumbley, Wenwu Wang","doi":"10.1186/s13636-022-00259-2","DOIUrl":"https://doi.org/10.1186/s13636-022-00259-2","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":"2022 1","pages":"1-18"},"PeriodicalIF":2.4,"publicationDate":"2022-05-12","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"49139079","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
P. Gutierrez-Parera, José J. López, J. M. Mora-Merchan, D. Larios
{"title":"Interaural time difference individualization in HRTF by scaling through anthropometric parameters","authors":"P. Gutierrez-Parera, José J. López, J. M. Mora-Merchan, D. Larios","doi":"10.1186/s13636-022-00241-y","DOIUrl":"https://doi.org/10.1186/s13636-022-00241-y","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-05-12","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"48038096","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Heterogeneous separation consistency training for adaptation of unsupervised speech separation","authors":"Jiangyu Han, Yanhua Long","doi":"10.1186/s13636-023-00273-y","DOIUrl":"https://doi.org/10.1186/s13636-023-00273-y","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-04-23","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"45769392","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Jean-Marie Lemercier, J. Thiemann, Raphael Koning, Timo Gerkmann
{"title":"A neural network-supported two-stage algorithm for lightweight dereverberation on hearing devices","authors":"Jean-Marie Lemercier, J. Thiemann, Raphael Koning, Timo Gerkmann","doi":"10.1186/s13636-023-00285-8","DOIUrl":"https://doi.org/10.1186/s13636-023-00285-8","url":null,"abstract":"","PeriodicalId":49309,"journal":{"name":"Journal on Audio Speech and Music Processing","volume":" ","pages":""},"PeriodicalIF":2.4,"publicationDate":"2022-04-06","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"49169410","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":3,"RegionCategory":"计算机科学","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}