H. Subramoni, F. Petrini, Virat Agarwal, D. Pasetto
{"title":"High Performance Topology-Aware Communication in Multicore Processors","authors":"H. Subramoni, F. Petrini, Virat Agarwal, D. Pasetto","doi":"10.1201/b10376-30","DOIUrl":"https://doi.org/10.1201/b10376-30","url":null,"abstract":"","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"14 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132627603","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Dense Linear Algebra for Hybrid GPU-Based Systems","authors":"S. Tomov, J. Dongarra","doi":"10.1201/b10376-5","DOIUrl":"https://doi.org/10.1201/b10376-5","url":null,"abstract":"3.","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"24 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"121975674","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Implementing Matrix Multiplication on the Cell B. E","authors":"W. Alvaro, J. Kurzak, J. Dongarra","doi":"10.1201/b10376-3","DOIUrl":"https://doi.org/10.1201/b10376-3","url":null,"abstract":"Dense matrix multiplication is one of the most common numerical operations , especially in the area of dense linear algebra, where it forms the core of many important algorithms, including solvers of linear systems of equations , least square problems, and singular and eigenvalue problems. The Cell B. E. excells in its capabilities to process compute-intensive workloads, like matrix multiplication, in single precision, through its powerful SIMD capabilities. This chapter disects implementations of two single precision matrix 3","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"6 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"114985453","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Implementing Matrix Factorizations on the Cell B. E","authors":"J. Kurzak, J. Dongarra","doi":"10.1201/b10376-4","DOIUrl":"https://doi.org/10.1201/b10376-4","url":null,"abstract":"2.","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"53 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"114813149","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
M. Christen, O. Schenk, E. Neufeld, M. Paulides, H. Burkhart
{"title":"Manycore Stencil Computations in Hyperthermia Applications","authors":"M. Christen, O. Schenk, E. Neufeld, M. Paulides, H. Burkhart","doi":"10.1201/b10376-19","DOIUrl":"https://doi.org/10.1201/b10376-19","url":null,"abstract":"","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"1 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"128813899","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"BLAS for GPUs","authors":"Rajib Nath, S. Tomov, J. Dongarra","doi":"10.1201/b10376-6","DOIUrl":"https://doi.org/10.1201/b10376-6","url":null,"abstract":"","PeriodicalId":411793,"journal":{"name":"Scientific Computing with Multicore and Accelerators","volume":"64 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"1900-01-01","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"131641028","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}