Zongjing Chen, Kangjin Huang, Yonggang Che, Chuanfu Xu, Jian Zhang, Z. Dai, Ming Li
{"title":"Extending OP2 framework to support portable parallel programming of complex applications","authors":"Zongjing Chen, Kangjin Huang, Yonggang Che, Chuanfu Xu, Jian Zhang, Z. Dai, Ming Li","doi":"10.1007/s42514-023-00174-8","DOIUrl":"https://doi.org/10.1007/s42514-023-00174-8","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"2 2","pages":""},"PeriodicalIF":0.9,"publicationDate":"2023-12-07","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"138591803","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Leveraging simulation of high performance computing systems with node simulation using architecture simulator","authors":"Fang Lin, Yi Liu, Xin Wang, Xueyan Gai","doi":"10.1007/s42514-023-00173-9","DOIUrl":"https://doi.org/10.1007/s42514-023-00173-9","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"23 11","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-11-13","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"136281968","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Shiyang Li, Jingyu Zhu, Jiaxun Han, Yuting Peng, Zhuoran Wang, Xiaoli Gong, Gang Wang, Jin Zhang, Xuqiang Wang
{"title":"OneGraph: a cross-architecture framework for large-scale graph computing on GPUs based on oneAPI","authors":"Shiyang Li, Jingyu Zhu, Jiaxun Han, Yuting Peng, Zhuoran Wang, Xiaoli Gong, Gang Wang, Jin Zhang, Xuqiang Wang","doi":"10.1007/s42514-023-00172-w","DOIUrl":"https://doi.org/10.1007/s42514-023-00172-w","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":" 10","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-11-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"135241910","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Conflict-aware workload co-execution on SX-aurora TSUBASA","authors":"Riku Nunokawa, Yoichi Shimomura, Mulya Agung, Ryusuke Egawa, Hiroyuki Takizawa","doi":"10.1007/s42514-023-00171-x","DOIUrl":"https://doi.org/10.1007/s42514-023-00171-x","url":null,"abstract":"Abstract NEC SX-Aurora TSUBASA (SX-AT) is the latest vector supercomputer, consisting of host processors called Vector Hosts (VHs) and vector processors called Vector Engines (VEs). The goal of this work is to simultaneously use both VHs and VEs to increase the resource utilization and improve the system throughput by co-executing more workloads. One difficulty is that performance interferences among VH and VE workloads could occur because they share some computing resources and potentially compete to use the same resource at the same time, so-called resource conflicts. To achieve efficient workload co-execution, first, this paper experimentally investigates the performance interference between a VH and a VE, when each of the two processors executes a different workload. It is empirically shown that the frequency of system calls from the VE workload could be a good indicator to predict if the co-execution could cause severe performance interference, even though monitoring system calls requires a huge runtime overhead and it is impractical to simply use it for decision making of co-execution. Then, this paper proposes a workload co-execution strategy based on a practical approach to identifying a pair of VE and VH workloads that could cause severe performance interferences. Our evaluation results clearly demonstrate that the system call frequency can be used to predict if the workload can affect the performance of another co-executing workload, and VH’s CPU load can be a good approximation of the system call frequency. The proposed approach based on the CPU loads could accurately identify a pair of workloads causing frequent resource conflicts, and thus reduce the risk of severe performance interferences between co-executing workloads on an SX-AT system, resulting in shorter makespan without significantly increasing the turn-around time.","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"440 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-10-05","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"135480691","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Yueyuan Zhou, ZiYi Ren, En Shao, Lixian Ma, Qiang Hu, Leping Wang, Guangming Tan
{"title":"FILL: a heterogeneous resource scheduling system addressing the low throughput problem in GROMACS","authors":"Yueyuan Zhou, ZiYi Ren, En Shao, Lixian Ma, Qiang Hu, Leping Wang, Guangming Tan","doi":"10.1007/s42514-023-00169-5","DOIUrl":"https://doi.org/10.1007/s42514-023-00169-5","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"316 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-09-23","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"135959455","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Lu Bai, Weixing Ji, Qinyuan Li, Xilai Yao, Wei Xin, Wanyi Zhu
{"title":"ConvDarts: a fast and exact convolutional algorithm selector for deep learning frameworks","authors":"Lu Bai, Weixing Ji, Qinyuan Li, Xilai Yao, Wei Xin, Wanyi Zhu","doi":"10.1007/s42514-023-00167-7","DOIUrl":"https://doi.org/10.1007/s42514-023-00167-7","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"22 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-09-20","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"136308147","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Shaojie Tan, Qingcai Jiang, Zhenwei Cao, Xiaoyu Hao, Junshi Chen, Hong An
{"title":"Uncovering the performance bottleneck of modern HPC processor with static code analyzer: a case study on Kunpeng 920","authors":"Shaojie Tan, Qingcai Jiang, Zhenwei Cao, Xiaoyu Hao, Junshi Chen, Hong An","doi":"10.1007/s42514-023-00160-0","DOIUrl":"https://doi.org/10.1007/s42514-023-00160-0","url":null,"abstract":"","PeriodicalId":29895,"journal":{"name":"CCF Transactions on High Performance Computing","volume":"15 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2023-09-15","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"135395212","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}