@inproceedings{b20e2d2bd99f49af841e8b5e0aece20c,
title = "An HSAIL ISA conformed GPU platform",
abstract = "This paper presents a GPU platform based on the HSA (Heterogeneous System Architecture). The platform contains the OpenCL programming interface, a cycle-level HSAIL GPU simulator, and a finalizer that is able to translate the HSAIL code to our custom binary ISA. The system platform is able to run OpenCL applications, and the results are verified with the real GPU hardware. To improve the scheduling efficiency, we explore warp scheduling policies on our platform including Fair Round- Robin, Loose Round- Robin, Two-Level, and Greedy-Then-Oldest. We found that these algorithms are not optimal in using the load/store units. We propose a Memory Access First (MAF) mechanism which can be adopted to the Two- Level and Greedy-Then-Oldest scheduling policies to reduce the idle time of the load/store units. With the proposed mechanism, the warp scheduler can remove 23 to 34 percent of load/store unit idle time and improve the GPU performance by about 16%.",
author = "Chen, {Heng Yi} and Chen, {Chung Ho} and Huang, {Yun Chi} and Hsu, {Kuan Chieh} and Wang, {Chen Chieh}",
note = "Funding Information: This work was in part supported by the Ministry of Science and Technology, Taiwan, MOST 104-2220- E-006-013. Publisher Copyright: {\textcopyright} 2016 Taylor & Francis Group.; International Conference on Applied System Innovation, ICASI 2015 ; Conference date: 22-05-2015 Through 27-05-2015",
year = "2016",
doi = "10.1201/b21811-52",
language = "English",
isbn = "9781138028937",
series = "Applied System Innovation - Proceedings of the International Conference on Applied System Innovation, ICASI 2015",
publisher = "CRC Press/Balkema",
pages = "243--247",
editor = "Teen-Hang Meen and Prior, {Stephen D.} and Lam, {Artde Donald Kin-Tak}",
booktitle = "Applied System Innovation - Proceedings of the International Conference on Applied System Innovation, ICASI 2015",
}