@inproceedings{f967a1c9981148289d88530c85ed8cf9,
title = "Dynamic SIMD re-convergence with paired-path comparison",
abstract = "SIMD divergence is one of the critical factors that decrease the hardware utilization in contemporary GPGPUs (General Purpose Graphic Processor Unit). Both the reconvergence scheme and control flow detection have to be well considered. In the emerging HSA (Heterogeneous System Architecture) platform, we develop an effective dynamic stack-based re-convergence scheme that can be implemented without the insertion of re-convergence instructions generated by the finalizer. The stack keeps track of the minimal necessary information of the taken and non-taken paths; the additional end-of-branch instruction insertion is no longer required under our design. Using the scheme we propose, the divergent warp dynamically re-converges at opportunistic re-convergence points. The activity factor improves for 13.36% on average from opportunistic early re-convergence in the unstructured control flow. Our design has eased the development of a finalizer that no longer needs to reason about the reconvergence point after a branch divergence, especially for unstructured control flow.",
author = "Huang, {Yun Chi} and Hsu, {Kuan Chieh} and Hsieh, {Wan Shan} and Wang, {Chen Chieh} and Lu, {Chia Han} and Chen, {Chung Ho}",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 2016 IEEE International Symposium on Circuits and Systems, ISCAS 2016 ; Conference date: 22-05-2016 Through 25-05-2016",
year = "2016",
month = jul,
day = "29",
doi = "10.1109/ISCAS.2016.7527213",
language = "English",
series = "Proceedings - IEEE International Symposium on Circuits and Systems",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "233--236",
booktitle = "ISCAS 2016 - IEEE International Symposium on Circuits and Systems",
address = "United States",
}