@inproceedings{26ce1af6c9144feaa685da5d2000d024,
title = "A Deep Q-Learning Approach for GPU Task Scheduling",
abstract = "Efficient utilization of resources is critical to system performance and effectiveness for high performance computing systems. In a graphics processing unit (GPU)-based system, one method for enabling higher utilization is concurrent kernel execution-allowing multiple independent kernels to simultaneously execute on the GPU. However, resource contention due to the manner in which kernel tasks are scheduled may still lead to suboptimal task performance and utilization. In this work, we present a deep Q-learning approach to identify an ordering for a given set of tasks which achieves near-optimal average task performance and high resource utilization. Our solution outperforms other similar approaches and has additional benefit of being adaptable to dynamic task characteristics or GPU resource configurations.",
keywords = "GPU, concurrent kernel execution, deep Q-learning, kernel scheduling",
author = "Luley, {Ryan S.} and Qinru Qiu",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE High Performance Extreme Computing Conference, HPEC 2020 ; Conference date: 21-09-2020 Through 25-09-2020",
year = "2020",
month = sep,
day = "22",
doi = "10.1109/HPEC43674.2020.9286238",
language = "English (US)",
series = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
}