Integrated CPU-GPU architecture provides excellent acceleration capabilities for data parallel applications on embedded platforms while meeting the size, weight and power (SWaP) requirements. However, sharing of main memory between CPU applications and GPU kernels can severely affect the execution of GPU kernels and diminish the performance gain provided by GPU. For example, in the NVIDIA Jetson TX2 platform, an integrated CPU-GPU architecture, we observed that, in the worst case, the GPU kernels can suffer as much as 3X slowdown in the presence of co-running memory intensive CPU applications. In this paper, we propose a software mechanism, which we call BWLOCK++, to protect the performance of GPU kernels from co-scheduled memory intensive CPU applications.
@InProceedings{ali_et_al:LIPIcs.ECRTS.2018.19, author = {Ali, Waqar and Yun, Heechul}, title = {{Protecting Real-Time GPU Kernels on Integrated CPU-GPU SoC Platforms}}, booktitle = {30th Euromicro Conference on Real-Time Systems (ECRTS 2018)}, pages = {19:1--19:22}, series = {Leibniz International Proceedings in Informatics (LIPIcs)}, ISBN = {978-3-95977-075-0}, ISSN = {1868-8969}, year = {2018}, volume = {106}, editor = {Altmeyer, Sebastian}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/LIPIcs.ECRTS.2018.19}, URN = {urn:nbn:de:0030-drops-89833}, doi = {10.4230/LIPIcs.ECRTS.2018.19}, annote = {Keywords: GPU, memory bandwidth, resource contention, CPU throttling, fair scheduler} }
Feedback for Dagstuhl Publishing