This paper presents a real-time locking protocol whose design was motivated by the goal of enabling safe GPU sharing in time-sliced component-based systems. This locking protocol enables a GPU to be shared concurrently across, and utilized within, isolated components with predictable execution times. It relies on a novel resizing technique where GPU work is dimensioned on-the-fly to run on partitions of an NVIDIA GPU. This technique can be applied to any component that internally utilizes global CPU scheduling. The proposed locking protocol enables increased GPU parallelism and reduces GPU capacity loss with analytically provable benefits.
@Article{ali_et_al:DARTS.10.1.1, author = {Ali, Syed W. and Tong, Zelin and Goh, Joseph and Anderson, James H.}, title = {{Predictable GPU Sharing in Component-Based Real-Time Systems (Artifact)}}, pages = {1:1--1:5}, journal = {Dagstuhl Artifacts Series}, ISBN = {978-3-95977-327-0}, ISSN = {2509-8195}, year = {2024}, volume = {10}, number = {1}, editor = {Ali, Syed W. and Tong, Zelin and Goh, Joseph and Anderson, James H.}, publisher = {Schloss Dagstuhl -- Leibniz-Zentrum f{\"u}r Informatik}, address = {Dagstuhl, Germany}, URL = {https://drops.dagstuhl.de/entities/document/10.4230/DARTS.10.1.1}, URN = {urn:nbn:de:0030-drops-203236}, doi = {10.4230/DARTS.10.1.1}, annote = {Keywords: GPU locking protocols, real-time locking protocols, priority-inversion blocking, component-based systems} }
59602553fb34de203b253b31a96c9cf4
(Get MD5 Sum)
Feedback for Dagstuhl Publishing