[SYCL][CUDA] Bounds check on kernel launch

Steffen Larsen · Steffen Larsen · commit 7764648dca64 · 2020-02-25T14:50:44.000Z
Signed-off-by: Steffen Larsen &lt;steffen.larsen@codeplay.com&gt;
diff --git a/sycl/plugins/cuda/pi_cuda.cpp b/sycl/plugins/cuda/pi_cuda.cpp
@@ -1788,6 +1788,19 @@ pi_result cuda_piEnqueueKernelLaunch(
       }
     }
 
+    size_t maxThreadsPerBlock[3] = {};
+    retError = cuda_piDeviceGetInfo(command_queue->device_,
+                                    PI_DEVICE_INFO_MAX_WORK_ITEM_SIZES,
+                                    sizeof(maxThreadsPerBlock),
+                                    maxThreadsPerBlock, nullptr);
+    assert(retError == PI_SUCCESS);
+
+    for (size_t i = 0; i < work_dim; i++) {
+      if(size_t(threadsPerBlock[i]) > maxThreadsPerBlock[i]) {
+        return PI_INVALID_WORK_GROUP_SIZE;
+      }
+    }
+
     int blocksPerGrid[3] = { 1, 1, 1 };
 
     for (size_t i = 0; i < work_dim; i++) {