Made launch_kernel() not generate CUDA errors if you ask it to launch a kernel of size 0.

909ca040 · Davis King · f5abfca1 · 909ca040
Commit 909ca040 authored Apr 30, 2016 by Davis King
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 0 deletions

cuda_utils.h dlib/dnn/cuda_utils.h +2 -0

No files found.
--- a/dlib/dnn/cuda_utils.h
+++ b/dlib/dnn/cuda_utils.h
@@ -167,6 +167,8 @@ namespace dlib
                  launch_kernel().  
        !*/
        {
+            if (m.num == 0)
+                return;
            int num_blocks, num_threads;
            CHECK_CUDA(cudaOccupancyMaxPotentialBlockSize(&num_blocks,&num_threads,K));
            // Check if the job is really small and we don't really need to launch a kernel