Added tensor spec.

99e948db · Davis King · 37d493e2 · 99e948db · 99e948db · 99e948db
Commit 99e948db authored Oct 21, 2015 by Davis King
Expand all Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 9 deletions

gpu_data_abstract.h dlib/dnn/gpu_data_abstract.h +9 -9

tensor.h dlib/dnn/tensor.h +1 -0

tensor_abstract.h dlib/dnn/tensor_abstract.h +0 -0

No files found.
--- a/dlib/dnn/gpu_data_abstract.h
+++ b/dlib/dnn/gpu_data_abstract.h
@@ -16,23 +16,23 @@ namespace dlib
        /*!
            WHAT THIS OBJECT REPRESENTS
                This object is a block of size() floats, all stored contiguously in memory.
-                In particular, it keeps two copies of the floats, one on the host CPU side
+                Importantly, it keeps two copies of the floats, one on the host CPU side
                and another on the GPU device side. It automatically performs the necessary
                host/device transfers to keep these two copies of the data in sync.
-                All transfers to the device happen asynchronously so that CUDA kernel
+                All transfers to the device happen asynchronously with respect to the
-                computations can overlap with data transfers.  However, any transfers from
+                default CUDA stream so that CUDA kernel computations can overlap with data
-                the device to the host happen synchronously in the default CUDA stream.
+                transfers.  However, any transfers from the device to the host happen
-                Therefore, you should perform all your CUDA kernel launches on the default
+                synchronously in the default CUDA stream.  Therefore, you should perform
-                stream so that transfers back to the host do not happen before the
+                all your CUDA kernel launches on the default stream so that transfers back
-                computations have completed.
+                to the host do not happen before the relevant computations have completed.
                If DLIB_USE_CUDA is not #defined then this object will not use CUDA at all.
                Instead, it will simply store one host side memory block of floats.  
            THREAD SAFETY
-                This object is not thread-safe.  Don't touch it from multiple threads at
+                Instances of this object are not thread-safe.  So don't touch one from
-                the same time.
+                multiple threads at the same time.
        !*/
    public:

--- a/dlib/dnn/tensor.h
+++ b/dlib/dnn/tensor.h
@@ -367,6 +367,7 @@ namespace dlib
        const tensor& b
    )
    {
+        // TODO, do on GPU?
        DLIB_CASSERT(a.size() == b.size(), "");
        const float* da = a.host();
        const float* db = b.host();

--- a/dlib/dnn/tensor_abstract.h
+++ b/dlib/dnn/tensor_abstract.h