Added cpu version of add() and also added new add_bias_gradient() function.

8062663c · Davis King · 20d46fc5 · 8062663c · 8062663c · 8062663c
Commit 8062663c authored Dec 09, 2015 by Davis King
Showing with 123 additions and 3 deletions

cpu_dlib.cpp dlib/dnn/cpu_dlib.cpp +71 -0

cpu_dlib.h dlib/dnn/cpu_dlib.h +12 -0

tensor_tools.cpp dlib/dnn/tensor_tools.cpp +17 -2

tensor_tools.h dlib/dnn/tensor_tools.h +23 -1

No files found.
--- a/dlib/dnn/cpu_dlib.cpp
+++ b/dlib/dnn/cpu_dlib.cpp
@@ -68,6 +68,77 @@ namespace dlib
            }
        }
+        void add(
+            float beta,
+            tensor& dest,
+            float alpha,
+            const tensor& src
+        )
+        {
+            DLIB_CASSERT(
+                  (dest.num_samples()==src.num_samples() || src.num_samples()==1) &&
+                  (dest.nr()==src.nr() || src.nr()==1) &&
+                  (dest.nc()==src.nc() || src.nc()==1) &&
+                  (dest.k()==src.k()   || src.k()==1) && 
+                  is_same_object(src,dest) == false , "");
+            if (beta == 0 && alpha == 0)
+            {
+                dest = 0;
+                return;
+            }
+            auto d = dest.host();
+            auto s = src.host();
+            for (long n = 0; n < dest.num_samples(); ++n)
+            {
+                const auto sn = src.num_samples()==1 ? 0:n;
+                for (long k = 0; k < dest.k(); ++k)
+                {
+                    const auto sk = src.k()==1 ? 0:k;
+                    for (long r = 0; r < dest.nr(); ++r)
+                    {
+                        const auto sr = src.nr()==1 ? 0:r;
+                        for (long c = 0; c < dest.nc(); ++c)
+                        {
+                            const auto sc = src.nc()==1 ? 0:c;
+                            const auto s_idx = ((sn*src.k() + sk)*src.nr() + sr)*src.nc() + sc;
+                            *d = beta*(*d) + alpha*s[s_idx];
+                            ++d;
+                        }
+                    }
+                }
+            }
+        }
+    // ----------------------------------------------------------------------------------------
+        void add_bias_gradient (
+            tensor& grad,
+            const tensor& gradient_input
+        )
+        {
+            DLIB_CASSERT(
+                  grad.num_samples() == 1 &&
+                  gradient_input.k() == grad.k() &&
+                  gradient_input.nr() == grad.nr() &&
+                  gradient_input.nc() == grad.nc() &&
+                  gradient_input.size() > 0,"");
+            auto out = grad.host();
+            auto in = gradient_input.host();
+            for (size_t i = 0; i < grad.size(); ++i)
+                out[i] = *in++;
+            for (long i = 1; i < gradient_input.num_samples(); ++i)
+            {
+                for (size_t i = 0; i < grad.size(); ++i)
+                    out[i] += *in++;
+            }
+        }
    // -----------------------------------------------------------------------------------
        void affine_transform(

--- a/dlib/dnn/cpu_dlib.h
+++ b/dlib/dnn/cpu_dlib.h
@@ -26,6 +26,18 @@ namespace dlib
            const tensor& src2
        );
+        void add(
+            float beta,
+            tensor& dest,
+            float alpha,
+            const tensor& src
+        );
+        void add_bias_gradient (
+            tensor& grad,
+            const tensor& gradient_input
+        );
    // -----------------------------------------------------------------------------------
        void affine_transform(

--- a/dlib/dnn/tensor_tools.cpp
+++ b/dlib/dnn/tensor_tools.cpp
@@ -259,8 +259,7 @@ namespace dlib { namespace tt
 #ifdef DLIB_USE_CUDA
        cuda::add(beta,dest,alpha,src);
 #else
-        // TODO
+        cpu::add(beta,dest,alpha,src);
-        DLIB_CASSERT(false,"");
 #endif
    }
@@ -279,6 +278,22 @@ namespace dlib { namespace tt
 #endif
    }
+// ----------------------------------------------------------------------------------------
+    void add_bias_gradient (
+        tensor& grad,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        // TODO
+        DLIB_CASSERT(false,"");
+        //cuda::add_bias_gradient(grad,gradient_input);
+#else
+        cpu::add_bias_gradient(grad,gradient_input);
+#endif
+    }
 // ----------------------------------------------------------------------------------------
 // ----------------------------------------------------------------------------------------

--- a/dlib/dnn/tensor_tools.h
+++ b/dlib/dnn/tensor_tools.h
@@ -406,7 +406,29 @@ namespace dlib { namespace tt
            - gradient_input.size() > 0
            - is_same_object(grad,gradient_input) == false
        ensures
-            - let BIAS be a tensor with all dimensions equal to 1 except for k which is >= 1.
+            - let BIAS be a tensor with the same dimensions as grad.
+            - let OUT be the output of add(1,OUT,1,BIAS)
+            - let f(gradient_input,BIAS) == dot(gradient_input,OUT)
+            - Then this function computes the gradient of f() with respect to BIAS and
+              assigns it to grad.
+    !*/
+// ----------------------------------------------------------------------------------------
+    void add_bias_gradient (
+        tensor& grad,
+        const tensor& gradient_input
+    );
+    /*!
+        requires
+            - grad.num_samples() == 1
+            - gradient_input.k() == grad.k()
+            - gradient_input.nr() == grad.nr()
+            - gradient_input.nc() == grad.nc()
+            - gradient_input.size() > 0
+            - is_same_object(grad,gradient_input) == false
+        ensures
+            - let BIAS be a tensor with the same dimensions as grad.
            - let OUT be the output of add(1,OUT,1,BIAS)
            - let f(gradient_input,BIAS) == dot(gradient_input,OUT)
            - Then this function computes the gradient of f() with respect to BIAS and