Added part of the tensor_tools implementations

cb2f9de6 · Davis King · 76433858 · cb2f9de6 · cb2f9de6 · cb2f9de6
Commit cb2f9de6 authored Nov 09, 2015 by Davis King
6 changed files
--- a/dlib/CMakeLists.txt
+++ b/dlib/CMakeLists.txt
@@ -138,6 +138,7 @@ if (NOT TARGET dlib)
   if (COMPILER_CAN_DO_CPP_11)
      set(source_files ${source_files}
         dnn/cpu_dlib.cpp
+         dnn/tensor_tools.cpp
         )
   endif()


--- a/dlib/all/source.cpp
+++ b/dlib/all/source.cpp
@@ -21,6 +21,7 @@
 // Stuff that requires C++11
 #if __cplusplus >= 201103
 #include "../dnn/cpu_dlib.cpp"
+#include "../dnn/tensor_tools.cpp"
 #endif 

 #ifndef DLIB_ISO_CPP_ONLY

--- a/dlib/dnn.h
+++ b/dlib/dnn.h
@@ -11,6 +11,7 @@
 #include "dnn/solvers.h"
 #include "dnn/trainer.h"
 #include "dnn/cpu_dlib.h"
+#include "dnn/tensor_tools.h"

 #endif // DLIB_DNn_


--- a/dlib/dnn/cpu_dlib.h
+++ b/dlib/dnn/cpu_dlib.h
@@ -91,6 +91,9 @@ namespace dlib
    } 
 }

+#ifdef NO_MAKEFILE
+#include "cpu_dlib.cpp"
+#endif

 #endif // DLIB_DNN_CPU_H_


--- a/dlib/dnn/tensor_tools.cpp
+++ b/dlib/dnn/tensor_tools.cpp
+// Copyright (C) 2015  Davis E. King (davis@dlib.net)
+// License: Boost Software License   See LICENSE.txt for the full license.
+#ifndef DLIB_TeNSOR_TOOLS_CPP_
+#define DLIB_TeNSOR_TOOLS_CPP_
+
+#include "tensor_tools.h"
+#include "cpu_dlib.h"
+
+namespace dlib { namespace tt
+{
+
+// ----------------------------------------------------------------------------------------
+
+    void gemm (
+        float beta,
+        tensor& dest,
+        float alpha,
+        const tensor& lhs,
+        bool trans_lhs,
+        const tensor& rhs,
+        bool trans_rhs
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::gemm(beta, dest, alpha, lhs, trans_lhs, rhs, trans_rhs);
+#else
+        if (trans_lhs && trans_rhs)
+            dest = alpha*trans(mat(lhs))*trans(mat(rhs)) + beta*mat(dest);
+        if (!trans_lhs && trans_rhs)
+            dest = alpha*mat(lhs)*trans(mat(rhs)) + beta*mat(dest);
+        if (trans_lhs && !trans_rhs)
+            dest = alpha*trans(mat(lhs))*mat(rhs) + beta*mat(dest);
+        else
+            dest = alpha*mat(lhs)*mat(rhs) + beta*mat(dest);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+
+    tensor_rand::
+    tensor_rand(
+        unsigned long long seed
+    )
+    {
+        // TODO
+    }
+
+    void tensor_rand::
+    fill_gaussian (
+        tensor& data,
+        float mean,
+        float stddev
+    )
+    {
+        DLIB_CASSERT(data.size()%2 == 0,"");
+#ifdef DLIB_USE_CUDA
+        rnd.fill_gaussian(data);
+#else
+        for (auto& x : data) 
+            x = rnd.get_random_gaussian()*stddev + mean;
+#endif
+    }
+
+    void tensor_rand::
+    fill_uniform (
+        tensor& data
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        rnd.fill_uniform(data);
+#else
+        for (auto& x : data) 
+            x = rnd.get_random_float();
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+
+    void multiply (
+        tensor& dest,
+        const tensor& src
+    )
+    {
+        DLIB_CASSERT(have_same_dimensions(dest,src) == true,"");
+#ifdef DLIB_USE_CUDA
+        cuda::multiply(dest, src);
+#else
+        cpu::multiply(dest, src);
+#endif
+
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void affine_transform(
+        resizable_tensor& dest,
+        const tensor& src,
+        const float A,
+        const float B
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::affine_transform(dest,src,A,B);
+#else
+        cpu::affine_transform(dest,src,A,B);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void affine_transform(
+        resizable_tensor& dest,
+        const tensor& src,
+        const tensor& A,
+        const tensor& B
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::affine_transform(dest,src,A,B);
+#else
+        cpu::affine_transform(dest,src,A,B);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void batch_normalize (
+        resizable_tensor& dest,
+        resizable_tensor& means,
+        resizable_tensor& vars,
+        const tensor& src,
+        const tensor& gamma, 
+        const tensor& beta 
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::batch_normalize(dest,means,vars,src,gamma,beta);
+#else
+        cpu::batch_normalize(dest,means,vars,src,gamma,beta);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void batch_normalize_gradient (
+        const tensor& gradient_input,
+        const tensor& means,
+        const tensor& vars,
+        const tensor& src,
+        const tensor& gamma,
+        tensor& src_grad,
+        tensor& gamma_grad, 
+        tensor& beta_grad 
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::batch_normalize_gradient(gradient_input,means,vars,src,gamma,
+                                       src_grad,gamma_grad,beta_grad);
+#else
+        cpu::batch_normalize_gradient(gradient_input,means,vars,src,gamma,
+                                       src_grad,gamma_grad,beta_grad);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void batch_normalize_conv (
+        resizable_tensor& dest,
+        resizable_tensor& means,
+        resizable_tensor& vars,
+        const tensor& src,
+        const tensor& gamma, 
+        const tensor& beta 
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::batch_normalize_conv(dest,means,vars,src,gamma,beta);
+#else
+        cpu::batch_normalize_conv(dest,means,vars,src,gamma,beta);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void batch_normalize_conv_gradient (
+        const tensor& gradient_input,
+        const tensor& means,
+        const tensor& vars,
+        const tensor& src,
+        const tensor& gamma,
+        tensor& src_grad,
+        tensor& gamma_grad, 
+        tensor& beta_grad 
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::batch_normalize_conv_gradient(gradient_input,means,vars,src,gamma,
+                                       src_grad,gamma_grad,beta_grad);
+#else
+        cpu::batch_normalize_conv_gradient(gradient_input,means,vars,src,gamma,
+                                       src_grad,gamma_grad,beta_grad);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void threshold (
+        tensor& data,
+        float thresh
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::threshold(data,thresh);
+#else
+        cpu::threshold(data,thresh);
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void add(
+        float beta,
+        tensor& dest,
+        float alpha,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::add(beta,dest,alpha,src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void add_conv_bias_gradient (
+        tensor& grad,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::add_conv_bias_gradient(grad,gradient_input);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+
+    tensor_conv::
+    tensor_conv()
+    {
+    }
+
+    void tensor_conv::
+    clear(
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.clear();
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void tensor_conv::
+    setup(
+        const tensor& data,
+        const tensor& filters,
+        int stride_y,
+        int stride_x
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.setup(data, filters, stride_y, stride_x);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void tensor_conv::
+    operator() (
+        resizable_tensor& output,
+        const tensor& data,
+        const tensor& filters
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl(output, data, filters);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void tensor_conv::
+    get_gradient_for_data (
+        const tensor& gradient_input, 
+        const tensor& filters,
+        tensor& data_gradient
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.get_gradient_for_data(gradient_input, filters, data_gradient);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void tensor_conv::
+    get_gradient_for_filters (
+        const tensor& gradient_input, 
+        const tensor& data,
+        tensor& filters_gradient
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.get_gradient_for_filters(gradient_input, data, filters_gradient);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+
+    max_pool::
+    max_pool (
+    )
+    {
+    }
+
+    void max_pool::
+    clear(
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.clear();
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void max_pool::
+    setup(
+        int window_height,
+        int window_width,
+        int stride_y,
+        int stride_x
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.setup(window_height, window_width, stride_y, stride_x);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void max_pool::
+    operator() (
+        resizable_tensor& dest,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl(dest, src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void max_pool::
+    get_gradient(
+        const tensor& gradient_input, 
+        const tensor& dest,
+        const tensor& src,
+        tensor& grad 
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        impl.get_gradient(gradient_input, dest, src, grad);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+// ----------------------------------------------------------------------------------------
+
+    void softmax (
+        resizable_tensor& dest,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::softmax(dest,src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void softmax_gradient (
+        tensor& grad,
+        const tensor& softmaxed_data,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::softmax_gradient(grad, softmaxed_data, gradient_input);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void sigmoid (
+        resizable_tensor& dest,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::sigmoid(dest,src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void sigmoid_gradient (
+        tensor& grad,
+        const tensor& dest,
+        const tensor& src,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::sigmoid_gradient(grad, dest, src, gradient_input);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void relu (
+        resizable_tensor& dest,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::relu(dest,src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void relu_gradient (
+        tensor& grad,
+        const tensor& dest,
+        const tensor& src,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::relu_gradient(grad, dest, src, gradient_input);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+    void tanh (
+        resizable_tensor& dest,
+        const tensor& src
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::tanh(dest,src);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+    void tanh_gradient (
+        tensor& grad,
+        const tensor& dest,
+        const tensor& src,
+        const tensor& gradient_input
+    )
+    {
+#ifdef DLIB_USE_CUDA
+        cuda::tanh_gradient(grad, dest, src, gradient_input);
+#else
+        // TODO
+        DLIB_CASSERT(false,"");
+#endif
+    }
+
+// ----------------------------------------------------------------------------------------
+
+}}
+
+#endif // DLIB_TeNSOR_TOOLS_CPP_
+
--- a/dlib/dnn/tensor_tools.h
+++ b/dlib/dnn/tensor_tools.h
@@ -4,8 +4,12 @@
 #define DLIB_TeNSOR_TOOLS_H_

 #include "tensor.h"
+#include "cudnn_dlibapi.h"
+#include "cublas_dlibapi.h"
+#include "curand_dlibapi.h"
+#include "../rand.h"

-namespace dlib
+namespace dlib { namespace tt
 {

 // ----------------------------------------------------------------------------------------
@@ -37,7 +41,51 @@ namespace dlib

    class tensor_rand
    {
+        /*!
+            WHAT THIS OBJECT REPRESENTS
+                This is a tool for filling a tensor with random numbers.  
+
+                Note that the sequence of random numbers output by this object is different
+                when dlib is compiled with DLIB_USE_CUDA.  So you should not write code
+                that depends on any specific sequence of numbers coming out of a
+                tensor_rand.
+
+        !*/
+
    public:
+        // not copyable
+        tensor_rand(const tensor_rand&) = delete;
+        tensor_rand& operator=(const tensor_rand&) = delete;
+
+        tensor_rand() : tensor_rand(0) {}
+        tensor_rand(unsigned long long seed);
+
+        void fill_gaussian (
+            tensor& data,
+            float mean,
+            float stddev
+        );
+        /*!
+            requires
+                - data.size()%2 == 0
+            ensures
+                - Fills data with random numbers drawn from a Gaussian distribution
+                  with the given mean and standard deviation.
+        !*/
+
+        void fill_uniform (
+            tensor& data
+        );
+        /*!
+            ensures
+                - Fills data with uniform random numbers in the range (0.0, 1.0].
+        !*/
+
+#ifdef DLIB_USE_CUDA
+        cuda::curand_generator rnd;
+#else
+        dlib::rand rnd;
+#endif
    };

 // ----------------------------------------------------------------------------------------
@@ -278,13 +326,13 @@ namespace dlib

 // ----------------------------------------------------------------------------------------

-    class conv
+    class tensor_conv
    {
    public:
-        conv(const conv&) = delete;
-        conv& operator=(const conv&) = delete;
+        tensor_conv(const tensor_conv&) = delete;
+        tensor_conv& operator=(const tensor_conv&) = delete;

-        conv();
+        tensor_conv();

        void clear(
        );
@@ -302,9 +350,6 @@ namespace dlib
                    - stride_x > 0
        !*/

-        ~conv (
-        );
-
        void operator() (
            resizable_tensor& output,
            const tensor& data,
@@ -362,6 +407,11 @@ namespace dlib
        !*/

    private:
+#ifdef DLIB_USE_CUDA
+        cuda::tensor_conv impl;
+#else
+        // TODO
+#endif

    };

@@ -379,9 +429,6 @@ namespace dlib
        max_pool (
        );

-        ~max_pool(
-        );
-
        void clear(
        );

@@ -429,6 +476,11 @@ namespace dlib
        !*/

        private:
+#ifdef DLIB_USE_CUDA
+        cuda::max_pool impl;
+#else
+        // TODO
+#endif
    };

 // ----------------------------------------------------------------------------------------
@@ -564,8 +616,11 @@ namespace dlib

 // ----------------------------------------------------------------------------------------

-    } 
-}
+}}
+
+#ifdef NO_MAKEFILE
+#include "tensor_tools.cpp"
+#endif

 #endif // DLIB_TeNSOR_TOOLS_H_