Moved log1pexp() and randomize_parameters() from core.h into utilities.h

2016-06-11 23:08:51 -04:00 · 2016-06-11 23:08:51 -04:00 · 172647f87c
parent 6578c1b574
commit 172647f87c
5 changed files with 66 additions and 61 deletions
--- a/dlib/dnn/core.h
+++ b/dlib/dnn/core.h
@ -112,23 +112,6 @@ namespace dlib
        }
    }
 // ----------------------------------------------------------------------------------------
    inline double log1pexp(double x)
    {
        using std::exp;
        using namespace std; // Do this instead of using std::log1p because some compilers
                             // error out otherwise (E.g. gcc 4.9 in cygwin)
        if (x <= -37)
            return exp(x);
        else if (-37 < x && x <= 18)
            return log1p(exp(x));
        else if (18 < x && x <= 33.3)
            return x + exp(-x);
        else
            return x;
    }
 // ----------------------------------------------------------------------------------------
    // Tell us if T is one of the special layer types (i.e. add_layer, repeat, add_tag_layer, or
@ -442,24 +425,6 @@ namespace dlib
    {
        return item;
    }
 // ----------------------------------------------------------------------------------------
    inline void randomize_parameters (
        tensor& params,
        unsigned long num_inputs_and_outputs,
        dlib::rand& rnd
    )
    {
        for (auto& val : params)
        {
            // Draw a random number to initialize the layer according to formula (16)
            // from Understanding the difficulty of training deep feedforward neural
            // networks by Xavier Glorot and Yoshua Bengio.
            val = 2*rnd.get_random_float()-1;
            val *= std::sqrt(6.0/(num_inputs_and_outputs));
        }
    }
 // ----------------------------------------------------------------------------------------
    template <typename T>
--- a/dlib/dnn/core_abstract.h
+++ b/dlib/dnn/core_abstract.h
@ -16,23 +16,6 @@ namespace dlib
 // ----------------------------------------------------------------------------------------
    void randomize_parameters (
        tensor& params,
        unsigned long num_inputs_and_outputs,
        dlib::rand& rnd
    );
    /*!
        ensures
            - This function assigns random values into params based on the given random
              number generator.  In particular, it uses the parameter initialization method
              of formula 16 from the paper "Understanding the difficulty of training deep
              feedforward neural networks" by Xavier Glorot and Yoshua Bengio.
            - It is assumed that the total number of inputs and outputs from the layer is
              num_inputs_and_outputs.  That is, you should set num_inputs_and_outputs to
              the sum of the dimensionalities of the vectors going into and out of the
              layer that uses params as its parameters.
    !*/
    template <
        typename... T 
        >
@ -58,15 +41,6 @@ namespace dlib
              a non-std::tuple object is found.
    !*/
    double log1pexp(
        double x
    );
    /*!
        ensures
            - returns log(1+exp(x))
              (except computes it using a numerically accurate method)
    !*/
 // ----------------------------------------------------------------------------------------
    template <typename T>
--- a/dlib/dnn/layers.h
+++ b/dlib/dnn/layers.h
@ -12,6 +12,7 @@
 #include "../string.h"
 #include "tensor_tools.h"
 #include "../vectorstream.h"
 #include "utilities.h"
 namespace dlib
--- a/dlib/dnn/utilities.h
+++ b/dlib/dnn/utilities.h
@ -9,6 +9,41 @@
 namespace dlib
 {
 // ----------------------------------------------------------------------------------------
    inline double log1pexp(double x)
    {
        using std::exp;
        using namespace std; // Do this instead of using std::log1p because some compilers
                             // error out otherwise (E.g. gcc 4.9 in cygwin)
        if (x <= -37)
            return exp(x);
        else if (-37 < x && x <= 18)
            return log1p(exp(x));
        else if (18 < x && x <= 33.3)
            return x + exp(-x);
        else
            return x;
    }
 // ----------------------------------------------------------------------------------------
    inline void randomize_parameters (
        tensor& params,
        unsigned long num_inputs_and_outputs,
        dlib::rand& rnd
    )
    {
        for (auto& val : params)
        {
            // Draw a random number to initialize the layer according to formula (16)
            // from Understanding the difficulty of training deep feedforward neural
            // networks by Xavier Glorot and Yoshua Bengio.
            val = 2*rnd.get_random_float()-1;
            val *= std::sqrt(6.0/(num_inputs_and_outputs));
        }
    }
 // ----------------------------------------------------------------------------------------
    namespace impl
--- a/dlib/dnn/utilities_abstract.h
+++ b/dlib/dnn/utilities_abstract.h
@ -8,6 +8,36 @@
 namespace dlib
 {
 // ----------------------------------------------------------------------------------------
    double log1pexp(
        double x
    );
    /*!
        ensures
            - returns log(1+exp(x))
              (except computes it using a numerically accurate method)
    !*/
 // ----------------------------------------------------------------------------------------
    void randomize_parameters (
        tensor& params,
        unsigned long num_inputs_and_outputs,
        dlib::rand& rnd
    );
    /*!
        ensures
            - This function assigns random values into params based on the given random
              number generator.  In particular, it uses the parameter initialization method
              of formula 16 from the paper "Understanding the difficulty of training deep
              feedforward neural networks" by Xavier Glorot and Yoshua Bengio.
            - It is assumed that the total number of inputs and outputs from the layer is
              num_inputs_and_outputs.  That is, you should set num_inputs_and_outputs to
              the sum of the dimensionalities of the vectors going into and out of the
              layer that uses params as its parameters.
    !*/
 // ----------------------------------------------------------------------------------------
    template <typename net_type>