mi-neural-nets/a00093_source.html

 #ifndef SRC_MLNN_SOFTMAX_HPP_

 #define SRC_MLNN_SOFTMAX_HPP_


 #include <mlnn/layer/Layer.hpp>


 namespace mic {

 namespace mlnn {

 namespace cost_function {


 template <typename eT=float>

 class Softmax : public mic::mlnn::Layer<eT> {

 public:


     Softmax(size_t size_, std::string name_ = "Softmax") :

         Softmax(size_, 1, 1, name_)

     {


     }


     Softmax(size_t height_, size_t width_, size_t depth_,

             std::string name_ = "Softmax") :

         Layer<eT>::Layer(height_, width_, depth_,

                 height_, width_, depth_,

                 LayerTypes::Softmax, name_)

     {

         // Add "temporary" parameters.

         m.add("e", Layer<eT>::inputSize(), 1);

         m.add("sum", 1, 1);

         m.add("max", 1, 1);

     }


     virtual ~Softmax() {};


     virtual void resizeBatch(size_t batch_size_) {

         // Call parent resize.

         Layer<eT>::resizeBatch(batch_size_);


         // Reshape the temporary matrices.

         m["e"]->resize(m["e"]->rows(), batch_size_);

         m["sum"]->resize(m["sum"]->rows(), batch_size_);

         m["max"]->resize(m["max"]->rows(), batch_size_);

     }


     void forward(bool test_ = false) {

         mic::types::MatrixPtr<eT> x = s["x"];

         mic::types::MatrixPtr<eT> y = s["y"];

         mic::types::MatrixPtr<eT> e = m["e"];

         mic::types::MatrixPtr<eT> max = m["max"];

         mic::types::MatrixPtr<eT> sum = m["sum"];


         //std::cout << "Softmax forward: s['x'] = \n" << (*s['x']) << std::endl;


         // Prevent overflow according to: http://eric-yuan.me/softmax/

         (*max) = x->colwise().maxCoeff();


         // Calculate the e matrix - with overflow prevention.

         for (size_t i = 0; i < (size_t)y->rows(); i++)

             for (size_t j = 0; j < (size_t)y->cols(); j++)

                 (*e)(i, j) = std::exp( (*x)(i, j) - (*max)(j) );


         // Sum the values in columns (single batch), one by one.

         (*sum) = e->colwise().sum();


         // Iterate through elements.

         for (size_t i = 0; i < (size_t)y->rows(); i++) {

             for (size_t j = 0; j < (size_t)y->cols(); j++) {

                 (*y)(i, j) = (*e)(i, j) / (*sum)(j);

             }//: for

         }//: for


 //      std::cout << "Softmax forward: s['y'] = \n" << (*s['y']) << std::endl;

     }


     void backward() {

         mic::types::MatrixPtr<eT> y = s["y"];

         mic::types::MatrixPtr<eT> dx = g["x"];

         mic::types::MatrixPtr<eT> dy = g["y"];


         // Pass the gradient.

         for (size_t i = 0; i < (size_t)y->size(); i++)

             // dx = dy *  derivative of softmax, i.e. y * (1 - y);

             (*dx)[i] = (*dy)[i] * (*y)[i] * (1 - (*y)[i]);


         /*std::cout << "Softmax backward: g['y'] = \n" << (*g['y']) << std::endl;

         std::cout << "Softmax backward: g['x'] = \n" << (*g['x']) << std::endl;*/

     }


     virtual void update(eT alpha_, eT decay_  = 0.0f) { };


     // Unhide the overloaded methods inherited from the template class Layer fields via "using" statement.

     using Layer<eT>::forward;

     using Layer<eT>::backward;


 protected:

     // Unhiding the template inherited fields via "using" statement.

     using Layer<eT>::g;

     using Layer<eT>::s;

     using Layer<eT>::m;


 private:

     // Friend class - required for using boost serialization.

     template<typename tmp> friend class mic::mlnn::MultiLayerNeuralNetwork;


     Softmax<eT>() : Layer<eT> () { }


 };


 } /* namespace cost_function */

 } /* namespace mlnn */

 } /* namespace mic */


 #endif /* SRC_MLNN_SOFTMAX_HPP_ */

mic::mlnn::cost_function::Softmax::Softmax
Softmax(size_t height_, size_t width_, size_t depth_, std::string name_="Softmax")
Definition: Softmax.hpp:60

mic::mlnn::cost_function::Softmax::resizeBatch
virtual void resizeBatch(size_t batch_size_)
Definition: Softmax.hpp:82

mic::mlnn::cost_function::Softmax::backward
void backward()
Definition: Softmax.hpp:124

mic::mlnn::Layer::resizeBatch
virtual void resizeBatch(size_t batch_size_)
Definition: Layer.hpp:199

mic::mlnn::cost_function::Softmax
Softmax activation function.
Definition: Softmax.hpp:38

mic::mlnn::MultiLayerNeuralNetwork
Class representing a multi-layer neural network.
Definition: Layer.hpp:86

mic::mlnn::LayerTypes
LayerTypes
Enumeration of possible layer types.
Definition: Layer.hpp:58

mic::mlnn::Layer::s
mic::types::MatrixArray< eT > s
States - contains input [x] and output [y] matrices.
Definition: Layer.hpp:753

mic::mlnn::Layer::g
mic::types::MatrixArray< eT > g
Gradients - contains input [x] and output [y] matrices.
Definition: Layer.hpp:756

mic::mlnn::cost_function::Softmax::forward
void forward(bool test_=false)
Definition: Softmax.hpp:94

mic::mlnn::Layer
Definition: Layer.hpp:94

mic::mlnn::cost_function::Softmax::Softmax
Softmax(size_t size_, std::string name_="Softmax")
Definition: Softmax.hpp:46

mic::mlnn::cost_function::Softmax::update
virtual void update(eT alpha_, eT decay_=0.0f)
Definition: Softmax.hpp:143

Layer.hpp
Contains a template class representing a layer.

mic::mlnn::Layer::m
mic::types::MatrixArray< eT > m
Memory - a list of temporal parameters, to be used by the derived classes.
Definition: Layer.hpp:762

mic::mlnn::cost_function::Softmax::~Softmax
virtual ~Softmax()
Definition: Softmax.hpp:76