mi-neural-nets/a00091_source.html

 #ifndef SRC_MLNN_POOLING_HPP_

 #define SRC_MLNN_POOLING_HPP_


 #include <mlnn/layer/Layer.hpp>


 namespace mic {

 namespace mlnn {

 namespace convolution {


 template <typename eT=float>

 class MaxPooling : public mic::mlnn::Layer<eT> {

 public:


     MaxPooling(size_t input_height_, size_t input_width_, size_t depth_,

             size_t window_size_,

             std::string name_ = "MaxPooling") :

         Layer<eT>::Layer(input_height_, input_width_, depth_,

                 (input_height_ /window_size_), (input_width_ / window_size_), depth_,

                 LayerTypes::MaxPooling, name_),

                 window_size(window_size_)

     {

         // Mapping from input to output - every cell will contain address of input image.

         m.add("pooling_map", Layer<eT>::outputSize(), 1);

     };


     virtual ~MaxPooling() {};


     virtual void resizeBatch(size_t batch_size_) {

         // Call base Layer resize.

         Layer<eT>::resizeBatch(batch_size_);


         // Reshape pooling mask and map.

         m["pooling_map"]->resize(Layer<eT>::outputSize(), batch_size_);


     }


     void forward(bool test_ = false) {

         LOG(LTRACE) << "MaxPooling::forward\n";


         // Get pointer to input batch.

         mic::types::MatrixPtr<eT> batch_x = s['x'];

         //std::cout<< "forward batch_x=\n" << (*batch) << std::endl;

         //std::cout << "forward input x activation: min:" << (*batch_x).minCoeff() <<" max: " << (*batch_x).maxCoeff() << std::endl;


         // Get pointer to output batch - so the results will be stored!

         mic::types::MatrixPtr<eT> batch_y = s['y'];

         // Reset the whole batch.

         batch_y->setZero();


         // Get pointer to the mask.

         mic::types::MatrixPtr<eT> pooling_map = m["pooling_map"];

         pooling_map->setZero();


         // TODO: should work for more channels - but requires testing!

         //assert(input_depth == 1);


         // Iterate through batch - cannot be done in parallel:

         // * pooling mask is shared (ok)

         // * tmp variables storing input samples/channels are multiplied and OMP secured (ok)

         // * pooling mask and output batch are edited on different addresses - OMP secured (ok)

         #pragma omp parallel for

         for (size_t ib = 0; ib < batch_size; ib++) {

             // Get input sample from batch.

             mic::types::MatrixPtr<eT> xs = lazyReturnInputSample(batch_x, ib);


             // Iterate through input/output channels.

             for (size_t ic=0; ic< input_depth; ic++) {

                 // Get input channel from input sample.

                 mic::types::MatrixPtr<eT> xc = lazyReturnInputChannel(xs, ib, ic);


                 // Iterate through "blocks" in a given channel.

                 for (size_t ih=0, oh=0; ih< input_height; ih+=window_size, oh++) {

                     for (size_t iw=0, ow=0; iw< input_width; iw+=window_size, ow++) {


                     #pragma omp critical

                     {

                         // Get location of max element.

                         size_t maxRow, maxCol;

                         eT max_val = xc->block(ih, iw, window_size, window_size).maxCoeff(&maxRow, &maxCol);


                         //std::cout << "xc->block(ih, iw, window_size, window_size) = " <<xc->block(ih, iw, window_size, window_size) <<std::endl;

                         //std::cout << " maxRow = " << maxRow << " maxCol = "<< maxCol << " max_val = "<< max_val << std::endl;


                         // Calculate "absolute addresses.

                         size_t ia = (ib * Layer<eT>::inputSize()) + ic * input_height * input_width + (iw + maxCol) * input_height + (ih + maxRow);

                         size_t oa = (ib * Layer<eT>::outputSize()) + ic * output_height * output_width + (ow) * output_height + (oh);

                         /*std::cout << " ih = " << ih << " iw = " << iw << " ia = " << ia << std::endl;

                         std::cout << " oh = " << oh << " ow = " << ow << " oa = " << oa << std::endl;*/


                         // Map output to input.

                         (*pooling_map)[oa] = ia;


                         // Copy value to output.

                         (*batch_y)[oa] = max_val;

                     }


                     }//: for width

                 }//: for width

             }//: for channels

         }//: for batch

         LOG(LTRACE) << "MaxPooling::forward end\n";

     }


     void backward() {

         LOG(LTRACE) << "MaxPooling::backward\n";


         // Get pointer to dy batch.

         mic::types::MatrixPtr<eT> batch_dy = g['y'];


         // Get pointer to dx batch.

         mic::types::MatrixPtr<eT> batch_dx = g['x'];

         batch_dx->setZero();


         mic::types::MatrixPtr<eT> pooling_map = m["pooling_map"];


         // Iterate through batch.

         #pragma omp parallel for

         for (size_t oi = 0; oi < batch_size * Layer<eT>::outputSize(); oi++) {


             // Map outputs to inputs.

             //std::cout << " oi = " << oi << " (*pooling_map)[oi] = " << (*pooling_map)[oi] << std::endl;

             (*batch_dx)[(size_t)(*pooling_map)[oi]] = (*batch_dy)[oi];


         }//: for batch


         LOG(LTRACE) << "MaxPooling::backward end\n";

     }


     void update(eT alpha_, eT decay_  = 0.0f) { }


     // Unhide the overloaded methods inherited from the template class Layer fields via "using" statement.

     using Layer<eT>::forward;

     using Layer<eT>::backward;


 protected:

     // Unhide the fields inherited from the template class Layer via "using" statement.

     using Layer<eT>::g;

     using Layer<eT>::s;

     using Layer<eT>::p;

     using Layer<eT>::m;


     // Uncover "sizes" for visualization.

     using Layer<eT>::input_height;

     using Layer<eT>::input_width;

     using Layer<eT>::input_depth;

     using Layer<eT>::output_height;

     using Layer<eT>::output_width;

     using Layer<eT>::output_depth;

     using Layer<eT>::batch_size;


     using Layer<eT>::lazyReturnInputSample;

     using Layer<eT>::lazyReturnOutputSample;

     using Layer<eT>::lazyReturnInputChannel;

     using Layer<eT>::lazyReturnOutputChannel;


     size_t window_size;


 private:

     // Friend class - required for using boost serialization.

     template<typename tmp> friend class mic::mlnn::MultiLayerNeuralNetwork;


     MaxPooling<eT>() : Layer<eT> () { }


 };


 } /* namespace convolution */

 } /* namespace mlnn */

 } /* namespace mic */


 #endif /* SRC_MLNN_POOLING_HPP_ */

mic::mlnn::Layer::inputSize
size_t inputSize()
Returns size (length) of inputs.
Definition: Layer.hpp:255

mic::mlnn::Layer::lazyReturnInputChannel
mic::types::MatrixPtr< eT > lazyReturnInputChannel(mic::types::MatrixPtr< eT > sample_ptr_, size_t sample_number_, size_t channel_number_)
Definition: Layer.hpp:519

mic::mlnn::convolution::MaxPooling
Layer performing max pooling.
Definition: MaxPooling.hpp:39

mic::mlnn::Layer::input_depth
size_t input_depth
Number of channels of the input (e.g. 3 for RGB images).
Definition: Layer.hpp:732

mic::mlnn::convolution::MaxPooling::update
void update(eT alpha_, eT decay_=0.0f)
Definition: MaxPooling.hpp:183

mic::mlnn::Layer::batch_size
size_t batch_size
Size (length) of (mini)batch.
Definition: Layer.hpp:744

mic::mlnn::Layer::outputSize
size_t outputSize()
Returns size (length) of outputs.
Definition: Layer.hpp:260

mic::mlnn::convolution::MaxPooling::forward
void forward(bool test_=false)
Definition: MaxPooling.hpp:82

mic::mlnn::convolution::MaxPooling::window_size
size_t window_size
Definition: MaxPooling.hpp:213

mic::mlnn::Layer::resizeBatch
virtual void resizeBatch(size_t batch_size_)
Definition: Layer.hpp:199

mic::mlnn::Layer::input_height
size_t input_height
Height of the input (e.g. 28 for MNIST).
Definition: Layer.hpp:726

mic::mlnn::MultiLayerNeuralNetwork
Class representing a multi-layer neural network.
Definition: Layer.hpp:86

mic::mlnn::LayerTypes
LayerTypes
Enumeration of possible layer types.
Definition: Layer.hpp:58

mic::mlnn::Layer::s
mic::types::MatrixArray< eT > s
States - contains input [x] and output [y] matrices.
Definition: Layer.hpp:753

mic::mlnn::Layer::g
mic::types::MatrixArray< eT > g
Gradients - contains input [x] and output [y] matrices.
Definition: Layer.hpp:756

mic::mlnn::convolution::MaxPooling::backward
void backward()
Definition: MaxPooling.hpp:152

mic::mlnn::convolution::MaxPooling::resizeBatch
virtual void resizeBatch(size_t batch_size_)
Definition: MaxPooling.hpp:72

mic::mlnn::Layer::lazyReturnInputSample
mic::types::MatrixPtr< eT > lazyReturnInputSample(mic::types::MatrixPtr< eT > batch_ptr_, size_t sample_number_)
Definition: Layer.hpp:460

mic::mlnn::convolution::MaxPooling::~MaxPooling
virtual ~MaxPooling()
Definition: MaxPooling.hpp:66

mic::mlnn::Layer::input_width
size_t input_width
Width of the input (e.g. 28 for MNIST).
Definition: Layer.hpp:729

mic::mlnn::Layer::output_height
size_t output_height
Number of receptive fields in a single channel - vertical direction.
Definition: Layer.hpp:735

mic::mlnn::Layer
Definition: Layer.hpp:94

mic::mlnn::convolution::MaxPooling::MaxPooling
MaxPooling(size_t input_height_, size_t input_width_, size_t depth_, size_t window_size_, std::string name_="MaxPooling")
Definition: MaxPooling.hpp:51

mic::mlnn::Layer::output_width
size_t output_width
Number of receptive fields in a single channel - horizontal direction.
Definition: Layer.hpp:738

Layer.hpp
Contains a template class representing a layer.

mic::mlnn::Layer::m
mic::types::MatrixArray< eT > m
Memory - a list of temporal parameters, to be used by the derived classes.
Definition: Layer.hpp:762