mi-neural-nets/a00146_source.html

 /*

 * @Author: kmrocki/tkornuta

 * @Date:   2016-02-24 09:43:05

 */


 #include <logger/Log.hpp>

 #include <logger/ConsoleOutput.hpp>

 using namespace mic::logger;


 #include <iomanip>


 #include <importers/MNISTMatrixImporter.hpp>

 #include <encoders/MatrixXfMatrixXfEncoder.hpp>

 #include <encoders/UIntMatrixXfEncoder.hpp>


 #include <mlnn/BackpropagationNeuralNetwork.hpp>


 // Using multi layer neural networks

 using namespace mic::mlnn;

 using namespace mic::types;


 int main() {

     // Task parameters.

     size_t batch_size = 20;

     size_t iterations = 60000/batch_size;


     // Set console output.

     LOGGER->addOutput(new ConsoleOutput());

 //  LOGGER->setSeverityLevel(LTRACE);


     // Create a simple NN for classification (should give around 95.3% accuracy)

     //MNIST - 28x28 -> 256 -> 100 -> 10

     BackpropagationNeuralNetwork<float> nn("3layerReLUSofmax");

     /*nn.pushLayer(new Linear<float>(28 * 28, 256));

     nn.pushLayer(new ReLU<float>(256));

     nn.pushLayer(new Linear<float>(256, 100));

     nn.pushLayer(new ReLU<float>(100));

     nn.pushLayer(new Linear<float>(100, 10));

     nn.pushLayer(new Softmax<float>(10));

     */

     nn.pushLayer(new mic::mlnn::convolution::Convolution<float>(28, 28, 1, 20, 14, 7));

     nn.pushLayer(new ReLU<float>(180));

     nn.pushLayer(new Linear<float>(180, 10));

     nn.pushLayer(new Softmax<float>(10));

     nn.verify();


     //[60000, 784]

     // Load the MNIST training...

     mic::importers::MNISTMatrixImporter<float> training;

     // Manually set paths. DEPRICATED! Used here only for simplification of the test.

     training.setDataFilename("../data/mnist/train-images.idx3-ubyte");

     training.setLabelsFilename("../data/mnist/train-labels.idx1-ubyte");

     training.setBatchSize(batch_size);


     if (!training.importData())

         return -1;


     // ... and test datasets.

     mic::importers::MNISTMatrixImporter<float> test;

     // Manually set paths. DEPRICATED! Used here only for simplification of the test.

     test.setDataFilename("../data/mnist/t10k-images.idx3-ubyte");

     test.setLabelsFilename("../data/mnist/t10k-labels.idx1-ubyte");

     test.setBatchSize(batch_size);


     if (!test.importData())

         return -1;


     // Initialize the encoders.

     mic::encoders::MatrixXfMatrixXfEncoder mnist_encoder(28, 28);

     mic::encoders::UIntMatrixXfEncoder label_encoder(10);


     LOG(LSTATUS) << "Starting the training of neural network...";

     float learning_rate = 0.001;

     MatrixXfPtr encoded_batch, encoded_targets;


     // Perform the training.

     for (size_t ii = 0; ii < iterations; ii++) {

         LOG(LINFO) << "Batch " << std::setw(4) << ii << "/" << std::setw(4) << iterations;


         // Get random batch [784 x batch_size].

         MNISTBatch<float> rand_batch = training.getRandomBatch();

         encoded_batch  = mnist_encoder.encodeBatch(rand_batch.data());

         encoded_targets  = label_encoder.encodeBatch(rand_batch.labels());


         // Train network with batch.

         float loss = nn.train (encoded_batch, encoded_targets, learning_rate);

         LOG(LINFO) << "Training: loss = " << std::setprecision(8) << loss;

     }//: for

     LOG(LSTATUS) << "Training finished";


     // Check performance on the test dataset.

     LOG(LSTATUS) << "Calculating performance for test dataset...";

     size_t correct = 0;

     float loss = 0.0;

     test.setNextSampleIndex(0);

     while(!test.isLastBatch()) {


         // Get next batch [784 x batch_size].

         MNISTBatch<float> next_batch = test.getNextBatch();

         encoded_batch  = mnist_encoder.encodeBatch(next_batch.data());

         encoded_targets  = label_encoder.encodeBatch(next_batch.labels());


         // Test network response.

         // Skip dropout layers at test time

         nn.forward(encoded_batch, true);

         // Get predictions.

         mic::types::MatrixXfPtr encoded_predictions = nn.getPredictions();

         // Calculate the loss and correct predictions.

         loss += nn.calculateMeanLoss(encoded_targets, encoded_predictions);

         correct += nn.countCorrectPredictions(encoded_targets, encoded_predictions);


     }//: while

     double test_acc = (double)correct / (double)(test.size());

     LOG(LINFO) << "Test  : loss = " << std::setprecision(3) << loss << " correct = " << std::setprecision(3) << 100.0 * test_acc << " %";


     // Check performance on the training dataset.

     LOG(LSTATUS) << "Calculating performance for the training dataset...";

     correct = 0;

     loss = 0;

     training.setNextSampleIndex(0);

     while(!training.isLastBatch()) {


         // Get next batch [784 x batch_size].

         MNISTBatch<float> next_batch = training.getNextBatch();

         encoded_batch  = mnist_encoder.encodeBatch(next_batch.data());

         encoded_targets  = label_encoder.encodeBatch(next_batch.labels());


         // Test network response.

         // Skip dropout layers at test time

         nn.forward(encoded_batch, true);

         // Get predictions.

         mic::types::MatrixXfPtr encoded_predictions = nn.getPredictions();

         // Calculate the loss and correct predictions.

         loss += nn.calculateMeanLoss(encoded_targets, encoded_predictions);

         correct += nn.countCorrectPredictions(encoded_targets, encoded_predictions);

     }

     double train_acc = (double)correct / (double)(training.size());

     LOG(LINFO) << "Train  : loss = " << std::setprecision(3) << loss << " correct = " << std::setprecision(3) << 100.0 * train_acc << " %";


 }

mic::mlnn::convolution::Convolution< float >

label_encoder
mic::encoders::UIntMatrixXfEncoder * label_encoder
Label 2 matrix encoder (1 hot).
Definition: mnist_convnet_features_visualization_test.cpp:70

main
int main()
Definition: mnist_simple_mlnn.cpp:37

mic::mlnn::BackpropagationNeuralNetwork< float >

mic::mlnn::MultiLayerNeuralNetwork::countCorrectPredictions
size_t countCorrectPredictions(mic::types::MatrixPtr< eT > targets_, mic::types::MatrixPtr< eT > predictions_)
Definition: MultiLayerNeuralNetwork.hpp:238

mic::mlnn::cost_function::Softmax< float >

mic::mlnn::fully_connected::Linear< float >

mic::mlnn::MultiLayerNeuralNetwork::getPredictions
mic::types::MatrixPtr< eT > getPredictions()
Definition: MultiLayerNeuralNetwork.hpp:217

mic::mlnn::activation_function::ReLU
Definition: ReLU.hpp:37

mic::mlnn::BackpropagationNeuralNetwork::verify
bool verify()
Definition: BackpropagationNeuralNetwork.hpp:128

mic::mlnn::BackpropagationNeuralNetwork::train
eT train(mic::types::MatrixPtr< eT > encoded_batch_, mic::types::MatrixPtr< eT > encoded_targets_, eT learning_rate_, eT decay_=0.0f)
Definition: BackpropagationNeuralNetwork.hpp:191

batch_size
const size_t batch_size
Definition: mnist_conv_hebbian.cpp:80

mic::mlnn::BackpropagationNeuralNetwork::forward
void forward(mic::types::MatrixPtr< eT > input_data, bool skip_dropout=false)
Definition: BackpropagationNeuralNetwork.hpp:76

mic::mlnn::MultiLayerNeuralNetwork::pushLayer
void pushLayer(LayerType *layer_ptr_)
Definition: MultiLayerNeuralNetwork.hpp:83

mnist_encoder
mic::encoders::ColMatrixEncoder< double > * mnist_encoder
MNIST matrix encoder.
Definition: mnist_conv_hebbian.cpp:75

BackpropagationNeuralNetwork.hpp

mic::mlnn::BackpropagationNeuralNetwork::calculateMeanLoss
eT calculateMeanLoss(mic::types::MatrixPtr< eT > encoded_targets_, mic::types::MatrixPtr< eT > encoded_predictions_)
Definition: BackpropagationNeuralNetwork.hpp:242