db/ddd/mnist__mlp_8hpp_source.html

 /*
  *  SNABSuite -- Spiking Neural Architecture Benchmark Suite
  *  Copyright (C) 2019  Christoph Ostrau
  *
  *  This program is free software: you can redistribute it and/or modify
  *  it under the terms of the GNU General Public License as published by
  *  the Free Software Foundation, either version 3 of the License, or
  *  (at your option) any later version.
  *
  *  This program is distributed in the hope that it will be useful,
  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  *  GNU General Public License for more details.
  *
  *  You should have received a copy of the GNU General Public License
  *  along with this program.  If not, see <http://www.gnu.org/licenses/>.
  */

 #pragma once
 #include <algorithm>
 #include <cmath>
 #include <cypress/cypress.hpp>

 #include "helper_functions.hpp"
 namespace MNIST {
 using cypress::Json;
 using cypress::Matrix;
 using cypress::Real;

 class MSE {
 public:
     static inline Real calc_loss(const uint16_t label,
                                  const std::vector<Real> &output)
     {
         Real res = 0.0;
         for (size_t neuron = 0; neuron < output.size(); neuron++) {
             if (label == neuron) {
                 res += (output[neuron] - 1.0) * (output[neuron] - 1.0);
             }
             else {
                 res += output[neuron] * output[neuron];
             }
         }
         res = sqrt(res / Real(output.size()));
         return res;
     }
     static inline std::vector<Real> calc_error(const uint16_t label,
                                                const std::vector<Real> &output)
     {
         std::vector<Real> res(output.size(), 0.0);
         for (size_t neuron = 0; neuron < output.size(); neuron++) {
             if (label == neuron) {
                 res[neuron] = output[neuron] - 1.0;
             }
             else {
                 res[neuron] = output[neuron] - 0.0;
             }
         }
         return res;
     }
 };

 class CatHinge {
 public:
     static inline Real calc_loss(const uint16_t label,
                                  const std::vector<Real> &output)
     {
         Real res = 0.0;
         for (size_t neuron = 0; neuron < output.size(); neuron++) {
             if (label == neuron) {
                 res += std::max(0.0, 1.0 - Real(output[neuron]));
             }
             else {
                 res += std::max(0.0, 1.0 + Real(output[neuron]));
             }
         }
         return res;
     }
     static inline std::vector<Real> calc_error(const uint16_t label,
                                                const std::vector<Real> &output)
     {
         // Real pos = output[label];
         std::vector<Real> vec = output;
         vec[label] = -0.0;
         auto neg_elem = std::max_element(vec.begin(), vec.end());
         auto index = std::distance(vec.begin(), neg_elem);
         auto res = std::vector<Real>(output.size(), 0.0);

         // Require that label neuron and the next most active neuron have at
         // least a difference of 1
         if ((*neg_elem) - output[label] + 1 >= 0.0) {
             res[label] = -1.0;
             if (label != index) {
                 res[index] = +1;
             }
         }
         return res;
     }
 };

 class ReLU {
 public:
     static inline std::vector<Real> function(std::vector<Real> input)
     {
         for (auto &i : input) {
             i = std::max(0.0, i);
         }
         return input;
     }
     static inline std::vector<Real> derivative(std::vector<Real> input)
     {
         for (auto &i : input) {
             i = i >= 0 ? 1.0 : 0.0;
         }
         return input;
     }
 };

 class NoConstraint {
 public:
     static inline void constrain_weights(std::vector<cypress::Matrix<Real>> &)
     {
     }

     void setup(std::vector<cypress::Matrix<Real>> &) {}
 };

 class PositiveWeights {
 public:
     void setup(std::vector<cypress::Matrix<Real>> &) {}
     inline void constrain_weights(std::vector<cypress::Matrix<Real>> &layers)
     {
         for (auto &i : layers) {
             for (auto &j : i) {
                 if (j < 0.0) {
                     j = 0.0;
                 }
             }
         }
     }
 };

 class PositiveLimitedWeights {
 public:
     Real m_max = 0.0;

     void setup(std::vector<cypress::Matrix<Real>> &layers)
     {
         for (auto &layer : layers) {
             auto w = mnist_helper::max_weight(layer);
             if (w > m_max)
                 m_max = w;
         }
     }

     inline void constrain_weights(std::vector<cypress::Matrix<Real>> &layers)
     {
         for (auto &i : layers) {
             for (auto &j : i) {
                 if (j < 0.0) {
                     j = 0.0;
                 }
                 if (j > m_max) {
                     j = m_max;
                 }
             }
         }
     }
 };

 class MLPBase {
 public:
     virtual Real max_weight() const = 0;
     virtual Real min_weight() const = 0;
     virtual Real max_weight_abs() const = 0;
     virtual Real conv_max_weight(size_t layer_id = 0) const = 0;
     virtual const size_t &epochs() const = 0;
     virtual const size_t &batchsize() const = 0;
     virtual const Real &learnrate() const = 0;
     virtual const mnist_helper::MNIST_DATA &mnist_train_set() = 0;
     virtual const mnist_helper::MNIST_DATA &mnist_test_set() = 0;
     virtual const std::vector<cypress::Matrix<Real>> &get_weights() = 0;
     virtual const std::vector<mnist_helper::CONVOLUTION_LAYER> &get_conv_layers() = 0;
     virtual const std::vector<mnist_helper::POOLING_LAYER> &get_pooling_layers() = 0;
     virtual const std::vector<size_t> &get_layer_sizes() = 0;
     virtual const std::vector<mnist_helper::LAYER_TYPE> &get_layer_types() = 0;
     virtual void scale_down_images(size_t pooling_size = 3) = 0;
     virtual inline bool correct(const uint16_t label,
                                 const std::vector<Real> &output) const = 0;
     virtual std::vector<std::vector<std::vector<Real>>> forward_path(
         const std::vector<size_t> &indices, const size_t start) const = 0;
     virtual Real forward_path_test() const = 0;
     virtual void backward_path(
         const std::vector<size_t> &indices, const size_t start,
         const std::vector<std::vector<std::vector<Real>>> &activations,
         bool last_only) = 0;
     virtual void backward_path_2(
         const std::vector<uint16_t> &labels,
         const std::vector<std::vector<std::vector<Real>>> &activations,
         bool last_only = false) = 0;
     virtual size_t accuracy(
         const std::vector<std::vector<std::vector<Real>>> &activations,
         const std::vector<size_t> &indices, const size_t start) = 0;
     virtual void train(unsigned seed = 0) = 0;
     virtual ~MLPBase() {}
 };

 template <typename Loss = MSE, typename ActivationFunction = ReLU,
           typename Constraint = NoConstraint>
 class MLP : public MLPBase {
 protected:
     std::vector<cypress::Matrix<Real>> m_layers;
     std::vector<size_t> m_layer_sizes;
     std::vector<mnist_helper::CONVOLUTION_LAYER> m_filters;
     std::vector<mnist_helper::POOLING_LAYER> m_pools;
     std::vector<mnist_helper::LAYER_TYPE> m_layer_types;
     size_t m_epochs = 20;
     size_t m_batchsize = 100;
     Real learn_rate = 0.01;
     mnist_helper::MNIST_DATA m_mnist;
     mnist_helper::MNIST_DATA m_mnist_test;

     void load_data(std::string path)
     {
         m_mnist = mnist_helper::loadMnistData(60000, path + "train");
         m_mnist_test = mnist_helper::loadMnistData(10000, path + "t10k");
     }

     Constraint m_constraint;

 public:
     MLP(std::vector<size_t> layer_sizes, size_t epochs = 20,
         size_t batchsize = 100, Real learn_rate = 0.01)
         : m_layer_sizes(layer_sizes),
           m_epochs(epochs),
           m_batchsize(batchsize),
           learn_rate(learn_rate)
     {
         for (size_t i = 0; i < layer_sizes.size() - 1; i++) {
             m_layers.emplace_back(
                 Matrix<Real>(layer_sizes[i], layer_sizes[i + 1]));
         }

         int seed = std::chrono::system_clock::now().time_since_epoch().count();
         auto rng = std::default_random_engine(seed);
         std::normal_distribution<Real> distribution(0.0, 1.0);
         for (auto &layer : m_layers) {
             // Kaiming init, best suited for ReLU activation functions
             auto scale = std::sqrt(2.0 / double(layer.rows()));
             for (size_t i = 0; i < layer.size(); i++) {
                 layer[i] = distribution(rng) * scale;
             }
         }

         // Glorot uniform
         /*for (auto &layer : m_layers) {
             auto limit = std::sqrt(6.0 / Real(layer.rows()+ layer.cols()));
             std::uniform_real_distribution<Real> distribution(0, limit);
             for (size_t i = 0; i < layer.size(); i++) {
                 layer[i] = distribution(rng);
             }
         }*/
         try {
             load_data("");
         }
         catch (...) {
             load_data("../");
         }
         m_constraint.setup(m_layers);
     }

     MLP(Json &data, size_t epochs = 20, size_t batchsize = 100,
         Real learn_rate = 0.01, bool random = false,
         Constraint constraint = Constraint())
         : m_epochs(epochs),
           m_batchsize(batchsize),
           learn_rate(learn_rate),
           m_constraint(constraint)
     {
         int seed = std::chrono::system_clock::now().time_since_epoch().count();
         auto rng = std::default_random_engine(seed);
         std::normal_distribution<Real> distribution(0.0, 1.0);
         for (auto &layer : data["netw"]) {
             if (layer["class_name"].get<std::string>() == "Dense") {
                 auto &json = layer["weights"];
                 m_layers.emplace_back(
                     Matrix<Real>(json.size(), json[0].size()));
                 auto &weights = m_layers.back();
                 auto scale = std::sqrt(2.0 / double(weights.rows()));
                 for (size_t i = 0; i < json.size(); i++) {
                     for (size_t j = 0; j < json[i].size(); j++) {
                         if (!random) {
                             weights(i, j) = json[i][j].get<Real>();
                         }
                         else {
                             weights(i, j) = distribution(rng) * scale;
                         }
                     }
                 }
                 m_layer_sizes.emplace_back(m_layers.back().rows());
                 m_layer_types.push_back(mnist_helper::LAYER_TYPE::Dense);
                 cypress::global_logger().debug(
                     "MNIST", "Dense layer detected with size " +
                                  std::to_string(weights.rows()) + " times " +
                                  std::to_string(weights.cols()));
             }
             else if (layer["class_name"].get<std::string>() == "Conv2D") {
                 auto &json = layer["weights"];
                 size_t kernel_x = json.size();
                 size_t kernel_y = json[0].size();
                 size_t kernel_z = json[0][0].size();
                 size_t output = json[0][0][0].size();
                 size_t stride = layer["stride"];
                 size_t padding = layer["padding"] == "valid" ? 0 : 1;
                 std::vector<size_t> input_sizes;
                 std::vector<size_t> output_sizes;
                 if (!layer["input_shape_x"].empty()){
                     input_sizes.push_back(layer["input_shape_x"]);
                     input_sizes.push_back(layer["input_shape_y"]);
                     input_sizes.push_back(layer["input_shape_z"]);
                 } else {
                     if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Conv) {
                         input_sizes.push_back(m_filters.back().output_sizes[0]);
                         input_sizes.push_back(m_filters.back().output_sizes[1]);
                         input_sizes.push_back(m_filters.back().output_sizes[2]);
                     } else if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Pooling) {
                         input_sizes.push_back(m_pools.back().output_sizes[0]);
                         input_sizes.push_back(m_pools.back().output_sizes[1]);
                         input_sizes.push_back(m_pools.back().output_sizes[2]);
                     } else if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Dense) {
                         throw std::runtime_error("Conv after Dense layer not implemented!");
                     }
                 }
                 output_sizes.push_back((input_sizes[0] - kernel_x + 2*padding)/stride+1);
                 output_sizes.push_back((input_sizes[1] - kernel_x + 2*padding)/stride+1);
                 output_sizes.push_back(output);
                 mnist_helper::CONVOLUTION_FILTER conv_filter(
                     kernel_x,
                     std::vector<std::vector<std::vector<Real>>>(kernel_y,
                     std::vector<std::vector<Real>>(kernel_z,
                     std::vector<Real>(output)))
                     );
                 mnist_helper::CONVOLUTION_LAYER conv = {
                     conv_filter,
                     input_sizes,
                     output_sizes,
                     stride,
                     padding};
                 m_filters.emplace_back(conv);
                 auto &weights = m_filters.back().filter;
                 //auto scale = std::sqrt(2.0 / double(weights.rows()));
                 for (size_t i = 0; i < json.size(); i++){
                     for (size_t j = 0; j < json[i].size(); j++){
                         for (size_t k = 0; k < json[i][j].size(); k++){
                             for (size_t l = 0 ; l < json[i][j][k].size(); l++){
                                 weights[i][j][k][l] = json[i][j][k][l].get<Real>();
                             }
                         }
                     }
                 }
                 m_layer_sizes.emplace_back(input_sizes[0] * input_sizes[1] * input_sizes[2]);
                 m_layer_types.push_back(mnist_helper::LAYER_TYPE::Conv);
                 cypress::global_logger().debug(
                     "MNIST", "Conv layer detected with size ("+
                         std::to_string(json.size())+","+std::to_string(json[0].size())+
                         ","+std::to_string(json[0][0].size())+","+std::to_string(json[0][0][0].size())+")");
             } else if(layer["class_name"].get<std::string>() == "MaxPooling2D"){
                 std::vector<size_t> size = layer["size"];
                 size_t stride = layer["stride"];
                 std::vector<size_t> input_sizes;
                 std::vector<size_t> output_sizes;
                 if (m_layer_types.empty()){
                     throw std::runtime_error("Pooling layer must not be the first layer!");
                 }
                 if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Conv){
                     input_sizes.push_back(m_filters.back().output_sizes[0]);
                     input_sizes.push_back(m_filters.back().output_sizes[1]);
                     input_sizes.push_back(m_filters.back().output_sizes[2]);
                 } else if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Pooling){
                     input_sizes.push_back(m_pools.back().output_sizes[0]);
                     input_sizes.push_back(m_pools.back().output_sizes[1]);
                     input_sizes.push_back(m_pools.back().output_sizes[2]);
                 } else if (m_layer_types.back() == mnist_helper::LAYER_TYPE::Dense){
                     throw std::runtime_error("Pooling after Dense not implemented!");
                 }
                 output_sizes.push_back((input_sizes[0] - size[0] + 2*0)/stride+1);
                 output_sizes.push_back((input_sizes[1] - size[1] + 2*0)/stride+1);
                 output_sizes.push_back(input_sizes[2]);
                 mnist_helper::POOLING_LAYER pool = {input_sizes, output_sizes, size, stride};
                 m_pools.emplace_back(pool);
                 m_layer_sizes.emplace_back(input_sizes[0] * input_sizes[1] * input_sizes[2]);
                 m_layer_types.emplace_back(mnist_helper::LAYER_TYPE::Pooling);
                 cypress::global_logger().debug(
                     "MNIST", "Pooling layer detected with size (" +
                                  std::to_string(size[0]) + ", " + std::to_string(size[1]) +
                                 ") and stride " + std::to_string(stride));
             }
             else {
                 throw std::runtime_error("Unknown layer type");
             }
         }
         m_layer_sizes.push_back(m_layers.back().cols());
 //      for (auto &layer : m_layers) {
 //          m_layer_sizes.emplace_back(layer.cols());
 //      }

         m_mnist = mnist_helper::loadMnistData(60000, "train");
         m_mnist_test = mnist_helper::loadMnistData(10000, "t10k");
         m_constraint.setup(m_layers);
     }

     Real max_weight() const override
     {
         Real max = 0.0;
         for (auto &layer : m_layers) {
             auto w = mnist_helper::max_weight(layer);
             if (w > max)
                 max = w;
         }
         return max;
     }

     Real conv_max_weight(size_t layer_id) const override
     {
         Real max = 0.0;
         auto layer = m_filters[layer_id];
         auto filter = layer.filter;
         for (size_t f = 0; f < layer.output_sizes[2]; f++) {
             for (size_t x = 0; x < filter.size(); x++) {
                 for (size_t y = 0; y < filter[0].size(); y++) {
                     for (size_t z = 0; z < filter[0][0].size(); z++) {
                         max = filter[x][y][z][f] > max ? filter[x][y][z][f] : max;
                     }
                 }
             }
         }
         return max;
     }

     Real min_weight() const override
     {
         Real min = 0.0;
         for (auto &layer : m_layers) {
             auto w = mnist_helper::min_weight(layer);
             if (w < min)
                 min = w;
         }
         return min;
     }

     Real max_weight_abs() const override
     {
         Real max = 0.0;
         for (auto &layer : m_layers) {
             auto w = mnist_helper::max_weight_abs(layer);
             if (w > max)
                 max = w;
         }
         return max;
     }

     const size_t &epochs() const override { return m_epochs; }
     const size_t &batchsize() const override { return m_batchsize; }
     const Real &learnrate() const override { return learn_rate; }

     const mnist_helper::MNIST_DATA &mnist_train_set() override
     {
         return m_mnist;
     }
     const mnist_helper::MNIST_DATA &mnist_test_set() override
     {
         return m_mnist_test;
     }

     const std::vector<cypress::Matrix<Real>> &get_weights() override
     {
         return m_layers;
     }

      // TODO: return whole conv struct? mh
     const std::vector<mnist_helper::CONVOLUTION_LAYER> &get_conv_layers() override
     {
         return m_filters;
     }

     const std::vector<mnist_helper::POOLING_LAYER> &get_pooling_layers() override
     {
         return m_pools;
     }

     const std::vector<size_t> &get_layer_sizes() override
     {
         return m_layer_sizes;
     }

     const std::vector<mnist_helper::LAYER_TYPE> &get_layer_types() override
     {
         return m_layer_types;
     }

     void scale_down_images(size_t pooling_size = 3) override
     {
         m_mnist = mnist_helper::scale_mnist(m_mnist, pooling_size);
         m_mnist_test = mnist_helper::scale_mnist(m_mnist_test, pooling_size);
     }

     static inline std::vector<Real> mat_X_vec(const Matrix<Real> &mat,
                                               const std::vector<Real> &vec)
     {
 #ifndef NDEBUG
         assert(mat.cols() == vec.size());
 #endif
         std::vector<Real> res(mat.rows(), 0.0);
         for (size_t i = 0; i < mat.rows(); i++) {
             for (size_t j = 0; j < mat.cols(); j++) {
                 res[i] += mat(i, j) * vec[j];
             }
         }
         return res;
     }

     static inline std::vector<Real> mat_trans_X_vec(
         const Matrix<Real> &mat, const std::vector<Real> &vec)
     {
 #ifndef NDEBUG
         assert(mat.rows() == vec.size());
 #endif
         std::vector<Real> res(mat.cols(), 0.0);
         for (size_t i = 0; i < mat.cols(); i++) {
             for (size_t j = 0; j < mat.rows(); j++) {
                 res[i] += mat(j, i) * vec[j];
             }
         }
         return res;
     }

     static inline std::vector<Real> vec_X_vec_comp(
         const std::vector<Real> &vec1, const std::vector<Real> &vec2)
     {
 #ifndef NDEBUG
         assert(vec1.size() == vec2.size());
 #endif
         std::vector<Real> res(vec1.size());
         for (size_t i = 0; i < vec1.size(); i++) {
             res[i] = vec1[i] * vec2[i];
         }
         return res;
     }

     inline bool correct(const uint16_t label,
                         const std::vector<Real> &output) const override
     {
         auto it = std::max_element(output.begin(), output.end());
         auto out = std::distance(output.begin(), it);
         return out == label;
     }

     static inline void update_mat(Matrix<Real> &mat,
                                   const std::vector<Real> &errors,
                                   const std::vector<Real> &pre_output,
                                   const size_t sample_num,
                                   const Real learn_rate)
     {
 #ifndef NDEBUG
         assert(mat.rows() == pre_output.size());
         assert(mat.cols() == errors.size());
 #endif
         Real sample_num_r(sample_num);
         for (size_t i = 0; i < mat.rows(); i++) {
             for (size_t j = 0; j < mat.cols(); j++) {
                 mat(i, j) = mat(i, j) - learn_rate * pre_output[i] * errors[j] /
                                             sample_num_r;
             }
         }
     }

     virtual std::vector<std::vector<std::vector<Real>>> forward_path(
         const std::vector<size_t> &indices, const size_t start) const override
     {
         if(!m_filters.empty()){
             throw std::runtime_error("Conv layer not supported in forward_path function!");
         }
         if(!m_pools.empty()){
             throw std::runtime_error("Pooling layer layer not supported in forward_path function!");
         }
         auto &input = std::get<0>(m_mnist);
         std::vector<std::vector<std::vector<Real>>> res;
         std::vector<std::vector<Real>> activations;
         for (auto size : m_layer_sizes) {
             activations.emplace_back(std::vector<Real>(size, 0.0));
         }
         for (size_t sample = 0; sample < m_batchsize; sample++) {
             res.emplace_back(activations);
         }

         for (size_t sample = 0; sample < m_batchsize; sample++) {
             if (start + sample >= indices.size())
                 break;
             res[sample][0] = input[indices[start + sample]];
             for (size_t layer = 0; layer < m_layers.size(); layer++) {
                 res[sample][layer + 1] = ActivationFunction::function(
                     mat_trans_X_vec(m_layers[layer], res[sample][layer]));
             }
         }
         return res;
     }

     virtual Real forward_path_test() const override
     {
         if(!m_filters.empty()){
             throw std::runtime_error("Conv layer not supported in forward_path function!");
         }
         if(!m_pools.empty()){
             throw std::runtime_error("Pooling layer layer not supported in forward_path function!");
         }
         auto &input = std::get<0>(m_mnist_test);
         auto &labels = std::get<1>(m_mnist_test);
         std::vector<std::vector<Real>> activations;
         for (auto size : m_layer_sizes) {
             activations.emplace_back(std::vector<Real>(size, 0.0));
         }
         size_t sum = 0;
         for (size_t sample = 0; sample < input.size(); sample++) {
             activations[0] = input[sample];
             for (size_t layer = 0; layer < m_layers.size(); layer++) {
                 activations[layer + 1] = ActivationFunction::function(
                     mat_trans_X_vec(m_layers[layer], activations[layer]));
             }
             if (correct(labels[sample], activations.back()))
                 sum++;
         }

         return Real(sum) / Real(labels.size());
     }

     virtual void backward_path(
         const std::vector<size_t> &indices, const size_t start,
         const std::vector<std::vector<std::vector<Real>>> &activations,
         bool last_only = false) override
     {
 #ifndef NDEBUG
         assert(m_batchsize == activations.size());
 #endif
         if(!m_filters.empty()){
             throw std::runtime_error("Conv layer not supported in forward_path function!");
         }
         if(!m_pools.empty()){
             throw std::runtime_error("Pooling layer layer not supported in forward_path function!");
         }
         const auto &labels = std::get<1>(m_mnist);
         const std::vector<cypress::Matrix<cypress::Real>> orig_weights =
             m_layers;
         for (size_t sample = 0; sample < m_batchsize; sample++) {
             if (start + sample >= indices.size())
                 break;
             const auto &activ = activations[sample];
             auto error = vec_X_vec_comp(
                 Loss::calc_error(labels[indices[start + sample]], activ.back()),
                 ActivationFunction::derivative(activ.back()));
             // TODO  works for ReLU only
             update_mat(m_layers.back(), error, activ[activ.size() - 2],
                        m_batchsize, learn_rate);
             if (!last_only) {
                 for (size_t inv_layer = 1; inv_layer < m_layers.size();
                      inv_layer++) {
                     size_t layer_id = m_layers.size() - inv_layer - 1;

                     error = vec_X_vec_comp(
                         mat_X_vec(orig_weights[layer_id + 1], error),
                         ActivationFunction::derivative(activ[layer_id + 1]));
                     update_mat(m_layers[layer_id], error, activ[layer_id],
                                m_batchsize, learn_rate);
                 }
             }
         }
         m_constraint.constrain_weights(m_layers);
     }
     virtual void backward_path_2(
         const std::vector<uint16_t> &labels,
         const std::vector<std::vector<std::vector<Real>>> &activations,
         bool last_only = false) override
     {
 #ifndef NDEBUG
         assert(m_batchsize == activations.back().size());
 #endif
         if(!m_filters.empty()){
             throw std::runtime_error("Conv layer not supported in forward_path function!");
         }
         if(!m_pools.empty()){
             throw std::runtime_error("Pooling layer layer not supported in forward_path function!");
         }
         const auto orig_weights = m_layers;
         for (size_t sample = 0; sample < m_batchsize; sample++) {

             auto error = vec_X_vec_comp(
                 Loss::calc_error(labels[sample], activations.back()[sample]),
                 ActivationFunction::derivative(activations.back()[sample]));
             // TODO  works for ReLU only
             update_mat(m_layers.back(), error,
                        activations[activations.size() - 2][sample], m_batchsize,
                        learn_rate);
             if (!last_only) {
                 for (size_t inv_layer = 1; inv_layer < m_layers.size();
                      inv_layer++) {
                     size_t layer_id = m_layers.size() - inv_layer - 1;

                     error = vec_X_vec_comp(
                         mat_X_vec(orig_weights[layer_id + 1], error),
                         ActivationFunction::derivative(
                             activations[layer_id + 1][sample]));
                     update_mat(m_layers[layer_id], error,
                                activations[layer_id][sample], m_batchsize,
                                learn_rate);
                 }
             }
             m_constraint.constrain_weights(m_layers);
         }
     }

     size_t accuracy(
         const std::vector<std::vector<std::vector<Real>>> &activations,
         const std::vector<size_t> &indices, const size_t start) override
     {
 #ifndef NDEBUG
         assert(activations.size() == m_batchsize);
 #endif

         auto &labels = std::get<1>(m_mnist);
         size_t sum = 0;

         for (size_t sample = 0; sample < m_batchsize; sample++) {
             if (start + sample >= indices.size())
                 break;
             if (correct(labels[indices[start + sample]],
                         activations[sample].back()))
                 sum++;
         }
         return sum;
     }

     void train(unsigned seed = 0) override
     {
         std::vector<size_t> indices(std::get<0>(m_mnist).size());
         m_constraint.constrain_weights(m_layers);
         for (size_t i = 0; i < indices.size(); i++) {
             indices[i] = i;
         }
         if (seed == 0) {
             seed = std::chrono::system_clock::now().time_since_epoch().count();
         }
         auto rng = std::default_random_engine{seed};

         for (size_t epoch = 0; epoch < m_epochs; epoch++) {
             size_t correct = 0;
             std::shuffle(indices.begin(), indices.end(), rng);
             for (size_t current_idx = 0;
                  current_idx < std::get<1>(m_mnist).size();
                  current_idx += m_batchsize) {
                 auto activations = forward_path(indices, current_idx);
                 correct += accuracy(activations, indices, current_idx);
                 backward_path(indices, current_idx, activations);
                 m_constraint.constrain_weights(m_layers);
             }
             cypress::global_logger().info(
                 "MLP", "Accuracy of epoch " + std::to_string(epoch) + ": " +
                            std::to_string(Real(correct) /
                                           Real(std::get<1>(m_mnist).size())));
         }
     }
 };
 }  // namespace MNIST
benchmark.index
index
Definition: benchmark.py:12

MNIST::MLP::forward_path_test
virtual Real forward_path_test() const override
Forward path of test data.
Definition: mnist_mlp.hpp:760

convert_weights.data
dictionary data
Definition: convert_weights.py:33

plot_membrane_pot.label
string label
Definition: plot_membrane_pot.py:124

MNIST::NoConstraint
Constraint for weights in neural network: No constraint.
Definition: mnist_mlp.hpp:135

mnist_helper::max_weight_abs
Real max_weight_abs(const T &json)
Calculate the max absolute weight.
Definition: helper_functions.hpp:237

MNIST::NoConstraint::setup
void setup(std::vector< cypress::Matrix< Real >> &)
Definition: mnist_mlp.hpp:141

MNIST::MLP::max_weight_abs
Real max_weight_abs() const override
Return the largest absolute weight in the network.
Definition: mnist_mlp.hpp:520

MNIST::MLPBase::~MLPBase
virtual ~MLPBase()
Definition: mnist_mlp.hpp:230

MNIST::MLP::m_pools
std::vector< mnist_helper::POOLING_LAYER > m_pools
Definition: mnist_mlp.hpp:246

plot_membrane_pot.x
x
Definition: plot_membrane_pot.py:140

mnist_helper::scale_mnist
MNIST_DATA scale_mnist(MNIST_DATA &data, size_t pooling_size=3)
downscale the complete MNIST dataset

MNIST::MLP::get_pooling_layers
const std::vector< mnist_helper::POOLING_LAYER > & get_pooling_layers() override
Definition: mnist_mlp.hpp:575

helper_functions.hpp

MNIST::MLP::min_weight
Real min_weight() const override
Return the smallest weight in the network.
Definition: mnist_mlp.hpp:504

MNIST::MLP::m_layer_sizes
std::vector< size_t > m_layer_sizes
Definition: mnist_mlp.hpp:244

MNIST::MLP
The standard densely connected multilayer Perceptron. Template arguments provide the loss function...
Definition: mnist_mlp.hpp:241

MNIST::MLP::m_filters
std::vector< mnist_helper::CONVOLUTION_LAYER > m_filters
Definition: mnist_mlp.hpp:245

MNIST::MLP::get_layer_sizes
const std::vector< size_t > & get_layer_sizes() override
Return the number of neurons per layer.
Definition: mnist_mlp.hpp:585

MNIST::MLP::learnrate
const Real & learnrate() const override
Definition: mnist_mlp.hpp:533

mnist_helper::min_weight
Real min_weight(const T &json)
Calculate the min weight.
Definition: helper_functions.hpp:197

MNIST::MLP::get_weights
const std::vector< cypress::Matrix< Real > > & get_weights() override
Return all weights in the form of weights[layer](src,tar)
Definition: mnist_mlp.hpp:559

MNIST::PositiveLimitedWeights::constrain_weights
void constrain_weights(std::vector< cypress::Matrix< Real >> &layers)
Definition: mnist_mlp.hpp:176

mnist_helper::MNIST_DATA
std::pair< std::vector< std::vector< Real > >, std::vector< uint16_t > > MNIST_DATA
Definition: helper_functions.hpp:32

MNIST::PositiveLimitedWeights
Definition: mnist_mlp.hpp:163

MNIST::MLPBase
Base class for Multi Layer Networks (–> currently Perceptron only). Allows us to use polymorphism wi...
Definition: mnist_mlp.hpp:196

MNIST::MLP::MLP
MLP(std::vector< size_t > layer_sizes, size_t epochs=20, size_t batchsize=100, Real learn_rate=0.01)
Constructor for random init.
Definition: mnist_mlp.hpp:274

MNIST::MSE::calc_loss
static Real calc_loss(const uint16_t label, const std::vector< Real > &output)
Definition: mnist_mlp.hpp:36

MNIST::MLP::mat_trans_X_vec
static std::vector< Real > mat_trans_X_vec(const Matrix< Real > &mat, const std::vector< Real > &vec)
Implements transposed matrix vector multiplication.
Definition: mnist_mlp.hpp:636

MNIST::MSE
Root Mean Squared Error.
Definition: mnist_mlp.hpp:34

mnist_cnn_pool.epochs
int epochs
Definition: mnist_cnn_pool.py:20

MNIST::MLP::scale_down_images
void scale_down_images(size_t pooling_size=3) override
Scale down the whole data set, reduces the image by a given factor in every dimension.
Definition: mnist_mlp.hpp:601

MNIST::MLP::mat_X_vec
static std::vector< Real > mat_X_vec(const Matrix< Real > &mat, const std::vector< Real > &vec)
Implements matrix vector multiplication.
Definition: mnist_mlp.hpp:614

MNIST::MLP::batchsize
const size_t & batchsize() const override
Definition: mnist_mlp.hpp:532

MNIST::CatHinge
Categorical hinge loss. Use if weights are restricted to be >0.
Definition: mnist_mlp.hpp:71

MNIST::MLP::m_constraint
Constraint m_constraint
Definition: mnist_mlp.hpp:260

MNIST::MLP::conv_max_weight
Real conv_max_weight(size_t layer_id) const override
Definition: mnist_mlp.hpp:482

MNIST::MLP::vec_X_vec_comp
static std::vector< Real > vec_X_vec_comp(const std::vector< Real > &vec1, const std::vector< Real > &vec2)
Vector vector multiplication, component-wise.
Definition: mnist_mlp.hpp:658

MNIST::MLP::mnist_train_set
const mnist_helper::MNIST_DATA & mnist_train_set() override
Returns reference to the train data.
Definition: mnist_mlp.hpp:540

plot_membrane_pot.i
i
Definition: plot_membrane_pot.py:140

MNIST::NoConstraint::constrain_weights
static void constrain_weights(std::vector< cypress::Matrix< Real >> &)
Definition: mnist_mlp.hpp:137

MNIST::PositiveWeights::setup
void setup(std::vector< cypress::Matrix< Real >> &)
Definition: mnist_mlp.hpp:150

MNIST::MLP::accuracy
size_t accuracy(const std::vector< std::vector< std::vector< Real >>> &activations, const std::vector< size_t > &indices, const size_t start) override
Calculate the overall accuracy from the given neural network output.
Definition: mnist_mlp.hpp:900

MNIST::MLP::get_layer_types
const std::vector< mnist_helper::LAYER_TYPE > & get_layer_types() override
Definition: mnist_mlp.hpp:590

MNIST::MLP::m_mnist
mnist_helper::MNIST_DATA m_mnist
Definition: mnist_mlp.hpp:251

MNIST
Definition: mnist_mlp.hpp:25

MNIST::MLP::forward_path
virtual std::vector< std::vector< std::vector< Real > > > forward_path(const std::vector< size_t > &indices, const size_t start) const override
Forward path of the network (–> inference)
Definition: mnist_mlp.hpp:724

MNIST::MLP::m_layers
std::vector< cypress::Matrix< Real > > m_layers
Definition: mnist_mlp.hpp:243

MNIST::PositiveLimitedWeights::setup
void setup(std::vector< cypress::Matrix< Real >> &layers)
Definition: mnist_mlp.hpp:167

MNIST::MLP::m_mnist_test
mnist_helper::MNIST_DATA m_mnist_test
Definition: mnist_mlp.hpp:252

MNIST::MLP::get_conv_layers
const std::vector< mnist_helper::CONVOLUTION_LAYER > & get_conv_layers() override
Return all filter weights in the form of weights[x][y][depth][filter].
Definition: mnist_mlp.hpp:570

mnist_helper::POOLING_LAYER
Definition: helper_functions.hpp:46

MNIST::PositiveWeights
Constraint for weights in neural network: Only weights >0.
Definition: mnist_mlp.hpp:148

MNIST::CatHinge::calc_loss
static Real calc_loss(const uint16_t label, const std::vector< Real > &output)
Definition: mnist_mlp.hpp:73

MNIST::MLP::epochs
const size_t & epochs() const override
Definition: mnist_mlp.hpp:531

MNIST::CatHinge::calc_error
static std::vector< Real > calc_error(const uint16_t label, const std::vector< Real > &output)
Definition: mnist_mlp.hpp:87

MNIST::MLP::backward_path_2
virtual void backward_path_2(const std::vector< uint16_t > &labels, const std::vector< std::vector< std::vector< Real >>> &activations, bool last_only=false) override
Implementation of backprop, adapted for usage in SNNs.
Definition: mnist_mlp.hpp:848

show_csv.path
path
Definition: show_csv.py:25

mnist_helper::Pooling
Definition: helper_functions.hpp:53

mnist_helper::max_weight
Real max_weight(const T &json)
Calculate the max weight, ignore negative values.
Definition: helper_functions.hpp:157

mnist_helper::Conv
Definition: helper_functions.hpp:53

MNIST::MLP::load_data
void load_data(std::string path)
Definition: mnist_mlp.hpp:254

MNIST::PositiveWeights::constrain_weights
void constrain_weights(std::vector< cypress::Matrix< Real >> &layers)
Definition: mnist_mlp.hpp:151

MNIST::MSE::calc_error
static std::vector< Real > calc_error(const uint16_t label, const std::vector< Real > &output)
Definition: mnist_mlp.hpp:51

MNIST::MLP::train
void train(unsigned seed=0) override
Starts the full training process.
Definition: mnist_mlp.hpp:926

MNIST::MLP::update_mat
static void update_mat(Matrix< Real > &mat, const std::vector< Real > &errors, const std::vector< Real > &pre_output, const size_t sample_num, const Real learn_rate)
Updates the weight matrix based on the error in this layer and the output of the previous layer...
Definition: mnist_mlp.hpp:696

mnist_helper::CONVOLUTION_FILTER
std::vector< std::vector< std::vector< std::vector< Real > > > > CONVOLUTION_FILTER
Definition: helper_functions.hpp:37

MNIST::MLP::correct
bool correct(const uint16_t label, const std::vector< Real > &output) const override
Checks if the output of the network was correct.
Definition: mnist_mlp.hpp:678

MNIST::MLP::backward_path
virtual void backward_path(const std::vector< size_t > &indices, const size_t start, const std::vector< std::vector< std::vector< Real >>> &activations, bool last_only=false) override
implementation of backprop
Definition: mnist_mlp.hpp:798

mnist_helper::loadMnistData
MNIST_DATA loadMnistData(const size_t num_data, const std::string path)
Read in MNIST data from files.

MNIST::MLP::mnist_test_set
const mnist_helper::MNIST_DATA & mnist_test_set() override
Returns reference to the test data.
Definition: mnist_mlp.hpp:549

MNIST::ReLU::derivative
static std::vector< Real > derivative(std::vector< Real > input)
Definition: mnist_mlp.hpp:122

mnist_helper::Dense
Definition: helper_functions.hpp:53

mnist_helper::CONVOLUTION_LAYER
Definition: helper_functions.hpp:38

MNIST::MLP::m_layer_types
std::vector< mnist_helper::LAYER_TYPE > m_layer_types
Definition: mnist_mlp.hpp:247

1dim_plot.max
max
Definition: 1dim_plot.py:126

MNIST::MLP::max_weight
Real max_weight() const override
Return the largest weight in the network.
Definition: mnist_mlp.hpp:471

MNIST::ReLU
ActivationFunction ReLU: Rectified Linear Unit.
Definition: mnist_mlp.hpp:113

MNIST::MLP::MLP
MLP(Json &data, size_t epochs=20, size_t batchsize=100, Real learn_rate=0.01, bool random=false, Constraint constraint=Constraint())
Constructs the network from json file. The repo provides python scripts to create those from a keras ...
Definition: mnist_mlp.hpp:326