mlpack-git/doxygen/mean__pooling_8hpp_source.html

 #ifndef MLPACK_METHODS_ANN_LAYER_MEAN_POOLING_HPP
 #define MLPACK_METHODS_ANN_LAYER_MEAN_POOLING_HPP

 #include <mlpack/prereqs.hpp>

 namespace mlpack {
 namespace ann  {

 template <
     typename InputDataType = arma::mat,
     typename OutputDataType = arma::mat
 >
 class MeanPooling
 {
  public:
   MeanPooling();

   MeanPooling(const size_t kernelWidth,
               const size_t kernelHeight,
               const size_t strideWidth = 1,
               const size_t strideHeight = 1,
               const bool floor = true);

   template<typename eT>
   void Forward(const arma::Mat<eT>& input, arma::Mat<eT>& output);

   template<typename eT>
   void Backward(const arma::Mat<eT>& /* input */,
                 const arma::Mat<eT>& gy,
                 arma::Mat<eT>& g);

   OutputDataType const& OutputParameter() const { return outputParameter; }
   OutputDataType& OutputParameter() { return outputParameter; }

   OutputDataType const& Delta() const { return delta; }
   OutputDataType& Delta() { return delta; }

   size_t const& InputWidth() const { return inputWidth; }
   size_t& InputWidth() { return inputWidth; }

   size_t const& InputHeight() const { return inputHeight; }
   size_t& InputHeight() { return inputHeight; }

   size_t const& OutputWidth() const { return outputWidth; }
   size_t& OutputWidth() { return outputWidth; }

   size_t const& OutputHeight() const { return outputHeight; }
   size_t& OutputHeight() { return outputHeight; }

   size_t InputSize() const { return inSize; }

   size_t OutputSize() const { return outSize; }

   size_t KernelWidth() const { return kernelWidth; }
   size_t& KernelWidth() { return kernelWidth; }

   size_t KernelHeight() const { return kernelHeight; }
   size_t& KernelHeight() { return kernelHeight; }

   size_t StrideWidth() const { return strideWidth; }
   size_t& StrideWidth() { return strideWidth; }

   size_t StrideHeight() const { return strideHeight; }
   size_t& StrideHeight() { return strideHeight; }

   bool const& Floor() const { return floor; }
   bool& Floor() { return floor; }

   bool Deterministic() const { return deterministic; }
   bool& Deterministic() { return deterministic; }

   size_t WeightSize() const { return 0; }

   template<typename Archive>
   void serialize(Archive& ar, const uint32_t /* version */);

  private:
   template<typename eT>
   void Pooling(const arma::Mat<eT>& input, arma::Mat<eT>& output)
   {
     arma::Mat<eT> inputPre = input;

     for (size_t i = 1; i < input.n_cols; ++i)
       inputPre.col(i) += inputPre.col(i - 1);

     for (size_t i = 1; i < input.n_rows; ++i)
       inputPre.row(i) += inputPre.row(i - 1);

     for (size_t j = 0, colidx = 0; j < output.n_cols;
          ++j, colidx += strideHeight)
     {
       for (size_t i = 0, rowidx = 0; i < output.n_rows;
            ++i, rowidx += strideWidth)
       {
         double val = 0.0;
         size_t rowEnd = rowidx + kernelWidth - 1;
         size_t colEnd = colidx + kernelHeight - 1;

         if (rowEnd > input.n_rows - 1)
           rowEnd = input.n_rows - 1;
         if (colEnd > input.n_cols - 1)
           colEnd = input.n_cols - 1;

         const size_t kernalArea = (rowEnd - rowidx + 1) * (colEnd - colidx + 1);
         val += inputPre(rowEnd, colEnd);
         if (rowidx >= 1)
         {
           if (colidx >= 1)
             val += inputPre(rowidx - 1, colidx - 1);
           val -= inputPre(rowidx - 1, colEnd);
         }
         if (colidx >= 1)
           val -= inputPre(rowEnd, colidx - 1);

         output(i, j) = val / kernalArea;
       }
     }
   }

   template<typename eT>
   void Unpooling(const arma::Mat<eT>& input,
                  const arma::Mat<eT>& error,
                  arma::Mat<eT>& output)
   {
     // This condition comes by comparing the number of operations involved in the brute
     // force method and the prefix method. Let the area of error be errorArea and area
     // of kernal be kernalArea. Total number of operations in brute force method will be
     // `errorArea * kernalArea` and for each element in error we are doing `kernalArea`
     // number of operations. Whereas in the prefix method the total number of operations
     // will be `4 * errorArea + 2 * inputArea`. The term `2 * inputArea` comes from
     // prefix sums performed (col-wise and row-wise).
     // We can use this to determine which method to use.
     const bool condition = (error.n_elem * kernelHeight * kernelWidth) >
         (4 * error.n_elem + 2 * input.n_elem);

     if (condition)
     {
       // If this condition is true then theoritically the prefix sum method of
       // unpooling is faster. The aim of unpooling is to add
       // `error(i, j) / kernalArea` to `inputArea(kernal)`. This requires
       // `inputArea.n_elem` additions. So, total operations required will be
       // `error.n_elem * inputArea.n_elem` operations.
       // To improve this method we will use an idea of prefix sums. Let's see
       // this method in 1-D matrix then we will extend it to 2-D matrix.
       // Let the input be a 1-D matrix input = `[0, 0, 0, 0, 0, 0, 0, 0, 0, 0]` of size 10
       // and we want to add `10` to idx = 1 to idx = 5. In brute force method we can run
       // a loop from idx = 1 to idx = 5 and add `10` to each element. In prefix method
       // We will add `+10` to idx = 1 and `-10` to idx = (5 + 1). Now the input will look
       // like `[0, +10, 0, 0, 0, 0, -10, 0, 0, 0]`. After that we can just do prefix
       // sum `input[i] += input[i - 1]`. Then the input becomes
       // `[0, +10, +10, +10, +10, +10, 0, 0, 0, 0]`. So the total computation require
       // by this method is (2 additions + Prefix operations).
       // Note that if there are `k` such operation of adding a number of some
       // continuous subarray. Then the brute force method will require
       // `k * size(subarray)` operations. But the prefix method will require
       // `2 * k + Prefix` operations, because the Prefix can be performed once at
       // the end.
       // Now for 2-D matrix. Lets say we want to add `e` to all elements from
       // input(x1 : x2, y1 : y2). So the inputArea = (x2 - x1 + 1) * (y2 - y1 + 1).
       // In prefix method the following operations will be performed:
       //    1. Add `+e` to input(x1, y1).
       //    2. Add `-e` to input(x1 + 1, y1).
       //    3. Add `-e` to input(x1, y1 + 1).
       //    4. Add `+e` to input(x1 + 1, y1 + 1).
       //    5. Perform Prefix sum over columns i.e input(i, j) += input(i, j - 1)
       //    6. Perform Prefix sum over rows i.e input(i, j) += input(i - 1, j)
       // So lets say if we had `k` number of such operations. The brute force
       // method will require `kernalArea * k` operations.
       // The prefix method will require `4 * k + Prefix operation`.

       for (size_t j = 0, colidx = 0; j < input.n_cols; j += strideHeight, ++colidx)
       {
         for (size_t i = 0, rowidx = 0; i < input.n_rows; i += strideWidth, ++rowidx)
         {
           // We have to add error(i, j) to output(span(rowidx, rowEnd), span(colidx, colEnd)).
           // The steps of prefix sum method:
           //
           // 1. For each (i, j) perform:
           //    1.1 Add +error(i, j) to output(rowidx, colidx)
           //    1.2 Add -error(i, j) to output(rowidx, colidx + 1)
           //    1.3 Add -error(i, j) to output(rowidx + 1, colidx)
           //    1.4 Add +error(i, j) to output(rowidx + 1, colidx + 1)
           //
           // 2. Do prefix sum column wise i.e output(i, j) += output(i, j - 1)
           // 2. Do prefix sum row wise i.e output(i, j) += output(i - 1, j)

           size_t rowEnd = i + kernelWidth - 1;
           size_t colEnd = j + kernelHeight - 1;

           if (rowEnd > input.n_rows - 1)
           {
             if (floor)
               continue;
             rowEnd = input.n_rows - 1;
           }

           if (colEnd > input.n_cols - 1)
           {
             if (floor)
               continue;
             colEnd = input.n_cols - 1;
           }

           size_t kernalArea = (rowEnd - i + 1) * (colEnd - j + 1);
           output(i, j) += error(rowidx, colidx) / kernalArea;

           if (rowEnd + 1 < input.n_rows)
           {
             output(rowEnd + 1, j) -= error(rowidx, colidx) / kernalArea;

             if (colEnd + 1 < input.n_cols)
               output(rowEnd + 1, colEnd + 1) += error(rowidx, colidx) / kernalArea;
           }

           if (colEnd + 1 < input.n_cols)
             output(i, colEnd + 1) -= error(rowidx, colidx) / kernalArea;
         }
       }

       for (size_t i = 1; i < input.n_rows; ++i)
         output.row(i) += output.row(i - 1);

       for (size_t j = 1; j < input.n_cols; ++j)
         output.col(j) += output.col(j - 1);
     }
     else
     {
       arma::Mat<eT> unpooledError;
       for (size_t j = 0, colidx = 0; j < input.n_cols; j += strideHeight, ++colidx)
       {
         for (size_t i = 0, rowidx = 0; i < input.n_rows; i += strideWidth, ++rowidx)
         {
           size_t rowEnd = i + kernelWidth - 1;
           size_t colEnd = j + kernelHeight - 1;

           if (rowEnd > input.n_rows - 1)
           {
             if (floor)
               continue;
             rowEnd = input.n_rows - 1;
           }

           if (colEnd > input.n_cols - 1)
           {
             if (floor)
               continue;
             colEnd = input.n_cols - 1;
           }

           arma::mat InputArea = input(arma::span(i, rowEnd), arma::span(j, colEnd));

           unpooledError = arma::Mat<eT>(InputArea.n_rows, InputArea.n_cols);
           unpooledError.fill(error(rowidx, colidx) / InputArea.n_elem);

           output(arma::span(i, i + InputArea.n_rows - 1),
               arma::span(j, j + InputArea.n_cols - 1)) += unpooledError;
         }
       }
     }
   }

   size_t kernelWidth;

   size_t kernelHeight;

   size_t strideWidth;

   size_t strideHeight;

   bool floor;

   size_t inSize;

   size_t outSize;

   size_t inputWidth;

   size_t inputHeight;

   size_t outputWidth;

   size_t outputHeight;

   bool reset;

   bool deterministic;

   size_t batchSize;

   arma::cube outputTemp;

   arma::cube inputTemp;

   arma::cube gTemp;

   OutputDataType delta;

   OutputDataType gradient;

   OutputDataType outputParameter;
 }; // class MeanPooling


 } // namespace ann
 } // namespace mlpack

 // Include implementation.
 #include "mean_pooling_impl.hpp"

 #endif
mlpack::ann::MeanPooling::KernelHeight
size_t KernelHeight() const
Get the kernel height.
Definition: mean_pooling.hpp:120

mlpack::ann::MeanPooling::Delta
OutputDataType const  & Delta() const
Get the delta.
Definition: mean_pooling.hpp:84

mlpack::ann::MeanPooling::serialize
void serialize(Archive &ar, const uint32_t)
Serialize the layer.

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: add_to_cli11.hpp:21

mlpack::ann::MeanPooling::KernelWidth
size_t & KernelWidth()
Modify the kernel width.
Definition: mean_pooling.hpp:117

mlpack::ann::MeanPooling::MeanPooling
MeanPooling()
Create the MeanPooling object.

mlpack::ann::MeanPooling::OutputHeight
size_t & OutputHeight()
Modify the output height.
Definition: mean_pooling.hpp:106

prereqs.hpp
The core includes that mlpack expects; standard C++ includes and Armadillo.

mlpack::ann::MeanPooling::OutputHeight
size_t const  & OutputHeight() const
Get the output height.
Definition: mean_pooling.hpp:104

mlpack::ann::MeanPooling::InputHeight
size_t const  & InputHeight() const
Get the input height.
Definition: mean_pooling.hpp:94

mlpack::ann::MeanPooling::Deterministic
bool Deterministic() const
Get the value of the deterministic parameter.
Definition: mean_pooling.hpp:140

mlpack::ann::MeanPooling::Delta
OutputDataType & Delta()
Modify the delta.
Definition: mean_pooling.hpp:86

mlpack::ann::MeanPooling
Implementation of the MeanPooling.
Definition: mean_pooling.hpp:33

mlpack::ann::MeanPooling::Forward
void Forward(const arma::Mat< eT > &input, arma::Mat< eT > &output)
Ordinary feed forward pass of a neural network, evaluating the function f(x) by propagating the activ...

mlpack::ann::MeanPooling::StrideWidth
size_t StrideWidth() const
Get the stride width.
Definition: mean_pooling.hpp:125

mlpack::ann::MeanPooling::OutputParameter
OutputDataType const  & OutputParameter() const
Get the output parameter.
Definition: mean_pooling.hpp:79

mlpack::ann::MeanPooling::InputSize
size_t InputSize() const
Get the input size.
Definition: mean_pooling.hpp:109

mlpack::ann::MeanPooling::KernelWidth
size_t KernelWidth() const
Get the kernel width.
Definition: mean_pooling.hpp:115

mlpack::ann::MeanPooling::OutputWidth
size_t const  & OutputWidth() const
Get the output width.
Definition: mean_pooling.hpp:99

mlpack::ann::MeanPooling::InputHeight
size_t & InputHeight()
Modify the input height.
Definition: mean_pooling.hpp:96

mlpack::ann::MeanPooling::InputWidth
size_t const  & InputWidth() const
Get the intput width.
Definition: mean_pooling.hpp:89

mlpack::ann::MeanPooling::OutputParameter
OutputDataType & OutputParameter()
Modify the output parameter.
Definition: mean_pooling.hpp:81

mlpack::ann::MeanPooling::Floor
bool const  & Floor() const
Get the value of the rounding operation.
Definition: mean_pooling.hpp:135

mlpack::ann::MeanPooling::InputWidth
size_t & InputWidth()
Modify the input width.
Definition: mean_pooling.hpp:91

mlpack::ann::MeanPooling::Floor
bool & Floor()
Modify the value of the rounding operation.
Definition: mean_pooling.hpp:137

mlpack::ann::MeanPooling::Deterministic
bool & Deterministic()
Modify the value of the deterministic parameter.
Definition: mean_pooling.hpp:142

mlpack::ann::MeanPooling::OutputWidth
size_t & OutputWidth()
Modify the output width.
Definition: mean_pooling.hpp:101

mlpack::ann::MeanPooling::StrideHeight
size_t & StrideHeight()
Modify the stride height.
Definition: mean_pooling.hpp:132

mlpack::ann::MeanPooling::OutputSize
size_t OutputSize() const
Get the output size.
Definition: mean_pooling.hpp:112

mlpack::ann::MeanPooling::WeightSize
size_t WeightSize() const
Get the size of the weights.
Definition: mean_pooling.hpp:145

mlpack::ann::MeanPooling::StrideWidth
size_t & StrideWidth()
Modify the stride width.
Definition: mean_pooling.hpp:127

mlpack::ann::MeanPooling::StrideHeight
size_t StrideHeight() const
Get the stride height.
Definition: mean_pooling.hpp:130

mlpack::ann::MeanPooling::KernelHeight
size_t & KernelHeight()
Modify the kernel height.
Definition: mean_pooling.hpp:122

mlpack::ann::MeanPooling::Backward
void Backward(const arma::Mat< eT > &, const arma::Mat< eT > &gy, arma::Mat< eT > &g)
Ordinary feed backward pass of a neural network, using 3rd-order tensors as input, calculating the function f(x) by propagating x backwards through f.