tesseract-ocr.github.io/5.3.3/a01028_source.html

// File:        weightmatrix.h

// Description: Hides distinction between float/int implementations.

// Author:      Ray Smith

//

// (C) Copyright 2014, Google Inc.

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

// http://www.apache.org/licenses/LICENSE-2.0

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.


#ifndef TESSERACT_LSTM_WEIGHTMATRIX_H_

#define TESSERACT_LSTM_WEIGHTMATRIX_H_


#include <memory>

#include <vector>

#include "intsimdmatrix.h"

#include "matrix.h"

#include "tesstypes.h"

#include "tprintf.h"


namespace tesseract {


// Convenience instantiation of GENERIC_2D_ARRAY<TFloat> with additional

// operations to write a strided vector, so the transposed form of the input

// is memory-contiguous.

class TransposedArray : public GENERIC_2D_ARRAY<TFloat> {

public:

  // Copies the whole input transposed, converted to TFloat, into *this.

  void Transpose(const GENERIC_2D_ARRAY<TFloat> &input);

  // Writes a vector of data representing a timestep (gradients or sources).

  // The data is assumed to be of size1 in size (the strided dimension).

  ~TransposedArray() override;

  void WriteStrided(int t, const float *data) {

    int size1 = dim1();

    for (int i = 0; i < size1; ++i) {

      put(i, t, data[i]);

    }

  }

  void WriteStrided(int t, const double *data) {

    int size1 = dim1();

    for (int i = 0; i < size1; ++i) {

      put(i, t, data[i]);

    }

  }

  // Prints the first and last num elements of the un-transposed array.

  void PrintUnTransposed(int num) {

    int num_features = dim1();

    int width = dim2();

    for (int y = 0; y < num_features; ++y) {

      for (int t = 0; t < width; ++t) {

        if (num == 0 || t < num || t + num >= width) {

          tprintf(" %g", static_cast<double>((*this)(y, t)));

        }

      }

      tprintf("\n");

    }

  }

}; // class TransposedArray


// Generic weight matrix for network layers. Can store the matrix as either

// an array of floats or int8_t. Provides functions to compute the forward and

// backward steps with the matrix and updates to the weights.

class WeightMatrix {

public:

  WeightMatrix() : int_mode_(false), use_adam_(false) {}

  // Sets up the network for training. Initializes weights using weights of

  // scale `range` picked according to the random number generator `randomizer`.

  // Note the order is outputs, inputs, as this is the order of indices to

  // the matrix, so the adjacent elements are multiplied by the input during

  // a forward operation.

  int InitWeightsFloat(int no, int ni, bool use_adam, float weight_range, TRand *randomizer);

  // Changes the number of outputs to the size of the given code_map, copying

  // the old weight matrix entries for each output from code_map[output] where

  // non-negative, and uses the mean (over all outputs) of the existing weights

  // for all outputs with negative code_map entries. Returns the new number of

  // weights.

  int RemapOutputs(const std::vector<int> &code_map);


  // Converts a float network to an int network. Each set of input weights that

  // corresponds to a single output weight is converted independently:

  // Compute the max absolute value of the weight set.

  // Scale so the max absolute value becomes INT8_MAX.

  // Round to integer.

  // Store a multiplicative scale factor (as a float) that will reproduce

  // the original value, subject to rounding errors.

  void ConvertToInt();

  // Returns the size rounded up to an internal factor used by the SIMD

  // implementation for its input.

  int RoundInputs(int size) const {

    if (!int_mode_ || !IntSimdMatrix::intSimdMatrix) {

      return size;

    }

    return IntSimdMatrix::intSimdMatrix->RoundInputs(size);

  }


  // Accessors.

  bool is_int_mode() const {

    return int_mode_;

  }

  int NumOutputs() const {

    return int_mode_ ? wi_.dim1() : wf_.dim1();

  }

  // Provides one set of weights. Only used by peep weight maxpool.

  const TFloat *GetWeights(int index) const {

    return wf_[index];

  }

  // Provides access to the deltas (dw_).

  TFloat GetDW(int i, int j) const {

    return dw_(i, j);

  }


  // Allocates any needed memory for running Backward, and zeroes the deltas,

  // thus eliminating any existing momentum.

  void InitBackward();


  // Writes to the given file. Returns false in case of error.

  bool Serialize(bool training, TFile *fp) const;

  // Reads from the given file. Returns false in case of error.

  bool DeSerialize(bool training, TFile *fp);

  // As DeSerialize, but reads an old (float) format WeightMatrix for

  // backward compatibility.

  bool DeSerializeOld(bool training, TFile *fp);


  // Computes matrix.vector v = Wu.

  // u is of size W.dim2() - 1 and the output v is of size W.dim1().

  // u is imagined to have an extra element at the end with value 1, to

  // implement the bias, but it doesn't actually have it.

  // Asserts that the call matches what we have.

  void MatrixDotVector(const TFloat *u, TFloat *v) const;

  void MatrixDotVector(const int8_t *u, TFloat *v) const;

  // MatrixDotVector for peep weights, MultiplyAccumulate adds the

  // component-wise products of *this[0] and v to inout.

  void MultiplyAccumulate(const TFloat *v, TFloat *inout);

  // Computes vector.matrix v = uW.

  // u is of size W.dim1() and the output v is of size W.dim2() - 1.

  // The last result is discarded, as v is assumed to have an imaginary

  // last value of 1, as with MatrixDotVector.

  void VectorDotMatrix(const TFloat *u, TFloat *v) const;

  // Fills dw_[i][j] with the dot product u[i][] . v[j][], using elements

  // from u and v, starting with u[i][offset] and v[j][offset].

  // Note that (matching MatrixDotVector) v[last][] is missing, presumed 1.0.

  // Runs parallel if requested. Note that inputs must be transposed.

  void SumOuterTransposed(const TransposedArray &u, const TransposedArray &v, bool parallel);

  // Updates the weights using the given learning rate, momentum and adam_beta.

  // num_samples is used in the Adam correction factor.

  void Update(float learning_rate, float momentum, float adam_beta, int num_samples);

  // Adds the dw_ in other to the dw_ is *this.

  void AddDeltas(const WeightMatrix &other);

  // Sums the products of weight updates in *this and other, splitting into

  // positive (same direction) in *same and negative (different direction) in

  // *changed.

  void CountAlternators(const WeightMatrix &other, TFloat *same, TFloat *changed) const;


  void Debug2D(const char *msg);


private:

  // Choice between float and 8 bit int implementations.

  GENERIC_2D_ARRAY<TFloat> wf_;

  GENERIC_2D_ARRAY<int8_t> wi_;

  // Transposed copy of wf_, used only for Backward, and set with each Update.

  TransposedArray wf_t_;

  // Which of wf_ and wi_ are we actually using.

  bool int_mode_;

  // True if we are running adam in this weight matrix.

  bool use_adam_;

  // If we are using wi_, then scales_ is a factor to restore the row product

  // with a vector to the correct range.

  std::vector<TFloat> scales_;

  // Weight deltas. dw_ is the new delta, and updates_ the momentum-decaying

  // amount to be added to wf_/wi_.

  GENERIC_2D_ARRAY<TFloat> dw_;

  GENERIC_2D_ARRAY<TFloat> updates_;

  // Iff use_adam_, the sum of squares of dw_. The number of samples is

  // given to Update(). Serialized iff use_adam_.

  GENERIC_2D_ARRAY<TFloat> dw_sq_sum_;

  // The weights matrix reorganized in whatever way suits this instance.

  std::vector<int8_t> shaped_w_;

};


} // namespace tesseract.


#endif // TESSERACT_LSTM_WEIGHTMATRIX_H_

tprintf.h

tesstypes.h

matrix.h

intsimdmatrix.h

y
const double y
Definition: gmock-matchers_test.cc:4028

i
int i
Definition: gmock-matchers_test.cc:718

tesseract
Definition: baseapi.h:39

tesseract::tprintf
void tprintf(const char *format,...)
Definition: tprintf.cpp:41

tesseract::TFloat
double TFloat
Definition: tesstypes.h:39

tesseract::GENERIC_2D_ARRAY
Definition: matrix.h:51

tesseract::GENERIC_2D_ARRAY< TFloat >::dim2
int dim2() const
Definition: matrix.h:243

tesseract::GENERIC_2D_ARRAY< TFloat >::put
void put(ICOORD pos, const TFloat &thing)
Definition: matrix.h:260

tesseract::GENERIC_2D_ARRAY< TFloat >::dim1
int dim1() const
Definition: matrix.h:240

tesseract::IntSimdMatrix::RoundInputs
int RoundInputs(int size) const
Definition: intsimdmatrix.h:70

tesseract::IntSimdMatrix::intSimdMatrix
static const IntSimdMatrix * intSimdMatrix
Definition: intsimdmatrix.h:115

tesseract::TRand
Definition: helpers.h:61

tesseract::TFile
Definition: serialis.h:61

tesseract::TransposedArray
Definition: weightmatrix.h:33

tesseract::TransposedArray::~TransposedArray
~TransposedArray() override

tesseract::TransposedArray::Transpose
void Transpose(const GENERIC_2D_ARRAY< TFloat > &input)
Definition: weightmatrix.cpp:114

tesseract::TransposedArray::WriteStrided
void WriteStrided(int t, const double *data)
Definition: weightmatrix.h:46

tesseract::TransposedArray::WriteStrided
void WriteStrided(int t, const float *data)
Definition: weightmatrix.h:40

tesseract::TransposedArray::PrintUnTransposed
void PrintUnTransposed(int num)
Definition: weightmatrix.h:53

tesseract::WeightMatrix
Definition: weightmatrix.h:70

tesseract::WeightMatrix::NumOutputs
int NumOutputs() const
Definition: weightmatrix.h:107

tesseract::WeightMatrix::SumOuterTransposed
void SumOuterTransposed(const TransposedArray &u, const TransposedArray &v, bool parallel)
Definition: weightmatrix.cpp:429

tesseract::WeightMatrix::Serialize
bool Serialize(bool training, TFile *fp) const
Definition: weightmatrix.cpp:238

tesseract::WeightMatrix::WeightMatrix
WeightMatrix()
Definition: weightmatrix.h:72

tesseract::WeightMatrix::DeSerializeOld
bool DeSerializeOld(bool training, TFile *fp)
Definition: weightmatrix.cpp:342

tesseract::WeightMatrix::MultiplyAccumulate
void MultiplyAccumulate(const TFloat *v, TFloat *inout)
Definition: weightmatrix.cpp:405

tesseract::WeightMatrix::InitWeightsFloat
int InitWeightsFloat(int no, int ni, bool use_adam, float weight_range, TRand *randomizer)
Definition: weightmatrix.cpp:130

tesseract::WeightMatrix::Update
void Update(float learning_rate, float momentum, float adam_beta, int num_samples)
Definition: weightmatrix.cpp:460

tesseract::WeightMatrix::GetDW
TFloat GetDW(int i, int j) const
Definition: weightmatrix.h:115

tesseract::WeightMatrix::GetWeights
const TFloat * GetWeights(int index) const
Definition: weightmatrix.h:111

tesseract::WeightMatrix::InitBackward
void InitBackward()
Definition: weightmatrix.cpp:217

tesseract::WeightMatrix::Debug2D
void Debug2D(const char *msg)
Definition: weightmatrix.cpp:527

tesseract::WeightMatrix::is_int_mode
bool is_int_mode() const
Definition: weightmatrix.h:104

tesseract::WeightMatrix::ConvertToInt
void ConvertToInt()
Definition: weightmatrix.cpp:183

tesseract::WeightMatrix::AddDeltas
void AddDeltas(const WeightMatrix &other)
Definition: weightmatrix.cpp:486

tesseract::WeightMatrix::RemapOutputs
int RemapOutputs(const std::vector< int > &code_map)
Definition: weightmatrix.cpp:151

tesseract::WeightMatrix::VectorDotMatrix
void VectorDotMatrix(const TFloat *u, TFloat *v) const
Definition: weightmatrix.cpp:419

tesseract::WeightMatrix::MatrixDotVector
void MatrixDotVector(const TFloat *u, TFloat *v) const
Definition: weightmatrix.cpp:388

tesseract::WeightMatrix::DeSerialize
bool DeSerialize(bool training, TFile *fp)
Definition: weightmatrix.cpp:280

tesseract::WeightMatrix::RoundInputs
int RoundInputs(int size) const
Definition: weightmatrix.h:96

tesseract::WeightMatrix::CountAlternators
void CountAlternators(const WeightMatrix &other, TFloat *same, TFloat *changed) const
Definition: weightmatrix.cpp:495