tesseract-ocr.github.io/5.3.3/a00998_source.html

// File:        lstmtrainer.h

// Description: Top-level line trainer class for LSTM-based networks.

// Author:      Ray Smith

//

// (C) Copyright 2013, Google Inc.

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

// http://www.apache.org/licenses/LICENSE-2.0

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.


#ifndef TESSERACT_LSTM_LSTMTRAINER_H_

#define TESSERACT_LSTM_LSTMTRAINER_H_


#include "export.h"


#include "imagedata.h" // for DocumentCache

#include "lstmrecognizer.h"

#include "rect.h"


#include <functional> // for std::function

#include <sstream>    // for std::stringstream


namespace tesseract {


class LSTM;

class LSTMTester;

class LSTMTrainer;

class Parallel;

class Reversed;

class Softmax;

class Series;


// Enum for the types of errors that are counted.

enum ErrorTypes {

  ET_RMS,         // RMS activation error.

  ET_DELTA,       // Number of big errors in deltas.

  ET_WORD_RECERR, // Output text string word recall error.

  ET_CHAR_ERROR,  // Output text string total char error.

  ET_SKIP_RATIO,  // Fraction of samples skipped.

  ET_COUNT        // For array sizing.

};


// Enum for the trainability_ flags.

enum Trainability {

  TRAINABLE,        // Non-zero delta error.

  PERFECT,          // Zero delta error.

  UNENCODABLE,      // Not trainable due to coding/alignment trouble.

  HI_PRECISION_ERR, // Hi confidence disagreement.

  NOT_BOXED,        // Early in training and has no character boxes.

};


// Enum to define the amount of data to get serialized.

enum SerializeAmount {

  LIGHT,           // Minimal data for remote training.

  NO_BEST_TRAINER, // Save an empty vector in place of best_trainer_.

  FULL,            // All data including best_trainer_.

};


// Enum to indicate how the sub_trainer_ training went.

enum SubTrainerResult {

  STR_NONE,    // Did nothing as not good enough.

  STR_UPDATED, // Subtrainer was updated, but didn't replace *this.

  STR_REPLACED // Subtrainer replaced *this.

};


class LSTMTrainer;

// Function to compute and record error rates on some external test set(s).

// Args are: iteration, mean errors, model, training stage.

// Returns a string containing logging information about the tests.

using TestCallback = std::function<std::string(int, const double *,

                                               const TessdataManager &, int)>;


// Trainer class for LSTM networks. Most of the effort is in creating the

// ideal target outputs from the transcription. A box file is used if it is

// available, otherwise estimates of the char widths from the unicharset are

// used to guide a DP search for the best fit to the transcription.

class TESS_UNICHARSET_TRAINING_API LSTMTrainer : public LSTMRecognizer {

public:

  LSTMTrainer();

  LSTMTrainer(const char *model_base, const char *checkpoint_name,

              int debug_interval, int64_t max_memory);

  virtual ~LSTMTrainer();


  // Tries to deserialize a trainer from the given file and silently returns

  // false in case of failure. If old_traineddata is not null, then it is

  // assumed that the character set is to be re-mapped from old_traineddata to

  // the new, with consequent change in weight matrices etc.

  bool TryLoadingCheckpoint(const char *filename, const char *old_traineddata);


  // Initializes the character set encode/decode mechanism directly from a

  // previously setup traineddata containing dawgs, UNICHARSET and

  // UnicharCompress. Note: Call before InitNetwork!

  bool InitCharSet(const std::string &traineddata_path) {

    bool success = mgr_.Init(traineddata_path.c_str());

    if (success) {

      InitCharSet();

    }

    return success;

  }

  void InitCharSet(const TessdataManager &mgr) {

    mgr_ = mgr;

    InitCharSet();

  }


  // Initializes the trainer with a network_spec in the network description

  // net_flags control network behavior according to the NetworkFlags enum.

  // There isn't really much difference between them - only where the effects

  // are implemented.

  // For other args see NetworkBuilder::InitNetwork.

  // Note: Be sure to call InitCharSet before InitNetwork!

  bool InitNetwork(const char *network_spec, int append_index, int net_flags,

                   float weight_range, float learning_rate, float momentum,

                   float adam_beta);

  // Initializes a trainer from a serialized TFNetworkModel proto.

  // Returns the global step of TensorFlow graph or 0 if failed.

  // Building a compatible TF graph: See tfnetwork.proto.

  int InitTensorFlowNetwork(const std::string &tf_proto);

  // Resets all the iteration counters for fine tuning or training a head,

  // where we want the error reporting to reset.

  void InitIterations();


  // Accessors.

  double ActivationError() const {

    return error_rates_[ET_DELTA];

  }

  double CharError() const {

    return error_rates_[ET_CHAR_ERROR];

  }

  const double *error_rates() const {

    return error_rates_;

  }

  double best_error_rate() const {

    return best_error_rate_;

  }

  int best_iteration() const {

    return best_iteration_;

  }

  int learning_iteration() const {

    return learning_iteration_;

  }

  int32_t improvement_steps() const {

    return improvement_steps_;

  }

  void set_perfect_delay(int delay) {

    perfect_delay_ = delay;

  }

  const std::vector<char> &best_trainer() const {

    return best_trainer_;

  }

  // Returns the error that was just calculated by PrepareForBackward.

  double NewSingleError(ErrorTypes type) const {

    return error_buffers_[type][training_iteration() % kRollingBufferSize_];

  }

  // Returns the error that was just calculated by TrainOnLine. Since

  // TrainOnLine rolls the error buffers, this is one further back than

  // NewSingleError.

  double LastSingleError(ErrorTypes type) const {

    return error_buffers_[type]

                         [(training_iteration() + kRollingBufferSize_ - 1) %

                          kRollingBufferSize_];

  }

  const DocumentCache &training_data() const {

    return training_data_;

  }

  DocumentCache *mutable_training_data() {

    return &training_data_;

  }


  // If the training sample is usable, grid searches for the optimal

  // dict_ratio/cert_offset, and returns the results in a string of space-

  // separated triplets of ratio,offset=worderr.

  Trainability GridSearchDictParams(

      const ImageData *trainingdata, int iteration, double min_dict_ratio,

      double dict_ratio_step, double max_dict_ratio, double min_cert_offset,

      double cert_offset_step, double max_cert_offset, std::string &results);


  // Provides output on the distribution of weight values.

  void DebugNetwork();


  // Loads a set of lstmf files that were created using the lstm.train config to

  // tesseract into memory ready for training. Returns false if nothing was

  // loaded.

  bool LoadAllTrainingData(const std::vector<std::string> &filenames,

                           CachingStrategy cache_strategy,

                           bool randomly_rotate);


  // Keeps track of best and locally worst error rate, using internally computed

  // values. See MaintainCheckpointsSpecific for more detail.

  bool MaintainCheckpoints(const TestCallback &tester, std::stringstream &log_msg);

  // Keeps track of best and locally worst error_rate (whatever it is) and

  // launches tests using rec_model, when a new min or max is reached.

  // Writes checkpoints using train_model at appropriate times and builds and

  // returns a log message to indicate progress. Returns false if nothing

  // interesting happened.

  bool MaintainCheckpointsSpecific(int iteration,

                                   const std::vector<char> *train_model,

                                   const std::vector<char> *rec_model,

                                   TestCallback tester, std::stringstream &log_msg);

  // Builds a progress message with current error rates.

  void PrepareLogMsg(std::stringstream &log_msg) const;

  // Appends <intro_str> iteration learning_iteration()/training_iteration()/

  // sample_iteration() to the log_msg.

  void LogIterations(const char *intro_str, std::stringstream &log_msg) const;


  // TODO(rays) Add curriculum learning.

  // Returns true and increments the training_stage_ if the error rate has just

  // passed through the given threshold for the first time.

  bool TransitionTrainingStage(float error_threshold);

  // Returns the current training stage.

  int CurrentTrainingStage() const {

    return training_stage_;

  }


  // Writes to the given file. Returns false in case of error.

  bool Serialize(SerializeAmount serialize_amount, const TessdataManager *mgr,

                 TFile *fp) const;

  // Reads from the given file. Returns false in case of error.

  bool DeSerialize(const TessdataManager *mgr, TFile *fp);


  // De-serializes the saved best_trainer_ into sub_trainer_, and adjusts the

  // learning rates (by scaling reduction, or layer specific, according to

  // NF_LAYER_SPECIFIC_LR).

  void StartSubtrainer(std::stringstream &log_msg);

  // While the sub_trainer_ is behind the current training iteration and its

  // training error is at least kSubTrainerMarginFraction better than the

  // current training error, trains the sub_trainer_, and returns STR_UPDATED if

  // it did anything. If it catches up, and has a better error rate than the

  // current best, as well as a margin over the current error rate, then the

  // trainer in *this is replaced with sub_trainer_, and STR_REPLACED is

  // returned. STR_NONE is returned if the subtrainer wasn't good enough to

  // receive any training iterations.

  SubTrainerResult UpdateSubtrainer(std::stringstream &log_msg);

  // Reduces network learning rates, either for everything, or for layers

  // independently, according to NF_LAYER_SPECIFIC_LR.

  void ReduceLearningRates(LSTMTrainer *samples_trainer, std::stringstream &log_msg);

  // Considers reducing the learning rate independently for each layer down by

  // factor(<1), or leaving it the same, by double-training the given number of

  // samples and minimizing the amount of changing of sign of weight updates.

  // Even if it looks like all weights should remain the same, an adjustment

  // will be made to guarantee a different result when reverting to an old best.

  // Returns the number of layer learning rates that were reduced.

  int ReduceLayerLearningRates(TFloat factor, int num_samples,

                               LSTMTrainer *samples_trainer);


  // Converts the string to integer class labels, with appropriate null_char_s

  // in between if not in SimpleTextOutput mode. Returns false on failure.

  bool EncodeString(const std::string &str, std::vector<int> *labels) const {

    return EncodeString(str, GetUnicharset(),

                        IsRecoding() ? &recoder_ : nullptr, SimpleTextOutput(),

                        null_char_, labels);

  }

  // Static version operates on supplied unicharset, encoder, simple_text.

  static bool EncodeString(const std::string &str, const UNICHARSET &unicharset,

                           const UnicharCompress *recoder, bool simple_text,

                           int null_char, std::vector<int> *labels);


  // Performs forward-backward on the given trainingdata.

  // Returns the sample that was used or nullptr if the next sample was deemed

  // unusable. samples_trainer could be this or an alternative trainer that

  // holds the training samples.

  const ImageData *TrainOnLine(LSTMTrainer *samples_trainer, bool batch) {

    int sample_index = sample_iteration();

    const ImageData *image =

        samples_trainer->training_data_.GetPageBySerial(sample_index);

    if (image != nullptr) {

      Trainability trainable = TrainOnLine(image, batch);

      if (trainable == UNENCODABLE || trainable == NOT_BOXED) {

        return nullptr; // Sample was unusable.

      }

    } else {

      ++sample_iteration_;

    }

    return image;

  }

  Trainability TrainOnLine(const ImageData *trainingdata, bool batch);


  // Prepares the ground truth, runs forward, and prepares the targets.

  // Returns a Trainability enum to indicate the suitability of the sample.

  Trainability PrepareForBackward(const ImageData *trainingdata,

                                  NetworkIO *fwd_outputs, NetworkIO *targets);


  // Writes the trainer to memory, so that the current training state can be

  // restored.  *this must always be the master trainer that retains the only

  // copy of the training data and language model. trainer is the model that is

  // actually serialized.

  bool SaveTrainingDump(SerializeAmount serialize_amount,

                        const LSTMTrainer &trainer,

                        std::vector<char> *data) const;


  // Reads previously saved trainer from memory. *this must always be the

  // master trainer that retains the only copy of the training data and

  // language model. trainer is the model that is restored.

  bool ReadTrainingDump(const std::vector<char> &data,

                        LSTMTrainer &trainer) const {

    if (data.empty()) {

      return false;

    }

    return ReadSizedTrainingDump(&data[0], data.size(), trainer);

  }

  bool ReadSizedTrainingDump(const char *data, int size,

                             LSTMTrainer &trainer) const {

    return trainer.ReadLocalTrainingDump(&mgr_, data, size);

  }

  // Restores the model to *this.

  bool ReadLocalTrainingDump(const TessdataManager *mgr, const char *data,

                             int size);


  // Sets up the data for MaintainCheckpoints from a light ReadTrainingDump.

  void SetupCheckpointInfo();


  // Writes the full recognition traineddata to the given filename.

  bool SaveTraineddata(const char *filename);


  // Writes the recognizer to memory, so that it can be used for testing later.

  void SaveRecognitionDump(std::vector<char> *data) const;


  // Returns a suitable filename for a training dump, based on the model_base_,

  // the iteration and the error rates.

  std::string DumpFilename() const;


  // Fills the whole error buffer of the given type with the given value.

  void FillErrorBuffer(double new_error, ErrorTypes type);

  // Helper generates a map from each current recoder_ code (ie softmax index)

  // to the corresponding old_recoder code, or -1 if there isn't one.

  std::vector<int> MapRecoder(const UNICHARSET &old_chset,

                              const UnicharCompress &old_recoder) const;


protected:

  // Private version of InitCharSet above finishes the job after initializing

  // the mgr_ data member.

  void InitCharSet();

  // Helper computes and sets the null_char_.

  void SetNullChar();


  // Factored sub-constructor sets up reasonable default values.

  void EmptyConstructor();


  // Outputs the string and periodically displays the given network inputs

  // as an image in the given window, and the corresponding labels at the

  // corresponding x_starts.

  // Returns false if the truth string is empty.

  bool DebugLSTMTraining(const NetworkIO &inputs, const ImageData &trainingdata,

                         const NetworkIO &fwd_outputs,

                         const std::vector<int> &truth_labels,

                         const NetworkIO &outputs);

  // Displays the network targets as line a line graph.

  void DisplayTargets(const NetworkIO &targets, const char *window_name,

                      ScrollView **window);


  // Builds a no-compromises target where the first positions should be the

  // truth labels and the rest is padded with the null_char_.

  bool ComputeTextTargets(const NetworkIO &outputs,

                          const std::vector<int> &truth_labels,

                          NetworkIO *targets);


  // Builds a target using standard CTC. truth_labels should be pre-padded with

  // nulls wherever desired. They don't have to be between all labels.

  // outputs is input-output, as it gets clipped to minimum probability.

  bool ComputeCTCTargets(const std::vector<int> &truth_labels,

                         NetworkIO *outputs, NetworkIO *targets);


  // Computes network errors, and stores the results in the rolling buffers,

  // along with the supplied text_error.

  // Returns the delta error of the current sample (not running average.)

  double ComputeErrorRates(const NetworkIO &deltas, double char_error,

                           double word_error);


  // Computes the network activation RMS error rate.

  double ComputeRMSError(const NetworkIO &deltas);


  // Computes network activation winner error rate. (Number of values that are

  // in error by >= 0.5 divided by number of time-steps.) More closely related

  // to final character error than RMS, but still directly calculable from

  // just the deltas. Because of the binary nature of the targets, zero winner

  // error is a sufficient but not necessary condition for zero char error.

  double ComputeWinnerError(const NetworkIO &deltas);


  // Computes a very simple bag of chars char error rate.

  double ComputeCharError(const std::vector<int> &truth_str,

                          const std::vector<int> &ocr_str);

  // Computes a very simple bag of words word recall error rate.

  // NOTE that this is destructive on both input strings.

  double ComputeWordError(std::string *truth_str, std::string *ocr_str);


  // Updates the error buffer and corresponding mean of the given type with

  // the new_error.

  void UpdateErrorBuffer(double new_error, ErrorTypes type);


  // Rolls error buffers and reports the current means.

  void RollErrorBuffers();


  // Given that error_rate is either a new min or max, updates the best/worst

  // error rates, and record of progress.

  std::string UpdateErrorGraph(int iteration, double error_rate,

                               const std::vector<char> &model_data,

                               const TestCallback &tester);


protected:

#ifndef GRAPHICS_DISABLED

  // Alignment display window.

  ScrollView *align_win_;

  // CTC target display window.

  ScrollView *target_win_;

  // CTC output display window.

  ScrollView *ctc_win_;

  // Reconstructed image window.

  ScrollView *recon_win_;

#endif

  // How often to display a debug image.

  int debug_interval_;

  // Iteration at which the last checkpoint was dumped.

  int checkpoint_iteration_;

  // Basename of files to save best models to.

  std::string model_base_;

  // Checkpoint filename.

  std::string checkpoint_name_;

  // Training data.

  bool randomly_rotate_;

  DocumentCache training_data_;

  // Name to use when saving best_trainer_.

  std::string best_model_name_;

  // Number of available training stages.

  int num_training_stages_;


  // ===Serialized data to ensure that a restart produces the same results.===

  // These members are only serialized when serialize_amount != LIGHT.

  // Best error rate so far.

  double best_error_rate_;

  // Snapshot of all error rates at best_iteration_.

  double best_error_rates_[ET_COUNT];

  // Iteration of best_error_rate_.

  int best_iteration_;

  // Worst error rate since best_error_rate_.

  double worst_error_rate_;

  // Snapshot of all error rates at worst_iteration_.

  double worst_error_rates_[ET_COUNT];

  // Iteration of worst_error_rate_.

  int worst_iteration_;

  // Iteration at which the process will be thought stalled.

  int stall_iteration_;

  // Saved recognition models for computing test error for graph points.

  std::vector<char> best_model_data_;

  std::vector<char> worst_model_data_;

  // Saved trainer for reverting back to last known best.

  std::vector<char> best_trainer_;

  // A subsidiary trainer running with a different learning rate until either

  // *this or sub_trainer_ hits a new best.

  std::unique_ptr<LSTMTrainer> sub_trainer_;

  // Error rate at which last best model was dumped.

  float error_rate_of_last_saved_best_;

  // Current stage of training.

  int training_stage_;

  // History of best error rate against iteration. Used for computing the

  // number of steps to each 2% improvement.

  std::vector<double> best_error_history_;

  std::vector<int32_t> best_error_iterations_;

  // Number of iterations since the best_error_rate_ was 2% more than it is now.

  int32_t improvement_steps_;

  // Number of iterations that yielded a non-zero delta error and thus provided

  // significant learning. learning_iteration_ <= training_iteration_.

  // learning_iteration_ is used to measure rate of learning progress.

  int learning_iteration_;

  // Saved value of sample_iteration_ before looking for the next sample.

  int prev_sample_iteration_;

  // How often to include a PERFECT training sample in backprop.

  // A PERFECT training sample is used if the current

  // training_iteration_ > last_perfect_training_iteration_ + perfect_delay_,

  // so with perfect_delay_ == 0, all samples are used, and with

  // perfect_delay_ == 4, at most 1 in 5 samples will be perfect.

  int perfect_delay_;

  // Value of training_iteration_ at which the last PERFECT training sample

  // was used in back prop.

  int last_perfect_training_iteration_;

  // Rolling buffers storing recent training errors are indexed by

  // training_iteration % kRollingBufferSize_.

  static const int kRollingBufferSize_ = 1000;

  std::vector<double> error_buffers_[ET_COUNT];

  // Rounded mean percent trailing training errors in the buffers.

  double error_rates_[ET_COUNT]; // RMS training error.

  // Traineddata file with optional dawgs + UNICHARSET and recoder.

  TessdataManager mgr_;

};


} // namespace tesseract.


#endif // TESSERACT_LSTM_LSTMTRAINER_H_

imagedata.h

rect.h

lstmrecognizer.h

tesseract
Definition: baseapi.h:39

tesseract::ErrorTypes
ErrorTypes
Definition: lstmtrainer.h:41

tesseract::ET_COUNT
@ ET_COUNT
Definition: lstmtrainer.h:47

tesseract::ET_DELTA
@ ET_DELTA
Definition: lstmtrainer.h:43

tesseract::ET_WORD_RECERR
@ ET_WORD_RECERR
Definition: lstmtrainer.h:44

tesseract::ET_SKIP_RATIO
@ ET_SKIP_RATIO
Definition: lstmtrainer.h:46

tesseract::ET_RMS
@ ET_RMS
Definition: lstmtrainer.h:42

tesseract::ET_CHAR_ERROR
@ ET_CHAR_ERROR
Definition: lstmtrainer.h:45

tesseract::Trainability
Trainability
Definition: lstmtrainer.h:51

tesseract::PERFECT
@ PERFECT
Definition: lstmtrainer.h:53

tesseract::NOT_BOXED
@ NOT_BOXED
Definition: lstmtrainer.h:56

tesseract::HI_PRECISION_ERR
@ HI_PRECISION_ERR
Definition: lstmtrainer.h:55

tesseract::UNENCODABLE
@ UNENCODABLE
Definition: lstmtrainer.h:54

tesseract::TRAINABLE
@ TRAINABLE
Definition: lstmtrainer.h:52

tesseract::SubTrainerResult
SubTrainerResult
Definition: lstmtrainer.h:67

tesseract::STR_UPDATED
@ STR_UPDATED
Definition: lstmtrainer.h:69

tesseract::STR_NONE
@ STR_NONE
Definition: lstmtrainer.h:68

tesseract::STR_REPLACED
@ STR_REPLACED
Definition: lstmtrainer.h:70

tesseract::DeSerialize
bool DeSerialize(bool swap, FILE *fp, std::vector< T > &data)
Definition: helpers.h:205

tesseract::Serialize
bool Serialize(FILE *fp, const std::vector< T > &data)
Definition: helpers.h:236

tesseract::TestCallback
std::function< std::string(int, const double *, const TessdataManager &, int)> TestCallback
Definition: lstmtrainer.h:78

tesseract::TFloat
double TFloat
Definition: tesstypes.h:39

tesseract::CachingStrategy
CachingStrategy
Definition: imagedata.h:42

tesseract::SerializeAmount
SerializeAmount
Definition: lstmtrainer.h:60

tesseract::FULL
@ FULL
Definition: lstmtrainer.h:63

tesseract::NO_BEST_TRAINER
@ NO_BEST_TRAINER
Definition: lstmtrainer.h:62

tesseract::LIGHT
@ LIGHT
Definition: lstmtrainer.h:61

upload.type
type
Definition: upload.py:458

tesseract::ImageData
Definition: imagedata.h:62

tesseract::DocumentCache
Definition: imagedata.h:288

tesseract::DocumentCache::GetPageBySerial
const ImageData * GetPageBySerial(int serial)
Definition: imagedata.h:317

tesseract::TFile
Definition: serialis.h:61

tesseract::TessdataManager
Definition: tessdatamanager.h:127

tesseract::UnicharCompress
Definition: unicharcompress.h:139

tesseract::UNICHARSET
Definition: unicharset.h:164

tesseract::LSTMRecognizer
Definition: lstmrecognizer.h:51

tesseract::NetworkIO
Definition: networkio.h:38

tesseract::LSTMTrainer
Definition: lstmtrainer.h:84

tesseract::LSTMTrainer::best_error_iterations_
std::vector< int32_t > best_error_iterations_
Definition: lstmtrainer.h:463

tesseract::LSTMTrainer::MaintainCheckpointsSpecific
bool MaintainCheckpointsSpecific(int iteration, const std::vector< char > *train_model, const std::vector< char > *rec_model, TestCallback tester, std::stringstream &log_msg)

tesseract::LSTMTrainer::worst_iteration_
int worst_iteration_
Definition: lstmtrainer.h:445

tesseract::LSTMTrainer::worst_model_data_
std::vector< char > worst_model_data_
Definition: lstmtrainer.h:450

tesseract::LSTMTrainer::ReadLocalTrainingDump
bool ReadLocalTrainingDump(const TessdataManager *mgr, const char *data, int size)
Definition: lstmtrainer.cpp:1022

tesseract::LSTMTrainer::target_win_
ScrollView * target_win_
Definition: lstmtrainer.h:410

tesseract::LSTMTrainer::stall_iteration_
int stall_iteration_
Definition: lstmtrainer.h:447

tesseract::LSTMTrainer::EncodeString
bool EncodeString(const std::string &str, std::vector< int > *labels) const
Definition: lstmtrainer.h:254

tesseract::LSTMTrainer::error_rates
const double * error_rates() const
Definition: lstmtrainer.h:136

tesseract::LSTMTrainer::InitCharSet
bool InitCharSet(const std::string &traineddata_path)
Definition: lstmtrainer.h:100

tesseract::LSTMTrainer::InitTensorFlowNetwork
int InitTensorFlowNetwork(const std::string &tf_proto)

tesseract::LSTMTrainer::model_base_
std::string model_base_
Definition: lstmtrainer.h:421

tesseract::LSTMTrainer::best_model_name_
std::string best_model_name_
Definition: lstmtrainer.h:428

tesseract::LSTMTrainer::NewSingleError
double NewSingleError(ErrorTypes type) const
Definition: lstmtrainer.h:158

tesseract::LSTMTrainer::CharError
double CharError() const
Definition: lstmtrainer.h:133

tesseract::LSTMTrainer::best_error_rate_
double best_error_rate_
Definition: lstmtrainer.h:435

tesseract::LSTMTrainer::best_trainer_
std::vector< char > best_trainer_
Definition: lstmtrainer.h:452

tesseract::LSTMTrainer::learning_iteration_
int learning_iteration_
Definition: lstmtrainer.h:469

tesseract::LSTMTrainer::best_error_rate
double best_error_rate() const
Definition: lstmtrainer.h:139

tesseract::LSTMTrainer::LastSingleError
double LastSingleError(ErrorTypes type) const
Definition: lstmtrainer.h:164

tesseract::LSTMTrainer::mutable_training_data
DocumentCache * mutable_training_data()
Definition: lstmtrainer.h:172

tesseract::LSTMTrainer::perfect_delay_
int perfect_delay_
Definition: lstmtrainer.h:477

tesseract::LSTMTrainer::best_trainer
const std::vector< char > & best_trainer() const
Definition: lstmtrainer.h:154

tesseract::LSTMTrainer::error_rate_of_last_saved_best_
float error_rate_of_last_saved_best_
Definition: lstmtrainer.h:457

tesseract::LSTMTrainer::best_iteration_
int best_iteration_
Definition: lstmtrainer.h:439

tesseract::LSTMTrainer::recon_win_
ScrollView * recon_win_
Definition: lstmtrainer.h:414

tesseract::LSTMTrainer::last_perfect_training_iteration_
int last_perfect_training_iteration_
Definition: lstmtrainer.h:480

tesseract::LSTMTrainer::learning_iteration
int learning_iteration() const
Definition: lstmtrainer.h:145

tesseract::LSTMTrainer::set_perfect_delay
void set_perfect_delay(int delay)
Definition: lstmtrainer.h:151

tesseract::LSTMTrainer::randomly_rotate_
bool randomly_rotate_
Definition: lstmtrainer.h:425

tesseract::LSTMTrainer::debug_interval_
int debug_interval_
Definition: lstmtrainer.h:417

tesseract::LSTMTrainer::training_stage_
int training_stage_
Definition: lstmtrainer.h:459

tesseract::LSTMTrainer::num_training_stages_
int num_training_stages_
Definition: lstmtrainer.h:430

tesseract::LSTMTrainer::checkpoint_name_
std::string checkpoint_name_
Definition: lstmtrainer.h:423

tesseract::LSTMTrainer::improvement_steps_
int32_t improvement_steps_
Definition: lstmtrainer.h:465

tesseract::LSTMTrainer::ctc_win_
ScrollView * ctc_win_
Definition: lstmtrainer.h:412

tesseract::LSTMTrainer::CurrentTrainingStage
int CurrentTrainingStage() const
Definition: lstmtrainer.h:217

tesseract::LSTMTrainer::ActivationError
double ActivationError() const
Definition: lstmtrainer.h:130

tesseract::LSTMTrainer::best_model_data_
std::vector< char > best_model_data_
Definition: lstmtrainer.h:449

tesseract::LSTMTrainer::ReadSizedTrainingDump
bool ReadSizedTrainingDump(const char *data, int size, LSTMTrainer &trainer) const
Definition: lstmtrainer.h:307

tesseract::LSTMTrainer::InitCharSet
void InitCharSet(const TessdataManager &mgr)
Definition: lstmtrainer.h:107

tesseract::LSTMTrainer::training_data_
DocumentCache training_data_
Definition: lstmtrainer.h:426

tesseract::LSTMTrainer::checkpoint_iteration_
int checkpoint_iteration_
Definition: lstmtrainer.h:419

tesseract::LSTMTrainer::prev_sample_iteration_
int prev_sample_iteration_
Definition: lstmtrainer.h:471

tesseract::LSTMTrainer::sub_trainer_
std::unique_ptr< LSTMTrainer > sub_trainer_
Definition: lstmtrainer.h:455

tesseract::LSTMTrainer::training_data
const DocumentCache & training_data() const
Definition: lstmtrainer.h:169

tesseract::LSTMTrainer::ReadTrainingDump
bool ReadTrainingDump(const std::vector< char > &data, LSTMTrainer &trainer) const
Definition: lstmtrainer.h:300

tesseract::LSTMTrainer::improvement_steps
int32_t improvement_steps() const
Definition: lstmtrainer.h:148

tesseract::LSTMTrainer::TrainOnLine
const ImageData * TrainOnLine(LSTMTrainer *samples_trainer, bool batch)
Definition: lstmtrainer.h:268

tesseract::LSTMTrainer::best_error_history_
std::vector< double > best_error_history_
Definition: lstmtrainer.h:462

tesseract::LSTMTrainer::best_iteration
int best_iteration() const
Definition: lstmtrainer.h:142

tesseract::LSTMTrainer::mgr_
TessdataManager mgr_
Definition: lstmtrainer.h:488

tesseract::LSTMTrainer::align_win_
ScrollView * align_win_
Definition: lstmtrainer.h:408

tesseract::LSTMTrainer::worst_error_rate_
double worst_error_rate_
Definition: lstmtrainer.h:441

tesseract::LSTMTrainer::SetupCheckpointInfo
void SetupCheckpointInfo()

tesseract::ScrollView
Definition: scrollview.h:109

export.h