tesseract v5.3.3.20231005
params_model.h
Go to the documentation of this file.
1
2// File: params_model.h
3// Description: Trained feature serialization for language parameter training.
4// Author: David Eger
5//
6// (C) Copyright 2011, Google Inc.
7// Licensed under the Apache License, Version 2.0 (the "License");
8// you may not use this file except in compliance with the License.
9// You may obtain a copy of the License at
10// http://www.apache.org/licenses/LICENSE-2.0
11// Unless required by applicable law or agreed to in writing, software
12// distributed under the License is distributed on an "AS IS" BASIS,
13// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14// See the License for the specific language governing permissions and
15// limitations under the License.
16//
18
19#ifndef TESSERACT_WORDREC_PARAMS_MODEL_H_
20#define TESSERACT_WORDREC_PARAMS_MODEL_H_
21
22#include <tesseract/export.h> // for TESS_API
23#include "params_training_featdef.h" // for PTRAIN_NUM_FEATURE_TYPES
24
25namespace tesseract {
26
27class TFile;
28
29// Represents the learned weights for a given language.
31public:
32 // Enum for expressing OCR pass.
33 enum PassEnum {
36
37 PTRAIN_NUM_PASSES
38 };
39
40 ParamsModel() : pass_(PTRAIN_PASS1) {}
41 ParamsModel(const char *lang, const std::vector<float> &weights)
42 : lang_(lang), pass_(PTRAIN_PASS1) {
43 weights_vec_[pass_] = weights;
44 }
45 inline bool Initialized() {
46 return weights_vec_[pass_].size() == PTRAIN_NUM_FEATURE_TYPES;
47 }
48 // Prints out feature weights.
49 void Print();
50 // Clears weights for all passes.
51 void Clear() {
52 for (auto &p : weights_vec_) {
53 p.clear();
54 }
55 }
56 // Copies the weights of the given params model.
57 void Copy(const ParamsModel &other_model);
58 // Applies params model weights to the given features.
59 // Assumes that features is an array of size PTRAIN_NUM_FEATURE_TYPES.
60 float ComputeCost(const float features[]) const;
61 bool Equivalent(const ParamsModel &that) const;
62
63 // Returns true on success.
64 bool SaveToFile(const char *full_path) const;
65
66 // Returns true on success.
67 bool LoadFromFp(const char *lang, TFile *fp);
68
69 const std::vector<float> &weights() const {
70 return weights_vec_[pass_];
71 }
72 const std::vector<float> &weights_for_pass(PassEnum pass) const {
73 return weights_vec_[pass];
74 }
75 void SetPass(PassEnum pass) {
76 pass_ = pass;
77 }
78
79private:
80 bool ParseLine(char *line, char **key, float *val);
81
82 std::string lang_;
83 // Set to the current pass type and used to determine which set of weights
84 // should be used for ComputeCost() and other functions.
85 PassEnum pass_;
86 // Several sets of weights for various OCR passes (e.g. pass1 with adaption,
87 // pass2 without adaption, etc).
88 std::vector<float> weights_vec_[PTRAIN_NUM_PASSES];
89};
90
91} // namespace tesseract
92
93#endif // TESSERACT_WORDREC_PARAMS_MODEL_H_
const char * p
std::string Print(const T &value)
const std::vector< float > & weights() const
Definition: params_model.h:69
void SetPass(PassEnum pass)
Definition: params_model.h:75
const std::vector< float > & weights_for_pass(PassEnum pass) const
Definition: params_model.h:72
ParamsModel(const char *lang, const std::vector< float > &weights)
Definition: params_model.h:41
#define TESS_API
Definition: export.h:32