tesseract v5.3.3.20231005
tessclassifier.cpp
Go to the documentation of this file.
1
2// File: tessclassifier.cpp
3// Description: Tesseract implementation of a ShapeClassifier.
4// Author: Ray Smith
5//
6// (C) Copyright 2011, Google Inc.
7// Licensed under the Apache License, Version 2.0 (the "License");
8// you may not use this file except in compliance with the License.
9// You may obtain a copy of the License at
10// http://www.apache.org/licenses/LICENSE-2.0
11// Unless required by applicable law or agreed to in writing, software
12// distributed under the License is distributed on an "AS IS" BASIS,
13// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14// See the License for the specific language governing permissions and
15// limitations under the License.
16//
18
19#include "tessclassifier.h"
20
21#include "classify.h"
22#include "trainingsample.h"
23
24namespace tesseract {
25
26// Classifies the given [training] sample, writing to results.
27// See ShapeClassifier for a full description.
28int TessClassifier::UnicharClassifySample(const TrainingSample &sample, Image page_pix, int debug,
29 UNICHAR_ID keep_this,
30 std::vector<UnicharRating> *results) {
31 const int old_matcher_level = classify_->matcher_debug_level;
32 const int old_matcher_flags = classify_->matcher_debug_flags;
33 const int old_classify_level = classify_->classify_debug_level;
34 if (debug) {
35 // Explicitly set values of various control parameters to generate debug
36 // output if required, restoring the old values after classifying.
37 classify_->matcher_debug_level.set_value(2);
38 classify_->matcher_debug_flags.set_value(25);
39 classify_->classify_debug_level.set_value(3);
40 }
41 classify_->CharNormTrainingSample(pruner_only_, keep_this, sample, results);
42 if (debug) {
43 classify_->matcher_debug_level.set_value(old_matcher_level);
44 classify_->matcher_debug_flags.set_value(old_matcher_flags);
45 classify_->classify_debug_level.set_value(old_classify_level);
46 }
47 return results->size();
48}
49
50// Provides access to the ShapeTable that this classifier works with.
52 return classify_->shape_table();
53}
54// Provides access to the UNICHARSET that this classifier works with.
55// Only needs to be overridden if GetShapeTable() can return nullptr.
57 return classify_->unicharset;
58}
59
60// Displays classification as the given shape_id. Creates as many windows
61// as it feels fit, using index as a guide for placement. Adds any created
62// windows to the windows output and returns a new index that may be used
63// by any subsequent classifiers. Caller waits for the user to view and
64// then destroys the windows by clearing the vector.
65int TessClassifier::DisplayClassifyAs(const TrainingSample &sample, Image page_pix, int unichar_id,
66 int index, std::vector<ScrollView *> &windows) {
67 int shape_id = unichar_id;
68 // TODO(rays) Fix this so it works with both flat and real shapetables.
69 // if (GetShapeTable() != nullptr)
70 // shape_id = BestShapeForUnichar(sample, page_pix, unichar_id, nullptr);
71 if (shape_id < 0) {
72 return index;
73 }
74 if (UnusedClassIdIn(classify_->PreTrainedTemplates, shape_id)) {
75 tprintf("No built-in templates for class/shape %d\n", shape_id);
76 return index;
77 }
78#ifndef GRAPHICS_DISABLED
79 classify_->ShowBestMatchFor(shape_id, sample.features(), sample.num_features());
80#endif
81 return index;
82}
83
84} // namespace tesseract
#define UnusedClassIdIn(T, c)
Definition: intproto.h:155
void tprintf(const char *format,...)
Definition: tprintf.cpp:41
int UNICHAR_ID
Definition: unichar.h:34
UNICHARSET unicharset
Definition: ccutil.h:61
const ShapeTable * shape_table() const
Definition: classify.h:102
void ShowBestMatchFor(int shape_id, const INT_FEATURE_STRUCT *features, int num_features)
INT_TEMPLATES_STRUCT * PreTrainedTemplates
Definition: classify.h:419
int CharNormTrainingSample(bool pruner_only, int keep_this, const TrainingSample &sample, std::vector< UnicharRating > *results)
const ShapeTable * GetShapeTable() const override
const UNICHARSET & GetUnicharset() const override
int UnicharClassifySample(const TrainingSample &sample, Image page_pix, int debug, UNICHAR_ID keep_this, std::vector< UnicharRating > *results) override
int DisplayClassifyAs(const TrainingSample &sample, Image page_pix, int unichar_id, int index, std::vector< ScrollView * > &windows) override
const INT_FEATURE_STRUCT * features() const
uint32_t num_features() const