tesseract v5.3.3.20231005
wordseg.cpp File Reference
#include "wordseg.h"
#include <cmath>
#include "blobbox.h"
#include "cjkpitch.h"
#include "drawtord.h"
#include "fpchop.h"
#include "makerow.h"
#include "pitsync1.h"
#include "statistc.h"
#include "textord.h"
#include "topitch.h"
#include "tovars.h"

Go to the source code of this file.

Namespaces

namespace  tesseract
 

Macros

#define BLOCK_STATS_CLUSTERS   10
 

Functions

make_single_word

For each row, arrange the blobs into one word. There is no fixed pitch detection.

void tesseract::make_single_word (bool one_blob, TO_ROW_LIST *rows, ROW_LIST *real_rows)
 
void tesseract::make_words (tesseract::Textord *textord, ICOORD page_tr, float gradient, BLOCK_LIST *blocks, TO_BLOCK_LIST *port_blocks)
 
set_row_spaces

Set the min_space and max_nonspace members of the row so that the blobs can be arranged into words.

void tesseract::set_row_spaces (TO_BLOCK *block, FCOORD rotation, bool testing_on)
 
row_words

Compute the max nonspace and min space for the row.

int32_t tesseract::row_words (TO_BLOCK *block, TO_ROW *row, int32_t maxwidth, FCOORD rotation, bool testing_on)
 
row_words2

Compute the max nonspace and min space for the row.

int32_t tesseract::row_words2 (TO_BLOCK *block, TO_ROW *row, int32_t maxwidth, FCOORD rotation, bool testing_on)
 
make_real_words

Convert a TO_BLOCK to a BLOCK.

void tesseract::make_real_words (tesseract::Textord *textord, TO_BLOCK *block, FCOORD rotation)
 
make_rep_words

Fabricate a real row from only the repeated blob words. Get the xheight from the block as it may be more meaningful.

ROW * tesseract::make_rep_words (TO_ROW *row, TO_BLOCK *block)
 
make_real_word

Construct a WERD from a given number of adjacent entries in a list of BLOBNBOXs.

WERD * tesseract::make_real_word (BLOBNBOX_IT *box_it, int32_t blobcount, bool bol, uint8_t blanks)
 

Variables

bool tesseract::textord_force_make_prop_words = false
 
bool tesseract::textord_chopper_test = false
 

Macro Definition Documentation

◆ BLOCK_STATS_CLUSTERS

#define BLOCK_STATS_CLUSTERS   10

Definition at line 44 of file wordseg.cpp.