#include <cstdlib>
#include <filesystem>
#include "boxread.h"
#include "commandlineflags.h"
#include "commontraining.h"
#include "lang_model_helpers.h"
#include "normstrngs.h"
#include "unicharset.h"
#include "unicharset_training_utils.h"
Go to the source code of this file.
|
int | main (int argc, char **argv) |
|
◆ main()
int main |
( |
int |
argc, |
|
|
char ** |
argv |
|
) |
| |
Definition at line 103 of file unicharset_extractor.cpp.
103 {
104 tesseract::CheckSharedLibraryVersion();
105 if (argc > 1) {
107 }
108 if (argc < 2) {
110 "Usage: %s [--output_unicharset filename] [--norm_mode mode]"
111 " box_or_text_file [...]\n",
112 argv[0]);
113 tprintf(
"Where mode means:\n");
114 tprintf(
" 1=combine graphemes (use for Latin and other simple scripts)\n");
115 tprintf(
" 2=split graphemes (use for Indic/Khmer/Myanmar)\n");
116 tprintf(
" 3=pure unicode (use for Arabic/Hebrew/Thai/Tibetan)\n");
117 tprintf(
"Reads box or plain text files to extract the unicharset.\n");
118 return EXIT_FAILURE;
119 }
120 return tesseract::Main(argc, argv);
121}
void ParseCommandLineFlags(const char *usage, int *argc, char ***argv, const bool remove_flags)
void tprintf(const char *format,...)