19 #include "config_auto.h" 34 const char* extension)
35 : file_extension_(extension),
36 title_(
""), imagenum_(-1),
40 if (strcmp(outputbase,
"-") && strcmp(outputbase,
"stdout")) {
42 fout_ = fopen(outfile.
string(),
"wb");
50 if (fout_ !=
nullptr) {
60 if (next == NULL)
return;
65 while (next->next_ != NULL) {
68 next->next_ = remainder;
73 if (!happy_)
return false;
84 if (!happy_)
return false;
94 if (!happy_)
return false;
107 int n = fwrite(s, 1, len, fout_);
108 if (n != len) happy_ =
false;
128 const std::unique_ptr<const char[]> utf8(api->
GetUTF8Text());
136 if (pageSeparator !=
nullptr && *pageSeparator !=
'\0') {
153 font_info_ = font_info;
158 "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\n" 159 "<!DOCTYPE html PUBLIC \"-//W3C//DTD XHTML 1.0 Transitional//EN\"\n" 160 " \"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd\">\n" 161 "<html xmlns=\"http://www.w3.org/1999/xhtml\" xml:lang=\"en\" " 162 "lang=\"en\">\n <head>\n <title>");
166 "<meta http-equiv=\"Content-Type\" content=\"text/html;" 167 "charset=utf-8\" />\n" 170 " <meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par" 171 " ocr_line ocrx_word");
174 " ocrp_lang ocrp_dir ocrp_font ocrp_fsize ocrp_wconf");
177 "</head>\n<body>\n");
190 if (hocr == NULL)
return false;
207 font_info_ = font_info;
213 "level\tpage_num\tblock_num\tpar_num\tline_num\tword_" 214 "num\tleft\ttop\twidth\theight\tconf\ttext\n");
222 if (tsv == NULL)
return false;
237 const std::unique_ptr<const char[]> unlv(api->
GetUNLVText());
238 if (unlv == NULL)
return false;
254 if (text == NULL)
return false;
269 if (osd == NULL)
return false;
bool AddImage(TessBaseAPI *api)
virtual bool EndDocumentHandler()
TessHOcrRenderer(const char *outputbase, bool font_info)
virtual bool BeginDocumentHandler()
char * GetTSVText(int page_number)
virtual bool EndDocumentHandler()
TessOsdRenderer(const char *outputbase)
TessTextRenderer(const char *outputbase)
char * GetBoxText(int page_number)
virtual bool AddImageHandler(TessBaseAPI *api)
virtual bool AddImageHandler(TessBaseAPI *api)
TessBoxTextRenderer(const char *outputbase)
TessUnlvRenderer(const char *outputbase)
const char * string() const
virtual bool AddImageHandler(TessBaseAPI *api)
virtual bool AddImageHandler(TessBaseAPI *api)
TessResultRenderer(const char *outputbase, const char *extension)
const char * title() const
void insert(TessResultRenderer *next)
virtual bool BeginDocumentHandler()
bool BeginDocument(const char *title)
char * GetOsdText(int page_number)
TessTsvRenderer(const char *outputbase, bool font_info)
const char * GetStringVariable(const char *name) const
virtual bool EndDocumentHandler()
virtual bool AddImageHandler(TessBaseAPI *api)
virtual bool BeginDocumentHandler()
virtual ~TessResultRenderer()
void AppendString(const char *s)
virtual bool AddImageHandler(TessBaseAPI *api)
void AppendData(const char *s, int len)
TessResultRenderer * next()
char * GetHOCRText(ETEXT_DESC *monitor, int page_number)
#define TESSERACT_VERSION_STR
virtual bool AddImageHandler(TessBaseAPI *api)=0