tesseract v5.3.3.20231005
normstrngs_test.cc File Reference
#include "normstrngs.h"
#include <tesseract/unichar.h>
#include "include_gunit.h"
#include "normstrngs_test.h"

Go to the source code of this file.

Namespaces

namespace  tesseract
 

Functions

 tesseract::TEST (NormstrngsTest, BasicText)
 
 tesseract::TEST (NormstrngsTest, LigatureText)
 
 tesseract::TEST (NormstrngsTest, OcrSpecificNormalization)
 
 tesseract::TEST (NormstrngsTest, DetectsCorrectText)
 
 tesseract::TEST (NormstrngsTest, DetectsIncorrectText)
 
 tesseract::TEST (NormstrngsTest, NonIndicTextDoesntBreakIndicRules)
 
 tesseract::TEST (NormstrngsTest, NoLonelyJoiners)
 
 tesseract::TEST (NormstrngsTest, NoLonelyJoinersPlus)
 
 tesseract::TEST (NormstrngsTest, NoLonelyJoinersNonAlpha)
 
 tesseract::TEST (NormstrngsTest, JoinersStayInArabic)
 
 tesseract::TEST (NormstrngsTest, DigitOK)
 
 tesseract::TEST (NormstrngsTest, DandaOK)
 
 tesseract::TEST (NormstrngsTest, AllScriptsRegtest)
 
 tesseract::TEST (NormstrngsTest, IsWhitespace)
 
 tesseract::TEST (NormstrngsTest, SpanUTF8Whitespace)
 
 tesseract::TEST (NormstrngsTest, SpanUTF8NotWhitespace)
 
 tesseract::TEST (NormstrngsTest, IsInterchangeValid)
 
 tesseract::TEST (NormstrngsTest, IsInterchangeValid7BitAscii)
 
 tesseract::TEST (NormstrngsTest, FullwidthToHalfwidth)
 

Variables

const char tesseract::kEngText [] = "the quick brown fox jumps over the lazy dog"
 
const char tesseract::kHinText [] = "पिताने विवाह की | हो गई उद्विग्न वह सोचा"
 
const char tesseract::kKorText [] = "이는 것으로"
 
const char * tesseract::kBadlyFormedHinWords [] = {"उपयोक्ताो", "नहीें", "प्रंात", "कहीअे", "पत्रिाका", "छह्णाीस"}
 
const char * tesseract::kBadlyFormedThaiWords [] = {"ฤิ", "กา้ํ", "กิำ", "นำ้", "เเก"}