12#ifndef TESSERACT_UNITTEST_NORMSTRNGS_TEST_H_
13#define TESSERACT_UNITTEST_NORMSTRNGS_TEST_H_
23 std::stringstream result;
24 int total_chars = str32.size();
26 for (
int i = 0;
i < total_chars; ++
i) {
27 result <<
"[" << str32[
i] <<
"]";
41 for (
const auto &s : glyphs) {
49 int unicode_count,
int glyph_count,
int grapheme_count,
50 const std::string &target_str) {
51 std::vector<std::string> glyphs;
56 for (
auto &glyph : glyphs) {
61 true, str.c_str(), &glyphs));
64 for (
auto &glyph : glyphs) {
69 true, str.c_str(), &glyphs));
72 for (
auto &glyph : glyphs) {
77 true, str.c_str(), &glyphs));
#define EXPECT_EQ(val1, val2)
#define EXPECT_TRUE(condition)
std::string PrintString32WithUnicodes(const std::string &str)
void ExpectGraphemeModeResults(const std::string &str, UnicodeNormMode u_mode, int unicode_count, int glyph_count, int grapheme_count, const std::string &target_str)
std::string PrintStringVectorWithUnicodes(const std::vector< std::string > &glyphs)
bool NormalizeCleanAndSegmentUTF8(UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNormMode g_mode, bool report_errors, const char *str8, std::vector< std::string > *graphemes)
bool NormalizeUTF8String(UnicodeNormMode u_mode, OCRNorm ocr_normalize, GraphemeNorm grapheme_normalize, const char *str8, std::string *normalized)
std::string CodepointList(const std::vector< char32 > &str32)
static std::vector< char32 > UTF8ToUTF32(const char *utf8_str)