tesseract-ocr.github.io/5.3.3/a01556_source.html

#include <allheaders.h>

#include <tesseract/baseapi.h>

#include <tesseract/resultiterator.h>

#include <string>

#include "scrollview.h"


#include "include_gunit.h"

#include "log.h" // for LOG


namespace tesseract {


// DEFINE_string(tess_config, "", "config file for tesseract");

// DEFINE_bool(visual_test, false, "Runs a visual test using scrollview");


// The fixture for testing Tesseract.

class ResultIteratorTest : public testing::Test {

protected:

  std::string TestDataNameToPath(const std::string &name) {

    return file::JoinPath(TESTING_DIR, name);

  }

  std::string TessdataPath() {

    return file::JoinPath(TESSDATA_DIR, "");

  }

  std::string OutputNameToPath(const std::string &name) {

    file::MakeTmpdir();

    return file::JoinPath(FLAGS_test_tmpdir, name);

  }


  ResultIteratorTest() {

    src_pix_ = nullptr;

  }

  ~ResultIteratorTest() override = default;


  void SetImage(const char *filename) {

    src_pix_ = pixRead(TestDataNameToPath(filename).c_str());

    api_.Init(TessdataPath().c_str(), "eng", tesseract::OEM_TESSERACT_ONLY);

    //    if (!FLAGS_tess_config.empty())

    //      api_.ReadConfigFile(FLAGS_tess_config.c_str());

    api_.SetPageSegMode(tesseract::PSM_AUTO);

    api_.SetImage(src_pix_);

    src_pix_.destroy();

    src_pix_ = api_.GetInputImage();

  }


  // Rebuilds the image using the binary images at the given level, and

  // EXPECTs that the number of pixels in the xor of the rebuilt image with

  // the original is at most max_diff.

  void VerifyRebuild(int max_diff, PageIteratorLevel level, PageIterator *it) {

    it->Begin();

    int width = pixGetWidth(src_pix_);

    int height = pixGetHeight(src_pix_);

    int depth = pixGetDepth(src_pix_);

    Image pix = pixCreate(width, height, depth);

    EXPECT_TRUE(depth == 1 || depth == 8);

    if (depth == 8) {

      pixSetAll(pix);

    }

    do {

      int left, top, right, bottom;

      PageIteratorLevel im_level = level;

      // If the return is false, it is a non-text block so get the block image.

      if (!it->BoundingBox(level, &left, &top, &right, &bottom)) {

        im_level = tesseract::RIL_BLOCK;

        EXPECT_TRUE(it->BoundingBox(im_level, &left, &top, &right, &bottom));

      }

      LOG(INFO) << "BBox: [L:" << left << ", T:" << top << ", R:" << right << ", B:" << bottom

                << "]"

                << "\n";

      Image block_pix;

      if (depth == 1) {

        block_pix = it->GetBinaryImage(im_level);

        pixRasterop(pix, left, top, right - left, bottom - top, PIX_SRC ^ PIX_DST, block_pix, 0, 0);

      } else {

        block_pix = it->GetImage(im_level, 2, src_pix_, &left, &top);

        pixRasterop(pix, left, top, pixGetWidth(block_pix), pixGetHeight(block_pix),

                    PIX_SRC & PIX_DST, block_pix, 0, 0);

      }

      CHECK(block_pix != nullptr);

      block_pix.destroy();

    } while (it->Next(level));

    //    if (base::GetFlag(FLAGS_v) >= 1)

    //      pixWrite(OutputNameToPath("rebuilt.png").c_str(), pix, IFF_PNG);

    pixRasterop(pix, 0, 0, width, height, PIX_SRC ^ PIX_DST, src_pix_, 0, 0);

    if (depth == 8) {

      Image binary_pix = pixThresholdToBinary(pix, 128);

      pix.destroy();

      pixInvert(binary_pix, binary_pix);

      pix = binary_pix;

    }

    //    if (base::GetFlag(FLAGS_v) >= 1)

    //      pixWrite(OutputNameToPath("rebuiltxor.png").c_str(), pix, IFF_PNG);

    l_int32 pixcount;

    pixCountPixels(pix, &pixcount, nullptr);

    if (pixcount > max_diff) {

      std::string outfile = OutputNameToPath("failedxor.png");

      LOG(INFO) << "outfile = " << outfile << "\n";

      pixWrite(outfile.c_str(), pix, IFF_PNG);

    }

    pix.destroy();

    LOG(INFO) << "At level " << level << ": pix diff = " << pixcount << "\n";

    EXPECT_LE(pixcount, max_diff);

    //    if (base::GetFlag(FLAGS_v) > 1) CHECK_LE(pixcount, max_diff);

  }


  // Rebuilds the text from the iterator strings at the given level, and

  // EXPECTs that the rebuild string exactly matches the truth string.

  void VerifyIteratorText(const std::string &truth, PageIteratorLevel level, ResultIterator *it) {

    LOG(INFO) << "Text Test Level " << level << "\n";

    it->Begin();

    std::string result;

    do {

      char *text = it->GetUTF8Text(level);

      result += text;

      delete[] text;

      if ((level == tesseract::RIL_WORD || level == tesseract::RIL_SYMBOL) &&

          it->IsAtFinalElement(tesseract::RIL_WORD, level)) {

        if (it->IsAtFinalElement(tesseract::RIL_TEXTLINE, level)) {

          result += '\n';

        } else {

          result += ' ';

        }

        if (it->IsAtFinalElement(tesseract::RIL_PARA, level) &&

            !(it->IsAtFinalElement(tesseract::RIL_BLOCK, level))) {

          result += '\n';

        }

      }

    } while (it->Next(level));

    EXPECT_STREQ(truth.c_str(), result.c_str()) << "Rebuild failed at Text Level " << level;

  }


  void VerifyRebuilds(int block_limit, int para_limit, int line_limit, int word_limit,

                      int symbol_limit, PageIterator *it, PageIteratorLevel maxlevel=tesseract::RIL_SYMBOL) {

    VerifyRebuild(block_limit, tesseract::RIL_BLOCK, it);

    VerifyRebuild(para_limit, tesseract::RIL_PARA, it);

    VerifyRebuild(line_limit, tesseract::RIL_TEXTLINE, it);

    VerifyRebuild(word_limit, tesseract::RIL_WORD, it);

    if (maxlevel == tesseract::RIL_SYMBOL) {

      VerifyRebuild(symbol_limit, maxlevel, it);

    }

  }


  void VerifyAllText(const std::string &truth, ResultIterator *it) {

    VerifyIteratorText(truth, tesseract::RIL_BLOCK, it);

    VerifyIteratorText(truth, tesseract::RIL_PARA, it);

    VerifyIteratorText(truth, tesseract::RIL_TEXTLINE, it);

    VerifyIteratorText(truth, tesseract::RIL_WORD, it);

    VerifyIteratorText(truth, tesseract::RIL_SYMBOL, it);

  }


  // Verifies that ResultIterator::CalculateTextlineOrder() produces the right

  // results given an array of word directions (word_dirs[num_words]), an

  // expected output reading order

  // (expected_reading_order[num_reading_order_entries]) and a given reading

  // context (ltr or rtl).

  void ExpectTextlineReadingOrder(bool in_ltr_context, const StrongScriptDirection *word_dirs,

                                  int num_words, int *expected_reading_order,

                                  int num_reading_order_entries) const {

    std::vector<StrongScriptDirection> gv_word_dirs;

    for (int i = 0; i < num_words; i++) {

      gv_word_dirs.push_back(word_dirs[i]);

    }


    std::vector<int> calculated_order;

    ResultIterator::CalculateTextlineOrder(in_ltr_context, gv_word_dirs, &calculated_order);

    // STL vector can be used with EXPECT_EQ, so convert...

    std::vector<int> correct_order(expected_reading_order,

                                   expected_reading_order + num_reading_order_entries);

    EXPECT_EQ(correct_order, calculated_order);

  }


  // Verify that ResultIterator::CalculateTextlineOrder() produces sane output

  // for a given array of word_dirs[num_words] in ltr or rtl context.

  // Sane means that the output contains some permutation of the indices

  // 0..[num_words - 1] interspersed optionally with negative (marker) values.

  void VerifySaneTextlineOrder(bool in_ltr_context, const StrongScriptDirection *word_dirs,

                               int num_words) const {

    std::vector<StrongScriptDirection> gv_word_dirs;

    for (int i = 0; i < num_words; i++) {

      gv_word_dirs.push_back(word_dirs[i]);

    }


    std::vector<int> output;

    ResultIterator::CalculateTextlineOrder(in_ltr_context, gv_word_dirs, &output);

    ASSERT_GE(output.size(), num_words);

    std::vector<int> output_copy(output);

    std::sort(output_copy.begin(), output_copy.end());

    bool sane = true;

    unsigned j = 0;

    while (j < output_copy.size() && output_copy[j] < 0) {

      j++;

    }

    for (int i = 0; i < num_words; i++, j++) {

      if (output_copy[j] != i) {

        sane = false;

        break;

      }

    }

    if (j != output_copy.size()) {

      sane = false;

    }

    if (!sane) {

      std::vector<int> empty;

      EXPECT_EQ(output, empty) << " permutation of 0.." << num_words - 1 << " not found in "

                               << (in_ltr_context ? "ltr" : "rtl") << " context.";

    }

  }


  // Objects declared here can be used by all tests in the test case for Foo.

  Image src_pix_; // Borrowed from api_. Do not destroy.

  std::string ocr_text_;

  tesseract::TessBaseAPI api_;

};


// Tests layout analysis output (and scrollview) on the UNLV page numbered

// 8087_054.3G.tif. (Dubrovnik), but only if --visual_test is true.

//

// TEST_F(ResultIteratorTest, VisualTest) {

//  if (!FLAGS_visual_test) return;

//  const char* kIms[] = {"8087_054.3G.tif", "8071_093.3B.tif", nullptr};

//  for (int i = 0; kIms[i] != nullptr; ++i) {

//    SetImage(kIms[i]);

//    // Just run layout analysis.

//    PageIterator* it = api_.AnalyseLayout();

//    EXPECT_FALSE(it == nullptr);

//    // Make a scrollview window for the display.

//    int width = pixGetWidth(src_pix_);

//    int height = pixGetHeight(src_pix_);

//    ScrollView* win =

//        new ScrollView(kIms[i], 100, 100, width / 2, height / 2, width, height);

//    win->Image(src_pix_, 0, 0);

//    it->Begin();

//    ScrollView::Color color = ScrollView::RED;

//    win->Brush(ScrollView::NONE);

//    do {

//      Pta* pts = it->BlockPolygon();

//      if (pts != nullptr) {

//        win->Pen(color);

//        int num_pts = ptaGetCount(pts);

//        l_float32 x, y;

//        ptaGetPt(pts, num_pts - 1, &x, &y);

//        win->SetCursor(static_cast<int>(x), static_cast<int>(y));

//        for (int p = 0; p < num_pts; ++p) {

//          ptaGetPt(pts, p, &x, &y);

//          win->DrawTo(static_cast<int>(x), static_cast<int>(y));

//        }

//      }

//      ptaDestroy(&pts);

//    } while (it->Next(tesseract::RIL_BLOCK));

//    win->Update();

//    delete win->AwaitEvent(SVET_DESTROY);

//    delete win;

//    delete it;

//  }

//}


// Tests that Tesseract gets exactly the right answer on phototest.

TEST_F(ResultIteratorTest, EasyTest) {

  SetImage("phototest.tif");

  // Just run layout analysis.

  PageIterator *p_it = api_.AnalyseLayout();

  EXPECT_FALSE(p_it == nullptr);

  // Check iterator position.

  EXPECT_TRUE(p_it->IsAtBeginningOf(tesseract::RIL_BLOCK));

  // This should be a single block.

  EXPECT_FALSE(p_it->Next(tesseract::RIL_BLOCK));

  EXPECT_FALSE(p_it->IsAtBeginningOf(tesseract::RIL_BLOCK));


  // The images should rebuild almost perfectly.

  LOG(INFO) << "Verifying image rebuilds 1 (pageiterator)"

            << "\n";

  VerifyRebuilds(10, 10, 0, 0, 0, p_it);

  delete p_it;


  char *result = api_.GetUTF8Text();

  ocr_text_ = result;

  delete[] result;

  ResultIterator *r_it = api_.GetIterator();

  // The images should rebuild almost perfectly.

  LOG(INFO) << "Verifying image rebuilds 2a (resultiterator)"

            << "\n";

  VerifyRebuilds(8, 8, 0, 0, 40, r_it, tesseract::RIL_WORD);

  // Test the text.

  LOG(INFO) << "Verifying text rebuilds 1 (resultiterator)"

            << "\n";

  VerifyAllText(ocr_text_, r_it);


  // The images should rebuild almost perfectly.

  LOG(INFO) << "Verifying image rebuilds 2b (resultiterator)"

            << "\n";

  VerifyRebuilds(8, 8, 0, 0, 40, r_it, tesseract::RIL_WORD);


  r_it->Begin();

  // Test baseline of the first line.

  int x1, y1, x2, y2;

  r_it->Baseline(tesseract::RIL_TEXTLINE, &x1, &y1, &x2, &y2);

  LOG(INFO) << "Baseline ("

     << x1 << ',' << y1 << ")->(" << x2 << ',' << y2 << ")\n";

  // Make sure we have a decent vector.

  EXPECT_GE(x2, x1 + 400);

  // The point 200,116 should be very close to the baseline.

  // (x3,y3) is the vector from (x1,y1) to (200,116)

  int x3 = 200 - x1;

  int y3 = 116 - y1;

  x2 -= x1;

  y2 -= y1;

  // The cross product (x2,y1)x(x3,y3) should be small.

  int product = x2 * y3 - x3 * y2;

  EXPECT_LE(abs(product), x2);


  // Test font attributes for each word.

  do {

    float confidence = r_it->Confidence(tesseract::RIL_WORD);

#ifndef DISABLED_LEGACY_ENGINE

    int pointsize, font_id;

    bool bold, italic, underlined, monospace, serif, smallcaps;

    const char *font = r_it->WordFontAttributes(&bold, &italic, &underlined, &monospace, &serif,

                                                &smallcaps, &pointsize, &font_id);

    EXPECT_GE(confidence, 80.0f);

#endif

    char *word_str = r_it->GetUTF8Text(tesseract::RIL_WORD);


#ifdef DISABLED_LEGACY_ENGINE

    LOG(INFO) << "Word " << word_str << ", conf " << confidence << "\n";

#else

    LOG(INFO) << "Word " << word_str << " in font " << font

      << ", id " << font_id << ", size " << pointsize

      << ", conf " << confidence << "\n";

#endif // def DISABLED_LEGACY_ENGINE

    delete[] word_str;

#ifndef DISABLED_LEGACY_ENGINE

    EXPECT_FALSE(bold);

    EXPECT_FALSE(italic);

    EXPECT_FALSE(underlined);

    EXPECT_FALSE(monospace);

    EXPECT_FALSE(serif);

    // The text is about 31 pixels high.  Above we say the source is 200 ppi,

    // which translates to:

    // 31 pixels / textline * (72 pts / inch) / (200 pixels / inch) = 11.16 pts

    EXPECT_GE(pointsize, 11.16 - 1.50);

    EXPECT_LE(pointsize, 11.16 + 1.50);

#endif // def DISABLED_LEGACY_ENGINE

  } while (r_it->Next(tesseract::RIL_WORD));

  delete r_it;

}


// Tests image rebuild on the UNLV page numbered 8087_054.3B.tif. (Dubrovnik)

TEST_F(ResultIteratorTest, ComplexTest) {

  SetImage("8087_054.3B.tif");

  // Just run layout analysis.

  PageIterator *it = api_.AnalyseLayout();

  EXPECT_FALSE(it == nullptr);

  // The images should rebuild almost perfectly.

  VerifyRebuilds(2073, 2073, 2080, 2081, 2090, it);

  delete it;

}


// Tests image rebuild on the UNLV page numbered 8087_054.3G.tif. (Dubrovnik)

TEST_F(ResultIteratorTest, GreyTest) {

  SetImage("8087_054.3G.tif");

  // Just run layout analysis.

  PageIterator *it = api_.AnalyseLayout();

  EXPECT_FALSE(it == nullptr);

  // The images should rebuild almost perfectly.

  VerifyRebuilds(600, 600, 600, 600, 600, it);

  delete it;

}


// Tests that Tesseract gets smallcaps and dropcaps.

TEST_F(ResultIteratorTest, SmallCapDropCapTest) {

#ifdef DISABLED_LEGACY_ENGINE

  // Skip test as LSTM mode does not recognize smallcaps & dropcaps attributes.

  GTEST_SKIP();

#else

  SetImage("8071_093.3B.tif");

  char *result = api_.GetUTF8Text();

  delete[] result;

  ResultIterator *r_it = api_.GetIterator();

  // Iterate over the words.

  int found_dropcaps = 0;

  int found_smallcaps = 0;

  int false_positives = 0;

  do {

    bool bold, italic, underlined, monospace, serif, smallcaps;

    int pointsize, font_id;

    r_it->WordFontAttributes(&bold, &italic, &underlined, &monospace, &serif, &smallcaps,

                             &pointsize, &font_id);

    char *word_str = r_it->GetUTF8Text(tesseract::RIL_WORD);

    if (word_str != nullptr) {

      LOG(INFO) << "Word " << word_str

        << " is " << (smallcaps ? "SMALLCAPS" : "Normal") << "\n";

      if (r_it->SymbolIsDropcap()) {

        ++found_dropcaps;

      }

      if (strcmp(word_str, "SHE") == 0 || strcmp(word_str, "MOPED") == 0 ||

          strcmp(word_str, "RALPH") == 0 || strcmp(word_str, "KINNEY") == 0 || // Not working yet.

          strcmp(word_str, "BENNETT") == 0) {

        EXPECT_TRUE(smallcaps) << word_str;

        ++found_smallcaps;

      } else {

        if (smallcaps) {

          ++false_positives;

        }

      }

      // No symbol other than the first of any word should be dropcap.

      ResultIterator s_it(*r_it);

      while (s_it.Next(tesseract::RIL_SYMBOL) && !s_it.IsAtBeginningOf(tesseract::RIL_WORD)) {

        if (s_it.SymbolIsDropcap()) {

          char *sym_str = s_it.GetUTF8Text(tesseract::RIL_SYMBOL);

          LOG(ERROR) << "Symbol " << sym_str << " of word " << word_str << " is dropcap";

          delete[] sym_str;

        }

        EXPECT_FALSE(s_it.SymbolIsDropcap());

      }

      delete[] word_str;

    }

  } while (r_it->Next(tesseract::RIL_WORD));

  delete r_it;

  EXPECT_EQ(1, found_dropcaps);

  EXPECT_GE(4, found_smallcaps);

  EXPECT_LE(false_positives, 3);

#endif // DISABLED_LEGACY_ENGINE

}


#if 0

// TODO(rays) uncomment on the next change to layout analysis.

// CL 22736106 breaks it, but it is fixed in the change when

// the textline finders start to collapse.


// Tests that Tesseract gets subscript and superscript.

// TODO(rays) This test is a bit feeble, due to bad textline finding on this

// image, so beef up the test a bit when we get less false positive subs.

TEST_F(ResultIteratorTest, SubSuperTest) {

  SetImage("0146_281.3B.tif");

  char* result = api_.GetUTF8Text();

  delete [] result;

  ResultIterator* r_it = api_.GetIterator();

  // Iterate over the symbols.

  // Accuracy isn't great, so just count up and expect a decent count of

  // positives and negatives.

  const char kAllowedSupers[] = "O0123456789-";

  int found_subs = 0;

  int found_supers = 0;

  int found_normal = 0;

  do {

    if (r_it->SymbolIsSubscript()) {

      ++found_subs;

    } else if (r_it->SymbolIsSuperscript()) {

      result = r_it->GetUTF8Text(tesseract::RIL_SYMBOL);

      if (strchr(kAllowedSupers, result[0]) == nullptr) {

        char* word = r_it->GetUTF8Text(tesseract::RIL_WORD);

        LOG(ERROR) << "Char " << result << " in word " << word << " is unexpected super!";

        delete [] word;

        EXPECT_TRUE(strchr(kAllowedSupers, result[0]) != nullptr);

      }

      delete [] result;

      ++found_supers;

    } else {

      ++found_normal;

    }

  } while (r_it->Next(tesseract::RIL_SYMBOL));

  delete r_it;

  LOG(INFO) << "Subs = " << found_subs << ", supers= " << found_supers

    << ", normal = " << found_normal << "\n";

  EXPECT_GE(found_subs, 25);

  EXPECT_GE(found_supers, 25);

  EXPECT_GE(found_normal, 1350);

}

#endif


static const StrongScriptDirection dL = DIR_LEFT_TO_RIGHT;

static const StrongScriptDirection dR = DIR_RIGHT_TO_LEFT;

static const StrongScriptDirection dN = DIR_NEUTRAL;


// Test that a sequence of words that could be interpreted to start from

// the left side left-to-right or from the right side right-to-left is

// interpreted appropriately in different contexts.

TEST_F(ResultIteratorTest, DualStartTextlineOrderTest) {

  const StrongScriptDirection word_dirs[] = {dL, dL, dN, dL, dN, dR, dR, dR};

  int reading_order_rtl_context[] = {7, 6, 5, 4, ResultIterator::kMinorRunStart,

                                     0, 1, 2, 3, ResultIterator::kMinorRunEnd};

  int reading_order_ltr_context[] = {

      0, 1, 2, 3, 4, ResultIterator::kMinorRunStart, 7, 6, 5, ResultIterator::kMinorRunEnd};


  ExpectTextlineReadingOrder(true, word_dirs, countof(word_dirs), reading_order_ltr_context,

                             countof(reading_order_ltr_context));

  ExpectTextlineReadingOrder(false, word_dirs, countof(word_dirs), reading_order_rtl_context,

                             countof(reading_order_rtl_context));

}


// Tests that clearly left-direction text (with no right-to-left indications)

// comes out strictly left to right no matter the context.

TEST_F(ResultIteratorTest, LeftwardTextlineOrderTest) {

  const StrongScriptDirection word_dirs[] = {dL, dL, dN, dL, dN, dN, dL, dL};

  // The order here is just left to right, nothing fancy.

  int reading_order_ltr_context[] = {0, 1, 2, 3, 4, 5, 6, 7};

  // In the strange event that this shows up in an RTL paragraph, nonetheless

  // just presume the whole thing is an LTR line.

  int reading_order_rtl_context[] = {ResultIterator::kMinorRunStart, 0, 1, 2, 3, 4, 5, 6, 7,

                                     ResultIterator::kMinorRunEnd};


  ExpectTextlineReadingOrder(true, word_dirs, countof(word_dirs), reading_order_ltr_context,

                             countof(reading_order_ltr_context));

  ExpectTextlineReadingOrder(false, word_dirs, countof(word_dirs), reading_order_rtl_context,

                             countof(reading_order_rtl_context));

}


// Test that right-direction text comes out strictly right-to-left in

// a right-to-left context.

TEST_F(ResultIteratorTest, RightwardTextlineOrderTest) {

  const StrongScriptDirection word_dirs[] = {dR, dR, dN, dR, dN, dN, dR, dR};

  // The order here is just right-to-left, nothing fancy.

  int reading_order_rtl_context[] = {7, 6, 5, 4, 3, 2, 1, 0};

  ExpectTextlineReadingOrder(false, word_dirs, countof(word_dirs), reading_order_rtl_context,

                             countof(reading_order_rtl_context));

}


TEST_F(ResultIteratorTest, TextlineOrderSanityCheck) {

  // Iterate through all 7-word sequences and make sure that the output

  // contains each of the indices 0..6 exactly once.

  const int kNumWords(7);

  const int kNumCombos = 1 << (2 * kNumWords); // 4 ^ 7 combinations

  StrongScriptDirection word_dirs[kNumWords];

  for (int i = 0; i < kNumCombos; i++) {

    // generate the next combination.

    int tmp = i;

    for (auto &word_dir : word_dirs) {

      word_dir = static_cast<StrongScriptDirection>(tmp % 4);

      tmp = tmp / 4;

    }

    VerifySaneTextlineOrder(true, word_dirs, kNumWords);

    VerifySaneTextlineOrder(false, word_dirs, kNumWords);

  }

}


// TODO: Missing image

TEST_F(ResultIteratorTest, DISABLED_NonNullChoicesTest) {

  SetImage("5318c4b679264.jpg");

  char *result = api_.GetUTF8Text();

  delete[] result;

  ResultIterator *r_it = api_.GetIterator();

  // Iterate over the words.

  do {

    char *word_str = r_it->GetUTF8Text(tesseract::RIL_WORD);

    if (word_str != nullptr) {

      LOG(INFO) << "Word " << word_str << ":\n";

      ResultIterator s_it = *r_it;

      do {

        tesseract::ChoiceIterator c_it(s_it);

        do {

          const char *char_str = c_it.GetUTF8Text();

          if (char_str == nullptr) {

            LOG(INFO) << "Null char choice"

                      << "\n";

          } else {

            LOG(INFO) << "Char choice " << char_str << "\n";

          }

          CHECK(char_str != nullptr);

        } while (c_it.Next());

      } while (!s_it.IsAtFinalElement(tesseract::RIL_WORD, tesseract::RIL_SYMBOL) &&

               s_it.Next(tesseract::RIL_SYMBOL));

      delete[] word_str;

    }

  } while (r_it->Next(tesseract::RIL_WORD));

  delete r_it;

}


// TODO: Missing image

TEST_F(ResultIteratorTest, NonNullConfidencesTest) {

  //  SetImage("line6.tiff");

  SetImage("trainingitalline.tif");

  api_.SetPageSegMode(tesseract::PSM_SINGLE_BLOCK);

  // Force recognition so we can used the result iterator.

  // We don't care about the return from GetUTF8Text.

  char *result = api_.GetUTF8Text();

  delete[] result;

  ResultIterator *r_it = api_.GetIterator();

  // Iterate over the words.

  do {

    char *word_str = r_it->GetUTF8Text(tesseract::RIL_WORD);

    if (word_str != nullptr) {

      EXPECT_FALSE(r_it->Empty(tesseract::RIL_WORD));

      EXPECT_FALSE(r_it->Empty(tesseract::RIL_SYMBOL));

      ResultIterator s_it = *r_it;

      do {

        const char *char_str = s_it.GetUTF8Text(tesseract::RIL_SYMBOL);

        CHECK(char_str != nullptr);

        float confidence = s_it.Confidence(tesseract::RIL_SYMBOL);

        LOG(INFO) << "Char " << char_str << " has confidence " << confidence << "\n";

        delete[] char_str;

      } while (!s_it.IsAtFinalElement(tesseract::RIL_WORD, tesseract::RIL_SYMBOL) &&

               s_it.Next(tesseract::RIL_SYMBOL));

      delete[] word_str;

    } else {

      LOG(INFO) << "Empty word found"

                << "\n";

    }

  } while (r_it->Next(tesseract::RIL_WORD));

  delete r_it;

}


} // namespace tesseract

baseapi.h

resultiterator.h

scrollview.h

LOG
@ LOG
Definition: cleanapi_test.cc:19

log.h

ERROR
@ ERROR
Definition: log.h:28

INFO
@ INFO
Definition: log.h:28

i
int i
Definition: gmock-matchers_test.cc:718

GTEST_SKIP
#define GTEST_SKIP()
Definition: gtest.h:1889

EXPECT_EQ
#define EXPECT_EQ(val1, val2)
Definition: gtest.h:2043

EXPECT_GE
#define EXPECT_GE(val1, val2)
Definition: gtest.h:2051

EXPECT_TRUE
#define EXPECT_TRUE(condition)
Definition: gtest.h:1982

EXPECT_STREQ
#define EXPECT_STREQ(s1, s2)
Definition: gtest.h:2112

EXPECT_LE
#define EXPECT_LE(val1, val2)
Definition: gtest.h:2047

EXPECT_FALSE
#define EXPECT_FALSE(condition)
Definition: gtest.h:1986

ASSERT_GE
#define ASSERT_GE(val1, val2)
Definition: gtest.h:2089

include_gunit.h

CHECK
#define CHECK(condition)
Definition: include_gunit.h:76

tesseract
Definition: baseapi.h:39

tesseract::OEM_TESSERACT_ONLY
@ OEM_TESSERACT_ONLY
Definition: publictypes.h:264

tesseract::PSM_AUTO
@ PSM_AUTO
Fully automatic page segmentation, but no OSD.
Definition: publictypes.h:162

tesseract::PSM_SINGLE_BLOCK
@ PSM_SINGLE_BLOCK
Assume a single uniform block of text. (Default.)
Definition: publictypes.h:166

tesseract::StrongScriptDirection
StrongScriptDirection
Definition: unichar.h:41

tesseract::DIR_LEFT_TO_RIGHT
@ DIR_LEFT_TO_RIGHT
Definition: unichar.h:43

tesseract::DIR_RIGHT_TO_LEFT
@ DIR_RIGHT_TO_LEFT
Definition: unichar.h:44

tesseract::DIR_NEUTRAL
@ DIR_NEUTRAL
Definition: unichar.h:42

tesseract::countof
constexpr size_t countof(T const (&)[N]) noexcept
Definition: serialis.h:34

tesseract::PageIteratorLevel
PageIteratorLevel
Definition: publictypes.h:214

tesseract::RIL_BLOCK
@ RIL_BLOCK
Definition: publictypes.h:215

tesseract::RIL_PARA
@ RIL_PARA
Definition: publictypes.h:216

tesseract::RIL_TEXTLINE
@ RIL_TEXTLINE
Definition: publictypes.h:217

tesseract::RIL_SYMBOL
@ RIL_SYMBOL
Definition: publictypes.h:219

tesseract::RIL_WORD
@ RIL_WORD
Definition: publictypes.h:218

tesseract::TEST_F
TEST_F(EuroText, FastLatinOCR)
Definition: apiexample_test.cc:105

gmock_output_test.output
output
Definition: gmock_output_test.py:175

tesseract::TessBaseAPI
Definition: baseapi.h:76

tesseract::TessBaseAPI::SetPageSegMode
void SetPageSegMode(PageSegMode mode)
Definition: baseapi.cpp:511

tesseract::TessBaseAPI::Init
int Init(const char *datapath, const char *language, OcrEngineMode mode, char **configs, int configs_size, const std::vector< std::string > *vars_vec, const std::vector< std::string > *vars_values, bool set_only_non_debug_params)
Definition: baseapi.cpp:368

tesseract::TessBaseAPI::SetImage
void SetImage(const unsigned char *imagedata, int width, int height, int bytes_per_pixel, int bytes_per_line)
Definition: baseapi.cpp:576

tesseract::TessBaseAPI::GetInputImage
Pix * GetInputImage()
Definition: baseapi.cpp:924

tesseract::LTRResultIterator::WordFontAttributes
const char * WordFontAttributes(bool *is_bold, bool *is_italic, bool *is_underlined, bool *is_monospace, bool *is_serif, bool *is_smallcaps, int *pointsize, int *font_id) const
Definition: ltrresultiterator.cpp:158

tesseract::LTRResultIterator::SymbolIsDropcap
bool SymbolIsDropcap() const
Definition: ltrresultiterator.cpp:375

tesseract::LTRResultIterator::Confidence
float Confidence(PageIteratorLevel level) const
Definition: ltrresultiterator.cpp:97

tesseract::ChoiceIterator
Definition: ltrresultiterator.h:180

tesseract::ChoiceIterator::Next
bool Next()
Definition: ltrresultiterator.cpp:425

tesseract::ChoiceIterator::GetUTF8Text
const char * GetUTF8Text() const
Definition: ltrresultiterator.cpp:445

tesseract::PageIterator
Definition: pageiterator.h:50

tesseract::PageIterator::Next
virtual bool Next(PageIteratorLevel level)
Definition: pageiterator.cpp:149

tesseract::PageIterator::IsAtBeginningOf
virtual bool IsAtBeginningOf(PageIteratorLevel level) const
Definition: pageiterator.cpp:194

tesseract::PageIterator::Begin
virtual void Begin()
Definition: pageiterator.cpp:105

tesseract::PageIterator::GetImage
Pix * GetImage(PageIteratorLevel level, int padding, Pix *original_img, int *left, int *top) const
Definition: pageiterator.cpp:488

tesseract::PageIterator::Empty
bool Empty(PageIteratorLevel level) const
Definition: pageiterator.cpp:373

tesseract::PageIterator::Baseline
bool Baseline(PageIteratorLevel level, int *x1, int *y1, int *x2, int *y2) const
Definition: pageiterator.cpp:534

tesseract::PageIterator::GetBinaryImage
Pix * GetBinaryImage(PageIteratorLevel level) const
Definition: pageiterator.cpp:450

tesseract::PageIterator::BoundingBox
bool BoundingBox(PageIteratorLevel level, int *left, int *top, int *right, int *bottom) const
Definition: pageiterator.cpp:349

tesseract::ResultIterator
Definition: resultiterator.h:32

tesseract::ResultIterator::CalculateTextlineOrder
static void CalculateTextlineOrder(bool paragraph_is_ltr, const std::vector< StrongScriptDirection > &word_dirs, std::vector< int > *reading_order)
Definition: resultiterator.cpp:285

tesseract::ResultIterator::IsAtFinalElement
bool IsAtFinalElement(PageIteratorLevel level, PageIteratorLevel element) const override
Definition: resultiterator.cpp:614

tesseract::ResultIterator::kMinorRunEnd
static const int kMinorRunEnd
Definition: resultiterator.h:135

tesseract::ResultIterator::kMinorRunStart
static const int kMinorRunStart
Definition: resultiterator.h:134

tesseract::ResultIterator::GetUTF8Text
virtual char * GetUTF8Text(PageIteratorLevel level) const
Definition: resultiterator.cpp:650

tesseract::ResultIterator::IsAtBeginningOf
bool IsAtBeginningOf(PageIteratorLevel level) const override
Definition: resultiterator.cpp:565

tesseract::ResultIterator::Next
bool Next(PageIteratorLevel level) override
Definition: resultiterator.cpp:482

tesseract::ResultIterator::Begin
void Begin() override
Definition: resultiterator.cpp:474

tesseract::Image
Definition: image.h:25

tesseract::Image::destroy
void destroy()
Definition: image.cpp:32

file::MakeTmpdir
static void MakeTmpdir()
Definition: include_gunit.h:38

file::JoinPath
static std::string JoinPath(const std::string &s1, const std::string &s2)
Definition: include_gunit.h:65

tesseract::ResultIteratorTest
Definition: resultiterator_test.cc:17

tesseract::ResultIteratorTest::ocr_text_
std::string ocr_text_
Definition: resultiterator_test.cc:211

tesseract::ResultIteratorTest::api_
tesseract::TessBaseAPI api_
Definition: resultiterator_test.cc:212

tesseract::ResultIteratorTest::VerifyAllText
void VerifyAllText(const std::string &truth, ResultIterator *it)
Definition: resultiterator_test.cc:143

tesseract::ResultIteratorTest::OutputNameToPath
std::string OutputNameToPath(const std::string &name)
Definition: resultiterator_test.cc:25

tesseract::ResultIteratorTest::TessdataPath
std::string TessdataPath()
Definition: resultiterator_test.cc:22

tesseract::ResultIteratorTest::VerifyIteratorText
void VerifyIteratorText(const std::string &truth, PageIteratorLevel level, ResultIterator *it)
Definition: resultiterator_test.cc:108

tesseract::ResultIteratorTest::TestDataNameToPath
std::string TestDataNameToPath(const std::string &name)
Definition: resultiterator_test.cc:19

tesseract::ResultIteratorTest::VerifyRebuild
void VerifyRebuild(int max_diff, PageIteratorLevel level, PageIterator *it)
Definition: resultiterator_test.cc:49

tesseract::ResultIteratorTest::ExpectTextlineReadingOrder
void ExpectTextlineReadingOrder(bool in_ltr_context, const StrongScriptDirection *word_dirs, int num_words, int *expected_reading_order, int num_reading_order_entries) const
Definition: resultiterator_test.cc:156

tesseract::ResultIteratorTest::VerifyRebuilds
void VerifyRebuilds(int block_limit, int para_limit, int line_limit, int word_limit, int symbol_limit, PageIterator *it, PageIteratorLevel maxlevel=tesseract::RIL_SYMBOL)
Definition: resultiterator_test.cc:132

tesseract::ResultIteratorTest::VerifySaneTextlineOrder
void VerifySaneTextlineOrder(bool in_ltr_context, const StrongScriptDirection *word_dirs, int num_words) const
Definition: resultiterator_test.cc:176

tesseract::ResultIteratorTest::~ResultIteratorTest
~ResultIteratorTest() override=default

tesseract::ResultIteratorTest::ResultIteratorTest
ResultIteratorTest()
Definition: resultiterator_test.cc:30

tesseract::ResultIteratorTest::SetImage
void SetImage(const char *filename)
Definition: resultiterator_test.cc:35

tesseract::ResultIteratorTest::src_pix_
Image src_pix_
Definition: resultiterator_test.cc:210

testing::Test
Definition: gtest.h:414