42 return ConsumeConsonantHeadIfValid() && ConsumeConsonantTailIfValid();
45 return ConsumeVowelIfValid();
59 tprintf(
"Invalid start of grapheme sequence:%c=0x%x\n",
74bool ValidateJavanese::ConsumeViramaIfValid(IndicPair joiner,
bool post_matra) {
75 const unsigned num_codes =
codes_.size();
82 tprintf(
"ZWJ after a post-matra virama!!\n");
102 tprintf(
"Virama ZWJ ZWNJ in non-Sinhala: base=0x%x!\n",
static_cast<int>(
script_));
127 tprintf(
"Invalid pre-virama joiner with no 2nd consonant!!\n");
146bool ValidateJavanese::ConsumeConsonantHeadIfValid() {
147 const unsigned num_codes =
codes_.size();
152 int index =
output_.size() - 3;
158 bool have_nukta =
false;
164 index =
output_.size() - 2 - have_nukta;
177 tprintf(
"Skipping ending joiner: 0x%x 0x%x\n",
output_.back(), joiner.second);
182 output_.push_back(joiner.second);
185 tprintf(
"Skipping unnecessary joiner: 0x%x 0x%x 0x%x\n",
output_.back(), joiner.second,
192 if (!ConsumeViramaIfValid(joiner,
false)) {
207bool ValidateJavanese::ConsumeConsonantTailIfValid() {
258bool ValidateJavanese::ConsumeVowelIfValid() {
void tprintf(const char *format,...)
bool ConsumeGraphemeIfValid() override
Validator::CharClass UnicodeToCharClass(char32 ch) const override
static const char32 kZeroWidthNonJoiner
std::vector< char32 > output_
bool UseMultiCode(unsigned length)
void MultiCodePart(unsigned length)
static bool IsVirama(char32 unicode)
static const int kIndicCodePageSize
std::pair< CharClass, char32 > IndicPair
bool IsSubscriptScript() const
std::vector< IndicPair > codes_
static const char32 kZeroWidthJoiner