Remove test for Word started with a combiner

This commit is contained in:
Shree 2019-02-25 18:47:42 +00:00
parent 8e83b209c6
commit 449f1cd4ba

View File

@ -15,11 +15,12 @@ bool ValidateGrapheme::ConsumeGraphemeIfValid() {
char32 ch = codes_[codes_used_].second;
const bool is_combiner =
cc == CharClass::kCombiner || cc == CharClass::kVirama;
// Reject easily detected badly formed sequences.
if (prev_cc == CharClass::kWhitespace && is_combiner) {
if (report_errors_) tprintf("Word started with a combiner:0x%x\n", ch);
return false;
}
// TODO: Reject easily detected badly formed sequences.
// https://github.com/tesseract-ocr/tesseract/pull/2266#issuecomment-467114751
// if (prev_cc == CharClass::kWhitespace && is_combiner) {
// if (report_errors_) tprintf("Word started with a combiner:0x%x\n", ch);
// return false;
//}
if (prev_cc == CharClass::kVirama && cc == CharClass::kVirama) {
if (report_errors_)
tprintf("Two grapheme links in a row:0x%x 0x%x\n", prev_ch, ch);