mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2024-12-18 11:28:51 +08:00
Merge pull request #2268 from Shreeshrii/grapheme
Remove test for Word started with a combiner
This commit is contained in:
commit
9ddf267907
@ -15,11 +15,12 @@ bool ValidateGrapheme::ConsumeGraphemeIfValid() {
|
||||
char32 ch = codes_[codes_used_].second;
|
||||
const bool is_combiner =
|
||||
cc == CharClass::kCombiner || cc == CharClass::kVirama;
|
||||
// Reject easily detected badly formed sequences.
|
||||
if (prev_cc == CharClass::kWhitespace && is_combiner) {
|
||||
if (report_errors_) tprintf("Word started with a combiner:0x%x\n", ch);
|
||||
return false;
|
||||
}
|
||||
// TODO: Reject easily detected badly formed sequences.
|
||||
// https://github.com/tesseract-ocr/tesseract/pull/2266#issuecomment-467114751
|
||||
// if (prev_cc == CharClass::kWhitespace && is_combiner) {
|
||||
// if (report_errors_) tprintf("Word started with a combiner:0x%x\n", ch);
|
||||
// return false;
|
||||
//}
|
||||
if (prev_cc == CharClass::kVirama && cc == CharClass::kVirama) {
|
||||
if (report_errors_)
|
||||
tprintf("Two grapheme links in a row:0x%x 0x%x\n", prev_ch, ch);
|
||||
|
Loading…
Reference in New Issue
Block a user