diff --git a/unittest/README.md b/unittest/README.md index 0a5591f2..bf4f83fe 100644 --- a/unittest/README.md +++ b/unittest/README.md @@ -1,5 +1,82 @@ -Unit Testing for Tesseract ----------- +# Unit Testing for Tesseract + + +## Requirements + +### Files and structure +``` + +├── langdata_lstm +│   ├── common.punc +│   ├── common.unicharambigs +│   ├── desired_bigrams.txt +│   ├── eng +│   │   ├── desired_characters +│   │   ├── eng.config +│   │   ├── eng.numbers +│   │   ├── eng.punc +│   │   ├── eng.singles_text +│   │   ├── eng.training_text +│   │   ├── eng.unicharambigs +│   │   ├── eng.wordlist +│   │   └── okfonts.txt +│   ├── extended +│   │   └── extended.config +│   ├── extendedhin +│   │   └── extendedhin.config +│   ├── font_properties +│   ├── forbidden_characters_default +│   ├── hin +│   │   ├── hin.config +│   │   ├── hin.numbers +│   │   ├── hin.punc +│   │   └── hin.wordlist +│   ├── kan +│   │   └── kan.config +│   ├── kor +│   │   └── kor.config +│   ├── osd +│   │   └── osd.unicharset +│   └── radical-stroke.txt +├── tessdata +│   ├── ara.traineddata +│   ├── chi_tra.traineddata +│   ├── eng.traineddata +│   ├── heb.traineddata +│   ├── hin.traineddata +│   ├── jpn.traineddata +│   ├── kmr.traineddata +│   ├── osd.traineddata +│   └── vie.traineddata +├── tessdata_best +│   ├── eng.traineddata +│   ├── fra.traineddata +│   ├── kmr.traineddata +│   └── osd.traineddata +├── tessdata_fast +│   ├── eng.traineddata +│   ├── kmr.traineddata +│   ├── osd.traineddata +│   └── script +│   └── Latin.traineddata +└── tesseract + ├── abseil + ... + ├── test + ├── unittest + └── VERSION +``` + +### Fonts + +* Microsoft fonts: arialbi.ttf, times.ttf, verdana.ttf - [instalation guide](https://www.makeuseof.com/tag/how-to-install-microsoft-core-fonts-in-ubuntu-linux/) +* [ae_Arab.ttf](https://www.wfonts.com/download/data/2014/12/03/ae-arab/ae-arab.zip) +* dejavu-fonts: [DejaVuSans-ExtraLight.ttf](https://dejavu-fonts.github.io/Download.html) +* [Lohit-Hindi.ttf](https://raw.githubusercontent.com/pratul/packageofpractices/master/assets/fonts/Lohit-Hindi.ttf) +* [UnBatang.ttf](https://raw.githubusercontent.com/byrongibson/fonts/master/backup/truetype.original/unfonts-core/UnBatang.ttf) + + +## Run tests To run the tests, do the following in tesseract folder