mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-18 14:41:36 +08:00
add commas to language list
This commit is contained in:
parent
035325dfd0
commit
44588a3c7c
@ -119,124 +119,124 @@ The currently available traineddata files for tesseract 4.00
|
||||
for the following languages are in
|
||||
(in https://github.com/tesseract-ocr/tessdata_fast):
|
||||
|
||||
*afr* (Afrikaans)
|
||||
*amh* (Amharic)
|
||||
*ara* (Arabic)
|
||||
*asm* (Assamese)
|
||||
*aze* (Azerbaijani)
|
||||
*aze_cyrl* (Azerbaijani - Cyrilic)
|
||||
*bel* (Belarusian)
|
||||
*ben* (Bengali)
|
||||
*bod* (Tibetan)
|
||||
*bos* (Bosnian)
|
||||
*bul* (Bulgarian)
|
||||
*cat* (Catalan; Valencian)
|
||||
*ceb* (Cebuano)
|
||||
*ces* (Czech)
|
||||
*chi_sim* (Chinese - Simplified)
|
||||
*chi_tra* (Chinese - Traditional)
|
||||
*chr* (Cherokee)
|
||||
*cym* (Welsh)
|
||||
*dan* (Danish)
|
||||
*dan_frak* (Danish - Fraktur)
|
||||
*deu* (German)
|
||||
*deu_frak* (German - Fraktur)
|
||||
*dzo* (Dzongkha)
|
||||
*ell* (Greek, Modern (1453-))
|
||||
*eng* (English)
|
||||
*enm* (English, Middle (1100-1500))
|
||||
*epo* (Esperanto)
|
||||
*equ* (Math / equation detection module)
|
||||
*est* (Estonian)
|
||||
*eus* (Basque)
|
||||
*fas* (Persian)
|
||||
*fin* (Finnish)
|
||||
*fra* (French)
|
||||
*frk* (Frankish)
|
||||
*frm* (French, Middle (ca.1400-1600))
|
||||
*gle* (Irish)
|
||||
*glg* (Galician)
|
||||
*grc* (Greek, Ancient (to 1453))
|
||||
*guj* (Gujarati)
|
||||
*hat* (Haitian; Haitian Creole)
|
||||
*heb* (Hebrew)
|
||||
*hin* (Hindi)
|
||||
*hrv* (Croatian)
|
||||
*hun* (Hungarian)
|
||||
*iku* (Inuktitut)
|
||||
*ind* (Indonesian)
|
||||
*isl* (Icelandic)
|
||||
*ita* (Italian)
|
||||
*ita_old* (Italian - Old)
|
||||
*jav* (Javanese)
|
||||
*jpn* (Japanese)
|
||||
*kan* (Kannada)
|
||||
*kat* (Georgian)
|
||||
*kat_old* (Georgian - Old)
|
||||
*kaz* (Kazakh)
|
||||
*khm* (Central Khmer)
|
||||
*kir* (Kirghiz; Kyrgyz)
|
||||
*kor* (Korean)
|
||||
*kor_vert* (Korean (vertical))
|
||||
*kur* (Kurdish)
|
||||
*kur_ara* (Kurdish (Arabic))
|
||||
*lao* (Lao)
|
||||
*lat* (Latin)
|
||||
*lav* (Latvian)
|
||||
*lit* (Lithuanian)
|
||||
*ltz* (Luxembourgish)
|
||||
*mal* (Malayalam)
|
||||
*mar* (Marathi)
|
||||
*mkd* (Macedonian)
|
||||
*mlt* (Maltese)
|
||||
*mon* (Mongolian)
|
||||
*mri* (Maori)
|
||||
*msa* (Malay)
|
||||
*mya* (Burmese)
|
||||
*nep* (Nepali)
|
||||
*nld* (Dutch; Flemish)
|
||||
*nor* (Norwegian)
|
||||
*oci* (Occitan (post 1500))
|
||||
*ori* (Oriya)
|
||||
*osd* (Orientation and script detection module)
|
||||
*pan* (Panjabi; Punjabi)
|
||||
*pol* (Polish)
|
||||
*por* (Portuguese)
|
||||
*pus* (Pushto; Pashto)
|
||||
*que* (Quechua)
|
||||
*ron* (Romanian; Moldavian; Moldovan)
|
||||
*rus* (Russian)
|
||||
*san* (Sanskrit)
|
||||
*sin* (Sinhala; Sinhalese)
|
||||
*slk* (Slovak)
|
||||
*slk_frak* (Slovak - Fraktur)
|
||||
*slv* (Slovenian)
|
||||
*snd* (Sindhi)
|
||||
*spa* (Spanish; Castilian)
|
||||
*spa_old* (Spanish; Castilian - Old)
|
||||
*sqi* (Albanian)
|
||||
*srp* (Serbian)
|
||||
*srp_latn* (Serbian - Latin)
|
||||
*sun* (Sundanese)
|
||||
*swa* (Swahili)
|
||||
*swe* (Swedish)
|
||||
*syr* (Syriac)
|
||||
*tam* (Tamil)
|
||||
*tat* (Tatar)
|
||||
*tel* (Telugu)
|
||||
*tgk* (Tajik)
|
||||
*tgl* (Tagalog)
|
||||
*tha* (Thai)
|
||||
*tir* (Tigrinya)
|
||||
*ton* (Tonga)
|
||||
*tur* (Turkish)
|
||||
*uig* (Uighur; Uyghur)
|
||||
*ukr* (Ukrainian)
|
||||
*urd* (Urdu)
|
||||
*uzb* (Uzbek)
|
||||
*uzb_cyrl* (Uzbek - Cyrilic)
|
||||
*vie* (Vietnamese)
|
||||
*yid* (Yiddish)
|
||||
*afr* (Afrikaans),
|
||||
*amh* (Amharic),
|
||||
*ara* (Arabic),
|
||||
*asm* (Assamese),
|
||||
*aze* (Azerbaijani),
|
||||
*aze_cyrl* (Azerbaijani - Cyrilic),
|
||||
*bel* (Belarusian),
|
||||
*ben* (Bengali),
|
||||
*bod* (Tibetan),
|
||||
*bos* (Bosnian),
|
||||
*bul* (Bulgarian),
|
||||
*cat* (Catalan; Valencian),
|
||||
*ceb* (Cebuano),
|
||||
*ces* (Czech),
|
||||
*chi_sim* (Chinese - Simplified),
|
||||
*chi_tra* (Chinese - Traditional),
|
||||
*chr* (Cherokee),
|
||||
*cym* (Welsh),
|
||||
*dan* (Danish),
|
||||
*dan_frak* (Danish - Fraktur),
|
||||
*deu* (German),
|
||||
*deu_frak* (German - Fraktur),
|
||||
*dzo* (Dzongkha),
|
||||
*ell* (Greek, Modern (1453-)),
|
||||
*eng* (English),
|
||||
*enm* (English, Middle (1100-1500)),
|
||||
*epo* (Esperanto),
|
||||
*equ* (Math / equation detection module),
|
||||
*est* (Estonian),
|
||||
*eus* (Basque),
|
||||
*fas* (Persian),
|
||||
*fin* (Finnish),
|
||||
*fra* (French),
|
||||
*frk* (Frankish),
|
||||
*frm* (French, Middle (ca.1400-1600)),
|
||||
*gle* (Irish),
|
||||
*glg* (Galician),
|
||||
*grc* (Greek, Ancient (to 1453)),
|
||||
*guj* (Gujarati),
|
||||
*hat* (Haitian; Haitian Creole),
|
||||
*heb* (Hebrew),
|
||||
*hin* (Hindi),
|
||||
*hrv* (Croatian),
|
||||
*hun* (Hungarian),
|
||||
*iku* (Inuktitut),
|
||||
*ind* (Indonesian),
|
||||
*isl* (Icelandic),
|
||||
*ita* (Italian),
|
||||
*ita_old* (Italian - Old),
|
||||
*jav* (Javanese),
|
||||
*jpn* (Japanese),
|
||||
*kan* (Kannada),
|
||||
*kat* (Georgian),
|
||||
*kat_old* (Georgian - Old),
|
||||
*kaz* (Kazakh),
|
||||
*khm* (Central Khmer),
|
||||
*kir* (Kirghiz; Kyrgyz),
|
||||
*kor* (Korean),
|
||||
*kor_vert* (Korean (vertical)),
|
||||
*kur* (Kurdish),
|
||||
*kur_ara* (Kurdish (Arabic)),
|
||||
*lao* (Lao),
|
||||
*lat* (Latin),
|
||||
*lav* (Latvian),
|
||||
*lit* (Lithuanian),
|
||||
*ltz* (Luxembourgish),
|
||||
*mal* (Malayalam),
|
||||
*mar* (Marathi),
|
||||
*mkd* (Macedonian),
|
||||
*mlt* (Maltese),
|
||||
*mon* (Mongolian),
|
||||
*mri* (Maori),
|
||||
*msa* (Malay),
|
||||
*mya* (Burmese),
|
||||
*nep* (Nepali),
|
||||
*nld* (Dutch; Flemish),
|
||||
*nor* (Norwegian),
|
||||
*oci* (Occitan (post 1500)),
|
||||
*ori* (Oriya),
|
||||
*osd* (Orientation and script detection module),
|
||||
*pan* (Panjabi; Punjabi),
|
||||
*pol* (Polish),
|
||||
*por* (Portuguese),
|
||||
*pus* (Pushto; Pashto),
|
||||
*que* (Quechua),
|
||||
*ron* (Romanian; Moldavian; Moldovan),
|
||||
*rus* (Russian),
|
||||
*san* (Sanskrit),
|
||||
*sin* (Sinhala; Sinhalese),
|
||||
*slk* (Slovak),
|
||||
*slk_frak* (Slovak - Fraktur),
|
||||
*slv* (Slovenian),
|
||||
*snd* (Sindhi),
|
||||
*spa* (Spanish; Castilian),
|
||||
*spa_old* (Spanish; Castilian - Old),
|
||||
*sqi* (Albanian),
|
||||
*srp* (Serbian),
|
||||
*srp_latn* (Serbian - Latin),
|
||||
*sun* (Sundanese),
|
||||
*swa* (Swahili),
|
||||
*swe* (Swedish),
|
||||
*syr* (Syriac),
|
||||
*tam* (Tamil),
|
||||
*tat* (Tatar),
|
||||
*tel* (Telugu),
|
||||
*tgk* (Tajik),
|
||||
*tgl* (Tagalog),
|
||||
*tha* (Thai),
|
||||
*tir* (Tigrinya),
|
||||
*ton* (Tonga),
|
||||
*tur* (Turkish),
|
||||
*uig* (Uighur; Uyghur),
|
||||
*ukr* (Ukrainian),
|
||||
*urd* (Urdu),
|
||||
*uzb* (Uzbek),
|
||||
*uzb_cyrl* (Uzbek - Cyrilic),
|
||||
*vie* (Vietnamese),
|
||||
*yid* (Yiddish),
|
||||
*yor* (Yoruba)
|
||||
|
||||
To use a non-standard language pack named *foo.traineddata*, set the
|
||||
|
Loading…
Reference in New Issue
Block a user