diff --git a/doc/tesseract.1.asc b/doc/tesseract.1.asc index 489584c555..053fca8da7 100644 --- a/doc/tesseract.1.asc +++ b/doc/tesseract.1.asc @@ -119,124 +119,124 @@ The currently available traineddata files for tesseract 4.00 for the following languages are in (in https://github.com/tesseract-ocr/tessdata_fast): -*afr* (Afrikaans) -*amh* (Amharic) -*ara* (Arabic) -*asm* (Assamese) -*aze* (Azerbaijani) -*aze_cyrl* (Azerbaijani - Cyrilic) -*bel* (Belarusian) -*ben* (Bengali) -*bod* (Tibetan) -*bos* (Bosnian) -*bul* (Bulgarian) -*cat* (Catalan; Valencian) -*ceb* (Cebuano) -*ces* (Czech) -*chi_sim* (Chinese - Simplified) -*chi_tra* (Chinese - Traditional) -*chr* (Cherokee) -*cym* (Welsh) -*dan* (Danish) -*dan_frak* (Danish - Fraktur) -*deu* (German) -*deu_frak* (German - Fraktur) -*dzo* (Dzongkha) -*ell* (Greek, Modern (1453-)) -*eng* (English) -*enm* (English, Middle (1100-1500)) -*epo* (Esperanto) -*equ* (Math / equation detection module) -*est* (Estonian) -*eus* (Basque) -*fas* (Persian) -*fin* (Finnish) -*fra* (French) -*frk* (Frankish) -*frm* (French, Middle (ca.1400-1600)) -*gle* (Irish) -*glg* (Galician) -*grc* (Greek, Ancient (to 1453)) -*guj* (Gujarati) -*hat* (Haitian; Haitian Creole) -*heb* (Hebrew) -*hin* (Hindi) -*hrv* (Croatian) -*hun* (Hungarian) -*iku* (Inuktitut) -*ind* (Indonesian) -*isl* (Icelandic) -*ita* (Italian) -*ita_old* (Italian - Old) -*jav* (Javanese) -*jpn* (Japanese) -*kan* (Kannada) -*kat* (Georgian) -*kat_old* (Georgian - Old) -*kaz* (Kazakh) -*khm* (Central Khmer) -*kir* (Kirghiz; Kyrgyz) -*kor* (Korean) -*kor_vert* (Korean (vertical)) -*kur* (Kurdish) -*kur_ara* (Kurdish (Arabic)) -*lao* (Lao) -*lat* (Latin) -*lav* (Latvian) -*lit* (Lithuanian) -*ltz* (Luxembourgish) -*mal* (Malayalam) -*mar* (Marathi) -*mkd* (Macedonian) -*mlt* (Maltese) -*mon* (Mongolian) -*mri* (Maori) -*msa* (Malay) -*mya* (Burmese) -*nep* (Nepali) -*nld* (Dutch; Flemish) -*nor* (Norwegian) -*oci* (Occitan (post 1500)) -*ori* (Oriya) -*osd* (Orientation and script detection module) -*pan* (Panjabi; Punjabi) -*pol* (Polish) -*por* (Portuguese) -*pus* (Pushto; Pashto) -*que* (Quechua) -*ron* (Romanian; Moldavian; Moldovan) -*rus* (Russian) -*san* (Sanskrit) -*sin* (Sinhala; Sinhalese) -*slk* (Slovak) -*slk_frak* (Slovak - Fraktur) -*slv* (Slovenian) -*snd* (Sindhi) -*spa* (Spanish; Castilian) -*spa_old* (Spanish; Castilian - Old) -*sqi* (Albanian) -*srp* (Serbian) -*srp_latn* (Serbian - Latin) -*sun* (Sundanese) -*swa* (Swahili) -*swe* (Swedish) -*syr* (Syriac) -*tam* (Tamil) -*tat* (Tatar) -*tel* (Telugu) -*tgk* (Tajik) -*tgl* (Tagalog) -*tha* (Thai) -*tir* (Tigrinya) -*ton* (Tonga) -*tur* (Turkish) -*uig* (Uighur; Uyghur) -*ukr* (Ukrainian) -*urd* (Urdu) -*uzb* (Uzbek) -*uzb_cyrl* (Uzbek - Cyrilic) -*vie* (Vietnamese) -*yid* (Yiddish) +*afr* (Afrikaans), +*amh* (Amharic), +*ara* (Arabic), +*asm* (Assamese), +*aze* (Azerbaijani), +*aze_cyrl* (Azerbaijani - Cyrilic), +*bel* (Belarusian), +*ben* (Bengali), +*bod* (Tibetan), +*bos* (Bosnian), +*bul* (Bulgarian), +*cat* (Catalan; Valencian), +*ceb* (Cebuano), +*ces* (Czech), +*chi_sim* (Chinese - Simplified), +*chi_tra* (Chinese - Traditional), +*chr* (Cherokee), +*cym* (Welsh), +*dan* (Danish), +*dan_frak* (Danish - Fraktur), +*deu* (German), +*deu_frak* (German - Fraktur), +*dzo* (Dzongkha), +*ell* (Greek, Modern (1453-)), +*eng* (English), +*enm* (English, Middle (1100-1500)), +*epo* (Esperanto), +*equ* (Math / equation detection module), +*est* (Estonian), +*eus* (Basque), +*fas* (Persian), +*fin* (Finnish), +*fra* (French), +*frk* (Frankish), +*frm* (French, Middle (ca.1400-1600)), +*gle* (Irish), +*glg* (Galician), +*grc* (Greek, Ancient (to 1453)), +*guj* (Gujarati), +*hat* (Haitian; Haitian Creole), +*heb* (Hebrew), +*hin* (Hindi), +*hrv* (Croatian), +*hun* (Hungarian), +*iku* (Inuktitut), +*ind* (Indonesian), +*isl* (Icelandic), +*ita* (Italian), +*ita_old* (Italian - Old), +*jav* (Javanese), +*jpn* (Japanese), +*kan* (Kannada), +*kat* (Georgian), +*kat_old* (Georgian - Old), +*kaz* (Kazakh), +*khm* (Central Khmer), +*kir* (Kirghiz; Kyrgyz), +*kor* (Korean), +*kor_vert* (Korean (vertical)), +*kur* (Kurdish), +*kur_ara* (Kurdish (Arabic)), +*lao* (Lao), +*lat* (Latin), +*lav* (Latvian), +*lit* (Lithuanian), +*ltz* (Luxembourgish), +*mal* (Malayalam), +*mar* (Marathi), +*mkd* (Macedonian), +*mlt* (Maltese), +*mon* (Mongolian), +*mri* (Maori), +*msa* (Malay), +*mya* (Burmese), +*nep* (Nepali), +*nld* (Dutch; Flemish), +*nor* (Norwegian), +*oci* (Occitan (post 1500)), +*ori* (Oriya), +*osd* (Orientation and script detection module), +*pan* (Panjabi; Punjabi), +*pol* (Polish), +*por* (Portuguese), +*pus* (Pushto; Pashto), +*que* (Quechua), +*ron* (Romanian; Moldavian; Moldovan), +*rus* (Russian), +*san* (Sanskrit), +*sin* (Sinhala; Sinhalese), +*slk* (Slovak), +*slk_frak* (Slovak - Fraktur), +*slv* (Slovenian), +*snd* (Sindhi), +*spa* (Spanish; Castilian), +*spa_old* (Spanish; Castilian - Old), +*sqi* (Albanian), +*srp* (Serbian), +*srp_latn* (Serbian - Latin), +*sun* (Sundanese), +*swa* (Swahili), +*swe* (Swedish), +*syr* (Syriac), +*tam* (Tamil), +*tat* (Tatar), +*tel* (Telugu), +*tgk* (Tajik), +*tgl* (Tagalog), +*tha* (Thai), +*tir* (Tigrinya), +*ton* (Tonga), +*tur* (Turkish), +*uig* (Uighur; Uyghur), +*ukr* (Ukrainian), +*urd* (Urdu), +*uzb* (Uzbek), +*uzb_cyrl* (Uzbek - Cyrilic), +*vie* (Vietnamese), +*yid* (Yiddish), *yor* (Yoruba) To use a non-standard language pack named *foo.traineddata*, set the