@@ -119,124 +119,124 @@ The currently available traineddata files for tesseract 4.00
119
119
for the following languages are in
120
120
(in https://github.com/tesseract-ocr/tessdata_fast):
121
121
122
- *afr* (Afrikaans)
123
- *amh* (Amharic)
124
- *ara* (Arabic)
125
- *asm* (Assamese)
126
- *aze* (Azerbaijani)
127
- *aze_cyrl* (Azerbaijani - Cyrilic)
128
- *bel* (Belarusian)
129
- *ben* (Bengali)
130
- *bod* (Tibetan)
131
- *bos* (Bosnian)
132
- *bul* (Bulgarian)
133
- *cat* (Catalan; Valencian)
134
- *ceb* (Cebuano)
135
- *ces* (Czech)
136
- *chi_sim* (Chinese - Simplified)
137
- *chi_tra* (Chinese - Traditional)
138
- *chr* (Cherokee)
139
- *cym* (Welsh)
140
- *dan* (Danish)
141
- *dan_frak* (Danish - Fraktur)
142
- *deu* (German)
143
- *deu_frak* (German - Fraktur)
144
- *dzo* (Dzongkha)
145
- *ell* (Greek, Modern (1453-))
146
- *eng* (English)
147
- *enm* (English, Middle (1100-1500))
148
- *epo* (Esperanto)
149
- *equ* (Math / equation detection module)
150
- *est* (Estonian)
151
- *eus* (Basque)
152
- *fas* (Persian)
153
- *fin* (Finnish)
154
- *fra* (French)
155
- *frk* (Frankish)
156
- *frm* (French, Middle (ca.1400-1600))
157
- *gle* (Irish)
158
- *glg* (Galician)
159
- *grc* (Greek, Ancient (to 1453))
160
- *guj* (Gujarati)
161
- *hat* (Haitian; Haitian Creole)
162
- *heb* (Hebrew)
163
- *hin* (Hindi)
164
- *hrv* (Croatian)
165
- *hun* (Hungarian)
166
- *iku* (Inuktitut)
167
- *ind* (Indonesian)
168
- *isl* (Icelandic)
169
- *ita* (Italian)
170
- *ita_old* (Italian - Old)
171
- *jav* (Javanese)
172
- *jpn* (Japanese)
173
- *kan* (Kannada)
174
- *kat* (Georgian)
175
- *kat_old* (Georgian - Old)
176
- *kaz* (Kazakh)
177
- *khm* (Central Khmer)
178
- *kir* (Kirghiz; Kyrgyz)
179
- *kor* (Korean)
180
- *kor_vert* (Korean (vertical))
181
- *kur* (Kurdish)
182
- *kur_ara* (Kurdish (Arabic))
183
- *lao* (Lao)
184
- *lat* (Latin)
185
- *lav* (Latvian)
186
- *lit* (Lithuanian)
187
- *ltz* (Luxembourgish)
188
- *mal* (Malayalam)
189
- *mar* (Marathi)
190
- *mkd* (Macedonian)
191
- *mlt* (Maltese)
192
- *mon* (Mongolian)
193
- *mri* (Maori)
194
- *msa* (Malay)
195
- *mya* (Burmese)
196
- *nep* (Nepali)
197
- *nld* (Dutch; Flemish)
198
- *nor* (Norwegian)
199
- *oci* (Occitan (post 1500))
200
- *ori* (Oriya)
201
- *osd* (Orientation and script detection module)
202
- *pan* (Panjabi; Punjabi)
203
- *pol* (Polish)
204
- *por* (Portuguese)
205
- *pus* (Pushto; Pashto)
206
- *que* (Quechua)
207
- *ron* (Romanian; Moldavian; Moldovan)
208
- *rus* (Russian)
209
- *san* (Sanskrit)
210
- *sin* (Sinhala; Sinhalese)
211
- *slk* (Slovak)
212
- *slk_frak* (Slovak - Fraktur)
213
- *slv* (Slovenian)
214
- *snd* (Sindhi)
215
- *spa* (Spanish; Castilian)
216
- *spa_old* (Spanish; Castilian - Old)
217
- *sqi* (Albanian)
218
- *srp* (Serbian)
219
- *srp_latn* (Serbian - Latin)
220
- *sun* (Sundanese)
221
- *swa* (Swahili)
222
- *swe* (Swedish)
223
- *syr* (Syriac)
224
- *tam* (Tamil)
225
- *tat* (Tatar)
226
- *tel* (Telugu)
227
- *tgk* (Tajik)
228
- *tgl* (Tagalog)
229
- *tha* (Thai)
230
- *tir* (Tigrinya)
231
- *ton* (Tonga)
232
- *tur* (Turkish)
233
- *uig* (Uighur; Uyghur)
234
- *ukr* (Ukrainian)
235
- *urd* (Urdu)
236
- *uzb* (Uzbek)
237
- *uzb_cyrl* (Uzbek - Cyrilic)
238
- *vie* (Vietnamese)
239
- *yid* (Yiddish)
122
+ *afr* (Afrikaans),
123
+ *amh* (Amharic),
124
+ *ara* (Arabic),
125
+ *asm* (Assamese),
126
+ *aze* (Azerbaijani),
127
+ *aze_cyrl* (Azerbaijani - Cyrilic),
128
+ *bel* (Belarusian),
129
+ *ben* (Bengali),
130
+ *bod* (Tibetan),
131
+ *bos* (Bosnian),
132
+ *bul* (Bulgarian),
133
+ *cat* (Catalan; Valencian),
134
+ *ceb* (Cebuano),
135
+ *ces* (Czech),
136
+ *chi_sim* (Chinese - Simplified),
137
+ *chi_tra* (Chinese - Traditional),
138
+ *chr* (Cherokee),
139
+ *cym* (Welsh),
140
+ *dan* (Danish),
141
+ *dan_frak* (Danish - Fraktur),
142
+ *deu* (German),
143
+ *deu_frak* (German - Fraktur),
144
+ *dzo* (Dzongkha),
145
+ *ell* (Greek, Modern (1453-)),
146
+ *eng* (English),
147
+ *enm* (English, Middle (1100-1500)),
148
+ *epo* (Esperanto),
149
+ *equ* (Math / equation detection module),
150
+ *est* (Estonian),
151
+ *eus* (Basque),
152
+ *fas* (Persian),
153
+ *fin* (Finnish),
154
+ *fra* (French),
155
+ *frk* (Frankish),
156
+ *frm* (French, Middle (ca.1400-1600)),
157
+ *gle* (Irish),
158
+ *glg* (Galician),
159
+ *grc* (Greek, Ancient (to 1453)),
160
+ *guj* (Gujarati),
161
+ *hat* (Haitian; Haitian Creole),
162
+ *heb* (Hebrew),
163
+ *hin* (Hindi),
164
+ *hrv* (Croatian),
165
+ *hun* (Hungarian),
166
+ *iku* (Inuktitut),
167
+ *ind* (Indonesian),
168
+ *isl* (Icelandic),
169
+ *ita* (Italian),
170
+ *ita_old* (Italian - Old),
171
+ *jav* (Javanese),
172
+ *jpn* (Japanese),
173
+ *kan* (Kannada),
174
+ *kat* (Georgian),
175
+ *kat_old* (Georgian - Old),
176
+ *kaz* (Kazakh),
177
+ *khm* (Central Khmer),
178
+ *kir* (Kirghiz; Kyrgyz),
179
+ *kor* (Korean),
180
+ *kor_vert* (Korean (vertical)),
181
+ *kur* (Kurdish),
182
+ *kur_ara* (Kurdish (Arabic)),
183
+ *lao* (Lao),
184
+ *lat* (Latin),
185
+ *lav* (Latvian),
186
+ *lit* (Lithuanian),
187
+ *ltz* (Luxembourgish),
188
+ *mal* (Malayalam),
189
+ *mar* (Marathi),
190
+ *mkd* (Macedonian),
191
+ *mlt* (Maltese),
192
+ *mon* (Mongolian),
193
+ *mri* (Maori),
194
+ *msa* (Malay),
195
+ *mya* (Burmese),
196
+ *nep* (Nepali),
197
+ *nld* (Dutch; Flemish),
198
+ *nor* (Norwegian),
199
+ *oci* (Occitan (post 1500)),
200
+ *ori* (Oriya),
201
+ *osd* (Orientation and script detection module),
202
+ *pan* (Panjabi; Punjabi),
203
+ *pol* (Polish),
204
+ *por* (Portuguese),
205
+ *pus* (Pushto; Pashto),
206
+ *que* (Quechua),
207
+ *ron* (Romanian; Moldavian; Moldovan),
208
+ *rus* (Russian),
209
+ *san* (Sanskrit),
210
+ *sin* (Sinhala; Sinhalese),
211
+ *slk* (Slovak),
212
+ *slk_frak* (Slovak - Fraktur),
213
+ *slv* (Slovenian),
214
+ *snd* (Sindhi),
215
+ *spa* (Spanish; Castilian),
216
+ *spa_old* (Spanish; Castilian - Old),
217
+ *sqi* (Albanian),
218
+ *srp* (Serbian),
219
+ *srp_latn* (Serbian - Latin),
220
+ *sun* (Sundanese),
221
+ *swa* (Swahili),
222
+ *swe* (Swedish),
223
+ *syr* (Syriac),
224
+ *tam* (Tamil),
225
+ *tat* (Tatar),
226
+ *tel* (Telugu),
227
+ *tgk* (Tajik),
228
+ *tgl* (Tagalog),
229
+ *tha* (Thai),
230
+ *tir* (Tigrinya),
231
+ *ton* (Tonga),
232
+ *tur* (Turkish),
233
+ *uig* (Uighur; Uyghur),
234
+ *ukr* (Ukrainian),
235
+ *urd* (Urdu),
236
+ *uzb* (Uzbek),
237
+ *uzb_cyrl* (Uzbek - Cyrilic),
238
+ *vie* (Vietnamese),
239
+ *yid* (Yiddish),
240
240
*yor* (Yoruba)
241
241
242
242
To use a non-standard language pack named *foo.traineddata*, set the
0 commit comments