Restore the OCR languages

Restore the OCR languages to the state they were in
66d3c40163, with some minor changes. We
can now do so because we download all the trained models, not just the
ones that Alpine Linux offers.
This commit is contained in:
Alex Pyrgiotis 2023-05-18 23:54:43 +03:00
parent a0d6f0d719
commit 35e439f9e8
No known key found for this signature in database
GPG key ID: B6C15EBA0357C9AA

View file

@ -1,66 +1,130 @@
{ {
"Afrikaans": "arf", "Afrikaans": "afr",
"Amharic": "amh",
"Arabic": "ara", "Arabic": "ara",
"Assamese": "asm", "Assamese": "asm",
"Azerbaijani": "aze", "Azerbaijani": "aze",
"Azerbaijani (Cyrillic)": "aze_cyrl",
"Belarusian": "bel", "Belarusian": "bel",
"Bengali": "ben", "Bengali": "ben",
"Tibetan Standard": "bod",
"Bosnian": "bos",
"Breton": "bre",
"Bulgarian": "bul", "Bulgarian": "bul",
"Catalan": "cat", "Catalan": "cat",
"Cebuano": "ceb",
"Czech": "ces", "Czech": "ces",
"Chinese - Simplified": "chi_sim", "Chinese - Simplified": "chi_sim",
"Chinese - Simplified (vertical)": "chi_sim_vert",
"Chinese - Traditional": "chi_tra", "Chinese - Traditional": "chi_tra",
"Chinese - Traditional (vertical)": "chi_tra_vert",
"Cherokee": "chr", "Cherokee": "chr",
"Corsican": "cos",
"Welsh": "cym",
"Danish": "dan", "Danish": "dan",
"Danish - Fraktur": "dan_frak",
"German": "deu", "German": "deu",
"German - Fraktur": "deu_frak",
"Divehi": "div",
"Dzongkha": "dzo",
"Greek": "ell", "Greek": "ell",
"English": "eng", "English": "eng",
"English, Middle (1100-1500)": "enm", "English, Middle (1100-1500)": "enm",
"Esperanto": "epo", "Esperanto": "epo",
"Estonian": "est", "Estonian": "est",
"Basque": "eus", "Basque": "eus",
"Faroese": "fao",
"Persian": "fas",
"Filipino": "fil",
"Finnish": "fin", "Finnish": "fin",
"French": "fra", "French": "fra",
"Frankish": "frk", "Frankish": "frk",
"French, Middle (ca.1400-1600)": "frm", "French, Middle (ca.1400-1600)": "frm",
"Frisian (Western)": "fry",
"Gaelic (Scots)": "gla",
"Irish": "gle",
"Galician": "glg", "Galician": "glg",
"Greek, Ancient, to 1453": "grc", "Greek, Ancient (to 1453)": "grc",
"Gujarati": "guj",
"Hatian": "hat",
"Hebrew": "heb", "Hebrew": "heb",
"Hindi": "hin", "Hindi": "hin",
"Croatian": "hrv", "Croatian": "hrv",
"Hungarian": "hun", "Hungarian": "hun",
"Armenian": "hye",
"Inuktitut": "iku",
"Indonesian": "ind", "Indonesian": "ind",
"Icelandic": "isl", "Icelandic": "isl",
"Italian": "ita", "Italian": "ita",
"Italian - Old": "ita_old", "Italian - Old": "ita_old",
"Javanese": "jav",
"Japanese": "jpn", "Japanese": "jpn",
"Japanese (vertical)": "jpn_vert",
"Kannada": "kan", "Kannada": "kan",
"Georgian": "kat", "Georgian": "kat",
"Old Georgian": "kat_old",
"Kazakh": "kaz",
"Khmer": "khm",
"Kyrgyz": "kir",
"Kurmanji (Kurdish - Latin Script)": "kmr",
"Korean": "kor", "Korean": "kor",
"Korean (vertical)": "kor_vert",
"Kurdish (Arabic)": "kur_ara",
"Lao": "lao",
"Latin": "lat",
"Latvian": "lav", "Latvian": "lav",
"Lithuanian": "lit", "Lithuanian": "lit",
"Luxembourgish": "ltz",
"Malayalam": "mal", "Malayalam": "mal",
"Marathi": "mar",
"Macedonian": "mkd", "Macedonian": "mkd",
"Maltese": "mlt", "Maltese": "mlt",
"Mongolian": "mon",
"Maori": "mri",
"Malay": "msa", "Malay": "msa",
"Burmese": "mya",
"Nepali": "nep",
"Dutch": "nld", "Dutch": "nld",
"Norwegian": "nor", "Norwegian": "nor",
"Occitan (post 1500)": "oci",
"Oriya": "ori",
"Punjabi": "pan",
"Polish": "pol", "Polish": "pol",
"Portuguese": "por", "Portuguese": "por",
"Pashto": "pus",
"Quechua": "que",
"Romanian": "ron", "Romanian": "ron",
"Russian": "rus", "Russian": "rus",
"Sanskrit": "san",
"Sinhala": "sin",
"Slovakian": "slk", "Slovakian": "slk",
"Slovak - Fraktur": "slk_frak",
"Slovenian": "slv",
"Sindhi": "snd",
"Spanish": "spa", "Spanish": "spa",
"Spanish; Castilian - Old": "spa_old", "Spanish; Castilian - Old": "spa_old",
"Albanian": "sqi", "Albanian": "sqi",
"Serbian": "srp", "Serbian": "srp",
"Serbian (Latin)": "srp_latn",
"Sundanese": "sun",
"Swahili": "swa", "Swahili": "swa",
"Swedish": "swe", "Swedish": "swe",
"Syriac": "syr",
"Tamil": "tam", "Tamil": "tam",
"Tatar": "tat",
"Telugu": "tel", "Telugu": "tel",
"Filipino": "tgl", "Tajik": "tgk",
"Tagalog (new - Filipino)": "tgl",
"Thai": "tha", "Thai": "tha",
"Tigrinya": "tir",
"Tonga": "ton",
"Turkish": "tur", "Turkish": "tur",
"Uyghur": "uig",
"Ukrainian": "ukr", "Ukrainian": "ukr",
"Vietnamese": "vie" "Urdu": "urd",
"Uzbek": "uzb",
"Uzbek (Cyrillic)": "uzb_cyrl",
"Vietnamese": "vie",
"Yiddish": "yid",
"Yoruba": "yor"
} }