mirror of
https://github.com/freedomofpress/dangerzone.git
synced 2025-04-28 18:02:38 +02:00
tesseract: add new lanaguages and others
Tagalo was replaced with filipino [1] in newer tesseract versions, so it
doesn't make sense for us to use the new name and map it to the old
"tgl" name (Tagalo) under the hood.
Language names obtained from tesseract's man page [2].
[1]: 58f7a72f00
[2]: https://github.com/tesseract-ocr/tesseract/blob/main/doc/tesseract.1.asc
This commit is contained in:
parent
d8d83ff036
commit
58332fdd6e
1 changed files with 6 additions and 3 deletions
|
@ -24,6 +24,7 @@
|
||||||
"Frankish": "frk",
|
"Frankish": "frk",
|
||||||
"French, Middle (ca.1400-1600)": "frm",
|
"French, Middle (ca.1400-1600)": "frm",
|
||||||
"Galician": "glg",
|
"Galician": "glg",
|
||||||
|
"Greek, Ancient, to 1453": "grc",
|
||||||
"Hebrew": "heb",
|
"Hebrew": "heb",
|
||||||
"Hindi": "hin",
|
"Hindi": "hin",
|
||||||
"Croatian": "hrv",
|
"Croatian": "hrv",
|
||||||
|
@ -50,14 +51,16 @@
|
||||||
"Russian": "rus",
|
"Russian": "rus",
|
||||||
"Slovakian": "slk",
|
"Slovakian": "slk",
|
||||||
"Spanish": "spa",
|
"Spanish": "spa",
|
||||||
"Spanish": "spa_old",
|
"Spanish; Castilian - Old": "spa_old",
|
||||||
"Albanian": "sqi",
|
"Albanian": "sqi",
|
||||||
"Serbian": "srp",
|
"Serbian": "srp",
|
||||||
"Swahili": "swa",
|
"Swahili": "swa",
|
||||||
"Swedish": "swe",
|
"Swedish": "swe",
|
||||||
"Tamil": "tam",
|
"Tamil": "tam",
|
||||||
"Telugu": "tel",
|
"Telugu": "tel",
|
||||||
|
"Filipino": "tgl",
|
||||||
"Thai": "tha",
|
"Thai": "tha",
|
||||||
"Turkish": "tur",
|
"Turkish": "tur",
|
||||||
"Ukrainian": "ukr"
|
"Ukrainian": "ukr",
|
||||||
}
|
"Vietnamese": "vie"
|
||||||
|
}
|
||||||
|
|
Loading…
Reference in a new issue