mirror of
https://github.com/TheAnachronism/docspell.git
synced 2025-06-22 02:18:26 +00:00
Updating stanford corenlp to 4.3.2; adding more languages
There are models for Spanish, that have been added now. Also the Hungarian language has been added to the list of supported languages (for tesseract mainly, no nlp models)
This commit is contained in:
@ -30,7 +30,7 @@ object Language {
|
||||
override val allowsNLP = true
|
||||
}
|
||||
object NLPLanguage {
|
||||
val all: NonEmptyList[NLPLanguage] = NonEmptyList.of(German, English, French)
|
||||
val all: NonEmptyList[NLPLanguage] = NonEmptyList.of(German, English, French, Spanish)
|
||||
}
|
||||
|
||||
case object German extends NLPLanguage {
|
||||
@ -53,11 +53,16 @@ object Language {
|
||||
val iso3 = "ita"
|
||||
}
|
||||
|
||||
case object Spanish extends Language {
|
||||
case object Spanish extends NLPLanguage {
|
||||
val iso2 = "es"
|
||||
val iso3 = "spa"
|
||||
}
|
||||
|
||||
case object Hungarian extends Language {
|
||||
val iso2 = "hu"
|
||||
val iso3 = "hun"
|
||||
}
|
||||
|
||||
case object Portuguese extends Language {
|
||||
val iso2 = "pt"
|
||||
val iso3 = "por"
|
||||
@ -125,6 +130,7 @@ object Language {
|
||||
French,
|
||||
Italian,
|
||||
Spanish,
|
||||
Hungarian,
|
||||
Dutch,
|
||||
Portuguese,
|
||||
Czech,
|
||||
|
Reference in New Issue
Block a user