Separate ner from classification

This commit is contained in:
Eike Kettner
2021-01-13 21:41:51 +01:00
parent f02f15e5bd
commit a699e87304
12 changed files with 25 additions and 28 deletions

View File

@ -1,4 +1,4 @@
package docspell.analysis.nlp
package docspell.analysis.classifier
import minitest._
import cats.effect._

View File

@ -13,7 +13,7 @@ object TextAnalyserSuite extends SimpleTestSuite {
test("find english ner labels") {
val labels =
StanfordNerClassifier.runClassifier(englishClassifier, TestFiles.letterENText)
StanfordNerAnnotator.nerAnnotate(englishClassifier, TestFiles.letterENText)
val expect = Vector(
NerLabel("Derek", NerTag.Person, 0, 5),
NerLabel("Jeter", NerTag.Person, 6, 11),
@ -49,7 +49,7 @@ object TextAnalyserSuite extends SimpleTestSuite {
test("find german ner labels") {
val labels =
StanfordNerClassifier.runClassifier(germanClassifier, TestFiles.letterDEText)
StanfordNerAnnotator.nerAnnotate(germanClassifier, TestFiles.letterDEText)
val expect = Vector(
NerLabel("Max", NerTag.Person, 0, 3),
NerLabel("Mustermann", NerTag.Person, 4, 14),