diff --git a/modules/joex/src/main/resources/reference.conf b/modules/joex/src/main/resources/reference.conf index 059e6d05..bd0de234 100644 --- a/modules/joex/src/main/resources/reference.conf +++ b/modules/joex/src/main/resources/reference.conf @@ -169,7 +169,7 @@ docspell.joex { # below, OCR is run afterwards. Then both extracted texts are # compared and the longer will be used. pdf { - min-text-len = 10 + min-text-len = 500 } # Extracting text using OCR works for image and pdf files. It will