diff --git a/modules/joex/src/main/scala/docspell/joex/process/ConvertPdf.scala b/modules/joex/src/main/scala/docspell/joex/process/ConvertPdf.scala index 57292563..84828e19 100644 --- a/modules/joex/src/main/scala/docspell/joex/process/ConvertPdf.scala +++ b/modules/joex/src/main/scala/docspell/joex/process/ConvertPdf.scala @@ -40,14 +40,14 @@ object ConvertPdf { Task { ctx => def convert(ra: RAttachment): F[(RAttachment, Option[RAttachmentMeta])] = isConverted(ctx)(ra).flatMap { - case true => + case true if ctx.args.isNormalProcessing => ctx.logger.info( s"Conversion to pdf already done for attachment ${ra.name}." ) *> ctx.store .transact(RAttachmentMeta.findById(ra.id)) .map(rmOpt => (ra, rmOpt)) - case false => + case _ => findMime(ctx)(ra).flatMap(m => convertSafe(cfg, JsoupSanitizer.clean, ctx, item)(ra, m) ) diff --git a/modules/joex/src/main/scala/docspell/joex/process/TextExtraction.scala b/modules/joex/src/main/scala/docspell/joex/process/TextExtraction.scala index fcdd6f98..2dcc4d31 100644 --- a/modules/joex/src/main/scala/docspell/joex/process/TextExtraction.scala +++ b/modules/joex/src/main/scala/docspell/joex/process/TextExtraction.scala @@ -84,10 +84,10 @@ object TextExtraction { val rm = item.findOrCreate(ra.id, lang) rm.content match { - case Some(_) => + case Some(_) if ctx.args.isNormalProcessing => ctx.logger.info("TextExtraction skipped, since text is already available.") *> makeTextData((rm, Nil)).pure[F] - case None => + case _ => extractTextToMeta[F](ctx, cfg, lang, item)(ra) .map(makeTextData) }