mirror of
https://github.com/TheAnachronism/docspell.git
synced 2025-02-22 14:03:26 +00:00
commit
216f69c322
@ -14,6 +14,7 @@ import fs2.Stream
|
||||
import docspell.backend.ops.OItemSearch._
|
||||
import docspell.common._
|
||||
import docspell.store._
|
||||
import docspell.store.file.FileMetadata
|
||||
import docspell.store.queries.{QAttachment, QItem}
|
||||
import docspell.store.records._
|
||||
|
||||
@ -89,18 +90,21 @@ object OItemSearch {
|
||||
trait BinaryData[F[_]] {
|
||||
def data: Stream[F, Byte]
|
||||
def name: Option[String]
|
||||
def meta: RFileMeta
|
||||
def fileId: Ident
|
||||
def meta: FileMetadata
|
||||
def fileId: FileKey
|
||||
}
|
||||
case class AttachmentData[F[_]](ra: RAttachment, meta: RFileMeta, data: Stream[F, Byte])
|
||||
extends BinaryData[F] {
|
||||
case class AttachmentData[F[_]](
|
||||
ra: RAttachment,
|
||||
meta: FileMetadata,
|
||||
data: Stream[F, Byte]
|
||||
) extends BinaryData[F] {
|
||||
val name = ra.name
|
||||
val fileId = ra.fileId
|
||||
}
|
||||
|
||||
case class AttachmentSourceData[F[_]](
|
||||
rs: RAttachmentSource,
|
||||
meta: RFileMeta,
|
||||
meta: FileMetadata,
|
||||
data: Stream[F, Byte]
|
||||
) extends BinaryData[F] {
|
||||
val name = rs.name
|
||||
@ -109,7 +113,7 @@ object OItemSearch {
|
||||
|
||||
case class AttachmentPreviewData[F[_]](
|
||||
rs: RAttachmentPreview,
|
||||
meta: RFileMeta,
|
||||
meta: FileMetadata,
|
||||
data: Stream[F, Byte]
|
||||
) extends BinaryData[F] {
|
||||
val name = rs.name
|
||||
@ -118,7 +122,7 @@ object OItemSearch {
|
||||
|
||||
case class AttachmentArchiveData[F[_]](
|
||||
rs: RAttachmentArchive,
|
||||
meta: RFileMeta,
|
||||
meta: FileMetadata,
|
||||
data: Stream[F, Byte]
|
||||
) extends BinaryData[F] {
|
||||
val name = rs.name
|
||||
@ -188,7 +192,7 @@ object OItemSearch {
|
||||
AttachmentData[F](
|
||||
ra,
|
||||
m,
|
||||
store.fileStore.getBytes(m.id)
|
||||
store.fileRepo.getBytes(m.id)
|
||||
)
|
||||
}
|
||||
|
||||
@ -208,7 +212,7 @@ object OItemSearch {
|
||||
AttachmentSourceData[F](
|
||||
ra,
|
||||
m,
|
||||
store.fileStore.getBytes(m.id)
|
||||
store.fileRepo.getBytes(m.id)
|
||||
)
|
||||
}
|
||||
|
||||
@ -228,7 +232,7 @@ object OItemSearch {
|
||||
AttachmentPreviewData[F](
|
||||
ra,
|
||||
m,
|
||||
store.fileStore.getBytes(m.id)
|
||||
store.fileRepo.getBytes(m.id)
|
||||
)
|
||||
}
|
||||
|
||||
@ -248,7 +252,7 @@ object OItemSearch {
|
||||
AttachmentPreviewData[F](
|
||||
ra,
|
||||
m,
|
||||
store.fileStore.getBytes(m.id)
|
||||
store.fileRepo.getBytes(m.id)
|
||||
)
|
||||
}
|
||||
|
||||
@ -268,7 +272,7 @@ object OItemSearch {
|
||||
AttachmentArchiveData[F](
|
||||
ra,
|
||||
m,
|
||||
store.fileStore.getBytes(m.id)
|
||||
store.fileRepo.getBytes(m.id)
|
||||
)
|
||||
}
|
||||
|
||||
@ -276,9 +280,11 @@ object OItemSearch {
|
||||
(None: Option[AttachmentArchiveData[F]]).pure[F]
|
||||
}
|
||||
|
||||
private def makeBinaryData[A](fileId: Ident)(f: RFileMeta => A): F[Option[A]] =
|
||||
store.fileStore
|
||||
.findMeta(fileId)
|
||||
private def makeBinaryData[A](fileId: FileKey)(f: FileMetadata => A): F[Option[A]] =
|
||||
OptionT(
|
||||
store.fileRepo
|
||||
.findMeta(fileId)
|
||||
)
|
||||
.map(fm => f(fm))
|
||||
.value
|
||||
|
||||
|
@ -249,7 +249,7 @@ object OMail {
|
||||
} yield {
|
||||
val addAttach = m.attach.filter(ras).map { a =>
|
||||
Attach[F](
|
||||
store.fileStore.getBytes(a._2.id)
|
||||
store.fileRepo.getBytes(a._2.id)
|
||||
).withFilename(a._1.name)
|
||||
.withLength(a._2.length.bytes)
|
||||
.withMimeType(a._2.mimetype.toEmil)
|
||||
|
@ -126,7 +126,7 @@ object OUpload {
|
||||
): F[OUpload.UploadResult] =
|
||||
(for {
|
||||
_ <- checkExistingItem(itemId, account.collective)
|
||||
files <- right(data.files.traverse(saveFile).map(_.flatten))
|
||||
files <- right(data.files.traverse(saveFile(account)).map(_.flatten))
|
||||
_ <- checkFileList(files)
|
||||
lang <- data.meta.language match {
|
||||
case Some(lang) => right(lang.pure[F])
|
||||
@ -200,10 +200,18 @@ object OUpload {
|
||||
} yield UploadResult.Success
|
||||
|
||||
/** Saves the file into the database. */
|
||||
private def saveFile(file: File[F]): F[Option[ProcessItemArgs.File]] =
|
||||
private def saveFile(
|
||||
accountId: AccountId
|
||||
)(file: File[F]): F[Option[ProcessItemArgs.File]] =
|
||||
logger.finfo(s"Receiving file $file") *>
|
||||
file.data
|
||||
.through(store.fileStore.save(MimeTypeHint(file.name, None)))
|
||||
.through(
|
||||
store.fileRepo.save(
|
||||
accountId.collective,
|
||||
FileCategory.AttachmentSource,
|
||||
MimeTypeHint(file.name, None)
|
||||
)
|
||||
)
|
||||
.compile
|
||||
.lastOrError
|
||||
.attempt
|
||||
|
@ -0,0 +1,46 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.common
|
||||
|
||||
import cats.data.NonEmptyList
|
||||
|
||||
import docspell.common
|
||||
|
||||
import io.circe.{Decoder, Encoder}
|
||||
|
||||
/** This is used to have a rough idea for what a file is used in the system. It is part of
|
||||
* the file-key to identify a file, backends could ignore it, since the file-id (the last
|
||||
* part of the file-key) should be globally unique anyways.
|
||||
*/
|
||||
sealed trait FileCategory { self: Product =>
|
||||
final def id: Ident =
|
||||
Ident.unsafe(self.productPrefix.toLowerCase)
|
||||
|
||||
def toFileKey(collective: Ident, fileId: Ident): FileKey =
|
||||
common.FileKey(collective, this, fileId)
|
||||
}
|
||||
|
||||
object FileCategory {
|
||||
// Impl note: Changing constants here requires a database migration!
|
||||
|
||||
case object AttachmentSource extends FileCategory
|
||||
case object AttachmentConvert extends FileCategory
|
||||
case object PreviewImage extends FileCategory
|
||||
case object Classifier extends FileCategory
|
||||
|
||||
val all: NonEmptyList[FileCategory] =
|
||||
NonEmptyList.of(AttachmentSource, AttachmentConvert, PreviewImage, Classifier)
|
||||
|
||||
def fromString(str: String): Either[String, FileCategory] =
|
||||
all.find(_.id.id == str).toRight(s"Unknown category: $str")
|
||||
|
||||
implicit val jsonDecoder: Decoder[FileCategory] =
|
||||
Decoder[String].emap(fromString)
|
||||
|
||||
implicit val jsonEncoder: Encoder[FileCategory] =
|
||||
Encoder[String].contramap(_.id.id)
|
||||
}
|
21
modules/common/src/main/scala/docspell/common/FileKey.scala
Normal file
21
modules/common/src/main/scala/docspell/common/FileKey.scala
Normal file
@ -0,0 +1,21 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.common
|
||||
|
||||
import io.circe.generic.semiauto.{deriveDecoder, deriveEncoder}
|
||||
import io.circe.{Decoder, Encoder}
|
||||
|
||||
case class FileKey(collective: Ident, category: FileCategory, id: Ident)
|
||||
|
||||
object FileKey {
|
||||
|
||||
implicit val jsonDecoder: Decoder[FileKey] =
|
||||
deriveDecoder[FileKey]
|
||||
|
||||
implicit val jsonEncoder: Encoder[FileKey] =
|
||||
deriveEncoder[FileKey]
|
||||
}
|
@ -25,13 +25,15 @@ case class Ident(id: String) {
|
||||
!isEmpty
|
||||
|
||||
def /(next: Ident): Ident =
|
||||
new Ident(id + "." + next.id)
|
||||
new Ident(id + Ident.concatChar + next.id)
|
||||
}
|
||||
|
||||
object Ident {
|
||||
private val concatChar = '.'
|
||||
implicit val identEq: Eq[Ident] =
|
||||
Eq.by(_.id)
|
||||
|
||||
// Note, the slash *must not* be part of valid characters
|
||||
val chars: Set[Char] = (('A' to 'Z') ++ ('a' to 'z') ++ ('0' to '9') ++ "-_.@").toSet
|
||||
|
||||
def randomUUID[F[_]: Sync]: F[Ident] =
|
||||
@ -75,5 +77,4 @@ object Ident {
|
||||
|
||||
implicit val order: Order[Ident] =
|
||||
Order.by(_.id)
|
||||
|
||||
}
|
||||
|
@ -60,7 +60,7 @@ object ProcessItemArgs {
|
||||
implicit val jsonDecoder: Decoder[ProcessMeta] = deriveDecoder[ProcessMeta]
|
||||
}
|
||||
|
||||
case class File(name: Option[String], fileMetaId: Ident)
|
||||
case class File(name: Option[String], fileMetaId: FileKey)
|
||||
object File {
|
||||
implicit val jsonEncoder: Encoder[File] = deriveEncoder[File]
|
||||
implicit val jsonDecoder: Decoder[File] = deriveDecoder[File]
|
||||
|
@ -31,7 +31,7 @@ object Classify {
|
||||
_ <- OptionT.liftF(logger.info(s"Guessing label for ${cname.name} …"))
|
||||
model <- OptionT(store.transact(RClassifierModel.findByName(coll, cname.name)))
|
||||
.flatTapNone(logger.debug("No classifier model found."))
|
||||
modelData = store.fileStore.getBytes(model.fileId)
|
||||
modelData = store.fileRepo.getBytes(model.fileId)
|
||||
cls <- OptionT(File.withTempDir(workingDir, "classify").use { dir =>
|
||||
val modelFile = dir.resolve("model.ser.gz")
|
||||
modelData
|
||||
|
@ -91,7 +91,7 @@ object LearnClassifierTask {
|
||||
n <- ctx.store.transact(RClassifierModel.deleteAll(list.map(_.id)))
|
||||
_ <- list
|
||||
.map(_.fileId)
|
||||
.traverse(id => ctx.store.fileStore.delete(id))
|
||||
.traverse(id => ctx.store.fileRepo.delete(id))
|
||||
_ <- ctx.logger.debug(s"Deleted $n model files.")
|
||||
} yield ()
|
||||
|
||||
|
@ -42,7 +42,12 @@ object StoreClassifierModel {
|
||||
_ <- logger.debug(s"Storing new trained model for: ${modelName.name}")
|
||||
fileData = Files[F].readAll(trainedModel.model)
|
||||
newFileId <-
|
||||
fileData.through(store.fileStore.save(MimeTypeHint.none)).compile.lastOrError
|
||||
fileData
|
||||
.through(
|
||||
store.fileRepo.save(collective, FileCategory.Classifier, MimeTypeHint.none)
|
||||
)
|
||||
.compile
|
||||
.lastOrError
|
||||
_ <- store.transact(
|
||||
RClassifierModel.updateFile(collective, modelName.name, newFileId)
|
||||
)
|
||||
@ -50,7 +55,7 @@ object StoreClassifierModel {
|
||||
_ <- oldFile match {
|
||||
case Some(fid) =>
|
||||
logger.debug(s"Deleting old model file ${fid.id}") *>
|
||||
store.fileStore.delete(fid)
|
||||
store.fileRepo.delete(fid)
|
||||
case None => ().pure[F]
|
||||
}
|
||||
} yield ()
|
||||
|
@ -92,7 +92,7 @@ object PdfConvTask {
|
||||
ctx: Context[F, Args],
|
||||
in: RFileMeta
|
||||
): F[Unit] = {
|
||||
val fs = ctx.store.fileStore
|
||||
val fs = ctx.store.fileRepo
|
||||
val data = fs.getBytes(in.id)
|
||||
|
||||
val storeResult: ConversionResult.Handler[F, Unit] =
|
||||
@ -141,11 +141,15 @@ object PdfConvTask {
|
||||
newFile: Stream[F, Byte]
|
||||
): F[Unit] = {
|
||||
val mimeHint = MimeTypeHint.advertised(meta.mimetype)
|
||||
val collective = meta.id.collective
|
||||
val cat = FileCategory.AttachmentConvert
|
||||
for {
|
||||
fid <-
|
||||
newFile.through(ctx.store.fileStore.save(mimeHint)).compile.lastOrError
|
||||
newFile
|
||||
.through(ctx.store.fileRepo.save(collective, cat, mimeHint))
|
||||
.compile
|
||||
.lastOrError
|
||||
_ <- ctx.store.transact(RAttachment.updateFileId(ctx.args.attachId, fid))
|
||||
} yield ()
|
||||
}
|
||||
|
||||
}
|
||||
|
@ -100,5 +100,5 @@ object AttachmentPageCount {
|
||||
.getOrElse(MimeType.octetStream)
|
||||
|
||||
def loadFile[F[_]](ctx: Context[F, _])(ra: RAttachment): Stream[F, Byte] =
|
||||
ctx.store.fileStore.getBytes(ra.fileId)
|
||||
ctx.store.fileRepo.getBytes(ra.fileId)
|
||||
}
|
||||
|
@ -59,7 +59,7 @@ object AttachmentPreview {
|
||||
preview.previewPNG(loadFile(ctx)(ra)).flatMap {
|
||||
case Some(out) =>
|
||||
ctx.logger.debug("Preview generated, saving to database…") *>
|
||||
createRecord(ctx, out, ra).map(_.some)
|
||||
createRecord(ctx, ra.fileId.collective, out, ra).map(_.some)
|
||||
case None =>
|
||||
ctx.logger
|
||||
.info(s"Preview could not be generated. Maybe the pdf has no pages?") *>
|
||||
@ -73,6 +73,7 @@ object AttachmentPreview {
|
||||
|
||||
private def createRecord[F[_]: Sync](
|
||||
ctx: Context[F, _],
|
||||
collective: Ident,
|
||||
png: Stream[F, Byte],
|
||||
ra: RAttachment
|
||||
): F[RAttachmentPreview] = {
|
||||
@ -82,7 +83,11 @@ object AttachmentPreview {
|
||||
for {
|
||||
fileId <- png
|
||||
.through(
|
||||
ctx.store.fileStore.save(MimeTypeHint(name.map(_.fullName), Some("image/png")))
|
||||
ctx.store.fileRepo.save(
|
||||
collective,
|
||||
FileCategory.PreviewImage,
|
||||
MimeTypeHint(name.map(_.fullName), Some("image/png"))
|
||||
)
|
||||
)
|
||||
.compile
|
||||
.lastOrError
|
||||
@ -99,5 +104,5 @@ object AttachmentPreview {
|
||||
.getOrElse(MimeType.octetStream)
|
||||
|
||||
def loadFile[F[_]](ctx: Context[F, _])(ra: RAttachment): Stream[F, Byte] =
|
||||
ctx.store.fileStore.getBytes(ra.fileId)
|
||||
ctx.store.fileRepo.getBytes(ra.fileId)
|
||||
}
|
||||
|
@ -32,11 +32,12 @@ import docspell.store.records._
|
||||
* This step assumes an existing premature item, it traverses its attachments.
|
||||
*/
|
||||
object ConvertPdf {
|
||||
type Args = ProcessItemArgs
|
||||
|
||||
def apply[F[_]: Async](
|
||||
cfg: ConvertConfig,
|
||||
item: ItemData
|
||||
): Task[F, ProcessItemArgs, ItemData] =
|
||||
): Task[F, Args, ItemData] =
|
||||
Task { ctx =>
|
||||
def convert(ra: RAttachment): F[(RAttachment, Option[RAttachmentMeta])] =
|
||||
isConverted(ctx)(ra).flatMap {
|
||||
@ -61,7 +62,7 @@ object ConvertPdf {
|
||||
|
||||
}
|
||||
|
||||
def isConverted[F[_]](ctx: Context[F, ProcessItemArgs])(
|
||||
def isConverted[F[_]](ctx: Context[F, Args])(
|
||||
ra: RAttachment
|
||||
): F[Boolean] =
|
||||
ctx.store.transact(RAttachmentSource.isConverted(ra.id))
|
||||
@ -74,14 +75,14 @@ object ConvertPdf {
|
||||
def convertSafe[F[_]: Async](
|
||||
cfg: ConvertConfig,
|
||||
sanitizeHtml: SanitizeHtml,
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
item: ItemData
|
||||
)(ra: RAttachment, mime: MimeType): F[(RAttachment, Option[RAttachmentMeta])] =
|
||||
loadCollectivePasswords(ctx).flatMap(collPass =>
|
||||
Conversion.create[F](cfg, sanitizeHtml, collPass, ctx.logger).use { conv =>
|
||||
mime match {
|
||||
case mt =>
|
||||
val data = ctx.store.fileStore.getBytes(ra.fileId)
|
||||
val data = ctx.store.fileRepo.getBytes(ra.fileId)
|
||||
val handler = conversionHandler[F](ctx, cfg, ra, item)
|
||||
ctx.logger
|
||||
.info(s"Converting file ${ra.name} (${mime.asString}) into a PDF") *>
|
||||
@ -93,14 +94,14 @@ object ConvertPdf {
|
||||
)
|
||||
|
||||
private def loadCollectivePasswords[F[_]: Async](
|
||||
ctx: Context[F, ProcessItemArgs]
|
||||
ctx: Context[F, Args]
|
||||
): F[List[Password]] =
|
||||
ctx.store
|
||||
.transact(RCollectivePassword.findAll(ctx.args.meta.collective))
|
||||
.map(_.map(_.password).distinct)
|
||||
|
||||
private def conversionHandler[F[_]: Sync](
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
cfg: ConvertConfig,
|
||||
ra: RAttachment,
|
||||
item: ItemData
|
||||
@ -146,7 +147,7 @@ object ConvertPdf {
|
||||
}
|
||||
|
||||
private def storePDF[F[_]: Sync](
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
cfg: ConvertConfig,
|
||||
ra: RAttachment,
|
||||
pdf: Stream[F, Byte]
|
||||
@ -160,7 +161,13 @@ object ConvertPdf {
|
||||
.map(_.fullName)
|
||||
|
||||
pdf
|
||||
.through(ctx.store.fileStore.save(MimeTypeHint(hint.filename, hint.advertised)))
|
||||
.through(
|
||||
ctx.store.fileRepo.save(
|
||||
ctx.args.meta.collective,
|
||||
FileCategory.AttachmentConvert,
|
||||
MimeTypeHint(hint.filename, hint.advertised)
|
||||
)
|
||||
)
|
||||
.compile
|
||||
.lastOrError
|
||||
.flatMap(fmId => updateAttachment[F](ctx, ra, fmId, newName).map(_ => fmId))
|
||||
@ -170,7 +177,7 @@ object ConvertPdf {
|
||||
private def updateAttachment[F[_]: Sync](
|
||||
ctx: Context[F, _],
|
||||
ra: RAttachment,
|
||||
fmId: Ident,
|
||||
fmId: FileKey,
|
||||
newName: Option[String]
|
||||
): F[Unit] =
|
||||
for {
|
||||
@ -188,7 +195,7 @@ object ConvertPdf {
|
||||
if (sameFile) ().pure[F]
|
||||
else
|
||||
ctx.logger.info("Deleting previous attachment file") *>
|
||||
ctx.store.fileStore
|
||||
ctx.store.fileRepo
|
||||
.delete(raPrev.fileId)
|
||||
.attempt
|
||||
.flatMap {
|
||||
|
@ -14,6 +14,7 @@ import fs2.Stream
|
||||
|
||||
import docspell.common._
|
||||
import docspell.joex.scheduler.{Context, Task}
|
||||
import docspell.store.file.FileMetadata
|
||||
import docspell.store.queries.QItem
|
||||
import docspell.store.records._
|
||||
|
||||
@ -28,7 +29,7 @@ object CreateItem {
|
||||
|
||||
def createNew[F[_]: Sync]: Task[F, ProcessItemArgs, ItemData] =
|
||||
Task { ctx =>
|
||||
def isValidFile(fm: RFileMeta) =
|
||||
def isValidFile(fm: FileMetadata) =
|
||||
ctx.args.meta.validFileTypes.isEmpty ||
|
||||
ctx.args.meta.validFileTypes.toSet
|
||||
.contains(fm.mimetype)
|
||||
@ -39,9 +40,7 @@ object CreateItem {
|
||||
.flatMap { offset =>
|
||||
Stream
|
||||
.emits(ctx.args.files)
|
||||
.evalMap(f =>
|
||||
ctx.store.fileStore.findMeta(f.fileMetaId).value.map(fm => (f, fm))
|
||||
)
|
||||
.evalMap(f => ctx.store.fileRepo.findMeta(f.fileMetaId).map(fm => (f, fm)))
|
||||
.collect { case (f, Some(fm)) if isValidFile(fm) => f }
|
||||
.zipWithIndex
|
||||
.evalMap { case (f, index) =>
|
||||
@ -198,6 +197,6 @@ object CreateItem {
|
||||
// TODO if no source is present, it must be saved!
|
||||
private def originFileTuple(
|
||||
t: (RAttachment, Option[RAttachmentSource])
|
||||
): (Ident, Ident) =
|
||||
): (Ident, FileKey) =
|
||||
t._2.map(s => s.id -> s.fileId).getOrElse(t._1.id -> t._1.fileId)
|
||||
}
|
||||
|
@ -51,7 +51,7 @@ object DuplicateCheck {
|
||||
val fname = ctx.args.files.find(_.fileMetaId == fd.fm.id).flatMap(_.name)
|
||||
if (fd.exists)
|
||||
ctx.logger
|
||||
.info(s"Deleting duplicate file $fname!") *> ctx.store.fileStore
|
||||
.info(s"Deleting duplicate file $fname!") *> ctx.store.fileRepo
|
||||
.delete(fd.fm.id)
|
||||
else ().pure[F]
|
||||
}
|
||||
|
@ -32,16 +32,17 @@ import emil.Mail
|
||||
* This step assumes an existing premature item, it traverses its attachments.
|
||||
*/
|
||||
object ExtractArchive {
|
||||
type Args = ProcessItemArgs
|
||||
|
||||
def apply[F[_]: Async](
|
||||
item: ItemData
|
||||
): Task[F, ProcessItemArgs, ItemData] =
|
||||
): Task[F, Args, ItemData] =
|
||||
multiPass(item, None).map(_._2)
|
||||
|
||||
def multiPass[F[_]: Async](
|
||||
item: ItemData,
|
||||
archive: Option[RAttachmentArchive]
|
||||
): Task[F, ProcessItemArgs, (Option[RAttachmentArchive], ItemData)] =
|
||||
): Task[F, Args, (Option[RAttachmentArchive], ItemData)] =
|
||||
singlePass(item, archive).flatMap { t =>
|
||||
if (t._1.isEmpty) Task.pure(t)
|
||||
else multiPass(t._2, t._1)
|
||||
@ -50,7 +51,7 @@ object ExtractArchive {
|
||||
def singlePass[F[_]: Async](
|
||||
item: ItemData,
|
||||
archive: Option[RAttachmentArchive]
|
||||
): Task[F, ProcessItemArgs, (Option[RAttachmentArchive], ItemData)] =
|
||||
): Task[F, Args, (Option[RAttachmentArchive], ItemData)] =
|
||||
Task { ctx =>
|
||||
def extract(ra: RAttachment, pos: Int): F[Extracted] =
|
||||
findMime(ctx)(ra).flatMap(m => extractSafe(ctx, archive)(ra, pos, m))
|
||||
@ -88,7 +89,7 @@ object ExtractArchive {
|
||||
.getOrElse(MimeType.octetStream)
|
||||
|
||||
def extractSafe[F[_]: Async](
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
archive: Option[RAttachmentArchive]
|
||||
)(ra: RAttachment, pos: Int, mime: MimeType): F[Extracted] =
|
||||
mime match {
|
||||
@ -120,7 +121,7 @@ object ExtractArchive {
|
||||
)
|
||||
_ <- ctx.store.transact(RAttachmentArchive.delete(ra.id))
|
||||
_ <- ctx.store.transact(RAttachment.delete(ra.id))
|
||||
_ <- ctx.store.fileStore.delete(ra.fileId)
|
||||
_ <- ctx.store.fileRepo.delete(ra.fileId)
|
||||
} yield extracted
|
||||
case None =>
|
||||
for {
|
||||
@ -132,10 +133,10 @@ object ExtractArchive {
|
||||
}
|
||||
|
||||
def extractZip[F[_]: Async](
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
archive: Option[RAttachmentArchive]
|
||||
)(ra: RAttachment, pos: Int): F[Extracted] = {
|
||||
val zipData = ctx.store.fileStore.getBytes(ra.fileId)
|
||||
val zipData = ctx.store.fileRepo.getBytes(ra.fileId)
|
||||
val glob = ctx.args.meta.fileFilter.getOrElse(Glob.all)
|
||||
ctx.logger.debug(s"Filtering zip entries with '${glob.asString}'") *>
|
||||
zipData
|
||||
@ -148,10 +149,10 @@ object ExtractArchive {
|
||||
}
|
||||
|
||||
def extractMail[F[_]: Async](
|
||||
ctx: Context[F, ProcessItemArgs],
|
||||
ctx: Context[F, Args],
|
||||
archive: Option[RAttachmentArchive]
|
||||
)(ra: RAttachment, pos: Int): F[Extracted] = {
|
||||
val email: Stream[F, Byte] = ctx.store.fileStore.getBytes(ra.fileId)
|
||||
val email: Stream[F, Byte] = ctx.store.fileRepo.getBytes(ra.fileId)
|
||||
|
||||
val glob = ctx.args.meta.fileFilter.getOrElse(Glob.all)
|
||||
val attachOnly = ctx.args.meta.attachmentsOnly.getOrElse(false)
|
||||
@ -183,7 +184,7 @@ object ExtractArchive {
|
||||
.getOrElse(Extracted.empty)
|
||||
|
||||
def handleEntry[F[_]: Sync](
|
||||
ctx: Context[F, _],
|
||||
ctx: Context[F, Args],
|
||||
ra: RAttachment,
|
||||
pos: Int,
|
||||
archive: Option[RAttachmentArchive],
|
||||
@ -193,7 +194,10 @@ object ExtractArchive {
|
||||
): Stream[F, Extracted] = {
|
||||
val (entry, subPos) = tentry
|
||||
val mimeHint = MimeTypeHint.filename(entry.name).withAdvertised(entry.mime.asString)
|
||||
val fileId = entry.data.through(ctx.store.fileStore.save(mimeHint))
|
||||
val fileId = entry.data.through(
|
||||
ctx.store.fileRepo
|
||||
.save(ctx.args.meta.collective, FileCategory.AttachmentSource, mimeHint)
|
||||
)
|
||||
|
||||
Stream.eval(ctx.logger.debug(s"Extracted ${entry.name}. Storing as attachment.")) >>
|
||||
fileId.evalMap { fid =>
|
||||
|
@ -38,7 +38,7 @@ case class ItemData(
|
||||
attachments: Vector[RAttachment],
|
||||
metas: Vector[RAttachmentMeta],
|
||||
dateLabels: Vector[AttachmentDates],
|
||||
originFile: Map[Ident, Ident], // maps RAttachment.id -> FileMeta.id
|
||||
originFile: Map[Ident, FileKey], // maps RAttachment.id -> FileMeta.id
|
||||
givenMeta: MetaProposalList, // given meta data not associated to a specific attachment
|
||||
// a list of tags (names or ids) attached to the item if they exist
|
||||
tags: List[String],
|
||||
|
@ -133,7 +133,7 @@ object ItemHandler {
|
||||
ctx.logger.info("Deleting input files …") *>
|
||||
Stream
|
||||
.emits(ctx.args.files.map(_.fileMetaId))
|
||||
.evalMap(id => ctx.store.fileStore.delete(id).attempt)
|
||||
.evalMap(id => ctx.store.fileRepo.delete(id).attempt)
|
||||
.compile
|
||||
.drain
|
||||
)
|
||||
|
@ -126,11 +126,11 @@ object TextExtraction {
|
||||
ctx: Context[F, _],
|
||||
extr: Extraction[F],
|
||||
lang: Language
|
||||
)(fileId: Ident): F[ExtractResult] = {
|
||||
val data = ctx.store.fileStore.getBytes(fileId)
|
||||
)(fileId: FileKey): F[ExtractResult] = {
|
||||
val data = ctx.store.fileRepo.getBytes(fileId)
|
||||
|
||||
def findMime: F[MimeType] =
|
||||
OptionT(ctx.store.transact(RFileMeta.findById(fileId)))
|
||||
OptionT(ctx.store.fileRepo.findMeta(fileId))
|
||||
.map(_.mimetype)
|
||||
.getOrElse(MimeType.octetStream)
|
||||
|
||||
@ -143,7 +143,7 @@ object TextExtraction {
|
||||
cfg: ExtractConfig,
|
||||
ra: RAttachment,
|
||||
lang: Language
|
||||
)(fileIds: List[Ident]): F[Option[ExtractResult.Success]] =
|
||||
)(fileIds: List[FileKey]): F[Option[ExtractResult.Success]] =
|
||||
fileIds match {
|
||||
case Nil =>
|
||||
ctx.logger.error(s"Cannot extract text").map(_ => None)
|
||||
@ -179,7 +179,7 @@ object TextExtraction {
|
||||
private def filesToExtract[F[_]: Sync](ctx: Context[F, _])(
|
||||
item: ItemData,
|
||||
ra: RAttachment
|
||||
): F[List[Ident]] =
|
||||
): F[List[FileKey]] =
|
||||
item.originFile.get(ra.id) match {
|
||||
case Some(sid) =>
|
||||
ctx.store.transact(RFileMeta.findMime(sid)).map {
|
||||
|
@ -15,7 +15,7 @@ import docspell.backend.ops.OItemSearch.{AttachmentData, AttachmentPreviewData}
|
||||
import docspell.backend.ops._
|
||||
import docspell.restapi.model.BasicResult
|
||||
import docspell.restserver.http4s.{QueryParam => QP}
|
||||
import docspell.store.records.RFileMeta
|
||||
import docspell.store.file.FileMetadata
|
||||
|
||||
import org.http4s._
|
||||
import org.http4s.circe.CirceEntityEncoder._
|
||||
@ -117,7 +117,7 @@ object BinaryUtil {
|
||||
}
|
||||
|
||||
def matchETag[F[_]](
|
||||
fileData: Option[RFileMeta],
|
||||
fileData: Option[FileMetadata],
|
||||
noneMatch: Option[NonEmptyList[EntityTag]]
|
||||
): Boolean =
|
||||
(fileData, noneMatch) match {
|
||||
|
@ -0,0 +1,150 @@
|
||||
drop table if exists file_migration_temp;
|
||||
create table file_migration_temp (
|
||||
id bigserial primary key,
|
||||
original_file varchar(254) not null unique,
|
||||
cid varchar(254) not null,
|
||||
category varchar(254) not null,
|
||||
new_file varchar(254) not null unique
|
||||
);
|
||||
|
||||
-- Source files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
i.cid || '/attachmentsource/' || rs.file_id as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Archive files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select distinct
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
i.cid || '/attachmentsource/' || rs.file_id as new_file
|
||||
from attachment_archive rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Converted files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ra.filemetaid as original_file,
|
||||
i.cid,
|
||||
'attachmentconvert' as category,
|
||||
i.cid || '/attachmentconvert/' || ra.filemetaid as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
where rs.file_id <> ra.filemetaid
|
||||
;
|
||||
|
||||
-- Preview image
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ap.file_id as original_file,
|
||||
i.cid,
|
||||
'previewimage' as category,
|
||||
i.cid || '/previewimage/' || ap.file_id as new_file
|
||||
from attachment_preview ap
|
||||
inner join attachment ra on ra.attachid = ap.id
|
||||
inner join item i on i.itemid = ra.itemid
|
||||
order by id
|
||||
;
|
||||
|
||||
-- classifier
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
file_id as original_file,
|
||||
cid,
|
||||
'classifier' as category,
|
||||
cid || '/classifier/' || file_id as new_file
|
||||
from classifier_model
|
||||
;
|
||||
|
||||
|
||||
-- save obsolete/orphaned files
|
||||
drop table if exists obsolete_files;
|
||||
create table obsolete_files(
|
||||
file_id varchar(254) not null,
|
||||
mimetype varchar(254) not null,
|
||||
length bigint not null,
|
||||
checksum varchar(254) not null,
|
||||
created timestamp not null
|
||||
);
|
||||
|
||||
with
|
||||
missing_ids as (
|
||||
select file_id from filemeta
|
||||
except
|
||||
select original_file as file_id from file_migration_temp)
|
||||
insert into obsolete_files (file_id, mimetype, length, checksum, created)
|
||||
select file_id, mimetype, length, checksum, created from filemeta
|
||||
where file_id in (select file_id from missing_ids)
|
||||
;
|
||||
|
||||
|
||||
-- duplicate each filemeta with the new id
|
||||
insert into filemeta (file_id, mimetype, length, checksum, created)
|
||||
select mm.new_file, fm.mimetype, fm.length, fm.checksum, fm.created
|
||||
from file_migration_temp mm
|
||||
inner join filemeta fm on fm.file_id = mm.original_file
|
||||
;
|
||||
|
||||
|
||||
-- update each reference to the new id
|
||||
update attachment_source
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_source.id is not null)
|
||||
;
|
||||
|
||||
update attachment
|
||||
set filemetaid = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = filemetaid and attachment.attachid is not null)
|
||||
;
|
||||
|
||||
update attachment_archive
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_archive.id is not null)
|
||||
;
|
||||
|
||||
update attachment_preview
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_preview.id is not null)
|
||||
;
|
||||
|
||||
update classifier_model
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and classifier_model.id is not null)
|
||||
;
|
||||
|
||||
-- delete old filemeta and filechunk rows
|
||||
delete from filemeta
|
||||
where file_id in (select original_file from file_migration_temp);
|
||||
|
||||
delete from filemeta
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
delete from filechunk
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
-- update chunks
|
||||
update filechunk
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and filechunk.file_id is not null)
|
||||
;
|
||||
|
||||
-- drop temp table
|
||||
drop table file_migration_temp;
|
||||
drop table obsolete_files;
|
@ -0,0 +1,148 @@
|
||||
drop table if exists file_migration_temp;
|
||||
create table file_migration_temp (
|
||||
id bigint auto_increment primary key,
|
||||
original_file varchar(254) not null unique,
|
||||
cid varchar(254) not null,
|
||||
category varchar(254) not null,
|
||||
new_file varchar(254) not null unique
|
||||
);
|
||||
|
||||
-- Source files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
concat(i.cid, '/attachmentsource/', rs.file_id) as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Archive files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select distinct
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
concat(i.cid, '/attachmentsource/', rs.file_id) as new_file
|
||||
from attachment_archive rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Converted files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ra.filemetaid as original_file,
|
||||
i.cid,
|
||||
'attachmentconvert' as category,
|
||||
concat(i.cid, '/attachmentconvert/', ra.filemetaid) as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
where rs.file_id <> ra.filemetaid
|
||||
;
|
||||
|
||||
-- Preview image
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ap.file_id as original_file,
|
||||
i.cid,
|
||||
'previewimage' as category,
|
||||
concat(i.cid, '/previewimage/', ap.file_id) as new_file
|
||||
from attachment_preview ap
|
||||
inner join attachment ra on ra.attachid = ap.id
|
||||
inner join item i on i.itemid = ra.itemid
|
||||
order by id
|
||||
;
|
||||
|
||||
-- classifier
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
file_id as original_file,
|
||||
cid,
|
||||
'classifier' as category,
|
||||
concat(cid, '/classifier/', file_id) as new_file
|
||||
from classifier_model
|
||||
;
|
||||
|
||||
|
||||
-- save obsolete/orphaned files
|
||||
drop table if exists obsolete_files;
|
||||
create table obsolete_files(
|
||||
file_id varchar(254) not null,
|
||||
mimetype varchar(254) not null,
|
||||
length bigint not null,
|
||||
checksum varchar(254) not null,
|
||||
created timestamp not null
|
||||
);
|
||||
|
||||
insert into obsolete_files (file_id, mimetype, length, checksum, created)
|
||||
select file_id, mimetype, length, checksum, created from filemeta
|
||||
where file_id in (
|
||||
select file_id from filemeta
|
||||
except
|
||||
select original_file as file_id from file_migration_temp
|
||||
);
|
||||
|
||||
|
||||
-- duplicate each filemeta with the new id
|
||||
insert into filemeta (file_id, mimetype, length, checksum, created)
|
||||
select mm.new_file, fm.mimetype, fm.length, fm.checksum, fm.created
|
||||
from file_migration_temp mm
|
||||
inner join filemeta fm on fm.file_id = mm.original_file
|
||||
;
|
||||
|
||||
|
||||
-- update each reference to the new id
|
||||
update attachment_source
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_source.id is not null)
|
||||
;
|
||||
|
||||
update attachment
|
||||
set filemetaid = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = filemetaid and attachment.attachid is not null)
|
||||
;
|
||||
|
||||
update attachment_archive
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_archive.id is not null)
|
||||
;
|
||||
|
||||
update attachment_preview
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_preview.id is not null)
|
||||
;
|
||||
|
||||
update classifier_model
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and classifier_model.id is not null)
|
||||
;
|
||||
|
||||
-- delete old filemeta and filechunk rows
|
||||
delete from filemeta
|
||||
where file_id in (select original_file from file_migration_temp);
|
||||
|
||||
delete from filemeta
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
delete from filechunk
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
-- update chunks
|
||||
update filechunk
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and filechunk.file_id is not null)
|
||||
;
|
||||
|
||||
-- drop temp table
|
||||
drop table file_migration_temp;
|
||||
drop table obsolete_files;
|
@ -0,0 +1,150 @@
|
||||
drop table if exists file_migration_temp;
|
||||
create table file_migration_temp (
|
||||
id bigserial primary key,
|
||||
original_file varchar(254) not null unique,
|
||||
cid varchar(254) not null,
|
||||
category varchar(254) not null,
|
||||
new_file varchar(254) not null unique
|
||||
);
|
||||
|
||||
-- Source files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
i.cid || '/attachmentsource/' || rs.file_id as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Archive files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select distinct
|
||||
rs.file_id as original_file,
|
||||
i.cid,
|
||||
'attachmentsource' as category,
|
||||
i.cid || '/attachmentsource/' || rs.file_id as new_file
|
||||
from attachment_archive rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
;
|
||||
|
||||
-- Converted files
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ra.filemetaid as original_file,
|
||||
i.cid,
|
||||
'attachmentconvert' as category,
|
||||
i.cid || '/attachmentconvert/' || ra.filemetaid as new_file
|
||||
from attachment_source rs
|
||||
inner join attachment ra on rs.id = ra.attachid
|
||||
inner join item i on ra.itemid = i.itemid
|
||||
where rs.file_id <> ra.filemetaid
|
||||
;
|
||||
|
||||
-- Preview image
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
ap.file_id as original_file,
|
||||
i.cid,
|
||||
'previewimage' as category,
|
||||
i.cid || '/previewimage/' || ap.file_id as new_file
|
||||
from attachment_preview ap
|
||||
inner join attachment ra on ra.attachid = ap.id
|
||||
inner join item i on i.itemid = ra.itemid
|
||||
order by id
|
||||
;
|
||||
|
||||
-- classifier
|
||||
insert into file_migration_temp (original_file, cid, category, new_file)
|
||||
select
|
||||
file_id as original_file,
|
||||
cid,
|
||||
'classifier' as category,
|
||||
cid || '/classifier/' || file_id as new_file
|
||||
from classifier_model
|
||||
;
|
||||
|
||||
|
||||
-- save obsolete/orphaned files
|
||||
drop table if exists obsolete_files;
|
||||
create table obsolete_files(
|
||||
file_id varchar(254) not null,
|
||||
mimetype varchar(254) not null,
|
||||
length bigint not null,
|
||||
checksum varchar(254) not null,
|
||||
created timestamp not null
|
||||
);
|
||||
|
||||
with
|
||||
missing_ids as (
|
||||
select file_id from filemeta
|
||||
except
|
||||
select original_file as file_id from file_migration_temp)
|
||||
insert into obsolete_files (file_id, mimetype, length, checksum, created)
|
||||
select file_id, mimetype, length, checksum, created from filemeta
|
||||
where file_id in (select file_id from missing_ids)
|
||||
;
|
||||
|
||||
|
||||
-- duplicate each filemeta with the new id
|
||||
insert into filemeta (file_id, mimetype, length, checksum, created)
|
||||
select mm.new_file, fm.mimetype, fm.length, fm.checksum, fm.created
|
||||
from file_migration_temp mm
|
||||
inner join filemeta fm on fm.file_id = mm.original_file
|
||||
;
|
||||
|
||||
|
||||
-- update each reference to the new id
|
||||
update attachment_source
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_source.id is not null)
|
||||
;
|
||||
|
||||
update attachment
|
||||
set filemetaid = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = filemetaid and attachment.attachid is not null)
|
||||
;
|
||||
|
||||
update attachment_archive
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_archive.id is not null)
|
||||
;
|
||||
|
||||
update attachment_preview
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and attachment_preview.id is not null)
|
||||
;
|
||||
|
||||
update classifier_model
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and classifier_model.id is not null)
|
||||
;
|
||||
|
||||
-- delete old filemeta and filechunk rows
|
||||
delete from filemeta
|
||||
where file_id in (select original_file from file_migration_temp);
|
||||
|
||||
delete from filemeta
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
delete from filechunk
|
||||
where file_id in (select file_id from obsolete_files);
|
||||
|
||||
-- update chunks
|
||||
update filechunk
|
||||
set file_id = (select new_file
|
||||
from file_migration_temp
|
||||
where original_file = file_id and filechunk.file_id is not null)
|
||||
;
|
||||
|
||||
-- drop temp table
|
||||
drop table file_migration_temp;
|
||||
drop table obsolete_files;
|
@ -12,7 +12,7 @@ import cats.effect._
|
||||
import cats.~>
|
||||
import fs2._
|
||||
|
||||
import docspell.store.file.FileStore
|
||||
import docspell.store.file.FileRepository
|
||||
import docspell.store.impl.StoreImpl
|
||||
|
||||
import com.zaxxer.hikari.HikariDataSource
|
||||
@ -26,7 +26,7 @@ trait Store[F[_]] {
|
||||
|
||||
def transact[A](prg: Stream[ConnectionIO, A]): Stream[F, A]
|
||||
|
||||
def fileStore: FileStore[F]
|
||||
def fileRepo: FileRepository[F]
|
||||
|
||||
def add(insert: ConnectionIO[Int], exists: ConnectionIO[Boolean]): F[AddResult]
|
||||
}
|
||||
@ -50,8 +50,8 @@ object Store {
|
||||
ds.setDriverClassName(jdbc.driverClass)
|
||||
}
|
||||
xa = HikariTransactor(ds, connectEC)
|
||||
fs = FileStore[F](xa, ds, chunkSize)
|
||||
st = new StoreImpl[F](fs, jdbc, xa)
|
||||
fr = FileRepository.genericJDBC(xa, ds, chunkSize)
|
||||
st = new StoreImpl[F](fr, jdbc, xa)
|
||||
_ <- Resource.eval(st.migrate)
|
||||
} yield st
|
||||
}
|
||||
|
@ -23,8 +23,9 @@ final private[file] class AttributeStore[F[_]: Sync](xa: Transactor[F])
|
||||
for {
|
||||
now <- Timestamp.current[F]
|
||||
a <- attrs
|
||||
fileKey <- makeFileKey(id)
|
||||
fm = RFileMeta(
|
||||
Ident.unsafe(id.id),
|
||||
fileKey,
|
||||
now,
|
||||
MimeType.parse(a.contentType.contentType).getOrElse(MimeType.octetStream),
|
||||
ByteSize(a.length),
|
||||
@ -34,7 +35,7 @@ final private[file] class AttributeStore[F[_]: Sync](xa: Transactor[F])
|
||||
} yield ()
|
||||
|
||||
def deleteAttr(id: BinaryId): F[Boolean] =
|
||||
RFileMeta.delete(Ident.unsafe(id.id)).transact(xa).map(_ > 0)
|
||||
makeFileKey(id).flatMap(fileKey => RFileMeta.delete(fileKey).transact(xa).map(_ > 0))
|
||||
|
||||
def findAttr(id: BinaryId): OptionT[F, BinaryAttributes] =
|
||||
findMeta(id).map(fm =>
|
||||
@ -46,5 +47,10 @@ final private[file] class AttributeStore[F[_]: Sync](xa: Transactor[F])
|
||||
)
|
||||
|
||||
def findMeta(id: BinaryId): OptionT[F, RFileMeta] =
|
||||
OptionT(RFileMeta.findById(Ident.unsafe(id.id)).transact(xa))
|
||||
OptionT(makeFileKey(id).flatMap(fileKey => RFileMeta.findById(fileKey).transact(xa)))
|
||||
|
||||
private def makeFileKey(binaryId: BinaryId): F[FileKey] =
|
||||
Sync[F]
|
||||
.pure(BinnyUtils.binaryIdToFileKey(binaryId).left.map(new IllegalStateException(_)))
|
||||
.rethrow
|
||||
}
|
||||
|
@ -0,0 +1,59 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.store.file
|
||||
|
||||
import docspell.common
|
||||
import docspell.common._
|
||||
import docspell.files.TikaMimetype
|
||||
|
||||
import binny._
|
||||
import scodec.bits.ByteVector
|
||||
|
||||
private[store] object BinnyUtils {
|
||||
|
||||
def fileKeyToBinaryId(fk: FileKey): BinaryId =
|
||||
BinaryId(s"${fk.collective.id}/${fk.category.id.id}/${fk.id.id}")
|
||||
|
||||
def binaryIdToFileKey(bid: BinaryId): Either[String, FileKey] =
|
||||
bid.id.split('/').toList match {
|
||||
case cId :: catId :: fId :: Nil =>
|
||||
for {
|
||||
coll <- Ident.fromString(cId)
|
||||
cat <- FileCategory.fromString(catId)
|
||||
file <- Ident.fromString(fId)
|
||||
} yield common.FileKey(coll, cat, file)
|
||||
case _ =>
|
||||
Left(s"Invalid format for file-key: $bid")
|
||||
}
|
||||
|
||||
def unsafeBinaryIdToFileKey(bid: BinaryId): FileKey =
|
||||
binaryIdToFileKey(bid).fold(
|
||||
err => throw new IllegalStateException(err),
|
||||
identity
|
||||
)
|
||||
|
||||
object LoggerAdapter {
|
||||
def apply[F[_]](log: Logger[F]): binny.util.Logger[F] =
|
||||
new binny.util.Logger[F] {
|
||||
override def trace(msg: => String): F[Unit] = log.trace(msg)
|
||||
override def debug(msg: => String): F[Unit] = log.debug(msg)
|
||||
override def info(msg: => String): F[Unit] = log.info(msg)
|
||||
override def warn(msg: => String): F[Unit] = log.warn(msg)
|
||||
override def error(msg: => String): F[Unit] = log.error(msg)
|
||||
override def error(ex: Throwable)(msg: => String): F[Unit] = log.error(ex)(msg)
|
||||
}
|
||||
}
|
||||
|
||||
object TikaContentTypeDetect extends ContentTypeDetect {
|
||||
override def detect(data: ByteVector, hint: Hint): SimpleContentType =
|
||||
SimpleContentType(
|
||||
TikaMimetype
|
||||
.detect(data, MimeTypeHint(hint.filename, hint.advertisedType))
|
||||
.asString
|
||||
)
|
||||
}
|
||||
}
|
@ -0,0 +1,19 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.store.file
|
||||
|
||||
import docspell.common._
|
||||
|
||||
import scodec.bits.ByteVector
|
||||
|
||||
final case class FileMetadata(
|
||||
id: FileKey,
|
||||
created: Timestamp,
|
||||
mimetype: MimeType,
|
||||
length: ByteSize,
|
||||
checksum: ByteVector
|
||||
)
|
@ -0,0 +1,50 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.store.file
|
||||
|
||||
import javax.sql.DataSource
|
||||
|
||||
import cats.effect._
|
||||
import fs2._
|
||||
|
||||
import docspell.common._
|
||||
|
||||
import binny.BinaryId
|
||||
import binny.jdbc.{GenericJdbcStore, JdbcStoreConfig}
|
||||
import doobie.Transactor
|
||||
|
||||
trait FileRepository[F[_]] {
|
||||
def getBytes(key: FileKey): Stream[F, Byte]
|
||||
|
||||
def findMeta(key: FileKey): F[Option[FileMetadata]]
|
||||
|
||||
def delete(key: FileKey): F[Unit]
|
||||
|
||||
def save(
|
||||
collective: Ident,
|
||||
category: FileCategory,
|
||||
hint: MimeTypeHint
|
||||
): Pipe[F, Byte, FileKey]
|
||||
}
|
||||
|
||||
object FileRepository {
|
||||
private[this] val logger = org.log4s.getLogger
|
||||
|
||||
def genericJDBC[F[_]: Sync](
|
||||
xa: Transactor[F],
|
||||
ds: DataSource,
|
||||
chunkSize: Int
|
||||
): FileRepository[F] = {
|
||||
val attrStore = new AttributeStore[F](xa)
|
||||
val cfg = JdbcStoreConfig("filechunk", chunkSize, BinnyUtils.TikaContentTypeDetect)
|
||||
val log = Logger.log4s[F](logger)
|
||||
val binStore = GenericJdbcStore[F](ds, BinnyUtils.LoggerAdapter(log), cfg, attrStore)
|
||||
val keyFun: FileKey => BinaryId = BinnyUtils.fileKeyToBinaryId
|
||||
|
||||
new FileRepositoryImpl[F](binStore, attrStore, keyFun)
|
||||
}
|
||||
}
|
@ -0,0 +1,60 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.store.file
|
||||
|
||||
import cats.data.OptionT
|
||||
import cats.effect.Sync
|
||||
import cats.implicits._
|
||||
import fs2.{Pipe, Stream}
|
||||
|
||||
import docspell.common._
|
||||
|
||||
import binny._
|
||||
|
||||
final class FileRepositoryImpl[F[_]: Sync](
|
||||
bs: BinaryStore[F],
|
||||
attrStore: AttributeStore[F],
|
||||
keyFun: FileKey => BinaryId
|
||||
) extends FileRepository[F] {
|
||||
|
||||
def find(key: FileKey): OptionT[F, Stream[F, Byte]] =
|
||||
bs.findBinary(keyFun(key), ByteRange.All)
|
||||
|
||||
def getBytes(key: FileKey): Stream[F, Byte] =
|
||||
Stream.eval(find(key).value).unNoneTerminate.flatMap(identity)
|
||||
|
||||
def findMeta(key: FileKey): F[Option[FileMetadata]] =
|
||||
attrStore
|
||||
.findMeta(keyFun(key))
|
||||
.map(rfm =>
|
||||
FileMetadata(rfm.id, rfm.created, rfm.mimetype, rfm.length, rfm.checksum)
|
||||
)
|
||||
.value
|
||||
|
||||
def delete(key: FileKey): F[Unit] =
|
||||
bs.delete(keyFun(key))
|
||||
|
||||
def save(
|
||||
collective: Ident,
|
||||
category: FileCategory,
|
||||
hint: MimeTypeHint
|
||||
): Pipe[F, Byte, FileKey] = {
|
||||
val fhint = Hint(hint.filename, hint.advertised)
|
||||
in =>
|
||||
Stream
|
||||
.eval(randomKey(collective, category))
|
||||
.flatMap(fkey =>
|
||||
in.through(bs.insertWith(keyFun(fkey), fhint)) ++ Stream.emit(fkey)
|
||||
)
|
||||
}
|
||||
|
||||
def randomKey(
|
||||
collective: Ident,
|
||||
category: FileCategory
|
||||
): F[FileKey] =
|
||||
BinaryId.random[F].map(bid => FileKey(collective, category, Ident.unsafe(bid.id)))
|
||||
}
|
@ -1,91 +0,0 @@
|
||||
/*
|
||||
* Copyright 2020 Eike K. & Contributors
|
||||
*
|
||||
* SPDX-License-Identifier: AGPL-3.0-or-later
|
||||
*/
|
||||
|
||||
package docspell.store.file
|
||||
|
||||
import javax.sql.DataSource
|
||||
|
||||
import cats.data.OptionT
|
||||
import cats.effect._
|
||||
import fs2.{Pipe, Stream}
|
||||
|
||||
import docspell.common._
|
||||
import docspell.files.TikaMimetype
|
||||
import docspell.store.records.RFileMeta
|
||||
|
||||
import binny._
|
||||
import binny.jdbc.{GenericJdbcStore, JdbcStoreConfig}
|
||||
import doobie._
|
||||
import scodec.bits.ByteVector
|
||||
|
||||
trait FileStore[F[_]] {
|
||||
|
||||
def find(id: Ident): OptionT[F, Stream[F, Byte]]
|
||||
|
||||
def getBytes(id: Ident): Stream[F, Byte]
|
||||
|
||||
def findMeta(id: Ident): OptionT[F, RFileMeta]
|
||||
|
||||
def delete(id: Ident): F[Unit]
|
||||
|
||||
def save(hint: MimeTypeHint): Pipe[F, Byte, Ident]
|
||||
}
|
||||
|
||||
object FileStore {
|
||||
private[this] val logger = org.log4s.getLogger
|
||||
|
||||
def apply[F[_]: Sync](
|
||||
xa: Transactor[F],
|
||||
ds: DataSource,
|
||||
chunkSize: Int
|
||||
): FileStore[F] = {
|
||||
val attrStore = new AttributeStore[F](xa)
|
||||
val cfg = JdbcStoreConfig("filechunk", chunkSize, TikaContentTypeDetect)
|
||||
val log = Logger.log4s[F](logger)
|
||||
val binStore = GenericJdbcStore[F](ds, LoggerAdapter(log), cfg, attrStore)
|
||||
new Impl[F](binStore, attrStore)
|
||||
}
|
||||
|
||||
final private class Impl[F[_]](bs: BinaryStore[F], attrStore: AttributeStore[F])
|
||||
extends FileStore[F] {
|
||||
def find(id: Ident): OptionT[F, Stream[F, Byte]] =
|
||||
bs.findBinary(BinaryId(id.id), ByteRange.All)
|
||||
|
||||
def getBytes(id: Ident): Stream[F, Byte] =
|
||||
Stream.eval(find(id).value).unNoneTerminate.flatMap(identity)
|
||||
|
||||
def findMeta(id: Ident): OptionT[F, RFileMeta] =
|
||||
attrStore.findMeta(BinaryId(id.id))
|
||||
|
||||
def delete(id: Ident): F[Unit] =
|
||||
bs.delete(BinaryId(id.id))
|
||||
|
||||
def save(hint: MimeTypeHint): Pipe[F, Byte, Ident] =
|
||||
bs.insert(Hint(hint.filename, hint.advertised))
|
||||
.andThen(_.map(bid => Ident.unsafe(bid.id)))
|
||||
}
|
||||
|
||||
private object LoggerAdapter {
|
||||
def apply[F[_]](log: Logger[F]): binny.util.Logger[F] =
|
||||
new binny.util.Logger[F] {
|
||||
override def trace(msg: => String): F[Unit] = log.trace(msg)
|
||||
override def debug(msg: => String): F[Unit] = log.debug(msg)
|
||||
override def info(msg: => String): F[Unit] = log.info(msg)
|
||||
override def warn(msg: => String): F[Unit] = log.warn(msg)
|
||||
override def error(msg: => String): F[Unit] = log.error(msg)
|
||||
override def error(ex: Throwable)(msg: => String): F[Unit] = log.error(ex)(msg)
|
||||
}
|
||||
}
|
||||
|
||||
private object TikaContentTypeDetect extends ContentTypeDetect {
|
||||
override def detect(data: ByteVector, hint: Hint): SimpleContentType =
|
||||
SimpleContentType(
|
||||
TikaMimetype
|
||||
.detect(data, MimeTypeHint(hint.filename, hint.advertisedType))
|
||||
.asString
|
||||
)
|
||||
}
|
||||
}
|
@ -14,8 +14,10 @@ import docspell.common.syntax.all._
|
||||
import docspell.jsonminiq.JsonMiniQuery
|
||||
import docspell.notification.api.{ChannelType, EventType}
|
||||
import docspell.query.{ItemQuery, ItemQueryParser}
|
||||
import docspell.store.file.BinnyUtils
|
||||
import docspell.totp.Key
|
||||
|
||||
import binny.BinaryId
|
||||
import com.github.eikek.calev.CalEvent
|
||||
import doobie._
|
||||
import doobie.implicits.legacy.instant._
|
||||
@ -27,7 +29,7 @@ import scodec.bits.ByteVector
|
||||
|
||||
trait DoobieMeta extends EmilDoobieMeta {
|
||||
|
||||
implicit val sqlLogging = LogHandler {
|
||||
implicit val sqlLogging: LogHandler = LogHandler {
|
||||
case e @ Success(_, _, _, _) =>
|
||||
DoobieMeta.logger.trace("SQL " + e)
|
||||
case e =>
|
||||
@ -39,58 +41,64 @@ trait DoobieMeta extends EmilDoobieMeta {
|
||||
e.apply(a).noSpaces
|
||||
)
|
||||
|
||||
implicit val metaBinaryId: Meta[BinaryId] =
|
||||
Meta[String].timap(BinaryId.apply)(_.id)
|
||||
|
||||
implicit val metaFileKey: Meta[FileKey] =
|
||||
Meta[BinaryId].timap(BinnyUtils.unsafeBinaryIdToFileKey)(BinnyUtils.fileKeyToBinaryId)
|
||||
|
||||
implicit val metaAccountSource: Meta[AccountSource] =
|
||||
Meta[String].imap(AccountSource.unsafeFromString)(_.name)
|
||||
Meta[String].timap(AccountSource.unsafeFromString)(_.name)
|
||||
|
||||
implicit val metaDuration: Meta[Duration] =
|
||||
Meta[Long].imap(Duration.millis)(_.millis)
|
||||
Meta[Long].timap(Duration.millis)(_.millis)
|
||||
|
||||
implicit val metaCollectiveState: Meta[CollectiveState] =
|
||||
Meta[String].imap(CollectiveState.unsafe)(CollectiveState.asString)
|
||||
Meta[String].timap(CollectiveState.unsafe)(CollectiveState.asString)
|
||||
|
||||
implicit val metaUserState: Meta[UserState] =
|
||||
Meta[String].imap(UserState.unsafe)(UserState.asString)
|
||||
Meta[String].timap(UserState.unsafe)(UserState.asString)
|
||||
|
||||
implicit val metaPassword: Meta[Password] =
|
||||
Meta[String].imap(Password(_))(_.pass)
|
||||
Meta[String].timap(Password(_))(_.pass)
|
||||
|
||||
implicit val metaIdent: Meta[Ident] =
|
||||
Meta[String].imap(Ident.unsafe)(_.id)
|
||||
Meta[String].timap(Ident.unsafe)(_.id)
|
||||
|
||||
implicit val metaContactKind: Meta[ContactKind] =
|
||||
Meta[String].imap(ContactKind.unsafe)(_.asString)
|
||||
Meta[String].timap(ContactKind.unsafe)(_.asString)
|
||||
|
||||
implicit val metaTimestamp: Meta[Timestamp] =
|
||||
Meta[Instant].imap(Timestamp(_))(_.value)
|
||||
Meta[Instant].timap(Timestamp(_))(_.value)
|
||||
|
||||
implicit val metaJobState: Meta[JobState] =
|
||||
Meta[String].imap(JobState.unsafe)(_.name)
|
||||
Meta[String].timap(JobState.unsafe)(_.name)
|
||||
|
||||
implicit val metaDirection: Meta[Direction] =
|
||||
Meta[Boolean].imap(flag =>
|
||||
Meta[Boolean].timap(flag =>
|
||||
if (flag) Direction.Incoming: Direction else Direction.Outgoing: Direction
|
||||
)(d => Direction.isIncoming(d))
|
||||
|
||||
implicit val metaPriority: Meta[Priority] =
|
||||
Meta[Int].imap(Priority.fromInt)(Priority.toInt)
|
||||
Meta[Int].timap(Priority.fromInt)(Priority.toInt)
|
||||
|
||||
implicit val metaLogLevel: Meta[LogLevel] =
|
||||
Meta[String].imap(LogLevel.unsafeString)(_.name)
|
||||
Meta[String].timap(LogLevel.unsafeString)(_.name)
|
||||
|
||||
implicit val metaLenientUri: Meta[LenientUri] =
|
||||
Meta[String].imap(LenientUri.unsafe)(_.asString)
|
||||
Meta[String].timap(LenientUri.unsafe)(_.asString)
|
||||
|
||||
implicit val metaNodeType: Meta[NodeType] =
|
||||
Meta[String].imap(NodeType.unsafe)(_.name)
|
||||
Meta[String].timap(NodeType.unsafe)(_.name)
|
||||
|
||||
implicit val metaLocalDate: Meta[LocalDate] =
|
||||
Meta[String].imap(str => LocalDate.parse(str))(_.format(DateTimeFormatter.ISO_DATE))
|
||||
Meta[String].timap(str => LocalDate.parse(str))(_.format(DateTimeFormatter.ISO_DATE))
|
||||
|
||||
implicit val metaItemState: Meta[ItemState] =
|
||||
Meta[String].imap(ItemState.unsafe)(_.name)
|
||||
Meta[String].timap(ItemState.unsafe)(_.name)
|
||||
|
||||
implicit val metNerTag: Meta[NerTag] =
|
||||
Meta[String].imap(NerTag.unsafe)(_.name)
|
||||
Meta[String].timap(NerTag.unsafe)(_.name)
|
||||
|
||||
implicit val metaNerLabel: Meta[NerLabel] =
|
||||
jsonMeta[NerLabel]
|
||||
@ -108,7 +116,7 @@ trait DoobieMeta extends EmilDoobieMeta {
|
||||
jsonMeta[List[IdRef]]
|
||||
|
||||
implicit val metaLanguage: Meta[Language] =
|
||||
Meta[String].imap(Language.unsafe)(_.iso3)
|
||||
Meta[String].timap(Language.unsafe)(_.iso3)
|
||||
|
||||
implicit val metaCalEvent: Meta[CalEvent] =
|
||||
Meta[String].timap(CalEvent.unsafe)(_.asString)
|
||||
|
@ -11,7 +11,7 @@ import cats.effect.Async
|
||||
import cats.implicits._
|
||||
import cats.~>
|
||||
|
||||
import docspell.store.file.FileStore
|
||||
import docspell.store.file.FileRepository
|
||||
import docspell.store.migrate.FlywayMigrate
|
||||
import docspell.store.{AddResult, JdbcConfig, Store}
|
||||
|
||||
@ -19,7 +19,7 @@ import doobie._
|
||||
import doobie.implicits._
|
||||
|
||||
final class StoreImpl[F[_]: Async](
|
||||
val fileStore: FileStore[F],
|
||||
val fileRepo: FileRepository[F],
|
||||
jdbc: JdbcConfig,
|
||||
xa: Transactor[F]
|
||||
) extends Store[F] {
|
||||
@ -30,10 +30,10 @@ final class StoreImpl[F[_]: Async](
|
||||
def migrate: F[Int] =
|
||||
FlywayMigrate.run[F](jdbc).map(_.migrationsExecuted)
|
||||
|
||||
def transact[A](prg: doobie.ConnectionIO[A]): F[A] =
|
||||
def transact[A](prg: ConnectionIO[A]): F[A] =
|
||||
prg.transact(xa)
|
||||
|
||||
def transact[A](prg: fs2.Stream[doobie.ConnectionIO, A]): fs2.Stream[F, A] =
|
||||
def transact[A](prg: fs2.Stream[ConnectionIO, A]): fs2.Stream[F, A] =
|
||||
prg.transact(xa)
|
||||
|
||||
def add(insert: ConnectionIO[Int], exists: ConnectionIO[Boolean]): F[AddResult] =
|
||||
|
@ -40,7 +40,7 @@ object QAttachment {
|
||||
.evalSeq(store.transact(findPreview))
|
||||
.map(_.fileId)
|
||||
.evalTap(_ => store.transact(RAttachmentPreview.delete(attachId)))
|
||||
.evalMap(store.fileStore.delete)
|
||||
.evalMap(store.fileRepo.delete)
|
||||
.map(_ => 1)
|
||||
.compile
|
||||
.foldMonoid
|
||||
@ -68,7 +68,7 @@ object QAttachment {
|
||||
f <-
|
||||
Stream
|
||||
.emits(files._1)
|
||||
.evalMap(store.fileStore.delete)
|
||||
.evalMap(store.fileRepo.delete)
|
||||
.map(_ => 1)
|
||||
.compile
|
||||
.foldMonoid
|
||||
@ -91,7 +91,7 @@ object QAttachment {
|
||||
f <-
|
||||
Stream
|
||||
.emits(ra.fileId +: (s.map(_.fileId).toSeq ++ p.map(_.fileId).toSeq))
|
||||
.evalMap(store.fileStore.delete)
|
||||
.evalMap(store.fileRepo.delete)
|
||||
.map(_ => 1)
|
||||
.compile
|
||||
.foldMonoid
|
||||
@ -104,7 +104,7 @@ object QAttachment {
|
||||
_ <- OptionT.liftF(
|
||||
Stream
|
||||
.emit(aa.fileId)
|
||||
.evalMap(store.fileStore.delete)
|
||||
.evalMap(store.fileRepo.delete)
|
||||
.compile
|
||||
.drain
|
||||
)
|
||||
|
@ -15,7 +15,7 @@ import cats.implicits._
|
||||
import fs2.Stream
|
||||
|
||||
import docspell.common.syntax.all._
|
||||
import docspell.common.{IdRef, _}
|
||||
import docspell.common.{FileKey, IdRef, _}
|
||||
import docspell.query.ItemQuery
|
||||
import docspell.store.Store
|
||||
import docspell.store.qb.DSL._
|
||||
@ -470,7 +470,7 @@ object QItem {
|
||||
} yield tn + rn + n + mn + cf + im
|
||||
|
||||
private def findByFileIdsQuery(
|
||||
fileMetaIds: Nel[Ident],
|
||||
fileMetaIds: Nel[FileKey],
|
||||
states: Option[Nel[ItemState]]
|
||||
): Select.SimpleSelect = {
|
||||
val i = RItem.as("i")
|
||||
@ -490,7 +490,7 @@ object QItem {
|
||||
).distinct
|
||||
}
|
||||
|
||||
def findOneByFileIds(fileMetaIds: Seq[Ident]): ConnectionIO[Option[RItem]] =
|
||||
def findOneByFileIds(fileMetaIds: Seq[FileKey]): ConnectionIO[Option[RItem]] =
|
||||
Nel.fromList(fileMetaIds.toList) match {
|
||||
case Some(nel) =>
|
||||
findByFileIdsQuery(nel, None).limit(1).build.query[RItem].option
|
||||
@ -499,7 +499,7 @@ object QItem {
|
||||
}
|
||||
|
||||
def findByFileIds(
|
||||
fileMetaIds: Seq[Ident],
|
||||
fileMetaIds: Seq[FileKey],
|
||||
states: Nel[ItemState]
|
||||
): ConnectionIO[Vector[RItem]] =
|
||||
Nel.fromList(fileMetaIds.toList) match {
|
||||
@ -512,7 +512,7 @@ object QItem {
|
||||
def findByChecksum(
|
||||
checksum: String,
|
||||
collective: Ident,
|
||||
excludeFileMeta: Set[Ident]
|
||||
excludeFileMeta: Set[FileKey]
|
||||
): ConnectionIO[Vector[RItem]] = {
|
||||
val qq = findByChecksumQuery(checksum, collective, excludeFileMeta).build
|
||||
logger.debug(s"FindByChecksum: $qq")
|
||||
@ -522,7 +522,7 @@ object QItem {
|
||||
def findByChecksumQuery(
|
||||
checksum: String,
|
||||
collective: Ident,
|
||||
excludeFileMeta: Set[Ident]
|
||||
excludeFileMeta: Set[FileKey]
|
||||
): Select = {
|
||||
val m1 = RFileMeta.as("m1")
|
||||
val m2 = RFileMeta.as("m2")
|
||||
|
@ -10,7 +10,7 @@ import cats.data.NonEmptyList
|
||||
import cats.implicits._
|
||||
import fs2.Stream
|
||||
|
||||
import docspell.common._
|
||||
import docspell.common.{FileKey, _}
|
||||
import docspell.store.qb.DSL._
|
||||
import docspell.store.qb._
|
||||
|
||||
@ -20,7 +20,7 @@ import doobie.implicits._
|
||||
case class RAttachment(
|
||||
id: Ident,
|
||||
itemId: Ident,
|
||||
fileId: Ident,
|
||||
fileId: FileKey,
|
||||
position: Int,
|
||||
created: Timestamp,
|
||||
name: Option[String]
|
||||
@ -32,7 +32,7 @@ object RAttachment {
|
||||
|
||||
val id = Column[Ident]("attachid", this)
|
||||
val itemId = Column[Ident]("itemid", this)
|
||||
val fileId = Column[Ident]("filemetaid", this)
|
||||
val fileId = Column[FileKey]("filemetaid", this)
|
||||
val position = Column[Int]("position", this)
|
||||
val created = Column[Timestamp]("created", this)
|
||||
val name = Column[String]("name", this)
|
||||
@ -47,7 +47,7 @@ object RAttachment {
|
||||
DML.insert(
|
||||
T,
|
||||
T.all,
|
||||
fr"${v.id},${v.itemId},${v.fileId.id},${v.position},${v.created},${v.name}"
|
||||
fr"${v.id},${v.itemId},${v.fileId},${v.position},${v.created},${v.name}"
|
||||
)
|
||||
|
||||
def decPositions(iId: Ident, lowerBound: Int, upperBound: Int): ConnectionIO[Int] =
|
||||
@ -77,7 +77,7 @@ object RAttachment {
|
||||
|
||||
def updateFileIdAndName(
|
||||
attachId: Ident,
|
||||
fId: Ident,
|
||||
fId: FileKey,
|
||||
fname: Option[String]
|
||||
): ConnectionIO[Int] =
|
||||
DML.update(
|
||||
@ -88,7 +88,7 @@ object RAttachment {
|
||||
|
||||
def updateFileId(
|
||||
attachId: Ident,
|
||||
fId: Ident
|
||||
fId: FileKey
|
||||
): ConnectionIO[Int] =
|
||||
DML.update(
|
||||
T,
|
||||
@ -182,7 +182,7 @@ object RAttachment {
|
||||
def findByItemCollectiveSource(
|
||||
id: Ident,
|
||||
coll: Ident,
|
||||
fileIds: NonEmptyList[Ident]
|
||||
fileIds: NonEmptyList[FileKey]
|
||||
): ConnectionIO[Vector[RAttachment]] = {
|
||||
val i = RItem.as("i")
|
||||
val a = RAttachment.as("a")
|
||||
|
@ -8,7 +8,7 @@ package docspell.store.records
|
||||
|
||||
import cats.data.NonEmptyList
|
||||
|
||||
import docspell.common._
|
||||
import docspell.common.{FileKey, _}
|
||||
import docspell.store.qb.DSL._
|
||||
import docspell.store.qb.TableDef
|
||||
import docspell.store.qb._
|
||||
@ -21,7 +21,7 @@ import doobie.implicits._
|
||||
*/
|
||||
case class RAttachmentArchive(
|
||||
id: Ident, // same as RAttachment.id
|
||||
fileId: Ident,
|
||||
fileId: FileKey,
|
||||
name: Option[String],
|
||||
messageId: Option[String],
|
||||
created: Timestamp
|
||||
@ -32,7 +32,7 @@ object RAttachmentArchive {
|
||||
val tableName = "attachment_archive"
|
||||
|
||||
val id = Column[Ident]("id", this)
|
||||
val fileId = Column[Ident]("file_id", this)
|
||||
val fileId = Column[FileKey]("file_id", this)
|
||||
val name = Column[String]("filename", this)
|
||||
val messageId = Column[String]("message_id", this)
|
||||
val created = Column[Timestamp]("created", this)
|
||||
@ -59,7 +59,7 @@ object RAttachmentArchive {
|
||||
def delete(attachId: Ident): ConnectionIO[Int] =
|
||||
DML.delete(T, T.id === attachId)
|
||||
|
||||
def deleteAll(fId: Ident): ConnectionIO[Int] =
|
||||
def deleteAll(fId: FileKey): ConnectionIO[Int] =
|
||||
DML.delete(T, T.fileId === fId)
|
||||
|
||||
def findByIdAndCollective(
|
||||
|
@ -8,7 +8,7 @@ package docspell.store.records
|
||||
|
||||
import cats.data.NonEmptyList
|
||||
|
||||
import docspell.common._
|
||||
import docspell.common.{FileKey, _}
|
||||
import docspell.store.qb.DSL._
|
||||
import docspell.store.qb._
|
||||
|
||||
@ -20,7 +20,7 @@ import doobie.implicits._
|
||||
*/
|
||||
case class RAttachmentPreview(
|
||||
id: Ident, // same as RAttachment.id
|
||||
fileId: Ident,
|
||||
fileId: FileKey,
|
||||
name: Option[String],
|
||||
created: Timestamp
|
||||
)
|
||||
@ -30,7 +30,7 @@ object RAttachmentPreview {
|
||||
val tableName = "attachment_preview"
|
||||
|
||||
val id = Column[Ident]("id", this)
|
||||
val fileId = Column[Ident]("file_id", this)
|
||||
val fileId = Column[FileKey]("file_id", this)
|
||||
val name = Column[String]("filename", this)
|
||||
val created = Column[Timestamp]("created", this)
|
||||
|
||||
|
@ -8,7 +8,7 @@ package docspell.store.records
|
||||
|
||||
import cats.data.NonEmptyList
|
||||
|
||||
import docspell.common._
|
||||
import docspell.common.{FileKey, _}
|
||||
import docspell.store.qb.DSL._
|
||||
import docspell.store.qb._
|
||||
|
||||
@ -20,7 +20,7 @@ import doobie.implicits._
|
||||
*/
|
||||
case class RAttachmentSource(
|
||||
id: Ident, // same as RAttachment.id
|
||||
fileId: Ident,
|
||||
fileId: FileKey,
|
||||
name: Option[String],
|
||||
created: Timestamp
|
||||
)
|
||||
@ -30,7 +30,7 @@ object RAttachmentSource {
|
||||
val tableName = "attachment_source"
|
||||
|
||||
val id = Column[Ident]("id", this)
|
||||
val fileId = Column[Ident]("file_id", this)
|
||||
val fileId = Column[FileKey]("file_id", this)
|
||||
val name = Column[String]("filename", this)
|
||||
val created = Column[Timestamp]("created", this)
|
||||
|
||||
@ -50,7 +50,7 @@ object RAttachmentSource {
|
||||
def findById(attachId: Ident): ConnectionIO[Option[RAttachmentSource]] =
|
||||
run(select(T.all), from(T), T.id === attachId).query[RAttachmentSource].option
|
||||
|
||||
def isSameFile(attachId: Ident, file: Ident): ConnectionIO[Boolean] =
|
||||
def isSameFile(attachId: Ident, file: FileKey): ConnectionIO[Boolean] =
|
||||
Select(count(T.id).s, from(T), T.id === attachId && T.fileId === file).build
|
||||
.query[Int]
|
||||
.unique
|
||||
|
@ -21,7 +21,7 @@ final case class RClassifierModel(
|
||||
id: Ident,
|
||||
cid: Ident,
|
||||
name: String,
|
||||
fileId: Ident,
|
||||
fileId: FileKey,
|
||||
created: Timestamp
|
||||
) {}
|
||||
|
||||
@ -30,7 +30,7 @@ object RClassifierModel {
|
||||
def createNew[F[_]: Sync](
|
||||
cid: Ident,
|
||||
name: String,
|
||||
fileId: Ident
|
||||
fileId: FileKey
|
||||
): F[RClassifierModel] =
|
||||
for {
|
||||
id <- Ident.randomId[F]
|
||||
@ -43,7 +43,7 @@ object RClassifierModel {
|
||||
val id = Column[Ident]("id", this)
|
||||
val cid = Column[Ident]("cid", this)
|
||||
val name = Column[String]("name", this)
|
||||
val fileId = Column[Ident]("file_id", this)
|
||||
val fileId = Column[FileKey]("file_id", this)
|
||||
val created = Column[Timestamp]("created", this)
|
||||
|
||||
val all = NonEmptyList.of[Column[_]](id, cid, name, fileId, created)
|
||||
@ -61,7 +61,7 @@ object RClassifierModel {
|
||||
fr"${v.id},${v.cid},${v.name},${v.fileId},${v.created}"
|
||||
)
|
||||
|
||||
def updateFile(coll: Ident, name: String, fid: Ident): ConnectionIO[Int] =
|
||||
def updateFile(coll: Ident, name: String, fid: FileKey): ConnectionIO[Int] =
|
||||
for {
|
||||
now <- Timestamp.current[ConnectionIO]
|
||||
n <- DML.update(
|
||||
|
@ -9,7 +9,7 @@ package docspell.store.records
|
||||
import cats.data.NonEmptyList
|
||||
import cats.implicits._
|
||||
|
||||
import docspell.common._
|
||||
import docspell.common.{FileKey, _}
|
||||
import docspell.store.qb.DSL._
|
||||
import docspell.store.qb._
|
||||
|
||||
@ -18,7 +18,7 @@ import doobie.implicits._
|
||||
import scodec.bits.ByteVector
|
||||
|
||||
final case class RFileMeta(
|
||||
id: Ident,
|
||||
id: FileKey,
|
||||
created: Timestamp,
|
||||
mimetype: MimeType,
|
||||
length: ByteSize,
|
||||
@ -29,7 +29,7 @@ object RFileMeta {
|
||||
final case class Table(alias: Option[String]) extends TableDef {
|
||||
val tableName = "filemeta"
|
||||
|
||||
val id = Column[Ident]("file_id", this)
|
||||
val id = Column[FileKey]("file_id", this)
|
||||
val timestamp = Column[Timestamp]("created", this)
|
||||
val mimetype = Column[MimeType]("mimetype", this)
|
||||
val length = Column[ByteSize]("length", this)
|
||||
@ -47,10 +47,10 @@ object RFileMeta {
|
||||
def insert(r: RFileMeta): ConnectionIO[Int] =
|
||||
DML.insert(T, T.all, fr"${r.id},${r.created},${r.mimetype},${r.length},${r.checksum}")
|
||||
|
||||
def findById(fid: Ident): ConnectionIO[Option[RFileMeta]] =
|
||||
def findById(fid: FileKey): ConnectionIO[Option[RFileMeta]] =
|
||||
run(select(T.all), from(T), T.id === fid).query[RFileMeta].option
|
||||
|
||||
def findByIds(ids: List[Ident]): ConnectionIO[Vector[RFileMeta]] =
|
||||
def findByIds(ids: List[FileKey]): ConnectionIO[Vector[RFileMeta]] =
|
||||
NonEmptyList.fromList(ids) match {
|
||||
case Some(nel) =>
|
||||
run(select(T.all), from(T), T.id.in(nel)).query[RFileMeta].to[Vector]
|
||||
@ -58,11 +58,11 @@ object RFileMeta {
|
||||
Vector.empty[RFileMeta].pure[ConnectionIO]
|
||||
}
|
||||
|
||||
def findMime(fid: Ident): ConnectionIO[Option[MimeType]] =
|
||||
def findMime(fid: FileKey): ConnectionIO[Option[MimeType]] =
|
||||
run(select(T.mimetype), from(T), T.id === fid)
|
||||
.query[MimeType]
|
||||
.option
|
||||
|
||||
def delete(id: Ident): ConnectionIO[Int] =
|
||||
def delete(id: FileKey): ConnectionIO[Int] =
|
||||
DML.delete(T, T.id === id)
|
||||
}
|
||||
|
@ -11,7 +11,7 @@ import javax.sql.DataSource
|
||||
import cats.effect._
|
||||
|
||||
import docspell.common.LenientUri
|
||||
import docspell.store.file.FileStore
|
||||
import docspell.store.file.FileRepository
|
||||
import docspell.store.impl.StoreImpl
|
||||
import docspell.store.migrate.FlywayMigrate
|
||||
|
||||
@ -67,7 +67,8 @@ object StoreFixture {
|
||||
for {
|
||||
ds <- dataSource(jdbc)
|
||||
xa <- makeXA(ds)
|
||||
store = new StoreImpl[IO](FileStore[IO](xa, ds, 64 * 1024), jdbc, xa)
|
||||
fr = FileRepository.genericJDBC[IO](xa, ds, 64 * 1024)
|
||||
store = new StoreImpl[IO](fr, jdbc, xa)
|
||||
_ <- Resource.eval(store.migrate)
|
||||
} yield store
|
||||
}
|
||||
|
@ -282,7 +282,8 @@ object Dependencies {
|
||||
|
||||
val binny = Seq(
|
||||
"com.github.eikek" %% "binny-core" % BinnyVersion,
|
||||
"com.github.eikek" %% "binny-jdbc" % BinnyVersion
|
||||
"com.github.eikek" %% "binny-jdbc" % BinnyVersion,
|
||||
"com.github.eikek" %% "binny-minio" % BinnyVersion
|
||||
)
|
||||
|
||||
// https://github.com/flyway/flyway
|
||||
|
Loading…
Reference in New Issue
Block a user