mirror of
https://github.com/TheAnachronism/docspell.git
synced 2025-04-05 10:59:33 +00:00
Use fs2 Files api
This commit is contained in:
parent
bd791b4593
commit
02b8078f01
@ -1,91 +1,47 @@
|
|||||||
package docspell.common
|
package docspell.common
|
||||||
|
|
||||||
import java.io.IOException
|
import java.nio.file.Path
|
||||||
import java.nio.file.attribute.BasicFileAttributes
|
|
||||||
import java.nio.file.{Files => JFiles, _}
|
|
||||||
import java.util.concurrent.atomic.AtomicInteger
|
|
||||||
|
|
||||||
import scala.jdk.CollectionConverters._
|
|
||||||
|
|
||||||
|
import cats.FlatMap
|
||||||
|
import cats.Monad
|
||||||
import cats.effect._
|
import cats.effect._
|
||||||
import cats.implicits._
|
import cats.implicits._
|
||||||
|
import fs2.Stream
|
||||||
import fs2.io.file.Files
|
import fs2.io.file.Files
|
||||||
import fs2.{Chunk, Stream}
|
|
||||||
|
|
||||||
import docspell.common.syntax.all._
|
import docspell.common.syntax.all._
|
||||||
|
|
||||||
import io.circe.Decoder
|
import io.circe.Decoder
|
||||||
import scodec.bits.ByteVector
|
|
||||||
//TODO use io.fs2.files.Files api
|
|
||||||
object File {
|
object File {
|
||||||
|
|
||||||
def mkDir[F[_]: Sync](dir: Path): F[Path] =
|
def mkDir[F[_]: Files](dir: Path): F[Path] =
|
||||||
Sync[F].blocking(JFiles.createDirectories(dir))
|
Files[F].createDirectories(dir)
|
||||||
|
|
||||||
def mkTempDir[F[_]: Sync](parent: Path, prefix: String): F[Path] =
|
def exists[F[_]: Files](file: Path): F[Boolean] =
|
||||||
mkDir(parent).map(p => JFiles.createTempDirectory(p, prefix))
|
Files[F].exists(file)
|
||||||
|
|
||||||
def mkTempFile[F[_]: Sync](
|
def size[F[_]: Files](file: Path): F[Long] =
|
||||||
parent: Path,
|
Files[F].size(file)
|
||||||
prefix: String,
|
|
||||||
suffix: Option[String] = None
|
|
||||||
): F[Path] =
|
|
||||||
mkDir(parent).map(p => JFiles.createTempFile(p, prefix, suffix.orNull))
|
|
||||||
|
|
||||||
def deleteDirectory[F[_]: Sync](dir: Path): F[Int] =
|
def existsNonEmpty[F[_]: Files: Monad](file: Path, minSize: Long = 0): F[Boolean] =
|
||||||
Sync[F].delay {
|
exists[F](file).flatMap(b => if (b) size[F](file).map(_ > minSize) else false.pure[F])
|
||||||
val count = new AtomicInteger(0)
|
|
||||||
JFiles.walkFileTree(
|
|
||||||
dir,
|
|
||||||
new SimpleFileVisitor[Path]() {
|
|
||||||
override def visitFile(
|
|
||||||
file: Path,
|
|
||||||
attrs: BasicFileAttributes
|
|
||||||
): FileVisitResult = {
|
|
||||||
JFiles.deleteIfExists(file)
|
|
||||||
count.incrementAndGet()
|
|
||||||
FileVisitResult.CONTINUE
|
|
||||||
}
|
|
||||||
override def postVisitDirectory(dir: Path, e: IOException): FileVisitResult =
|
|
||||||
Option(e) match {
|
|
||||||
case Some(ex) => throw ex
|
|
||||||
case None =>
|
|
||||||
JFiles.deleteIfExists(dir)
|
|
||||||
FileVisitResult.CONTINUE
|
|
||||||
}
|
|
||||||
}
|
|
||||||
)
|
|
||||||
count.get
|
|
||||||
}
|
|
||||||
|
|
||||||
def exists[F[_]: Sync](file: Path): F[Boolean] =
|
def delete[F[_]: Files: FlatMap](path: Path): F[Unit] =
|
||||||
Sync[F].delay(JFiles.exists(file))
|
for {
|
||||||
|
isDir <- Files[F].isDirectory(path)
|
||||||
|
_ <-
|
||||||
|
if (isDir) Files[F].deleteDirectoryRecursively(path)
|
||||||
|
else Files[F].deleteIfExists(path)
|
||||||
|
} yield ()
|
||||||
|
|
||||||
def size[F[_]: Sync](file: Path): F[Long] =
|
def withTempDir[F[_]: Files](parent: Path, prefix: String): Resource[F, Path] =
|
||||||
Sync[F].delay(JFiles.size(file))
|
Resource
|
||||||
|
.eval(mkDir[F](parent))
|
||||||
|
.flatMap(_ => Files[F].tempDirectory(parent.some, prefix))
|
||||||
|
|
||||||
def existsNonEmpty[F[_]: Sync](file: Path, minSize: Long = 0): F[Boolean] =
|
def listFiles[F[_]: Files](pred: Path => Boolean, dir: Path): Stream[F, Path] =
|
||||||
Sync[F].delay(JFiles.exists(file) && JFiles.size(file) > minSize)
|
Files[F].directoryStream(dir, pred)
|
||||||
|
|
||||||
def deleteFile[F[_]: Sync](file: Path): F[Unit] =
|
|
||||||
Sync[F].delay(JFiles.deleteIfExists(file)).map(_ => ())
|
|
||||||
|
|
||||||
def delete[F[_]: Sync](path: Path): F[Int] =
|
|
||||||
if (JFiles.isDirectory(path)) deleteDirectory(path)
|
|
||||||
else deleteFile(path).map(_ => 1)
|
|
||||||
|
|
||||||
def withTempDir[F[_]: Sync](parent: Path, prefix: String): Resource[F, Path] =
|
|
||||||
Resource.make(mkTempDir(parent, prefix))(p => delete(p).map(_ => ()))
|
|
||||||
|
|
||||||
def listJFiles[F[_]: Sync](pred: Path => Boolean, dir: Path): F[List[Path]] =
|
|
||||||
Sync[F].delay {
|
|
||||||
val javaList =
|
|
||||||
JFiles
|
|
||||||
.list(dir)
|
|
||||||
.filter(p => pred(p))
|
|
||||||
.collect(java.util.stream.Collectors.toList())
|
|
||||||
javaList.asScala.toList.sortBy(_.getFileName.toString)
|
|
||||||
}
|
|
||||||
|
|
||||||
def readAll[F[_]: Files](
|
def readAll[F[_]: Files](
|
||||||
file: Path,
|
file: Path,
|
||||||
@ -97,17 +53,13 @@ object File {
|
|||||||
readAll[F](file, 8192).through(fs2.text.utf8Decode).compile.foldMonoid
|
readAll[F](file, 8192).through(fs2.text.utf8Decode).compile.foldMonoid
|
||||||
|
|
||||||
def writeString[F[_]: Files: Concurrent](file: Path, content: String): F[Path] =
|
def writeString[F[_]: Files: Concurrent](file: Path, content: String): F[Path] =
|
||||||
ByteVector.encodeUtf8(content) match {
|
Stream
|
||||||
case Right(bv) =>
|
.emit(content)
|
||||||
Stream
|
.through(fs2.text.utf8Encode)
|
||||||
.chunk(Chunk.byteVector(bv))
|
.through(Files[F].writeAll(file))
|
||||||
.through(Files[F].writeAll(file))
|
.compile
|
||||||
.compile
|
.drain
|
||||||
.drain
|
.map(_ => file)
|
||||||
.map(_ => file)
|
|
||||||
case Left(ex) =>
|
|
||||||
Concurrent[F].raiseError(ex)
|
|
||||||
}
|
|
||||||
|
|
||||||
def readJson[F[_]: Async, A](file: Path)(implicit d: Decoder[A]): F[A] =
|
def readJson[F[_]: Async, A](file: Path)(implicit d: Decoder[A]): F[A] =
|
||||||
readText[F](file).map(_.parseJsonAs[A]).rethrow
|
readText[F](file).map(_.parseJsonAs[A]).rethrow
|
||||||
|
@ -80,8 +80,7 @@ object Ocr {
|
|||||||
)
|
)
|
||||||
SystemCommand
|
SystemCommand
|
||||||
.execSuccess(cmd, logger, wd = Some(wd), stdin = pdf)
|
.execSuccess(cmd, logger, wd = Some(wd), stdin = pdf)
|
||||||
.evalMap(_ => File.listJFiles(pathEndsWith(".tif"), wd))
|
.flatMap(_ => File.listFiles(pathEndsWith(".tif"), wd))
|
||||||
.flatMap(fs => Stream.emits(fs))
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Run ghostscript to extract all pdf pages into tiff files. The
|
/** Run ghostscript to extract all pdf pages into tiff files. The
|
||||||
@ -101,8 +100,7 @@ object Ocr {
|
|||||||
)
|
)
|
||||||
SystemCommand
|
SystemCommand
|
||||||
.execSuccess[F](cmd, logger, wd = Some(wd))
|
.execSuccess[F](cmd, logger, wd = Some(wd))
|
||||||
.evalMap(_ => File.listJFiles(pathEndsWith(".tif"), wd))
|
.flatMap(_ => File.listFiles(pathEndsWith(".tif"), wd))
|
||||||
.flatMap(fs => Stream.emits(fs))
|
|
||||||
}
|
}
|
||||||
|
|
||||||
private def pathEndsWith(ext: String): Path => Boolean =
|
private def pathEndsWith(ext: String): Path => Boolean =
|
||||||
|
Loading…
x
Reference in New Issue
Block a user