#!/usr/bin/env bash # This script watches a directory for new files and uploads them to # docspell. Or it uploads all files currently in the directory. # # It requires inotifywait, curl and sha256sum if the `-m' option is # used. # saner programming env: these switches turn some bugs into errors set -o errexit -o pipefail -o noclobber -o nounset CURL_CMD="curl" INOTIFY_CMD="inotifywait" SHA256_CMD="sha256sum" MKTEMP_CMD="mktemp" ! getopt --test > /dev/null if [[ ${PIPESTATUS[0]} -ne 4 ]]; then echo 'I’m sorry, `getopt --test` failed in this environment.' exit 1 fi OPTIONS=omhdp:vr LONGOPTS=once,distinct,help,delete,path:,verbose,recursive,dry ! PARSED=$(getopt --options=$OPTIONS --longoptions=$LONGOPTS --name "$0" -- "$@") if [[ ${PIPESTATUS[0]} -ne 0 ]]; then # e.g. return value is 1 # then getopt has complained about wrong arguments to stdout exit 2 fi # read getopt’s output this way to handle the quoting right: eval set -- "$PARSED" declare -a watchdir help=n verbose=n delete=n once=n distinct=n recursive=n dryrun=n while true; do case "$1" in -h|--help) help=y shift ;; -v|--verbose) verbose=y shift ;; -d|--delete) delete=y shift ;; -o|--once) once=y shift ;; -p|--path) watchdir+=("$2") shift 2 ;; -m|--distinct) distinct=y shift ;; -r|--recursive) recursive=y shift ;; --dry) dryrun=y shift ;; --) shift break ;; *) echo "Programming error" exit 3 ;; esac done showUsage() { echo "Upload files in a directory" echo "" echo "Usage: $0 [options] url url ..." echo echo "Options:" echo " -v | --verbose Print more to stdout. (value: $verbose)" echo " -d | --delete Delete the file if successfully uploaded. (value: $delete)" echo " -p | --path The directories to watch. This is required. (value: ${watchdir[@]})" echo " -h | --help Prints this help text. (value: $help)" echo " -m | --distinct Optional. Upload only if the file doesn't already exist. (value: $distinct)" echo " -o | --once Instead of watching, upload all files in that dir. (value: $once)" echo " -r | --recursive Traverse the directory(ies) recursively (value: $recursive)" echo " --dry Do a 'dry run', not uploading anything only printing to stdout (value: $dryrun)" echo "" echo "Arguments:" echo " A list of URLs to upload the files to." echo "" echo "Example: Watch directory" echo "$0 --path ~/Downloads -m -dv http://localhost:7880/api/v1/open/upload/item/abcde-12345-abcde-12345" echo "" echo "Example: Upload all files in a directory" echo "$0 --path ~/Downloads -m -dv --once http://localhost:7880/api/v1/open/upload/item/abcde-12345-abcde-12345" echo "" } if [ "$help" = "y" ]; then showUsage exit 0 fi # handle non-option arguments if [[ $# -eq 0 ]]; then echo "$0: No upload URLs given." exit 4 fi urls=$@ if [ ! -d "$watchdir" ]; then echo "The path '$watchdir' is not a directory." exit 4 fi trace() { if [ "$verbose" = "y" ]; then echo "$1" fi } info() { echo $1 } upload() { if [ "$dryrun" = "y" ]; then info "Not uploading (dry-run) $1 to $2" else tf=$($MKTEMP_CMD) rc=0 $CURL_CMD -# -o "$tf" --stderr "$tf" -w "%{http_code}" -XPOST -F file=@"$1" "$2" | (2>&1 1>/dev/null grep 200) rc=$(expr $rc + $?) cat $tf | (2>&1 1>/dev/null grep '{"success":true') rc=$(expr $rc + $?) if [ $rc -ne 0 ]; then info "Upload failed. Exit code: $rc" cat "$tf" echo "" rm "$tf" return $rc else rm "$tf" return 0 fi fi } checksum() { $SHA256_CMD "$1" | cut -d' ' -f1 | xargs } checkFile() { local url=$(echo "$1" | sed 's,upload/item,checkfile,g') local file="$2" trace "Check file: $url/$(checksum "$file")" $CURL_CMD -XGET -s "$url/$(checksum "$file")" | (2>&1 1>/dev/null grep '"exists":true') } process() { file="$1" info "---- Processing $file ----------" declare -i curlrc=0 set +e for url in $urls; do if [ "$distinct" = "y" ]; then trace "- Checking if $file has been uploaded to $url already" checkFile "$url" "$file" if [ $? -eq 0 ]; then info "- Skipping file '$file' because it has been uploaded in the past." continue fi fi trace "- Uploading '$file' to '$url'." upload "$file" "$url" rc=$? curlrc=$(expr $curlrc + $rc) if [ $rc -ne 0 ]; then trace "Upload to '$url' failed!" fi done set -e if [ $curlrc -ne 0 ]; then info "-> Some uploads failed." else trace "= File processed for all URLs" if [ "$delete" = "y" ]; then info "- Deleting file '$file'" set +e rm "$file" if [ $? -ne 0 ]; then info "- Deleting failed!" fi set -e fi fi } if [ "$once" = "y" ]; then info "Uploading all files in '$watchdir'." MD="-maxdepth 1" if [ "$recursive" = "y" ]; then MD="" fi for dir in "${watchdir[@]}"; do find "$dir" $MD -type f -print0 | while IFS= read -d '' -r file; do process "$file" done done else REC="" if [ "$recursive" = "y" ]; then REC="-r" fi $INOTIFY_CMD $REC -m "${watchdir[@]}" -e close_write -e moved_to | while read path action file; do trace "The file '$file' appeared in directory '$path' via '$action'" sleep 1 process "$path$file" done fi