You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

100 lines
2.3 KiB
Bash

#!/bin/bash
set -euo pipefail
help_message="$(cat <<END
usage: $(basename "$0") [OPTIONS...] INPUT_PDF OUTPUT_PDF
Converts a PDF file to a series of JPEG images using convert to reduce the quality
and then merges back the result in a single pdf
Options:
-q, --quality Set the JPEG quality (default: 75)
-v, --verbose Enable verbose output, also shows an estimate of remaining time
-h, --help Display this help message
END
)"
function show_usage() {
echo "$help_message"
exit 1
}
quality=75
verbose=false
while [[ $# -gt 0 ]]
do
key="$1"
case $key in
-q|--quality)
quality="$2"
shift # past argument
shift # past value
;;
-v|--verbose)
verbose=true
shift # past argument
;;
-h|--help)
show_usage
;;
-*)
echo "Unknown option: $key"
show_usage
;;
*)
break
;;
esac
done
if [ -z "$1" ] || [ -z "$2" ]; then
show_usage
fi
input_file="$1"
output_file="$2"
temp_pages_dir="$(mktemp -d)"
function logf {
if [ "$verbose" = true ]; then
printf "$@"
fi
}
logf "Converting \"$input_file\" to \"$output_file\"\n"
page_count=$(pdfinfo "$input_file" | grep Pages | awk '{print $2}')
logf "Processing $page_count pages\n"
start=$(date +%s.%N)
for i in $(seq 0 $((page_count-1))); do
iter_start=$(date +%s.%N)
# convert -density 300 -quality "$quality" "${input_file}[$i]" "$temp_pages_dir/$i.jpg"
# Equivalent "gs" command that avoids convert's security policies
gs -sDEVICE=jpeg -o "$temp_pages_dir/$i.jpg" -dFirstPage="$i" -dLastPage="$i" -dJPEGQ="$quality" -r300x300 "$input_file"
# Compute estimated remaining time
end=$(date +%s.%N)
elapsed=$(echo "$end - $start" | bc)
iter_elapsed=$(echo "$end - $iter_start" | bc)
remaining=$(echo "($elapsed / ($i + 1)) * ($page_count - $i)" | bc)
remaining_fmt=$(printf "%02d:%02d:%02d" $((remaining/3600)) $((remaining/60)) $((remaining%60)))
logf "Compressed page $((i+1)) in $(printf '%.2f' "$iter_elapsed")s (estimated remaining time $remaining_fmt)\n"
done
logf "Merging compressed pages to a single PDF\n"
convert "$temp_pages_dir"/*.jpg "$output_file"
rm -r "$temp_pages_dir"
logf "Done\n"