From dcc57688685a4f75e4dec7caf5c2322f9137d35d Mon Sep 17 00:00:00 2001 From: Jan Jambor Date: Wed, 12 Mar 2025 16:21:43 +0100 Subject: [PATCH] new: add ocr.bash scriptto streamline ocr file creation. --- resources/scripts/ocr.bash | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100755 resources/scripts/ocr.bash diff --git a/resources/scripts/ocr.bash b/resources/scripts/ocr.bash new file mode 100755 index 0000000..e1cfa2b --- /dev/null +++ b/resources/scripts/ocr.bash @@ -0,0 +1,24 @@ +#!/usr/bin/env bash + +# Simple script to OCR multiple PDFs using ocrmypdf. +# Usage: ocrpdf.sh input.pdf + +if [ $# -eq 0 ]; then + echo "Usage: $(basename "$0") input.pdf" + exit 1 +fi + +for f in "$@"; do + # Make sure it's a PDF + if [[ "$f" == *.pdf ]]; then + dir=$(dirname "$f") + base=$(basename "$f" .pdf) + out="${dir}/${base}-ocr.pdf" + + echo "Processing $f -> $out" + ocrmypdf --redo-ocr "$f" "$out" + echo "Created: $out" + else + echo "Skipping non-PDF file: $f" + fi +done