remove force-ocr for only scan documents
This commit is contained in:
parent
e1d64e8bbc
commit
f52bd317a1
1 changed files with 1 additions and 1 deletions
|
@ -4,7 +4,7 @@ DOKUMENT_DIR=/home/simono41/data1/Dokumente
|
|||
|
||||
find ${DOKUMENT_DIR} -path ${DOKUMENT_DIR}/.stversions -prune -type f -o -name "*.pdf" ! -name '*-ocr.pdf' -print | while read file; do
|
||||
if ! [ -f "${file%.*}-ocr.pdf" ]; then
|
||||
ocrmypdf -l deu --force-ocr --jbig2-lossy "${file}" "${file%.*}-ocr.pdf"
|
||||
ocrmypdf -l deu+eng -c --jbig2-lossy --tesseract-timeout 60 "${file}" "${file%.*}-ocr.pdf"
|
||||
sleep 1
|
||||
else
|
||||
echo "Datei wurde bereits verarbeitet"
|
||||
|
|
Loading…
Reference in a new issue