Files
myscripts/pdt2txt.sh
stubbfel 1aa14e5344 init
2013-06-30 21:56:23 +02:00

13 lines
271 B
Bash
Executable File

#!/bin/bash
for FILE in "$@"
do
pdfseparate "$FILE" pdf2txtTemp-%d.pdf
for i in pdf2txtTemp-*.pdf
do
convert -monochrome -normalize -density 300 $i $i.png
tesseract $i.png $i -l eng+deu
done
cat pdf2txtTemp-*.pdf.txt > "$FILE".txt
rm pdf2txtTemp-*.*
done