diff options
Diffstat (limited to 'ocr-scan')
-rwxr-xr-x | ocr-scan | 20 |
1 files changed, 20 insertions, 0 deletions
diff --git a/ocr-scan b/ocr-scan new file mode 100755 index 0000000..5e7423f --- /dev/null +++ b/ocr-scan @@ -0,0 +1,20 @@ +#!/bin/bash + +jpeg_quality=70 +jpeg_size=1500x1500 + +time=$(date +%Y-%m-%d_%H%M%S) +scanimage --resolution 300 -b -x 215 -y 297 +i=1 +while [[ -e "out$i.pnm" ]]; do + img="out$i.pnm" + newname="$(printf "%s_%03d" "$time" "$i")" + unpaper "$img" "unpaper-$img" + tesseract "unpaper-$img" "$newname.txt" + convert "$img" -normalize -resize $jpeg_size -quality $jpeg_quality "$newname.jpg" && rm "$img" "unpaper-$img" + ((i++)) +done + +if [[ $1 = "--pdf" ]]; then + convert "${time}"_*.jpg -resize $jpeg_size -compress jpeg -quality $jpeg_quality -density 72x72 -repage 595x842 "${time}.pdf" && rm "${time}"_*.jpg +fi |