summaryrefslogtreecommitdiffstats
path: root/pdf2txt
blob: e8632be33dbc06662cf0ad6776edc7bb1fa78071 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
#! /bin/sh

if [ $# -eq 0 ]; then
    echo "usage $0 : pdffile"
fi

TIFF=$(basename $1 .pdf).tif
OUTF=$(basename $1 .pdf)

FMT=${TIFF_FMT:-"tiffgray"} #tiff24nc

gs -r300x300 -sDEVICE=${FMT} -sOutputFile=$TIFF -dBATCH -dNOPAUSE $1
tesseract $TIFF $OUTF
rm $TIFF
echo "output : ${OUTF}"