summaryrefslogtreecommitdiffstats
path: root/pdf2txt
blob: 65590fc25345071334a902d8db3b632918f9f127 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
#! /bin/sh

if [ $# -eq 0 ]; then
    echo "usage $0 : pdffile"
fi

TIFF=$(basename $1 .pdf).tif
OUTF=$(basename $1 .pdf)

FMT=${TIFF_FMT:-"tiffgray"} #tiff24nc

gs -r300x300 -sDEVICE=${FMT} -sOutputFile=$TIFF -dBATCH -dNOPAUSE $1
#convert -monochrome -density 200 $1 $TIFF
tesseract $TIFF $OUTF
rm $TIFF
echo "output : ${OUTF}"