summaryrefslogtreecommitdiffstats
path: root/pdf2txt
diff options
context:
space:
mode:
Diffstat (limited to 'pdf2txt')
-rwxr-xr-xpdf2txt15
1 files changed, 15 insertions, 0 deletions
diff --git a/pdf2txt b/pdf2txt
new file mode 100755
index 0000000..e8632be
--- /dev/null
+++ b/pdf2txt
@@ -0,0 +1,15 @@
+#! /bin/sh
+
+if [ $# -eq 0 ]; then
+ echo "usage $0 : pdffile"
+fi
+
+TIFF=$(basename $1 .pdf).tif
+OUTF=$(basename $1 .pdf)
+
+FMT=${TIFF_FMT:-"tiffgray"} #tiff24nc
+
+gs -r300x300 -sDEVICE=${FMT} -sOutputFile=$TIFF -dBATCH -dNOPAUSE $1
+tesseract $TIFF $OUTF
+rm $TIFF
+echo "output : ${OUTF}"