]> Sergey Matveev's repositories - dotfiles.git/commitdiff
Multipaged pdftotext
authorSergey Matveev <stargrave@stargrave.org>
Thu, 16 Dec 2021 14:09:54 +0000 (17:09 +0300)
committerSergey Matveev <stargrave@stargrave.org>
Thu, 27 Jan 2022 11:35:14 +0000 (14:35 +0300)
recoll/bin/pdftotext.sh

index f2fa3b3df92133c9e1b9509a902c2af59de8eaa6..1775278068da0b9d1b844a82888b8b1a0b8088f9 100755 (executable)
@@ -2,5 +2,9 @@
 
 tmp=`mktemp`
 trap "rm -f $tmp" HUP PIPE INT QUIT TERM EXIT
-mutool convert -F text -o $tmp "$1"
-cat $tmp
+pages=`mutool info "$1" | sed -n 's/Pages: //p'`
+for page in `seq $pages` ; do
+    mutool convert -F text -o $tmp "$1" $page 2>/dev/null
+    cat $tmp
+    printf '\14\n' # ^L
+done