diff options
Diffstat (limited to 'pdf_dump_first_page.sh')
| -rw-r--r-- | pdf_dump_first_page.sh | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/pdf_dump_first_page.sh b/pdf_dump_first_page.sh new file mode 100644 index 00000000..dd67c87d --- /dev/null +++ b/pdf_dump_first_page.sh @@ -0,0 +1,8 @@ +#!/bin/bash + +for i in datasets/s2/pdf/*/*/*.pdf + do + OUTPUT="${i%.*}.txt" + pdf2txt.py -p 1 $i > $OUTPUT + echo $OUTPUT + done
\ No newline at end of file |
