diff options
| -rw-r--r-- | pdf_dump_first_page.sh | 9 |
1 files changed, 6 insertions, 3 deletions
diff --git a/pdf_dump_first_page.sh b/pdf_dump_first_page.sh index dd67c87d..d1610b50 100644 --- a/pdf_dump_first_page.sh +++ b/pdf_dump_first_page.sh @@ -3,6 +3,9 @@ for i in datasets/s2/pdf/*/*/*.pdf do OUTPUT="${i%.*}.txt" - pdf2txt.py -p 1 $i > $OUTPUT - echo $OUTPUT - done
\ No newline at end of file + if [ ! -e $OUTPUT ] + then + pdf2txt.py -p 1 $i > $OUTPUT + echo $OUTPUT + fi + done |
