#!/bin/bash for i in datasets/s2/pdf/*/*/*.pdf do OUTPUT="${i%.*}.txt" if [[ ! -e $OUTPUT ]] then pdf2txt.py -p 1 $i > $OUTPUT if [ -s $OUTPUT ] then echo "found $OUTPUT" else echo "rm empty $OUTPUT" rm -f $OUTPUT fi else if [ -s $OUTPUT ] then echo "found $OUTPUT" else echo "rm empty $OUTPUT" rm -f $OUTPUT fi fi done