#!/bin/bash for i in datasets/s2/pdf/*/*/*.pdf do OUTPUT="${i%.*}.txt" if [[ ! -e $OUTPUT ]] then pdf2txt.py -p 1 $i > $OUTPUT echo $OUTPUT else if [ -s $OUTPUT ] then echo "found $OUTPUT" else echo "rm empty $OUTPUT" rm -f $OUTPUT fi fi done