#!/bin/bash for i in datasets/s2/pdf/*/*/*.pdf do OUTPUT="${i%.*}.txt" OUTPUT="${OUTPUT/pdf/txt}" IMDIR=`dirname ${OUTPUT}` if [[ ! -e $OUTPUT ]] then pdf2txt.py -o "${OUTPUT}" -O "${IMDIR}" "${i}" if [ -s $OUTPUT ] then echo "found $OUTPUT" else echo "rm empty $OUTPUT" rm -f $OUTPUT fi fi done