Monday, November 17, 2008

Script to extract string from pdf. Find and rename files in folder

for pdf_name in `ls *.pdf`;
do
# echo pdf_name
pdftotext $pdf_name
txt_name=`echo $pdf_name | sed 's/\.pdf$/.txt/'`
# echo $txt_name
new_pdf_name=`sed -n '7p' $new_txt_name | cut -d":" -f2 | cut -d" " -f2`
# echo $new_pdf_name
cp $i $new_pdf_name.pdf;
# rm $txt_name;
done

No comments: