Spaces:
Paused
Paused
# pdftk thesis.pdf burst | |
#using pdf2text, extract text for each page in assets/pdfs and store in asssets/txts with similar basename | |
for pdf in assets/pdfs/*.pdf | |
do | |
echo | |
#pdftotext $pdf assets/txts/$(basename $pdf .pdf).txt | |
#pdf2txt.py -o assets/txts/$(basename $pdf .pdf).txt $pdf | |
done | |
for pdf in assets/pdfs/*.pdf | |
do | |
convert -density 100 -quality 100 -colorspace RGB -alpha remove -alpha off $pdf assets/pngs/$(basename $pdf .pdf).png | |
done | |