1
0
mirror of https://github.com/kanzure/pdfparanoia.git synced 2024-12-04 23:15:52 +01:00

Check PDF is from the RSC before cleaning

This commit is contained in:
Donncha O'Cearbhaill 2013-05-13 21:01:52 +01:00
parent 18140d838d
commit c673d77ec6

View File

@ -35,6 +35,9 @@ class RoyalSocietyOfChemistry(Plugin):
#"Table of Contents for this issue",
]
# Confirm the PDF is from the RSC
if "pubs.rsc.org" in content:
# parse the pdf into a pdfminer document
pdf = parse_content(content)