diff options
| author | jvoisin | 2011-07-30 20:43:45 +0200 |
|---|---|---|
| committer | jvoisin | 2011-07-30 20:43:45 +0200 |
| commit | b2e623d78db9e4c8da14fa44f830697f1a4eb739 (patch) | |
| tree | 174a0610a0c36e83114a0bff3b11d045f047c80d /lib/office.py | |
| parent | f9707e24e66e521300d297dcc35ff6f64008f6ae (diff) | |
Tests for pdf (all green btw)
Diffstat (limited to '')
| -rw-r--r-- | lib/office.py | 8 |
1 files changed, 5 insertions, 3 deletions
diff --git a/lib/office.py b/lib/office.py index 5d05e76..ec08cfb 100644 --- a/lib/office.py +++ b/lib/office.py | |||
| @@ -120,7 +120,7 @@ class PdfStripper(parser.GenericParser): | |||
| 120 | def __init__(self, filename, parser, mime, backup, add2archive): | 120 | def __init__(self, filename, parser, mime, backup, add2archive): |
| 121 | super(PdfStripper, self).__init__(filename, parser, mime, backup, | 121 | super(PdfStripper, self).__init__(filename, parser, mime, backup, |
| 122 | add2archive) | 122 | add2archive) |
| 123 | uri = 'file://' + self.filename | 123 | uri = 'file://' + os.path.abspath(self.filename) |
| 124 | self.password = None | 124 | self.password = None |
| 125 | self.document = poppler.document_new_from_file(uri, self.password) | 125 | self.document = poppler.document_new_from_file(uri, self.password) |
| 126 | self.meta_list = ('title', 'author', 'subject', 'keywords', 'creator', | 126 | self.meta_list = ('title', 'author', 'subject', 'keywords', 'creator', |
| @@ -131,11 +131,12 @@ class PdfStripper(parser.GenericParser): | |||
| 131 | Check if the file is clean from harmful metadatas | 131 | Check if the file is clean from harmful metadatas |
| 132 | ''' | 132 | ''' |
| 133 | for key in self.meta_list: | 133 | for key in self.meta_list: |
| 134 | if key == 'creation-date' and key == 'mod-date': | 134 | if key == 'creation-date' or key == 'mod-date': |
| 135 | if self.document.get_property(key) != -1: | 135 | if self.document.get_property(key) != -1: |
| 136 | return False | 136 | return False |
| 137 | else: | 137 | else: |
| 138 | if self.document.get_property(key) is not None: | 138 | if self.document.get_property(key) is not None and \ |
| 139 | self.document.get_property(key) != '': | ||
| 139 | return False | 140 | return False |
| 140 | return True | 141 | return True |
| 141 | 142 | ||
| @@ -179,4 +180,5 @@ class PdfStripper(parser.GenericParser): | |||
| 179 | if self.document.get_property(key) is not None and \ | 180 | if self.document.get_property(key) is not None and \ |
| 180 | self.document.get_property(key) != '': | 181 | self.document.get_property(key) != '': |
| 181 | metadata[key] = self.document.get_property(key) | 182 | metadata[key] = self.document.get_property(key) |
| 183 | print metadata | ||
| 182 | return metadata | 184 | return metadata |
