summaryrefslogtreecommitdiff
path: root/main.py
blob: e4157e68a80277096f99da86fc6dae9b8432f850 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
import sys
from shutil import copyfile
import argparse

from src.parsers import pdf


def create_arg_parser():
    parser = argparse.ArgumentParser(description='Metadata anonymisation toolkit 2')
    parser.add_argument('files', nargs='*')

    info = parser.add_argument_group('Information')
    info.add_argument('-c', '--check', action='store_true',
                      help='check if a file is free of harmful metadatas')
    info.add_argument('-l', '--list', action='store_true',
                      help='list all supported fileformats')
    info.add_argument('-s', '--show', action='store_true',
                      help='list all the harmful metadata of a file without removing them')
    return parser

def show_meta(file_name:str):
    p = pdf.PDFParser(file_name)
    for k,v in p.get_meta().items():
        print("%s: %s" % (k, v))

def main():
    argparser = create_arg_parser()
    args = argparser.parse_args()

    if args.show:
        for f in args.files:
            show_meta(f)
        return 0
    elif not args.files:
        return parser.show_help()

    copyfile(sys.argv[1] + '.bak', sys.argv[1])
    p = pdf.PDFParser(sys.argv[1])
    p.remove_all()
    p = pdf.PDFParser('OUT_clean.pdf')
    print("ok")


if __name__ == '__main__':

    main()