Skip to content
Snippets Groups Projects
main.py 3.66 KiB
Newer Older
  • Learn to ignore specific revisions
  • #!/usr/bin/python3
    
    import os
    
    import mimetypes
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
    import argparse
    
    from threading import Thread
    import multiprocessing
    from queue import Queue
    
    from src import parser_factory
    
    def __check_file(filename:str, mode:int = os.R_OK) -> bool:
    
        if not os.path.isfile(filename):
            print("[-] %s is not a regular file." % filename)
            return False
        elif not os.access(filename, mode):
            print("[-] %s is not readable and writeable." % filename)
            return False
        return True
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
    def create_arg_parser():
        parser = argparse.ArgumentParser(description='Metadata anonymisation toolkit 2')
        parser.add_argument('files', nargs='*')
    
        info = parser.add_argument_group('Information')
        info.add_argument('-c', '--check', action='store_true',
                          help='check if a file is free of harmful metadatas')
        info.add_argument('-l', '--list', action='store_true',
                          help='list all supported fileformats')
        info.add_argument('-s', '--show', action='store_true',
                          help='list all the harmful metadata of a file without removing them')
    
        info.add_argument('-L', '--lightweight', action='store_true',
                          help='remove SOME metadata')
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
        return parser
    
    
    def show_meta(filename:str):
    
        if not __check_file(filename):
            return
    
    
        p, mtype = parser_factory.get_parser(filename)
    
        if p is None:
    
            print("[-] %s's format (%s) is not supported" % (filename, mtype))
    
        print("[+] Metadata for %s:" % filename)
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
        for k,v in p.get_meta().items():
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
            try:  # FIXME this is ugly.
                print("  %s: %s" % (k, v))
            except UnicodeEncodeError:
                print("  %s: harmful content" % k)
    
    def clean_meta(filename:str, is_lightweigth:bool):
    
        if not __check_file(filename, os.R_OK|os.W_OK):
            return
    
    
        p, mtype = parser_factory.get_parser(filename)
    
        if p is None:
            print("[-] %s's format (%s) is not supported" % (filename, mtype))
            return
    
        if is_lightweigth:
            p.remove_all_lightweight()
        else:
            p.remove_all()
    
    def show_parsers():
        print('[+] Supported formats:')
        for parser in parser_factory._get_parsers():
            for mtype in parser.mimetypes:
                extensions = ', '.join(mimetypes.guess_all_extensions(mtype))
                print('  - %s (%s)' % (mtype, extensions))
    
    
    def __get_files_recursively(files):
        for f in files:
            if os.path.isfile(f):
                yield f
            else:
                for path, _, _files in os.walk(f):
                    for _f in _files:
                        yield os.path.join(path, _f)
    
    
    def __do_clean_async(is_lightweigth, q):
    
        while True:
            f = q.get()
            if f is None:  # nothing more to process
                return
    
            clean_meta(f, is_lightweigth)
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
    def main():
    
        arg_parser = create_arg_parser()
        args = arg_parser.parse_args()
    
        if not args.files:
            if not args.list:
                return arg_parser.print_help()
            show_parsers()
            return
    
    
        elif args.show:
    
            for f in __get_files_recursively(args.files):
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
                show_meta(f)
    
            return
    
        else:  # Thread the cleaning
    
            mode = (args.lightweight is True)
    
            q = Queue(maxsize=0)
            threads = list()
    
            for f in __get_files_recursively(args.files):
    
                q.put(f)
    
            for _ in range(multiprocessing.cpu_count()):
    
                worker = Thread(target=__do_clean_async, args=(mode, q))
    
                worker.start()
                threads.append(worker)
    
            for _ in range(multiprocessing.cpu_count()):
                q.put(None)  # stop the threads
    
            for worker in threads:
                worker.join()
    
    Julien (jvoisin) Voisin's avatar
    Julien (jvoisin) Voisin committed
    
    
    if __name__ == '__main__':
        main()