aboutsummaryrefslogtreecommitdiffstats
path: root/cli.py
blob: c03ffd104029126a1fcf642491490bb25088b01e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
import argparse
import json
from obfuscator.csv_reader import CSVReader
from obfuscator.obfuscate import obfuscate
from obfuscator.logger import get_logger
from obfuscator.csv_writer import create_byte_stream


def main():
    parser = argparse.ArgumentParser(
        prog="GDPR-Obfuscator",
        description="Obfuscate sensitive data stored locally or in an AWS environment",
    )

    parser.add_argument(
        "-v", "--verbose", action="store_true", help="Enable verbose logging"
    )

    loc = parser.add_mutually_exclusive_group(required=True)
    loc.add_argument("-l", "--local", help="Local path to file")
    loc.add_argument("-s", "--s3", help="URI path to file stored in S3")

    parser.add_argument(
        "-p",
        "--pii",
        nargs="+",
        required=True,
        help="List of PII fields to obfuscate, separated by spaces",
    )

    args = parser.parse_args()

    log_level = "DEBUG" if args.verbose else "INFO"

    logger = get_logger("CLI", log_level)

    reader = CSVReader(log_level)

    if args.local and not args.s3:
        logger.debug("User chose to read CSV from local path")
        data = reader.read_local(args.local)
        logger.debug("Contents: " + str(data))
    else:
        logger.debug("User chose to read CSV from S3")

        data = reader.read_s3(args.s3)
        logger.debug("Contents: " + str(data))

    obfuscated_data = obfuscate(data, args.pii)
    logger.debug("Obfuscated data (JSON): " + json.dumps(obfuscated_data, indent=4))
    return create_byte_stream(obfuscated_data)


if __name__ == "__main__":
    main()
git.ajschof.me — hosted by ajschofield — powered by cgit