aboutsummaryrefslogtreecommitdiffstats
path: root/test/test_csv_reader.py
blob: 27abea06a21795dcc99b214c324c0ae43c128da7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
# csv_reader.py - tests
# Author: Alex Schofield

import boto3
from moto import mock_aws
from obfuscator.csv_reader import CSVReader
import pytest

reader = CSVReader()

# CSVREADER: READ_STRING TESTS

# Check if the function can read a CSV string with no content and return
# an empty list


def test_empty_csv_should_return_no_content():
    content = ""
    result = reader.read_string(content)
    expected = []
    assert result == expected


# Check if the function can read a CSV string with only a header and return
# an empty list


def test_csv_with_header_only_should_return_no_content():
    content = "student_id,name,course\n"
    result = reader.read_string(content)
    expected = []
    assert result == expected


# Check if the function can read a CSV string with valid data and return
# a list of dictionaries


def test_csv_with_valid_data():
    content = (
        "student_id,name,course\n"
        "1234,Student 1,Course 1\n"
        "5678,Student 2,Course 2\n"
    )
    result = reader.read_string(content)
    expected = [
        {"student_id": "1234", "name": "Student 1", "course": "Course 1"},
        {"student_id": "5678", "name": "Student 2", "course": "Course 2"},
    ]
    assert result == expected


# Check if the function can read a CSV string with quoted fields and return
# a list of dictionaries with the quoted fields intact


def test_csv_with_quoted_fields_should_run_as_expected():
    content = (
        "student_id,name,course\n"
        '1234,"Student 1","Course 1"\n'
        '5678,"Student 2","Course 2"\n'
    )
    result = reader.read_string(content)
    expected = [
        {"student_id": "1234", "name": "Student 1", "course": "Course 1"},
        {"student_id": "5678", "name": "Student 2", "course": "Course 2"},
    ]
    assert result == expected


# CSVREADER: READ_S3 TESTS


def setup_s3(s3_client, bucket: str, key: str, content: str):
    s3_client.create_bucket(
        Bucket="test-bucket",
        CreateBucketConfiguration={"LocationConstraint": "eu-west-2"},
    )
    s3_client.put_object(Bucket=bucket, Key=key, Body=content)


@pytest.fixture(autouse=True)
def s3_client():
    with mock_aws():
        yield boto3.client("s3", "eu-west-2")


def test_read_s3_valid_csv_returns_expected():
    with mock_aws():
        s3 = boto3.client("s3", region_name="eu-west-2")
        bucket = "test-bucket"
        key = "data/mock.csv"

        csv_content = (
            "student_id,name,course\n"
            "1234,Student 1,Course 1\n"
            "5678,Student 2,Course 2\n"
        )

        setup_s3(s3, bucket, key, csv_content)
        path = f"s3://{bucket}/{key}"

        data = reader.read_s3(path)

        expected = [
            {"student_id": "1234", "name": "Student 1", "course": "Course 1"},
            {"student_id": "5678", "name": "Student 2", "course": "Course 2"},
        ]

        assert data == expected
git.ajschof.me — hosted by ajschofield — powered by cgit