diff options
Diffstat (limited to 'src')
| -rw-r--r-- | src/transform_lambda.py | 38 |
1 files changed, 26 insertions, 12 deletions
diff --git a/src/transform_lambda.py b/src/transform_lambda.py index 2a97931..900bf4b 100644 --- a/src/transform_lambda.py +++ b/src/transform_lambda.py @@ -17,17 +17,17 @@ s3_resource = boto3.resource('s3') ##need this for a way of reuploading data aft def lambda_handler(event, context): s3_client = boto3.client('s3') - # tables = ['sales_order', - # 'transaction', - # 'payment', - # 'counterparty', - # 'address', - # 'staff', - # 'purchase_order', - # 'department', - # 'currency', - # 'design', - # 'payment_type'] + tables = ['sales_order', + 'transaction', + 'payment', + 'counterparty', + 'address', + 'staff', + 'purchase_order', + 'department', + 'currency', + 'design', + 'payment_type'] try: s3_bucket_name = event["Records"][0]["s3"]["bucket"]["name"] s3_file_name = event["Records"][0]["s3"]["object"]["key"] @@ -40,4 +40,18 @@ def lambda_handler(event, context): body = object['Body'] csv_string = body.read().decode('utf-8') dataframe = pd.read_csv(StringIO(csv_string)) ##this is the streaming body -
\ No newline at end of file + + print(dataframe.head(3)) + + except Exception as err: + print(err) + + # TODO implement + return { + 'statusCode': 200, + 'body': json.dumps('') + } + +## each csv file must be converted into a pandas df +## done via read_csv, where stringIO creates an file-like-object from string - treats string like a file: as file is not physically stored in file +## each file needs its own panda df (?) to be normalised
\ No newline at end of file |
