aboutsummaryrefslogtreecommitdiffstats
path: root/src/fact-sales-order.py
blob: a14388932dc66f1076f86448e8f2c8c927d747e2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
import pandas as pd
from src.transform_lambda import get_dataframes

dict_of_df = get_dataframes()  # {"design": "design dataframe", "address": "address dataframe", ....}


# iterates through each dataframe in the list of dataframes and assigns them to a variable
df_design = dict_of_df[design]
df_currency = dict_of_df[currency]
df_address = dict_of_df[address]
df_staff = dict_of_df[staff]
df_department = dict_of_df[department]
df_counterparty = dict_of_df[counterparty]


# creates the dim_design dataframe
dim_design = df_design["design_id", "design_name", "file_name", "file_location"]

# creates the dim_staff dataframe
staff_department = pd.merge(df_staff, df_department, on='department_id', how="outer")
dim_staff = staff_department['staff_id', 'first_name', 'last_name', 'department_name', 'location', 'email_address']

# creates the dim_currency dataframe
# currency names currently hardcoded and not taken from database, is this viable/how else to do this? 
d = {"currency_id": [1, 2, 3], "currency_code": ["GBP", "USD", "EUR"], "currency_name": ["Pound", "US Dollar", "Euro"]}
currency_names = pd.DataFrame(data=d)
join_currency = pd.merge(df_currency, currency_names, on="currency_name", how="outer")
dim_currency = join_currency["currency_id", "currency_code", "currency_name"]

# creates the dim_location dataframe
# need to change address id to location id 
"dim_location dataframe: (location_id, address_line_1, address_line_2, district, city, postal code, country, phone)"
dim_location = df_address["address_id", "address_line_1", "address_line_2", "district", "city", "postal_code" "country", "phone"]









# creates the dim_counterparty dataframe
# counterparty_address = pd.merge(df_counterparty, df_address, left_on="legal_address_id", right_on='address_id', how="outer")

# dim_counterparty = df_counterparty["counterparty_id", "counterparty_legal_name", "counterparty_legal_address_line_1",
#                                    "counterparty_legal_address_line_2", "counterparty_legal_district", "counterpart_legal_city",
#                                    "counterparty_legal_postal_code", "counterparty_legal_country", "counterparty_legal_phone_number"]


# TO DO:
# dim_location
# dim_date
# fact_sales_order
git.ajschof.me — hosted by ajschofield — powered by cgit