diff options
| author | T-Aji <tolujbd2@gmail.com> | 2024-08-22 12:30:34 +0100 |
|---|---|---|
| committer | T-Aji <tolujbd2@gmail.com> | 2024-08-22 12:30:34 +0100 |
| commit | 85c38d9cf43204b1af597fa2762f658e202ac371 (patch) | |
| tree | 5f425bfda9e6fabb313b4a442e2fb5ce810d95aa /src/fact-sales-order.py | |
| parent | fe5a5ac472e90f1994b6f974429327ba9007ced3 (diff) | |
| download | de-project-bentley-85c38d9cf43204b1af597fa2762f658e202ac371.tar.gz de-project-bentley-85c38d9cf43204b1af597fa2762f658e202ac371.zip | |
add fact table
Diffstat (limited to 'src/fact-sales-order.py')
| -rw-r--r-- | src/fact-sales-order.py | 50 |
1 files changed, 0 insertions, 50 deletions
diff --git a/src/fact-sales-order.py b/src/fact-sales-order.py deleted file mode 100644 index 7921047..0000000 --- a/src/fact-sales-order.py +++ /dev/null @@ -1,50 +0,0 @@ -import pandas as pd - - -def create_dim_design(dict_of_df): - df_design = dict_of_df["design"] - dim_design = df_design.loc[:, ["design_id", "design_name", "file_name", "file_location"]] - return dim_design - -def create_dim_staff(dict_of_df): - staff_department = pd.merge(dict_of_df["staff"], dict_of_df["department"], on='department_id', how="outer") - dim_staff = staff_department.loc[:, ['staff_id', 'first_name', 'last_name', 'department_name', 'location', 'email_address']] - return dim_staff - -def create_dim_currency(dict_of_df): - df_currency = dict_of_df["currency"] - dim_currency = df_currency.loc[:, ["currency_id", "currency_code"]] - mappings = { - "GBP": "Pound", - "USD": "US Dollar", - "EUR": "Euro" - } - dim_currency["currency_name"] = dim_currency["currency_code"].map(mappings) - return dim_currency - - -def create_dim_date(dict_of_df): - df_sales = dict_of_df["sales"] - df_sales = df_sales.loc[:, ["agreed_delivery_date"]] - df_sales["agreed_delivery_date"] = pd.to_datetime["agreed_delivery_date"] - df_sales["year"] = df_sales["agreed_delivery_date"].dt.year - df_sales["month"] = df_sales["agreed_delivery_date"].dt.month - df_sales["day"] = df_sales["agreed_delivery_date"].dt.day - df_sales["day_of_week"] = df_sales["agreed_delivery_date"].dt.dayofweek - df_sales["day_name"] = df_sales["agreed_delivery_date"].dt.day_name() - df_sales["month_name"] = df_sales["agreed_delivery_date"].dt.month_name() - df_sales["quarter"] = df_sales["agreed_delivery_date"].dt.quarter() - dim_date = ["date_id", "year", "month", "day", "day_of_week", "day_name", "month_name", "quarter"] #series.dt.quarter() - return dim_date - -# repeat ln 52 - 60 for each column -# merge dataframes into one dataframe -# remove duplicates - - - - - -# TO DO: -# complete dim_date -# fact_sales_order |
