|
2 | 2 | # TABLE CONFIGURATIONS |
3 | 3 | # ============================================================================= |
4 | 4 |
|
| 5 | +# ------------------------------------------------------------ |
| 6 | +# CONFIGURATIONS FOR validate_raw_data.py |
| 7 | +# ------------------------------------------------------------ |
| 8 | + |
5 | 9 | TABLE_CONFIG = { |
6 | 10 | "df_orders": { |
7 | 11 | "role": "event_fact", |
|
81 | 85 | "order_delivered_timestamp": "%Y-%m-%d %H:%M:%S", |
82 | 86 | "order_estimated_delivery_date": "%Y-%m-%d", |
83 | 87 | } |
| 88 | + |
| 89 | + |
| 90 | +# ------------------------------------------------------------ |
| 91 | +# CONFIGURATIONS FOR assemble_validate_events.py |
| 92 | +# ------------------------------------------------------------ |
| 93 | + |
| 94 | +# Assemble events enforced schema and dtypes |
| 95 | +ASSEMBLE_ENFORCED_SCHEMA = [ |
| 96 | + "order_id", |
| 97 | + "order_revenue", |
| 98 | + "seller_id", |
| 99 | + "product_id", |
| 100 | + "order_status", |
| 101 | + "order_purchase_timestamp", |
| 102 | + "order_approved_at", |
| 103 | + "order_delivered_timestamp", |
| 104 | + "lead_time_days", |
| 105 | + "approval_lag_days", |
| 106 | + "delivery_delay_days", |
| 107 | + "order_date", |
| 108 | + "order_year", |
| 109 | + "order_year_week", |
| 110 | + "run_id", |
| 111 | +] |
| 112 | + |
| 113 | +ASSEMBLE_ENFORCED_DTYPES = { |
| 114 | + "order_id": "string", |
| 115 | + "order_revenue": "float64", |
| 116 | + "seller_id": "string", |
| 117 | + "product_id": "string", |
| 118 | + "order_status": "string", |
| 119 | + "order_purchase_timestamp": "datetime64[ns]", |
| 120 | + "order_approved_at": "datetime64[ns]", |
| 121 | + "order_delivered_timestamp": "datetime64[ns]", |
| 122 | + "lead_time_days": "int64", |
| 123 | + "approval_lag_days": "int64", |
| 124 | + "delivery_delay_days": "int64", |
| 125 | + "order_date": "datetime64[ns]", |
| 126 | + "order_year": "int64", |
| 127 | +} |
| 128 | + |
| 129 | + |
| 130 | +# ------------------------------------------------------------ |
| 131 | +# CONFIGURATIONS FOR build_bi_semantic_layer.py |
| 132 | +# ------------------------------------------------------------ |
| 133 | + |
| 134 | + |
| 135 | +# Seller dimension enforced schema and dtypes |
| 136 | +SELLER_DIM_ENFORCED_SCHEMA = [ |
| 137 | + "seller_id", |
| 138 | + "first_order_date", |
| 139 | + "first_order_year_week", |
| 140 | + "run_id", |
| 141 | +] |
| 142 | + |
| 143 | +SELLER_DIM_ENFORCED_DTYPES = { |
| 144 | + "seller_id": "string", |
| 145 | + "first_order_date": "datetime64[ns]", |
| 146 | + "first_order_year_week": "string", |
| 147 | + "run_id": "string", |
| 148 | +} |
| 149 | + |
| 150 | + |
| 151 | +# Seller Facts enforced schema and dtypes |
| 152 | +SELLER_FACT_ENFORCED_SCHEMA = [ |
| 153 | + "seller_id", |
| 154 | + "order_year_week", |
| 155 | + "week_start_date", |
| 156 | + "run_id", |
| 157 | + "weekly_order_count", |
| 158 | + "weekly_delivered_orders", |
| 159 | + "weekly_cancelled_orders", |
| 160 | + "weekly_revenue", |
| 161 | + "weekly_avg_lead_time", |
| 162 | + "weekly_total_lead_time", |
| 163 | + "weekly_avg_delivery_delay", |
| 164 | + "weekly_total_delivery_delay", |
| 165 | + "weekly_avg_approval_lag", |
| 166 | +] |
| 167 | + |
| 168 | +SELLER_FACT_ENFORCED_DTYPES = { |
| 169 | + "seller_id": "string", |
| 170 | + "order_year_week": "string", |
| 171 | + "week_start_date": "datetime64[ns]", |
| 172 | + "run_id": "string", |
| 173 | + "weekly_order_count": "int64", |
| 174 | + "weekly_delivered_orders": "int64", |
| 175 | + "weekly_cancelled_orders": "int64", |
| 176 | + "weekly_revenue": "float64", |
| 177 | + "weekly_avg_lead_time": "float64", |
| 178 | + "weekly_total_lead_time": "int64", |
| 179 | + "weekly_avg_delivery_delay": "float64", |
| 180 | + "weekly_total_delivery_delay": "int64", |
| 181 | + "weekly_avg_approval_lag": "float64", |
| 182 | +} |
0 commit comments