1+ {
2+ "metadata" : {
3+ "kernelspec" : {
4+ "display_name" : " Streamlit Notebook" ,
5+ "name" : " streamlit"
6+ },
7+ "lastEditStatus" : {
8+ <<<<<<< HEAD
9+ "notebookId" : " dwcf2fynfosmyghponvw" ,
10+ "authorId" : " 6690310009356" ,
11+ "authorName" : " YOHANMARKOSE" ,
12+ "authorEmail" : " markose.y@northeastern.edu" ,
13+ "sessionId" : " 3abaf741-87a4-40b0-8c7d-dc03d4b7f2a7" ,
14+ "lastEditTime" : 1740739209269
15+ =======
16+ "notebookId" : " eit25xap76vo7ktof4y5" ,
17+ "authorId" : " 6690310009356" ,
18+ "authorName" : " YOHANMARKOSE" ,
19+ "authorEmail" : " markose.y@northeastern.edu" ,
20+ "sessionId" : " cc15f23b-b6c0-4028-a56c-82718000c5b9" ,
21+ "lastEditTime" : 1740718649816
22+ >>>>>>> origin/main
23+ }
24+ },
25+ "nbformat_minor" : 5 ,
26+ "nbformat" : 4 ,
27+ "cells" : [
28+ {
29+ "cell_type" : " code" ,
30+ "execution_count" : null ,
31+ "id" : " 3775908f-ca36-4846-8f38-5adca39217f2" ,
32+ "metadata" : {
33+ "language" : " sql" ,
34+ "name" : " sql_get_context"
35+ },
36+ "outputs" : [],
37+ "source" : [
38+ " SELECT current_database() AS DATABASE_NAME, current_schema() AS SCHEMA_NAME\n "
39+ ]
40+ },
41+ {
42+ "cell_type" : " code" ,
43+ "execution_count" : null ,
44+ "id" : " 9a73e27a-c874-4e9c-a236-67aed79d8fd9" ,
45+ "metadata" : {
46+ "language" : " python" ,
47+ "name" : " cell1"
48+ },
49+ "outputs" : [],
50+ "source" : [
51+ " # Import python packages\n " ,
52+ " import logging\n " ,
53+ " from snowflake.snowpark.context import get_active_session\n " ,
54+ " \n " ,
55+ " logger = logging.getLogger(\" fred_logger\" )\n " ,
56+ " \n " ,
57+ " current_context_df = cells.sql_get_context.to_pandas()\n " ,
58+ " database_name = current_context_df.iloc[0,0]\n " ,
59+ " schema_name = current_context_df.iloc[0,1]\n " ,
60+ " \n " ,
61+ " session = get_active_session()\n " ,
62+ " \n " ,
63+ " logger.info(\" 02_raw_to_harmonized start\" )"
64+ ]
65+ },
66+ {
67+ "cell_type" : " code" ,
68+ "execution_count" : null ,
69+ "id" : " 31927266-930c-4441-8639-6d8cefcfcee4" ,
70+ "metadata" : {
71+ "collapsed" : false ,
72+ "language" : " python" ,
73+ "name" : " cell3"
74+ },
75+ "outputs" : [],
76+ <<<<<<< HEAD
77+ "source": "import snowflake.snowpark.functions as F\n\nenv = schema_name.split('_')[0]\ndef create_fred_table(session):\n raw_fred_10Y = session.table(f\"{database_name}.{env}_RAW_FRED.FRED_DGS10Y\").select(\n F.to_date(F.col('\"date\"')).alias(\"OBSERVATION_DATE\"),\n F.when(F.col('\"value\"') == 0, None)\n .otherwise(F.col('\"value\"'))\n .cast(\"float\")\n .alias(\"10Y_YIELD\")\n )\n \n raw_fred_2Y = session.table(f\"{database_name}.{env}_RAW_FRED.FRED_DGS2Y\").select(\n F.to_date(F.col('\"date\"')).alias(\"OBSERVATION_DATE\"),\n F.when(F.col('\"value\"') == 0, None)\n .otherwise(F.col('\"value\"'))\n .cast(\"float\")\n .alias(\"2Y_YIELD\")\n )\n\n harmonized_data = raw_fred_10Y.join(\n raw_fred_2Y, \n raw_fred_10Y[\"OBSERVATION_DATE\"] == raw_fred_2Y[\"OBSERVATION_DATE\"]\n ).select(\n raw_fred_10Y[\"OBSERVATION_DATE\"].alias(\"OBSERVATION_DATE\"),\n F.col(\"10Y_YIELD\"),\n F.col(\"2Y_YIELD\")\n )\n \n session.use_schema(f\"{database_name}.{schema_name}\")\n harmonized_data.write.mode(\"overwrite\").save_as_table('FRED_FLATTENED')\n\ndef create_fred_table_stream(session):\n _ = session.sql('CREATE OR REPLACE STREAM FRED_STREAM \\\n ON TABLE FRED_FLATTENED \\\n SHOW_INITIAL_ROWS = TRUE').collect()\n \n"
78+ =======
79+ "source": "import snowflake.snowpark.functions as F\n\nenv = schema_name.split('_')[0]\ndef create_fred_table(session):\n raw_fred_10Y = session.table(f\"{database_name}.{env}_RAW_FRED.FRED_DGS10Y\").select(\n F.to_date(F.col('\"date\"')).alias(\"OBSERVATION_DATE\"),\n F.col('\"value\"').cast(\"float\").alias(\"10Y_YIELD\")\n )\n \n raw_fred_2Y = session.table(f\"{database_name}.{env}_RAW_FRED.FRED_DGS2Y\").select(\n F.to_date(F.col('\"date\"')).alias(\"OBSERVATION_DATE\"),\n F.col('\"value\"').cast(\"float\").alias(\"2Y_YIELD\")\n )\n\n harmonized_data = raw_fred_10Y.join(raw_fred_2Y, raw_fred_10Y[\"OBSERVATION_DATE\"] == raw_fred_2Y[\"OBSERVATION_DATE\"]).select(\n raw_fred_10Y[\"OBSERVATION_DATE\"].alias(\"OBSERVATION_DATE\"),\n F.col(\"10Y_YIELD\"),\n F.col(\"2Y_YIELD\")\n )\n\n\n \n session.use_schema(f\"{database_name}.{schema_name}\")\n harmonized_data.write.mode(\"overwrite\").save_as_table('FRED_FLATTENED')\n\ndef create_fred_table_stream(session):\n _ = session.sql('CREATE OR REPLACE STREAM FRED_STREAM \\\n ON TABLE FRED_FLATTENED \\\n SHOW_INITIAL_ROWS = TRUE').collect()\n \n"
80+ >>>>>>> origin/main
81+ },
82+ {
83+ "cell_type" : " code" ,
84+ "execution_count" : null ,
85+ "id" : " 29badd8a-aead-4f7b-bdcb-e12049c0d18b" ,
86+ "metadata" : {
87+ "language" : " python" ,
88+ "name" : " cell4"
89+ },
90+ "outputs" : [],
91+ "source" : " \n create_fred_table(session)\n create_fred_table_stream(session)"
92+ }
93+ ]
94+ }
0 commit comments