Skip to content

Commit 8e44272

Browse files
committed
fix: set LLM_MODEL for Option 1 (cloud endpoints with NVIDIA API key)
- When Option 1 is selected, set LLM_MODEL to nvidia/llama-3.3-nemotron-super-49b-v1 - Previously only Option 2 (Brev) set LLM_MODEL - Now both options correctly configure the LLM model - Update summary output to show LLM_MODEL is set for Option 1 Fixes: LLM_MODEL not being set when using cloud endpoints with NVIDIA API key
1 parent f3aa1c3 commit 8e44272

1 file changed

Lines changed: 24 additions & 3 deletions

File tree

notebooks/setup/complete_setup_guide.ipynb

Lines changed: 24 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1469,9 +1469,29 @@
14691469
" # Remove EMBEDDING_API_KEY line if using Option 1 (will use NVIDIA_API_KEY)\n",
14701470
" content = re.sub(r'^EMBEDDING_API_KEY=.*$\\n?', '', content, flags=re.MULTILINE)\n",
14711471
" \n",
1472-
" # Update LLM_MODEL if Brev model is provided (Option 2)\n",
1473-
" if brev_model:\n",
1474-
" # Check if LLM_MODEL exists in content, if not add it\n",
1472+
" # Update LLM_MODEL\n",
1473+
" # Option 1: Use default cloud model (nvidia/llama-3.3-nemotron-super-49b-v1)\n",
1474+
" # Option 2: Use Brev model name if provided\n",
1475+
" if choice == \"1\":\n",
1476+
" # Option 1: Set to default cloud model\n",
1477+
" default_cloud_model = \"nvidia/llama-3.3-nemotron-super-49b-v1\"\n",
1478+
" if re.search(r'^LLM_MODEL=.*$', content, flags=re.MULTILINE):\n",
1479+
" content = re.sub(\n",
1480+
" r'^LLM_MODEL=.*$',\n",
1481+
" f'LLM_MODEL={default_cloud_model}',\n",
1482+
" content,\n",
1483+
" flags=re.MULTILINE\n",
1484+
" )\n",
1485+
" else:\n",
1486+
" # Add LLM_MODEL after NVIDIA_API_KEY if it doesn't exist\n",
1487+
" content = re.sub(\n",
1488+
" r'^(NVIDIA_API_KEY=.*)$',\n",
1489+
" rf'\\1\\nLLM_MODEL={default_cloud_model}',\n",
1490+
" content,\n",
1491+
" flags=re.MULTILINE\n",
1492+
" )\n",
1493+
" elif brev_model:\n",
1494+
" # Option 2: Use Brev model name if provided\n",
14751495
" if re.search(r'^LLM_MODEL=.*$', content, flags=re.MULTILINE):\n",
14761496
" content = re.sub(\n",
14771497
" r'^LLM_MODEL=.*$',\n",
@@ -1572,6 +1592,7 @@
15721592
" print(\"=\" * 60)\n",
15731593
" if choice == \"1\":\n",
15741594
" print(\" • NVIDIA_API_KEY: Set (will be used for all services)\")\n",
1595+
" print(\" • LLM_MODEL: Set (nvidia/llama-3.3-nemotron-super-49b-v1)\")\n",
15751596
" else:\n",
15761597
" print(\" • NVIDIA_API_KEY: Set (Brev API key for LLM)\")\n",
15771598
" print(\" • EMBEDDING_API_KEY: Set (NVIDIA API key for Embedding)\")\n",

0 commit comments

Comments
 (0)