|
1469 | 1469 | " # Remove EMBEDDING_API_KEY line if using Option 1 (will use NVIDIA_API_KEY)\n", |
1470 | 1470 | " content = re.sub(r'^EMBEDDING_API_KEY=.*$\\n?', '', content, flags=re.MULTILINE)\n", |
1471 | 1471 | " \n", |
1472 | | - " # Update LLM_MODEL if Brev model is provided (Option 2)\n", |
1473 | | - " if brev_model:\n", |
1474 | | - " # Check if LLM_MODEL exists in content, if not add it\n", |
| 1472 | + " # Update LLM_MODEL\n", |
| 1473 | + " # Option 1: Use default cloud model (nvidia/llama-3.3-nemotron-super-49b-v1)\n", |
| 1474 | + " # Option 2: Use Brev model name if provided\n", |
| 1475 | + " if choice == \"1\":\n", |
| 1476 | + " # Option 1: Set to default cloud model\n", |
| 1477 | + " default_cloud_model = \"nvidia/llama-3.3-nemotron-super-49b-v1\"\n", |
| 1478 | + " if re.search(r'^LLM_MODEL=.*$', content, flags=re.MULTILINE):\n", |
| 1479 | + " content = re.sub(\n", |
| 1480 | + " r'^LLM_MODEL=.*$',\n", |
| 1481 | + " f'LLM_MODEL={default_cloud_model}',\n", |
| 1482 | + " content,\n", |
| 1483 | + " flags=re.MULTILINE\n", |
| 1484 | + " )\n", |
| 1485 | + " else:\n", |
| 1486 | + " # Add LLM_MODEL after NVIDIA_API_KEY if it doesn't exist\n", |
| 1487 | + " content = re.sub(\n", |
| 1488 | + " r'^(NVIDIA_API_KEY=.*)$',\n", |
| 1489 | + " rf'\\1\\nLLM_MODEL={default_cloud_model}',\n", |
| 1490 | + " content,\n", |
| 1491 | + " flags=re.MULTILINE\n", |
| 1492 | + " )\n", |
| 1493 | + " elif brev_model:\n", |
| 1494 | + " # Option 2: Use Brev model name if provided\n", |
1475 | 1495 | " if re.search(r'^LLM_MODEL=.*$', content, flags=re.MULTILINE):\n", |
1476 | 1496 | " content = re.sub(\n", |
1477 | 1497 | " r'^LLM_MODEL=.*$',\n", |
|
1572 | 1592 | " print(\"=\" * 60)\n", |
1573 | 1593 | " if choice == \"1\":\n", |
1574 | 1594 | " print(\" • NVIDIA_API_KEY: Set (will be used for all services)\")\n", |
| 1595 | + " print(\" • LLM_MODEL: Set (nvidia/llama-3.3-nemotron-super-49b-v1)\")\n", |
1575 | 1596 | " else:\n", |
1576 | 1597 | " print(\" • NVIDIA_API_KEY: Set (Brev API key for LLM)\")\n", |
1577 | 1598 | " print(\" • EMBEDDING_API_KEY: Set (NVIDIA API key for Embedding)\")\n", |
|
0 commit comments