forked from lightspeed-core/lightspeed-stack
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathgemini-run.yaml
More file actions
112 lines (112 loc) · 3.14 KB
/
gemini-run.yaml
File metadata and controls
112 lines (112 loc) · 3.14 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
# Example llama-stack configuration for Google Gemini inference
#
# Contributed by @eranco74 (2025-08). See https://github.com/rh-ecosystem-edge/assisted-chat/blob/main/template.yaml#L282-L386
# This file shows how to integrate Gemini with LCS.
#
# Notes:
# - You will need valid Gemini API credentials to run this.
# - You will need a postgres instance to run this config.
#
version: 2
image_name: gemini-config
apis:
- agents
- datasetio
- eval
- files
- inference
- safety
- scoring
- telemetry
- tool_runtime
- vector_io
providers:
inference:
- provider_id: ${LLAMA_STACK_INFERENCE_PROVIDER}
provider_type: remote::gemini
config:
api_key: ${env.GEMINI_API_KEY}
vector_io: []
files: []
safety: []
agents:
- provider_id: meta-reference
provider_type: inline::meta-reference
config:
persistence_store:
type: postgres
host: ${env.LLAMA_STACK_POSTGRES_HOST}
port: ${env.LLAMA_STACK_POSTGRES_PORT}
db: ${env.LLAMA_STACK_POSTGRES_NAME}
user: ${env.LLAMA_STACK_POSTGRES_USER}
password: ${env.LLAMA_STACK_POSTGRES_PASSWORD}
responses_store:
type: postgres
host: ${env.LLAMA_STACK_POSTGRES_HOST}
port: ${env.LLAMA_STACK_POSTGRES_PORT}
db: ${env.LLAMA_STACK_POSTGRES_NAME}
user: ${env.LLAMA_STACK_POSTGRES_USER}
password: ${env.LLAMA_STACK_POSTGRES_PASSWORD}
telemetry:
- provider_id: meta-reference
provider_type: inline::meta-reference
config:
service_name: "${LLAMA_STACK_OTEL_SERVICE_NAME}"
sinks: ${LLAMA_STACK_TELEMETRY_SINKS}
sqlite_db_path: ${STORAGE_MOUNT_PATH}/sqlite/trace_store.db
eval: []
datasetio: []
scoring:
- provider_id: basic
provider_type: inline::basic
config: {}
- provider_id: llm-as-judge
provider_type: inline::llm-as-judge
config: {}
tool_runtime:
- provider_id: rag-runtime
provider_type: inline::rag-runtime
config: {}
- provider_id: model-context-protocol
provider_type: remote::model-context-protocol
config: {}
metadata_store:
type: sqlite
db_path: ${STORAGE_MOUNT_PATH}/sqlite/registry.db
inference_store:
type: postgres
host: ${env.LLAMA_STACK_POSTGRES_HOST}
port: ${env.LLAMA_STACK_POSTGRES_PORT}
db: ${env.LLAMA_STACK_POSTGRES_NAME}
user: ${env.LLAMA_STACK_POSTGRES_USER}
password: ${env.LLAMA_STACK_POSTGRES_PASSWORD}
models:
- metadata: {}
model_id: ${LLAMA_STACK_2_0_FLASH_MODEL}
provider_id: ${LLAMA_STACK_INFERENCE_PROVIDER}
provider_model_id: ${LLAMA_STACK_2_0_FLASH_MODEL}
model_type: llm
- metadata: {}
model_id: ${LLAMA_STACK_2_5_PRO_MODEL}
provider_id: ${LLAMA_STACK_INFERENCE_PROVIDER}
provider_model_id: ${LLAMA_STACK_2_5_PRO_MODEL}
model_type: llm
- metadata: {}
model_id: ${LLAMA_STACK_2_5_FLASH_MODEL}
provider_id: ${LLAMA_STACK_INFERENCE_PROVIDER}
provider_model_id: ${LLAMA_STACK_2_5_FLASH_MODEL}
model_type: llm
shields: []
vector_dbs: []
datasets: []
scoring_fns: []
benchmarks: []
tool_groups:
- toolgroup_id: builtin::rag
provider_id: rag-runtime
- toolgroup_id: mcp::assisted
provider_id: model-context-protocol
mcp_endpoint:
uri: "${MCP_SERVER_URL}"
server:
port: ${LLAMA_STACK_SERVER_PORT}