@@ -167,29 +167,11 @@ apis:
167167- tool_runtime
168168- safety
169169
170- models:
171- # Your LLM model
172- - model_id: your-llm-model
173- provider_id: openai # or your preferred provider
174- model_type: llm
175- provider_model_id: gpt-4o-mini
176-
177- # Embedding model for BYOK
178- - model_id: sentence-transformers/all-mpnet-base-v2
179- metadata:
180- embedding_dimension: 768
181- model_type: embedding
182- provider_id: sentence-transformers
183- provider_model_id: /path/to/embedding_models/all-mpnet-base-v2
184-
185170providers:
186171 inference:
187- # Embedding model provider
188172 - provider_id: sentence-transformers
189173 provider_type: inline::sentence-transformers
190174 config: {}
191-
192- # LLM provider (example: OpenAI)
193175 - provider_id: openai
194176 provider_type: remote::openai
195177 config:
@@ -199,48 +181,68 @@ providers:
199181 - provider_id: meta-reference
200182 provider_type: inline::meta-reference
201183 config:
202- persistence_store:
203- type: sqlite
204- db_path: .llama/distributions/ollama/agents_store.db
205- responses_store:
206- type: sqlite
207- db_path: .llama/distributions/ollama/responses_store.db
184+ persistence:
185+ agent_state:
186+ namespace: agents_state
187+ backend: kv_default
188+ responses:
189+ table_name: agents_responses
190+ backend: sql_default
208191
209192 safety:
210193 - provider_id: llama-guard
211194 provider_type: inline::llama-guard
212195 config:
213196 excluded_categories: []
214197
215- # Vector database configuration
216198 vector_io:
217199 - provider_id: your-knowledge-base
218- provider_type: inline::faiss # or remote::pgvector
200+ provider_type: inline::faiss
219201 config:
220- kvstore:
221- type: sqlite
222- db_path: /path/to/vector_db/faiss_store.db
223- namespace: null
202+ persistence:
203+ namespace: vector_io::faiss
204+ backend: byok_backend # References storage.backends
224205
225206 tool_runtime:
226207 - provider_id: rag-runtime
227208 provider_type: inline::rag-runtime
228209 config: {}
229210
230- # Enable RAG tools
231- tool_groups:
232- - provider_id: rag-runtime
233- toolgroup_id: builtin::rag
234-
235- # Vector database configuration
236- vector_dbs:
237- - embedding_dimension: 768
238- embedding_model: sentence-transformers/all-mpnet-base-v2
239- provider_id: your-knowledge-base
240- vector_db_id: your-index-id # ID used during index generation
211+ storage:
212+ backends:
213+ kv_default:
214+ type: kv_sqlite
215+ db_path: ~/.llama/storage/kv_store.db
216+ sql_default:
217+ type: sql_sqlite
218+ db_path: ~/.llama/storage/sql_store.db
219+ byok_backend:
220+ type: kv_sqlite
221+ db_path: /path/to/vector_db/faiss_store.db
222+
223+ registered_resources:
224+ models:
225+ - model_id: your-llm-model
226+ provider_id: openai
227+ model_type: llm
228+ provider_model_id: gpt-4o-mini
229+ - model_id: sentence-transformers/all-mpnet-base-v2
230+ model_type: embedding
231+ provider_id: sentence-transformers
232+ provider_model_id: /path/to/embedding_models/all-mpnet-base-v2
233+ metadata:
234+ embedding_dimension: 768
235+ vector_stores:
236+ - vector_store_id: your-index-id # ID used during index generation
237+ provider_id: your-knowledge-base
238+ embedding_model: sentence-transformers/all-mpnet-base-v2
239+ embedding_dimension: 768
240+ tool_groups:
241+ - toolgroup_id: builtin::rag
242+ provider_id: rag-runtime
241243` ` `
242244
243- **⚠️ Important**: The `vector_db_id ` value must exactly match the ID you provided when creating the vector database using the rag-content tool. This identifier links your Llama Stack configuration to the specific vector database index you created.
245+ **⚠️ Important**: The `vector_store_id ` value must exactly match the ID you provided when creating the vector database using the rag-content tool. This identifier links your Llama Stack configuration to the specific vector database index you created.
244246
245247# ## Step 5: Enable RAG Tools
246248
@@ -260,14 +262,20 @@ The configuration above automatically enables the RAG tools. The system will:
260262- **Storage**: SQLite database file
261263
262264` ` ` yaml
263- vector_io:
264- - provider_id: faiss-knowledge
265- provider_type: inline::faiss
266- config:
267- kvstore:
268- type: sqlite
265+ providers:
266+ vector_io:
267+ - provider_id: faiss-knowledge
268+ provider_type: inline::faiss
269+ config:
270+ persistence:
271+ namespace: vector_io::faiss
272+ backend: faiss_backend
273+
274+ storage:
275+ backends:
276+ faiss_backend:
277+ type: kv_sqlite
269278 db_path: /path/to/faiss_store.db
270- namespace: null
271279` ` `
272280
273281# ## 2. pgvector (PostgreSQL)
@@ -314,19 +322,6 @@ apis:
314322- tool_runtime
315323- safety
316324
317- models:
318- - model_id: gpt-4o-mini
319- provider_id: openai
320- model_type: llm
321- provider_model_id: gpt-4o-mini
322-
323- - model_id: sentence-transformers/all-mpnet-base-v2
324- metadata:
325- embedding_dimension: 768
326- model_type: embedding
327- provider_id: sentence-transformers
328- provider_model_id: /home/user/embedding_models/all-mpnet-base-v2
329-
330325providers:
331326 inference:
332327 - provider_id: sentence-transformers
@@ -341,12 +336,13 @@ providers:
341336 - provider_id: meta-reference
342337 provider_type: inline::meta-reference
343338 config:
344- persistence_store:
345- type: sqlite
346- db_path: .llama/distributions/ollama/agents_store.db
347- responses_store:
348- type: sqlite
349- db_path: .llama/distributions/ollama/responses_store.db
339+ persistence:
340+ agent_state:
341+ namespace: agents_state
342+ backend: kv_default
343+ responses:
344+ table_name: agents_responses
345+ backend: sql_default
350346
351347 safety:
352348 - provider_id: llama-guard
@@ -358,25 +354,47 @@ providers:
358354 - provider_id: company-docs
359355 provider_type: inline::faiss
360356 config:
361- kvstore:
362- type: sqlite
363- db_path: /home/user/vector_dbs/company_docs/faiss_store.db
364- namespace: null
357+ persistence:
358+ namespace: vector_io::faiss
359+ backend: company_docs_backend
365360
366361 tool_runtime:
367362 - provider_id: rag-runtime
368363 provider_type: inline::rag-runtime
369364 config: {}
370365
371- tool_groups:
372- - provider_id: rag-runtime
373- toolgroup_id: builtin::rag
374-
375- vector_dbs:
376- - embedding_dimension: 768
377- embedding_model: sentence-transformers/all-mpnet-base-v2
378- provider_id: company-docs
379- vector_db_id: company-knowledge-index
366+ storage:
367+ backends:
368+ kv_default:
369+ type: kv_sqlite
370+ db_path: ~/.llama/storage/kv_store.db
371+ sql_default:
372+ type: sql_sqlite
373+ db_path: ~/.llama/storage/sql_store.db
374+ company_docs_backend:
375+ type: kv_sqlite
376+ db_path: /home/user/vector_dbs/company_docs/faiss_store.db
377+
378+ registered_resources:
379+ models:
380+ - model_id: gpt-4o-mini
381+ provider_id: openai
382+ model_type: llm
383+ provider_model_id: gpt-4o-mini
384+ - model_id: sentence-transformers/all-mpnet-base-v2
385+ model_type: embedding
386+ provider_id: sentence-transformers
387+ provider_model_id: /home/user/embedding_models/all-mpnet-base-v2
388+ metadata:
389+ embedding_dimension: 768
390+ vector_stores:
391+ - vector_store_id: company-knowledge-index
392+ provider_id: company-docs
393+ embedding_model: sentence-transformers/all-mpnet-base-v2
394+ embedding_dimension: 768
395+ tool_groups:
396+ - toolgroup_id: builtin::rag
397+ provider_id: rag-runtime
380398` ` `
381399
382400# ## Example 2: vLLM + pgvector
@@ -421,12 +439,13 @@ providers:
421439 - provider_id: meta-reference
422440 provider_type: inline::meta-reference
423441 config:
424- persistence_store:
425- type: sqlite
426- db_path: .llama/distributions/ollama/agents_store.db
427- responses_store:
428- type: sqlite
429- db_path: .llama/distributions/ollama/responses_store.db
442+ persistence:
443+ agent_state:
444+ namespace: agents_state
445+ backend: kv_default
446+ responses:
447+ table_name: agents_responses
448+ backend: sql_default
430449
431450 safety:
432451 - provider_id: llama-guard
@@ -458,11 +477,11 @@ tool_groups:
458477 args: null
459478 mcp_endpoint: null
460479
461- vector_dbs :
480+ vector_stores :
462481- embedding_dimension: 768
463482 embedding_model: sentence-transformers/all-mpnet-base-v2
464483 provider_id: enterprise-knowledge
465- vector_db_id : enterprise-docs
484+ vector_store_id : enterprise-docs
466485` ` `
467486
468487---
0 commit comments