|
282 | 282 | }, |
283 | 283 | "db_path": { |
284 | 284 | "description": "Path to RAG database.", |
285 | | - "format": "file-path", |
286 | 285 | "title": "DB path", |
287 | 286 | "type": "string" |
| 287 | + }, |
| 288 | + "score_multiplier": { |
| 289 | + "default": 1.0, |
| 290 | + "description": "Multiplier applied to relevance scores from this vector store. Used to weight results when querying multiple knowledge sources. Values > 1 boost this store's results; values < 1 reduce them.", |
| 291 | + "minimum": 0, |
| 292 | + "title": "Score multiplier", |
| 293 | + "type": "number" |
288 | 294 | } |
289 | 295 | }, |
290 | 296 | "required": [ |
|
467 | 473 | "title": "Deployment environment", |
468 | 474 | "type": "string" |
469 | 475 | }, |
470 | | - "solr": { |
471 | | - "anyOf": [ |
472 | | - { |
473 | | - "$ref": "#/components/schemas/SolrConfiguration" |
474 | | - }, |
475 | | - { |
476 | | - "type": "null" |
477 | | - } |
478 | | - ], |
479 | | - "default": null, |
480 | | - "description": "Configuration for Solr vector search operations.", |
481 | | - "title": "Solr configuration" |
| 476 | + "rag": { |
| 477 | + "$ref": "#/components/schemas/RagConfiguration", |
| 478 | + "description": "Configuration for all RAG strategies (inline and tool-based).", |
| 479 | + "title": "RAG configuration" |
| 480 | + }, |
| 481 | + "okp": { |
| 482 | + "$ref": "#/components/schemas/OkpConfiguration", |
| 483 | + "description": "OKP provider settings. Only used when 'okp' is listed in rag.inline or rag.tool.", |
| 484 | + "title": "OKP configuration" |
482 | 485 | } |
483 | 486 | }, |
484 | 487 | "required": [ |
|
898 | 901 | "title": "ModelContextProtocolServer", |
899 | 902 | "type": "object" |
900 | 903 | }, |
| 904 | + "OkpConfiguration": { |
| 905 | + "additionalProperties": false, |
| 906 | + "description": "OKP (Offline Knowledge Portal) provider configuration.\n\nControls provider-specific behaviour for the OKP vector store.\nOnly relevant when ``\"okp\"`` is listed in ``rag.inline`` or ``rag.tool``.", |
| 907 | + "properties": { |
| 908 | + "offline": { |
| 909 | + "default": true, |
| 910 | + "description": "When True, use parent_id for OKP chunk source URLs. When False, use reference_url for chunk source URLs.", |
| 911 | + "title": "OKP offline mode", |
| 912 | + "type": "boolean" |
| 913 | + }, |
| 914 | + "chunk_filter_query": { |
| 915 | + "default": "is_chunk:true", |
| 916 | + "description": "OKP filter query applied to every OKP search request. Defaults to 'is_chunk:true' to restrict results to chunk documents. To add extra constraints, extend the expression using boolean syntax, e.g. 'is_chunk:true AND product:*openshift*'.", |
| 917 | + "title": "OKP chunk filter query", |
| 918 | + "type": "string" |
| 919 | + } |
| 920 | + }, |
| 921 | + "title": "OkpConfiguration", |
| 922 | + "type": "object" |
| 923 | + }, |
901 | 924 | "PostgreSQLDatabaseConfiguration": { |
902 | 925 | "additionalProperties": false, |
903 | 926 | "description": "PostgreSQL database configuration.\n\nPostgreSQL database is used by Lightspeed Core Stack service for storing\ninformation about conversation IDs. It can also be leveraged to store\nconversation history and information about quota usage.\n\nUseful resources:\n\n- [Psycopg: connection classes](https://www.psycopg.org/psycopg3/docs/api/connections.html)\n- [PostgreSQL connection strings](https://www.connectionstrings.com/postgresql/)\n- [How to Use PostgreSQL in Python](https://www.freecodecamp.org/news/postgresql-in-python/)", |
|
1110 | 1133 | "title": "RHIdentityConfiguration", |
1111 | 1134 | "type": "object" |
1112 | 1135 | }, |
| 1136 | + "RagConfiguration": { |
| 1137 | + "additionalProperties": false, |
| 1138 | + "description": "RAG strategy configuration.\n\nControls which RAG sources are used for inline and tool-based retrieval.\n\nEach strategy lists RAG IDs to include. The special ID ``\"okp\"`` defined in constants,\nactivates the OKP provider; all other IDs refer to entries in ``byok_rag``.\n\nBackward compatibility:\n - ``inline`` defaults to ``[]`` (no inline RAG).\n - ``tool`` defaults to ``[]`` (no tool RAG).\n\nIf no RAG strategy is defined (inline and tool are empty),\nthe RAG tool will register all stores available to llama-stack.", |
| 1139 | + "properties": { |
| 1140 | + "inline": { |
| 1141 | + "description": "RAG IDs whose sources are injected as context before the LLM call. Use 'okp' to enable OKP inline RAG. Empty by default (no inline RAG).", |
| 1142 | + "items": { |
| 1143 | + "type": "string" |
| 1144 | + }, |
| 1145 | + "title": "Inline RAG IDs", |
| 1146 | + "type": "array" |
| 1147 | + }, |
| 1148 | + "tool": { |
| 1149 | + "description": "RAG IDs made available to the LLM as a file_search tool. Use 'okp' to include the OKP vector store. When omitted, all registered BYOK vector stores are used (backward compatibility).", |
| 1150 | + "items": { |
| 1151 | + "type": "string" |
| 1152 | + }, |
| 1153 | + "title": "Tool RAG IDs", |
| 1154 | + "type": "array" |
| 1155 | + } |
| 1156 | + }, |
| 1157 | + "title": "RagConfiguration", |
| 1158 | + "type": "object" |
| 1159 | + }, |
1113 | 1160 | "SQLiteDatabaseConfiguration": { |
1114 | 1161 | "additionalProperties": false, |
1115 | 1162 | "description": "SQLite database configuration.", |
|
1195 | 1242 | "title": "ServiceConfiguration", |
1196 | 1243 | "type": "object" |
1197 | 1244 | }, |
1198 | | - "SolrConfiguration": { |
1199 | | - "additionalProperties": false, |
1200 | | - "description": "Solr configuration for vector search queries.\n\nControls whether to use offline or online mode when building document URLs\nfrom vector search results, and enables/disables Solr vector IO functionality.", |
1201 | | - "properties": { |
1202 | | - "enabled": { |
1203 | | - "default": false, |
1204 | | - "description": "When True, enables Solr vector IO functionality for vector search queries. When False, disables Solr vector search processing.", |
1205 | | - "title": "Solr enabled", |
1206 | | - "type": "boolean" |
1207 | | - }, |
1208 | | - "offline": { |
1209 | | - "default": true, |
1210 | | - "description": "When True, use parent_id for chunk source URLs. When False, use reference_url for chunk source URLs.", |
1211 | | - "title": "Offline mode", |
1212 | | - "type": "boolean" |
1213 | | - } |
1214 | | - }, |
1215 | | - "title": "SolrConfiguration", |
1216 | | - "type": "object" |
1217 | | - }, |
1218 | 1245 | "SplunkConfiguration": { |
1219 | 1246 | "additionalProperties": false, |
1220 | 1247 | "description": "Splunk HEC (HTTP Event Collector) configuration.\n\nSplunk HEC allows sending events directly to Splunk over HTTP/HTTPS.\nThis configuration is used to send telemetry events for inference\nrequests to the corporate Splunk deployment.\n\nUseful resources:\n\n - [Splunk HEC Docs](https://docs.splunk.com/Documentation/SplunkCloud)\n - [About HEC](https://docs.splunk.com/Documentation/Splunk/latest/Data)", |
|
0 commit comments