|
3664 | 3664 | "rlsapi-v1" |
3665 | 3665 | ], |
3666 | 3666 | "summary": "Infer Endpoint", |
3667 | | - "description": "Handle rlsapi v1 /infer requests for stateless inference.\n\nThis endpoint serves requests from the RHEL Lightspeed Command Line Assistant (CLA).\n\nAccepts a question with optional context (stdin, attachments, terminal output,\nsystem info) and returns an LLM-generated response.\n\nArgs:\n infer_request: The inference request containing question and context.\n auth: Authentication tuple from the configured auth provider.\n\nReturns:\n RlsapiV1InferResponse containing the generated response text and request ID.\n\nRaises:\n HTTPException: 503 if the LLM service is unavailable.", |
| 3667 | + "description": "Handle rlsapi v1 /infer requests for stateless inference.\n\nThis endpoint serves requests from the RHEL Lightspeed Command Line Assistant (CLA).\n\nAccepts a question with optional context (stdin, attachments, terminal output,\nsystem info) and returns an LLM-generated response.\n\nArgs:\n infer_request: The inference request containing question and context.\n request: The FastAPI request object for accessing headers and state.\n background_tasks: FastAPI background tasks for async Splunk event sending.\n auth: Authentication tuple from the configured auth provider.\n\nReturns:\n RlsapiV1InferResponse containing the generated response text and request ID.\n\nRaises:\n HTTPException: 503 if the LLM service is unavailable.", |
3668 | 3668 | "operationId": "infer_endpoint_v1_infer_post", |
3669 | 3669 | "requestBody": { |
3670 | 3670 | "content": { |
|
4290 | 4290 | ], |
4291 | 4291 | "summary": "Handle A2A Jsonrpc", |
4292 | 4292 | "description": "Handle A2A JSON-RPC requests following the A2A protocol specification.\n\nThis endpoint uses the DefaultRequestHandler from the A2A SDK to handle\nall JSON-RPC requests including message/send, message/stream, etc.\n\nThe A2A SDK application is created per-request to include authentication\ncontext while still leveraging FastAPI's authorization middleware.\n\nAutomatically detects streaming requests (message/stream JSON-RPC method)\nand returns a StreamingResponse to enable real-time chunk delivery.\n\nArgs:\n request: FastAPI request object\n auth: Authentication tuple\n mcp_headers: MCP headers for context propagation\n\nReturns:\n JSON-RPC response or streaming response", |
4293 | | - "operationId": "handle_a2a_jsonrpc_a2a_get", |
| 4293 | + "operationId": "handle_a2a_jsonrpc_a2a_post", |
4294 | 4294 | "responses": { |
4295 | 4295 | "200": { |
4296 | 4296 | "description": "Successful Response", |
|
4308 | 4308 | ], |
4309 | 4309 | "summary": "Handle A2A Jsonrpc", |
4310 | 4310 | "description": "Handle A2A JSON-RPC requests following the A2A protocol specification.\n\nThis endpoint uses the DefaultRequestHandler from the A2A SDK to handle\nall JSON-RPC requests including message/send, message/stream, etc.\n\nThe A2A SDK application is created per-request to include authentication\ncontext while still leveraging FastAPI's authorization middleware.\n\nAutomatically detects streaming requests (message/stream JSON-RPC method)\nand returns a StreamingResponse to enable real-time chunk delivery.\n\nArgs:\n request: FastAPI request object\n auth: Authentication tuple\n mcp_headers: MCP headers for context propagation\n\nReturns:\n JSON-RPC response or streaming response", |
4311 | | - "operationId": "handle_a2a_jsonrpc_a2a_get", |
| 4311 | + "operationId": "handle_a2a_jsonrpc_a2a_post", |
4312 | 4312 | "responses": { |
4313 | 4313 | "200": { |
4314 | 4314 | "description": "Successful Response", |
|
6957 | 6957 | ], |
6958 | 6958 | "title": "Llama Stack configuration path", |
6959 | 6959 | "description": "Path to configuration file used when Llama Stack is run in library mode" |
| 6960 | + }, |
| 6961 | + "timeout": { |
| 6962 | + "type": "integer", |
| 6963 | + "exclusiveMinimum": 0.0, |
| 6964 | + "title": "Request timeout", |
| 6965 | + "description": "Timeout in seconds for requests to Llama Stack service. Default is 180 seconds (3 minutes) to accommodate long-running RAG queries.", |
| 6966 | + "default": 180 |
6960 | 6967 | } |
6961 | 6968 | }, |
6962 | 6969 | "additionalProperties": false, |
|
0 commit comments