55 max_threads : 50 # Maximum number of threads, set to null for Python default. 50 is OK for bigger datasets
66 fail_on_invalid_data : true # If False don't fail on invalid conversations (like missing context for some metrics)
77 skip_on_failure : false # If True, skip remaining turns when a turn evaluation fails (can be overridden per conversation)
8+ cache_enabled : true # Global cache toggle, if True LLM as a judge, embeddings and API queries are cached
9+ cache_base_dir : .caches # Global base cache dir (queries cached separately under /llm (LLM as a judge + embeddings) and /api)
810
911# LLM as a judge configuration (Legacy)
1012# Deprecated: top-level llm: (single judge) will be removed — use llm_pool + judge_panel only.
@@ -17,15 +19,11 @@ core:
1719# max_tokens: 512 # Maximum tokens in response
1820# timeout: 300 # Request timeout in seconds
1921# num_retries: 3 # Retry attempts
20- # cache_dir: ".caches/llm_cache" # Directory with LLM cache
21- # cache_enabled: true # Is LLM cache enabled?
2222
2323# Pool of named models (judges reference these IDs)
2424# Default values merge into each model; parameters supports extra provider keys; null removes an inherited parameter.
2525llm_pool :
2626 defaults :
27- cache_enabled : true
28- cache_dir : " .caches/llm_cache"
2927 timeout : 300
3028 num_retries : 3
3129 parameters :
@@ -64,9 +62,6 @@ embedding:
6462 provider : " openai"
6563 model : " text-embedding-3-small"
6664 provider_kwargs : {}
67- cache_dir : " .caches/embedding_cache"
68- cache_enabled : true
69-
7065
7166# Lightspeed-stack API Configuration
7267# To get real time data. Currently it supports lightspeed-stack API.
9085 # Example: extra_request_params:
9186 # mode: troubleshooting
9287 extra_request_params : null
93-
94- cache_dir : " .caches/api_cache" # Directory with lightspeed-stack cache
95- cache_enabled : true # Is lightspeed-stack cache enabled?
9688
9789 # MCP Server Authentication Configuration
9890 mcp_headers :
0 commit comments