forked from opensearch-project/observability-stack
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-compose.agent-eval-llm.yml
More file actions
44 lines (42 loc) · 1.53 KB
/
Copy pathdocker-compose.agent-eval-llm.yml
File metadata and controls
44 lines (42 loc) · 1.53 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
# LLM Eval Canary
# Periodically runs LLM-as-judge (Bedrock Claude) on agent traces.
# Requires AWS credentials via AWS_* env vars.
#
# Enable by uncommenting INCLUDE_COMPOSE_AGENT_EVAL_LLM in .env
x-default-logging: &logging
driver: "json-file"
options:
max-size: "5m"
max-file: "2"
tag: "{{.Name}}"
services:
example-agent-eval-canary-llm:
build:
context: ./docker-compose/agent-eval-canary-llm
dockerfile: Dockerfile
container_name: agent-eval-canary-llm
environment:
- OPENSEARCH_HOST=https://${OPENSEARCH_HOST}:${OPENSEARCH_PORT}
- OPENSEARCH_USER=${OPENSEARCH_USER}
- OPENSEARCH_PASSWORD=${OPENSEARCH_PASSWORD}
- OTEL_EXPORTER_OTLP_ENDPOINT=${OTEL_COLLECTOR_HOST}:${OTEL_COLLECTOR_PORT_GRPC}
- EVAL_CANARY_LLM_INTERVAL=${EVAL_CANARY_LLM_INTERVAL:-60}
- EVAL_CANARY_LLM_LOOKBACK_MINUTES=${EVAL_CANARY_LLM_LOOKBACK_MINUTES:-10}
- EVAL_CANARY_LLM_MAX_PER_CYCLE=${EVAL_CANARY_LLM_MAX_PER_CYCLE:-20}
- EVAL_CANARY_LLM_CONCURRENCY=${EVAL_CANARY_LLM_CONCURRENCY:-8}
- EVAL_JUDGE_MODEL=${EVAL_JUDGE_MODEL:-us.anthropic.claude-sonnet-4-20250514-v1:0}
- AWS_ACCESS_KEY_ID=${AWS_ACCESS_KEY_ID:-}
- AWS_SECRET_ACCESS_KEY=${AWS_SECRET_ACCESS_KEY:-}
- AWS_SESSION_TOKEN=${AWS_SESSION_TOKEN:-}
- AWS_REGION=${AWS_REGION:-us-west-2}
depends_on:
- opensearch
- otel-collector
networks:
- observability-stack-network
restart: unless-stopped
deploy:
resources:
limits:
memory: 512M
logging: *logging