@@ -149,25 +149,25 @@ Run evaluators against historical agent traces.
149149
150150``` bash
151151# Project mode — evaluate a project agent
152- agentcore run evals \
152+ agentcore run eval \
153153 --agent MyAgent \
154154 --evaluator ResponseQuality \
155155 --days 7
156156
157157# Standalone mode — evaluate any agent by ARN
158- agentcore run evals \
158+ agentcore run eval \
159159 --agent-arn arn:aws:bedrock-agentcore:us-east-1:123456789012:runtime/abc123 \
160160 --evaluator-arn arn:aws:bedrock-agentcore:us-east-1:123456789012:evaluator/eval123 \
161161 --region us-east-1
162162
163163# Multiple evaluators
164- agentcore run evals \
164+ agentcore run eval \
165165 --agent MyAgent \
166166 --evaluator ResponseQuality Builtin.Faithfulness \
167167 --days 14
168168
169169# Target specific session or trace
170- agentcore run evals \
170+ agentcore run eval \
171171 --agent MyAgent \
172172 --evaluator ResponseQuality \
173173 --session-id abc123 \
@@ -359,7 +359,7 @@ AgentCore provides pre-built evaluators that can be used without creating custom
359359by their ` Builtin.* ` ID in ` --evaluator ` flags or in online eval config ` evaluators ` arrays.
360360
361361``` bash
362- agentcore run evals --agent MyAgent --evaluator Builtin.Faithfulness
362+ agentcore run eval --agent MyAgent --evaluator Builtin.Faithfulness
363363```
364364
365365---
@@ -369,8 +369,8 @@ agentcore run evals --agent MyAgent --evaluator Builtin.Faithfulness
369369### CI/CD Quality Gate
370370
371371``` bash
372- # Run evals and fail pipeline if score < threshold
373- result=$( agentcore run evals --agent MyAgent --evaluator ResponseQuality --days 1 --json)
372+ # Run eval and fail pipeline if score < threshold
373+ result=$( agentcore run eval --agent MyAgent --evaluator ResponseQuality --days 1 --json)
374374score=$( echo " $result " | jq ' .run.results[0].aggregateScore' )
375375if (( $(echo "$score < 0 .7 " | bc - l) )) ; then
376376 echo " Quality gate failed: score $score < 0.7"
@@ -389,7 +389,7 @@ agentcore add evaluator \
389389 --instructions " Evaluate the agent response quality. Context: {context}"
390390
391391# 2. Run on-demand eval to verify
392- agentcore run evals --agent MyAgent --evaluator ResponseQuality --days 7
392+ agentcore run eval --agent MyAgent --evaluator ResponseQuality --days 7
393393
394394# 3. Set up continuous monitoring
395395agentcore add online-eval \
@@ -407,7 +407,7 @@ agentcore deploy
407407Evaluate agents and use evaluators outside of a project directory using ARNs:
408408
409409``` bash
410- agentcore run evals \
410+ agentcore run eval \
411411 --agent-arn arn:aws:bedrock-agentcore:us-east-1:123456789012:runtime/my-agent \
412412 --evaluator-arn arn:aws:bedrock-agentcore:us-east-1:123456789012:evaluator/my-eval \
413413 --region us-east-1 \
0 commit comments