diff --git a/.agentv/targets.yaml b/.agentv/targets.yaml index b552e7809..7586f1a2e 100644 --- a/.agentv/targets.yaml +++ b/.agentv/targets.yaml @@ -32,13 +32,13 @@ targets: provider: copilot-cli model: ${{ COPILOT_MODEL }} grader_target: grader - log_format: json + stream_log: raw - name: copilot-sdk provider: copilot-sdk model: ${{ COPILOT_MODEL }} grader_target: grader - log_format: json + stream_log: raw - name: copilot-sdk-azure provider: copilot-sdk @@ -48,7 +48,7 @@ targets: base_url: ${{ AZURE_OPENAI_ENDPOINT }} api_key: ${{ AZURE_OPENAI_API_KEY }} grader_target: grader - log_format: json + stream_log: raw - name: claude provider: claude-cli @@ -85,12 +85,23 @@ targets: - name: pi-sdk provider: pi-coding-agent - subprovider: openrouter - model: ${{ OPENROUTER_MODEL }} - api_key: ${{ OPENROUTER_API_KEY }} - grader_target: grader - tools: read,bash,edit,write - log_format: json + subprovider: openai + base_url: ${{ OPENAI_ENDPOINT }} + api_key: ${{ OPENAI_API_KEY }} + model: gpt-5.5 + grader_target: openai + thinking: low + stream_log: raw + + - name: pi-sdk-openai + provider: pi-coding-agent + subprovider: openai + base_url: ${{ OPENAI_ENDPOINT }} + api_key: ${{ OPENAI_API_KEY }} + model: gpt-5.5 + grader_target: openai + thinking: low + stream_log: raw - name: pi-azure provider: pi-cli @@ -104,11 +115,11 @@ targets: provider: pi-coding-agent subprovider: azure base_url: ${{ AZURE_OPENAI_ENDPOINT }} - model: ${{ AZURE_DEPLOYMENT_NAME }} + model: gpt-5.5 api_key: ${{ AZURE_OPENAI_API_KEY }} grader_target: grader - tools: read,bash,edit,write - log_format: json + thinking: low + stream_log: raw - name: codex provider: codex diff --git a/apps/cli/src/templates/.agentv/targets.yaml b/apps/cli/src/templates/.agentv/targets.yaml index d0fbd7af9..c95f7decc 100644 --- a/apps/cli/src/templates/.agentv/targets.yaml +++ b/apps/cli/src/templates/.agentv/targets.yaml @@ -24,7 +24,7 @@ targets: # - ${{ CODEX_APPROVAL_PRESET }} cwd: ${{ CODEX_WORKSPACE_DIR }} # Where scratch workspaces are created log_dir: ${{ CODEX_LOG_DIR }} # Optional: where Codex CLI stream logs are stored (defaults to ./.agentv/logs/codex) - log_format: json # Optional: 'summary' (default) or 'json' for raw event logs + stream_log: raw # Optional: 'summary' for consolidated logs or 'raw' for per-event logs # Claude - Anthropic's Claude Agent SDK - name: claude @@ -36,7 +36,7 @@ targets: # max_turns: 50 # Optional: max conversation turns # max_budget_usd: 5.0 # Optional: max cost budget in USD # log_dir: ${{ CLAUDE_LOG_DIR }} # Optional: where stream logs are stored (defaults to ./.agentv/logs/claude) - log_format: json # Optional: 'summary' (default) or 'json' for raw event logs + stream_log: raw # Optional: 'summary' for consolidated logs or 'raw' for per-event logs # system_prompt: optional override (default instructs agent to include code in response) - name: azure-llm diff --git a/packages/core/src/evaluation/validation/targets-validator.ts b/packages/core/src/evaluation/validation/targets-validator.ts index 6e22f4f35..63950aa7b 100644 --- a/packages/core/src/evaluation/validation/targets-validator.ts +++ b/packages/core/src/evaluation/validation/targets-validator.ts @@ -124,6 +124,7 @@ const COPILOT_SDK_SETTINGS = new Set([ 'timeout_seconds', 'log_dir', 'log_format', + 'stream_log', 'system_prompt', 'byok', ]); @@ -140,6 +141,7 @@ const COPILOT_CLI_SETTINGS = new Set([ 'timeout_seconds', 'log_dir', 'log_format', + 'stream_log', 'system_prompt', ]); @@ -173,6 +175,7 @@ const CLAUDE_SETTINGS = new Set([ 'log_directory', 'log_format', 'log_output_format', + 'stream_log', 'system_prompt', 'max_turns', 'max_budget_usd',