Skip to content

Commit 916d46f

Browse files
MrFlounderclaude
andauthored
feat(crab-pf): default to gpt-5 with reasoning low (#36)
## Summary - Changes default provider from `openai:gpt-4o` to `openai:gpt-5` - Changes default reasoning effort from none to `low` - Based on 11/11 test results showing GPT-5 low outperforms GPT-4o across all target apps ## Test plan - [x] Tested all 11 target apps with GPT-5 + reasoning low (11/11 passed) 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
1 parent 1cc404d commit 916d46f

2 files changed

Lines changed: 4 additions & 4 deletions

File tree

plugins/promptfoo/src/agent/providers.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -266,7 +266,7 @@ export function createProvider(provider: string, options?: { reasoningEffort?: s
266266

267267
switch (type) {
268268
case 'openai':
269-
return new OpenAIProvider({ model: model || 'gpt-4o', reasoningEffort: options?.reasoningEffort });
269+
return new OpenAIProvider({ model: model || 'gpt-5', reasoningEffort: options?.reasoningEffort });
270270
case 'anthropic':
271271
return new AnthropicProvider({ model: model || 'claude-sonnet-4-20250514' });
272272
default:

plugins/promptfoo/src/cli.ts

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -23,11 +23,11 @@ async function main() {
2323
// Parse arguments
2424
const filePath = getArg('--file') || getArg('-f');
2525
const urlArg = getArg('--url');
26-
const providerStr = getArg('--provider') || process.env.DISCOVERY_PROVIDER || 'openai:gpt-4o';
26+
const providerStr = getArg('--provider') || process.env.DISCOVERY_PROVIDER || 'openai:gpt-5';
2727
const outputDir = getArg('--output') || getArg('-o') || '.';
2828
const verbose = args.includes('--verbose') || args.includes('-v');
2929
const maxTurns = parseInt(getArg('--max-turns') || '30', 10);
30-
const reasoningEffort = getArg('--reasoning');
30+
const reasoningEffort = getArg('--reasoning') || 'low';
3131

3232
let context: string;
3333

@@ -133,7 +133,7 @@ Options:
133133
--file, -f <path> Read target specification from file
134134
--url <url> Probe a URL directly
135135
--output, -o <dir> Output directory (default: current dir)
136-
--provider <provider> LLM provider (default: openai:gpt-4o)
136+
--provider <provider> LLM provider (default: openai:gpt-5)
137137
--max-turns <n> Max agent turns (default: 30)
138138
--reasoning <effort> Reasoning effort for GPT-5/o-series (low, medium, high)
139139
--verbose, -v Show detailed output

0 commit comments

Comments
 (0)