We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2263fa6 commit a609a0fCopy full SHA for a609a0f
2 files changed
example_comparisons/api_models.yaml
@@ -0,0 +1,26 @@
1
+# Example comparison config: API models on WAA tasks
2
+# Usage:
3
+# python scripts/compare_models.py --config example_comparisons/api_models.yaml
4
+# python scripts/compare_models.py --config example_comparisons/api_models.yaml --manage-vm --setup-tunnels
5
+
6
+name: "API Model Comparison"
7
+description: "Compare GPT-5.4-mini vs GPT-4o-mini as unified desktop agents"
8
9
+tasks:
10
+ - example_tasks/notepad-hello.yaml
11
+ - example_tasks/clear-browsing-data-chrome.yaml
12
13
+models:
14
+ - name: gpt-5.4-mini
15
+ provider: openai
16
+ type: unified
17
18
+ - name: gpt-4o-mini
19
20
21
22
+server_url: http://localhost:5001
23
+max_steps: 10
24
+runs_per_config: 1
25
+save_screenshots: true
26
+output_dir: comparison_results/
0 commit comments