Skip to content

Commit 40c616c

Browse files
committed
v0.9.3: 修复图像生成模式 edit 的分流错误;进一步提升环境安装便利性;新增 GPT Image 2 模型支持
1 parent 310a40b commit 40c616c

63 files changed

Lines changed: 8179 additions & 2690 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
0.9.2
1+
0.9.3
Lines changed: 254 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,254 @@
1+
{
2+
"arm_a": {
3+
"label": "BASELINE",
4+
"model": "aws.claude-sonnet-4.6",
5+
"rounds": [
6+
{
7+
"round_num": 1,
8+
"arm": "BASELINE",
9+
"msg_count": 4,
10+
"est_tokens_before_compact": 428,
11+
"est_tokens_after_compact": 428,
12+
"tokens_saved_by_compact": 0,
13+
"prompt_tokens": 1,
14+
"cache_read": 0,
15+
"cache_write": 1500,
16+
"output_tokens": 150,
17+
"elapsed": 0.0,
18+
"status": "SIM",
19+
"error": ""
20+
},
21+
{
22+
"round_num": 2,
23+
"arm": "BASELINE",
24+
"msg_count": 7,
25+
"est_tokens_before_compact": 1067,
26+
"est_tokens_after_compact": 1067,
27+
"tokens_saved_by_compact": 0,
28+
"prompt_tokens": 1,
29+
"cache_read": 0,
30+
"cache_write": 1400,
31+
"output_tokens": 150,
32+
"elapsed": 0.0,
33+
"status": "SIM",
34+
"error": ""
35+
},
36+
{
37+
"round_num": 3,
38+
"arm": "BASELINE",
39+
"msg_count": 10,
40+
"est_tokens_before_compact": 2088,
41+
"est_tokens_after_compact": 2088,
42+
"tokens_saved_by_compact": 0,
43+
"prompt_tokens": 88,
44+
"cache_read": 0,
45+
"cache_write": 1300,
46+
"output_tokens": 150,
47+
"elapsed": 0.0,
48+
"status": "SIM",
49+
"error": ""
50+
},
51+
{
52+
"round_num": 4,
53+
"arm": "BASELINE",
54+
"msg_count": 13,
55+
"est_tokens_before_compact": 2718,
56+
"est_tokens_after_compact": 2464,
57+
"tokens_saved_by_compact": 254,
58+
"prompt_tokens": 464,
59+
"cache_read": 0,
60+
"cache_write": 1200,
61+
"output_tokens": 150,
62+
"elapsed": 0.0,
63+
"status": "SIM",
64+
"error": ""
65+
},
66+
{
67+
"round_num": 5,
68+
"arm": "BASELINE",
69+
"msg_count": 16,
70+
"est_tokens_before_compact": 3070,
71+
"est_tokens_after_compact": 2299,
72+
"tokens_saved_by_compact": 771,
73+
"prompt_tokens": 299,
74+
"cache_read": 0,
75+
"cache_write": 1100,
76+
"output_tokens": 150,
77+
"elapsed": 0.0,
78+
"status": "SIM",
79+
"error": ""
80+
},
81+
{
82+
"round_num": 6,
83+
"arm": "BASELINE",
84+
"msg_count": 19,
85+
"est_tokens_before_compact": 4079,
86+
"est_tokens_after_compact": 2411,
87+
"tokens_saved_by_compact": 1668,
88+
"prompt_tokens": 411,
89+
"cache_read": 0,
90+
"cache_write": 1000,
91+
"output_tokens": 150,
92+
"elapsed": 0.0,
93+
"status": "SIM",
94+
"error": ""
95+
},
96+
{
97+
"round_num": 7,
98+
"arm": "BASELINE",
99+
"msg_count": 22,
100+
"est_tokens_before_compact": 4696,
101+
"est_tokens_after_compact": 2511,
102+
"tokens_saved_by_compact": 2185,
103+
"prompt_tokens": 511,
104+
"cache_read": 0,
105+
"cache_write": 900,
106+
"output_tokens": 150,
107+
"elapsed": 0.0,
108+
"status": "SIM",
109+
"error": ""
110+
},
111+
{
112+
"round_num": 8,
113+
"arm": "BASELINE",
114+
"msg_count": 25,
115+
"est_tokens_before_compact": 5047,
116+
"est_tokens_after_compact": 2609,
117+
"tokens_saved_by_compact": 2438,
118+
"prompt_tokens": 609,
119+
"cache_read": 0,
120+
"cache_write": 800,
121+
"output_tokens": 150,
122+
"elapsed": 0.0,
123+
"status": "SIM",
124+
"error": ""
125+
}
126+
]
127+
},
128+
"arm_b": {
129+
"label": "PAIRED",
130+
"model": "aws.claude-sonnet-4.6",
131+
"rounds": [
132+
{
133+
"round_num": 1,
134+
"arm": "PAIRED",
135+
"msg_count": 4,
136+
"est_tokens_before_compact": 428,
137+
"est_tokens_after_compact": 428,
138+
"tokens_saved_by_compact": 0,
139+
"prompt_tokens": 1,
140+
"cache_read": 0,
141+
"cache_write": 1500,
142+
"output_tokens": 150,
143+
"elapsed": 0.0,
144+
"status": "SIM",
145+
"error": ""
146+
},
147+
{
148+
"round_num": 2,
149+
"arm": "PAIRED",
150+
"msg_count": 7,
151+
"est_tokens_before_compact": 1067,
152+
"est_tokens_after_compact": 1067,
153+
"tokens_saved_by_compact": 0,
154+
"prompt_tokens": 1,
155+
"cache_read": 0,
156+
"cache_write": 1400,
157+
"output_tokens": 150,
158+
"elapsed": 0.0,
159+
"status": "SIM",
160+
"error": ""
161+
},
162+
{
163+
"round_num": 3,
164+
"arm": "PAIRED",
165+
"msg_count": 10,
166+
"est_tokens_before_compact": 2088,
167+
"est_tokens_after_compact": 2088,
168+
"tokens_saved_by_compact": 0,
169+
"prompt_tokens": 88,
170+
"cache_read": 0,
171+
"cache_write": 1300,
172+
"output_tokens": 150,
173+
"elapsed": 0.0,
174+
"status": "SIM",
175+
"error": ""
176+
},
177+
{
178+
"round_num": 4,
179+
"arm": "PAIRED",
180+
"msg_count": 13,
181+
"est_tokens_before_compact": 2718,
182+
"est_tokens_after_compact": 2428,
183+
"tokens_saved_by_compact": 290,
184+
"prompt_tokens": 428,
185+
"cache_read": 0,
186+
"cache_write": 1200,
187+
"output_tokens": 150,
188+
"elapsed": 0.0,
189+
"status": "SIM",
190+
"error": ""
191+
},
192+
{
193+
"round_num": 5,
194+
"arm": "PAIRED",
195+
"msg_count": 16,
196+
"est_tokens_before_compact": 3070,
197+
"est_tokens_after_compact": 2224,
198+
"tokens_saved_by_compact": 846,
199+
"prompt_tokens": 224,
200+
"cache_read": 0,
201+
"cache_write": 1100,
202+
"output_tokens": 150,
203+
"elapsed": 0.0,
204+
"status": "SIM",
205+
"error": ""
206+
},
207+
{
208+
"round_num": 6,
209+
"arm": "PAIRED",
210+
"msg_count": 19,
211+
"est_tokens_before_compact": 4079,
212+
"est_tokens_after_compact": 2305,
213+
"tokens_saved_by_compact": 1774,
214+
"prompt_tokens": 305,
215+
"cache_read": 0,
216+
"cache_write": 1000,
217+
"output_tokens": 150,
218+
"elapsed": 0.0,
219+
"status": "SIM",
220+
"error": ""
221+
},
222+
{
223+
"round_num": 7,
224+
"arm": "PAIRED",
225+
"msg_count": 22,
226+
"est_tokens_before_compact": 4696,
227+
"est_tokens_after_compact": 2376,
228+
"tokens_saved_by_compact": 2320,
229+
"prompt_tokens": 376,
230+
"cache_read": 0,
231+
"cache_write": 900,
232+
"output_tokens": 150,
233+
"elapsed": 0.0,
234+
"status": "SIM",
235+
"error": ""
236+
},
237+
{
238+
"round_num": 8,
239+
"arm": "PAIRED",
240+
"msg_count": 25,
241+
"est_tokens_before_compact": 5047,
242+
"est_tokens_after_compact": 2451,
243+
"tokens_saved_by_compact": 2596,
244+
"prompt_tokens": 451,
245+
"cache_read": 0,
246+
"cache_write": 800,
247+
"output_tokens": 150,
248+
"elapsed": 0.0,
249+
"status": "SIM",
250+
"error": ""
251+
}
252+
]
253+
}
254+
}

0 commit comments

Comments
 (0)