1+ {
2+ "arm_a" : {
3+ "label" : " BASELINE" ,
4+ "model" : " aws.claude-sonnet-4.6" ,
5+ "rounds" : [
6+ {
7+ "round_num" : 1 ,
8+ "arm" : " BASELINE" ,
9+ "msg_count" : 4 ,
10+ "est_tokens_before_compact" : 428 ,
11+ "est_tokens_after_compact" : 428 ,
12+ "tokens_saved_by_compact" : 0 ,
13+ "prompt_tokens" : 1 ,
14+ "cache_read" : 0 ,
15+ "cache_write" : 1500 ,
16+ "output_tokens" : 150 ,
17+ "elapsed" : 0.0 ,
18+ "status" : " SIM" ,
19+ "error" : " "
20+ },
21+ {
22+ "round_num" : 2 ,
23+ "arm" : " BASELINE" ,
24+ "msg_count" : 7 ,
25+ "est_tokens_before_compact" : 1067 ,
26+ "est_tokens_after_compact" : 1067 ,
27+ "tokens_saved_by_compact" : 0 ,
28+ "prompt_tokens" : 1 ,
29+ "cache_read" : 0 ,
30+ "cache_write" : 1400 ,
31+ "output_tokens" : 150 ,
32+ "elapsed" : 0.0 ,
33+ "status" : " SIM" ,
34+ "error" : " "
35+ },
36+ {
37+ "round_num" : 3 ,
38+ "arm" : " BASELINE" ,
39+ "msg_count" : 10 ,
40+ "est_tokens_before_compact" : 2088 ,
41+ "est_tokens_after_compact" : 2088 ,
42+ "tokens_saved_by_compact" : 0 ,
43+ "prompt_tokens" : 88 ,
44+ "cache_read" : 0 ,
45+ "cache_write" : 1300 ,
46+ "output_tokens" : 150 ,
47+ "elapsed" : 0.0 ,
48+ "status" : " SIM" ,
49+ "error" : " "
50+ },
51+ {
52+ "round_num" : 4 ,
53+ "arm" : " BASELINE" ,
54+ "msg_count" : 13 ,
55+ "est_tokens_before_compact" : 2718 ,
56+ "est_tokens_after_compact" : 2464 ,
57+ "tokens_saved_by_compact" : 254 ,
58+ "prompt_tokens" : 464 ,
59+ "cache_read" : 0 ,
60+ "cache_write" : 1200 ,
61+ "output_tokens" : 150 ,
62+ "elapsed" : 0.0 ,
63+ "status" : " SIM" ,
64+ "error" : " "
65+ },
66+ {
67+ "round_num" : 5 ,
68+ "arm" : " BASELINE" ,
69+ "msg_count" : 16 ,
70+ "est_tokens_before_compact" : 3070 ,
71+ "est_tokens_after_compact" : 2299 ,
72+ "tokens_saved_by_compact" : 771 ,
73+ "prompt_tokens" : 299 ,
74+ "cache_read" : 0 ,
75+ "cache_write" : 1100 ,
76+ "output_tokens" : 150 ,
77+ "elapsed" : 0.0 ,
78+ "status" : " SIM" ,
79+ "error" : " "
80+ },
81+ {
82+ "round_num" : 6 ,
83+ "arm" : " BASELINE" ,
84+ "msg_count" : 19 ,
85+ "est_tokens_before_compact" : 4079 ,
86+ "est_tokens_after_compact" : 2411 ,
87+ "tokens_saved_by_compact" : 1668 ,
88+ "prompt_tokens" : 411 ,
89+ "cache_read" : 0 ,
90+ "cache_write" : 1000 ,
91+ "output_tokens" : 150 ,
92+ "elapsed" : 0.0 ,
93+ "status" : " SIM" ,
94+ "error" : " "
95+ },
96+ {
97+ "round_num" : 7 ,
98+ "arm" : " BASELINE" ,
99+ "msg_count" : 22 ,
100+ "est_tokens_before_compact" : 4696 ,
101+ "est_tokens_after_compact" : 2511 ,
102+ "tokens_saved_by_compact" : 2185 ,
103+ "prompt_tokens" : 511 ,
104+ "cache_read" : 0 ,
105+ "cache_write" : 900 ,
106+ "output_tokens" : 150 ,
107+ "elapsed" : 0.0 ,
108+ "status" : " SIM" ,
109+ "error" : " "
110+ },
111+ {
112+ "round_num" : 8 ,
113+ "arm" : " BASELINE" ,
114+ "msg_count" : 25 ,
115+ "est_tokens_before_compact" : 5047 ,
116+ "est_tokens_after_compact" : 2609 ,
117+ "tokens_saved_by_compact" : 2438 ,
118+ "prompt_tokens" : 609 ,
119+ "cache_read" : 0 ,
120+ "cache_write" : 800 ,
121+ "output_tokens" : 150 ,
122+ "elapsed" : 0.0 ,
123+ "status" : " SIM" ,
124+ "error" : " "
125+ }
126+ ]
127+ },
128+ "arm_b" : {
129+ "label" : " PAIRED" ,
130+ "model" : " aws.claude-sonnet-4.6" ,
131+ "rounds" : [
132+ {
133+ "round_num" : 1 ,
134+ "arm" : " PAIRED" ,
135+ "msg_count" : 4 ,
136+ "est_tokens_before_compact" : 428 ,
137+ "est_tokens_after_compact" : 428 ,
138+ "tokens_saved_by_compact" : 0 ,
139+ "prompt_tokens" : 1 ,
140+ "cache_read" : 0 ,
141+ "cache_write" : 1500 ,
142+ "output_tokens" : 150 ,
143+ "elapsed" : 0.0 ,
144+ "status" : " SIM" ,
145+ "error" : " "
146+ },
147+ {
148+ "round_num" : 2 ,
149+ "arm" : " PAIRED" ,
150+ "msg_count" : 7 ,
151+ "est_tokens_before_compact" : 1067 ,
152+ "est_tokens_after_compact" : 1067 ,
153+ "tokens_saved_by_compact" : 0 ,
154+ "prompt_tokens" : 1 ,
155+ "cache_read" : 0 ,
156+ "cache_write" : 1400 ,
157+ "output_tokens" : 150 ,
158+ "elapsed" : 0.0 ,
159+ "status" : " SIM" ,
160+ "error" : " "
161+ },
162+ {
163+ "round_num" : 3 ,
164+ "arm" : " PAIRED" ,
165+ "msg_count" : 10 ,
166+ "est_tokens_before_compact" : 2088 ,
167+ "est_tokens_after_compact" : 2088 ,
168+ "tokens_saved_by_compact" : 0 ,
169+ "prompt_tokens" : 88 ,
170+ "cache_read" : 0 ,
171+ "cache_write" : 1300 ,
172+ "output_tokens" : 150 ,
173+ "elapsed" : 0.0 ,
174+ "status" : " SIM" ,
175+ "error" : " "
176+ },
177+ {
178+ "round_num" : 4 ,
179+ "arm" : " PAIRED" ,
180+ "msg_count" : 13 ,
181+ "est_tokens_before_compact" : 2718 ,
182+ "est_tokens_after_compact" : 2428 ,
183+ "tokens_saved_by_compact" : 290 ,
184+ "prompt_tokens" : 428 ,
185+ "cache_read" : 0 ,
186+ "cache_write" : 1200 ,
187+ "output_tokens" : 150 ,
188+ "elapsed" : 0.0 ,
189+ "status" : " SIM" ,
190+ "error" : " "
191+ },
192+ {
193+ "round_num" : 5 ,
194+ "arm" : " PAIRED" ,
195+ "msg_count" : 16 ,
196+ "est_tokens_before_compact" : 3070 ,
197+ "est_tokens_after_compact" : 2224 ,
198+ "tokens_saved_by_compact" : 846 ,
199+ "prompt_tokens" : 224 ,
200+ "cache_read" : 0 ,
201+ "cache_write" : 1100 ,
202+ "output_tokens" : 150 ,
203+ "elapsed" : 0.0 ,
204+ "status" : " SIM" ,
205+ "error" : " "
206+ },
207+ {
208+ "round_num" : 6 ,
209+ "arm" : " PAIRED" ,
210+ "msg_count" : 19 ,
211+ "est_tokens_before_compact" : 4079 ,
212+ "est_tokens_after_compact" : 2305 ,
213+ "tokens_saved_by_compact" : 1774 ,
214+ "prompt_tokens" : 305 ,
215+ "cache_read" : 0 ,
216+ "cache_write" : 1000 ,
217+ "output_tokens" : 150 ,
218+ "elapsed" : 0.0 ,
219+ "status" : " SIM" ,
220+ "error" : " "
221+ },
222+ {
223+ "round_num" : 7 ,
224+ "arm" : " PAIRED" ,
225+ "msg_count" : 22 ,
226+ "est_tokens_before_compact" : 4696 ,
227+ "est_tokens_after_compact" : 2376 ,
228+ "tokens_saved_by_compact" : 2320 ,
229+ "prompt_tokens" : 376 ,
230+ "cache_read" : 0 ,
231+ "cache_write" : 900 ,
232+ "output_tokens" : 150 ,
233+ "elapsed" : 0.0 ,
234+ "status" : " SIM" ,
235+ "error" : " "
236+ },
237+ {
238+ "round_num" : 8 ,
239+ "arm" : " PAIRED" ,
240+ "msg_count" : 25 ,
241+ "est_tokens_before_compact" : 5047 ,
242+ "est_tokens_after_compact" : 2451 ,
243+ "tokens_saved_by_compact" : 2596 ,
244+ "prompt_tokens" : 451 ,
245+ "cache_read" : 0 ,
246+ "cache_write" : 800 ,
247+ "output_tokens" : 150 ,
248+ "elapsed" : 0.0 ,
249+ "status" : " SIM" ,
250+ "error" : " "
251+ }
252+ ]
253+ }
254+ }
0 commit comments