|
15 | 15 | 'No subselect', 'No visual', 'VLM subselect', |
16 | 16 | 'ViLa', 'ViLa fewshot' |
17 | 17 | ], |
18 | | - 'NUM_SOLVED': [0.00, 8.20, 0.00, 0.00, 0.00, 0.00, 0.00, 0.00, 3.80], |
19 | | - 'NUM_SOLVED_STDDEV': [0.00, 1.17, 0.00, 0.00, 0.00, 0.00, 0.00, 0.00, 0.40] |
| 18 | + 'NUM_SOLVED': [0.00, 8.20, 6.40, 0.00, 0.00, 0.00, 0.00, 0.00, 3.80], |
| 19 | + 'NUM_SOLVED_STDDEV': [0.00, 1.17, 3.38, 0.00, 0.00, 0.00, 0.00, 0.00, 0.40] |
20 | 20 | } |
21 | 21 |
|
22 | 22 | data_fatter_burger = { |
|
25 | 25 | 'No subselect', 'No visual', 'VLM subselect', |
26 | 26 | 'ViLa', 'ViLa fewshot' |
27 | 27 | ], |
28 | | - 'NUM_SOLVED': [0.00, 9.60, 1.20, 0.00, 0.00, 1.20, 3.00, 0.80, 3.80], |
29 | | - 'NUM_SOLVED_STDDEV': [0.00, 0.80, 2.40, 0.00, 0.00, 2.40, 1.41, 0.40, 0.40] |
| 28 | + 'NUM_SOLVED': [0.00, 9.60, 1.80, 0.00, 0.00, 1.20, 3.00, 0.80, 3.80], |
| 29 | + 'NUM_SOLVED_STDDEV': [0.00, 0.80, 3.60, 0.00, 0.00, 2.40, 1.41, 0.40, 0.40] |
30 | 30 | } |
31 | 31 |
|
32 | 32 | data_more_stacks = { |
|
35 | 35 | 'No subselect', 'No visual', 'VLM subselect', |
36 | 36 | 'ViLa', 'ViLa fewshot' |
37 | 37 | ], |
38 | | - 'NUM_SOLVED': [0.00, 9.40, 0.00, 0.00, 0.00, 0.00, 3.60, 0.80, 3.80], |
39 | | - 'NUM_SOLVED_STDDEV': [0.00, 0.80, 0.00, 0.00, 0.00, 0.00, 2.24, 1.17, 0.40] |
| 38 | + 'NUM_SOLVED': [0.00, 9.40, 5.20, 0.00, 0.00, 0.00, 3.60, 0.80, 3.80], |
| 39 | + 'NUM_SOLVED_STDDEV': [0.00, 0.80, 4.31, 0.00, 0.00, 0.00, 2.24, 1.17, 0.40] |
40 | 40 | } |
41 | 41 |
|
42 | 42 | data_kitchen_boil_kettle = { |
|
45 | 45 | 'No subselect', 'No visual', 'VLM subselect', |
46 | 46 | 'ViLa', 'ViLa fewshot' |
47 | 47 | ], |
48 | | - 'NUM_SOLVED': [9.60, 9.80, 9.80, 0.00, 0.00, 9.80, 1.00, 6.60, 10.00], |
49 | | - 'NUM_SOLVED_STDDEV': [0.49, 0.40, 0.40, 0.00, 0.00, 0.40, 2.00, 1.02, 0.00] |
| 48 | + 'NUM_SOLVED': [9.60, 9.80, 3.80, 0.00, 0.00, 9.80, 1.00, 6.60, 10.00], |
| 49 | + 'NUM_SOLVED_STDDEV': [0.49, 0.40, 4.66, 0.00, 0.00, 0.40, 2.00, 1.02, 0.00] |
50 | 50 | } |
51 | 51 |
|
52 | 52 | # Convert each dataset to a DataFrame |
|
0 commit comments