|
1 | 1 | Model,Mean Similarity,Std. Dev.,Time (s),Cost($) |
2 | | -gemini-2.0-flash,0.829,0.102,7.41,0.00048 |
3 | | -gemini-2.0-flash-001,0.814,0.176,6.85,0.000421 |
4 | | -gemini-1.5-flash,0.797,0.143,9.54,0.000238 |
5 | | -gemini-2.0-pro-exp,0.764,0.227,11.95,TBA |
6 | | -AUTO,0.760,0.184,5.14,0.000217 |
7 | | -gemini-2.0-flash-thinking-exp,0.746,0.266,10.46,TBA |
8 | | -gemini-1.5-pro,0.732,0.265,11.44,0.003332 |
9 | | -accounts/fireworks/models/llama4-maverick-instruct-basic (via Fireworks),0.687,0.221,8.07,0.000419 |
10 | | -gpt-4o,0.687,0.247,10.16,0.004736 |
11 | | -accounts/fireworks/models/llama4-scout-instruct-basic (via Fireworks),0.675,0.184,5.98,0.000226 |
12 | | -gpt-4o-mini,0.642,0.213,9.71,0.000275 |
13 | | -gemma-3-27b-it (via OpenRouter),0.628,0.299,18.79,0.000096 |
14 | | -gemini-1.5-flash-8b,0.551,0.223,3.91,0.000055 |
15 | | -Llama-Vision-Free (via Together AI),0.531,0.198,6.93,0 |
16 | | -Llama-3.2-11B-Vision-Instruct-Turbo (via Together AI),0.524,0.192,3.68,0.00006 |
17 | | -qwen/qwen-2.5-vl-7b-instruct (via OpenRouter),0.482,0.209,11.53,0.000052 |
18 | | -Llama-3.2-90B-Vision-Instruct-Turbo (via Together AI),0.461,0.306,19.26,0.000426 |
19 | | -Llama-3.2-11B-Vision-Instruct (via Hugging Face),0.451,0.257,4.54,0 |
20 | | -microsoft/phi-4-multimodal-instruct (via OpenRouter),0.366,0.287,10.8,0.000019 |
| 2 | +AUTO,0.9055321411253106,0.11206803679187702,9.56385833566839,0.0006787363636363636 |
| 3 | +gemini-2.5-flash,0.8946347816279391,0.1482605007689307,54.099135637283325,0.010509618181818182 |
| 4 | +gemini-1.5-flash,0.8640438576932735,0.19414638131679113,15.467159444635564,0.0004385318181818182 |
| 5 | +gemini-2.0-flash,0.8973145898835583,0.1264561140762329,9.905281933871182,0.0007786000000000001 |
| 6 | +gemini-2.5-pro,0.8490041811304497,0.29783800660442017,101.94726826927878,0.018589318181818183 |
| 7 | +gemini-1.5-pro,0.8677550096512131,0.2834151596237667,15.033603364771063,0.006371590909090909 |
| 8 | +meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo,0.5457486292722399,0.23911002078944002,29.259384870529175,0.011025927272727273 |
| 9 | +google/gemma-3-27b-it,0.681351785269864,0.3342178855563382,19.41191567074169,0.00026869090909090914 |
| 10 | +accounts/fireworks/models/llama4-maverick-instruct-basic,0.7677804033672144,0.23377978676593608,12.122042699293656,0.00150424 |
| 11 | +microsoft/phi-4-multimodal-instruct,0.6218563462318033,0.3203799068287538,13.148698221553456,0.0005001727272727273 |
| 12 | +qwen/qwen-2.5-vl-7b-instruct,0.5585216467675268,0.347746697400353,17.708573601462625,0.0008551818181818182 |
| 13 | +claude-opus-4-20250514,0.7722977101059199,0.23820952402930706,20.034648851914838,0.09206590909090909 |
| 14 | +claude-sonnet-4-20250514,0.8042789811996047,0.18950547739236565,19.26913606036793,0.020705454545454548 |
| 15 | +claude-3-7-sonnet-20250219,0.6333232182237497,0.3691448669615299,14.244156620719217,0.01763318181818182 |
| 16 | +claude-3-5-sonnet-20241022,0.8510506363972368,0.20859878148975006,15.994478832591664,0.01757590909090909 |
| 17 | +gpt-4.1,0.6502514117129463,0.3419725663519831,33.72405509515242,0.014434545454545453 |
| 18 | +gpt-4.1-mini,0.7228987200296618,0.2692251738340237,20.910677563060414,0.0035145090909090913 |
| 19 | +gpt-4o,0.747764892526804,0.2839489784158823,26.799152395941995,0.014775909090909091 |
| 20 | +gpt-4o-mini,0.7329809456847031,0.23116793518719836,18.175196842713788,0.006497863636363636 |
0 commit comments