File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1010 "kimi-k2.5" : { "input" : " 0.60" , "output" : " 3.00" },
1111 "kimi-k2-thinking" : { "input" : " 0.60" , "output" : " 3.00" },
1212
13+ "gemma-4-31b" : { "input" : " 0.15" , "output" : " 0.40" },
14+ "gemma-4-26b-a4b" : { "input" : " 0.15" , "output" : " 0.40" },
15+
1316 "qwen3-235b" : { "input" : " 0.40" , "output" : " 3.00" },
1417 "qwen-3-235b" : { "input" : " 0.40" , "output" : " 3.00" },
1518 "qwen3-coder-480b-a35b-instruct" : { "input" : " 0.70" , "output" : " 2.80" },
1619 "qwen3-coder-480b-a35b" : { "input" : " 0.70" , "output" : " 2.80" },
1720 "qwen3-next-80b" : { "input" : " 0.15" , "output" : " 1.50" },
21+ "qwen35-35b-a3b" : { "input" : " 0.30" , "output" : " 1.25" },
22+ "qwen35-9b" : { "input" : " 0.05" , "output" : " 0.15" },
23+
24+ "arcee-trinity-large-thinking" : { "input" : " 0.30" , "output" : " 1.00" },
1825
1926 "minimax-m2.5" : { "input" : " 0.30" , "output" : " 1.20" },
2027
Original file line number Diff line number Diff line change 1717 "tpm" : 1000000 ,
1818 "models" : [
1919 " llama-3.2-3b" ,
20- " llama-3.2-3b:web" ,
21- " qwen3-4b" ,
22- " qwen3-4b:web"
20+ " llama-3.2-3b:web"
2321 ],
2422 "priority" : 25 ,
2523 "description" : " Small models with high throughput limits"
3533 " mistral-31-24b:web" ,
3634 " qwen3-next-80b" ,
3735 " qwen3-next-80b:web" ,
36+ " qwen35-35b-a3b" ,
37+ " qwen35-35b-a3b:web" ,
38+ " qwen35-9b" ,
39+ " qwen35-9b:web" ,
3840 " venice-uncensored" ,
3941 " venice-uncensored:web"
4042 ],
5860 " kimi-k2.5:web" ,
5961 " kimi-k2-thinking" ,
6062 " kimi-k2-thinking:web" ,
63+ " gemma-4-31b" ,
64+ " gemma-4-31b:web" ,
65+ " gemma-4-26b-a4b" ,
66+ " gemma-4-26b-a4b:web" ,
67+ " arcee-trinity-large-thinking" ,
68+ " arcee-trinity-large-thinking:web" ,
6169 " qwen3-235b" ,
6270 " qwen3-235b:web" ,
6371 " qwen3-coder-480b-a35b-instruct" ,
You can’t perform that action at this time.
0 commit comments