Skip to content

Commit bced9db

Browse files
authored
Merge pull request #228 from MorpheusAIs/feature/update-pricing
update pricing
2 parents f512b39 + 2575f68 commit bced9db

2 files changed

Lines changed: 18 additions & 3 deletions

File tree

models/prod_model_price.json

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,11 +10,18 @@
1010
"kimi-k2.5": { "input": "0.60", "output": "3.00" },
1111
"kimi-k2-thinking": { "input": "0.60", "output": "3.00" },
1212

13+
"gemma-4-31b": { "input": "0.15", "output": "0.40" },
14+
"gemma-4-26b-a4b": { "input": "0.15", "output": "0.40" },
15+
1316
"qwen3-235b": { "input": "0.40", "output": "3.00" },
1417
"qwen-3-235b": { "input": "0.40", "output": "3.00" },
1518
"qwen3-coder-480b-a35b-instruct": { "input": "0.70", "output": "2.80" },
1619
"qwen3-coder-480b-a35b": { "input": "0.70", "output": "2.80" },
1720
"qwen3-next-80b": { "input": "0.15", "output": "1.50" },
21+
"qwen35-35b-a3b": { "input": "0.30", "output": "1.25" },
22+
"qwen35-9b": { "input": "0.05", "output": "0.15" },
23+
24+
"arcee-trinity-large-thinking": { "input": "0.30", "output": "1.00" },
1825

1926
"minimax-m2.5": { "input": "0.30", "output": "1.20" },
2027

models/prod_rate_limit.json

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,7 @@
1717
"tpm": 1000000,
1818
"models": [
1919
"llama-3.2-3b",
20-
"llama-3.2-3b:web",
21-
"qwen3-4b",
22-
"qwen3-4b:web"
20+
"llama-3.2-3b:web"
2321
],
2422
"priority": 25,
2523
"description": "Small models with high throughput limits"
@@ -35,6 +33,10 @@
3533
"mistral-31-24b:web",
3634
"qwen3-next-80b",
3735
"qwen3-next-80b:web",
36+
"qwen35-35b-a3b",
37+
"qwen35-35b-a3b:web",
38+
"qwen35-9b",
39+
"qwen35-9b:web",
3840
"venice-uncensored",
3941
"venice-uncensored:web"
4042
],
@@ -58,6 +60,12 @@
5860
"kimi-k2.5:web",
5961
"kimi-k2-thinking",
6062
"kimi-k2-thinking:web",
63+
"gemma-4-31b",
64+
"gemma-4-31b:web",
65+
"gemma-4-26b-a4b",
66+
"gemma-4-26b-a4b:web",
67+
"arcee-trinity-large-thinking",
68+
"arcee-trinity-large-thinking:web",
6169
"qwen3-235b",
6270
"qwen3-235b:web",
6371
"qwen3-coder-480b-a35b-instruct",

0 commit comments

Comments
 (0)