Skip to content

Commit 4f1c566

Browse files
authored
Add a number of HF suts from the Big Model List. (#996)
1 parent 29944ad commit 4f1c566

1 file changed

Lines changed: 21 additions & 23 deletions

File tree

plugins/huggingface/modelgauge/suts/huggingface_chat_completion.py

Lines changed: 21 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -165,39 +165,37 @@ def translate_text_prompt(self, prompt: TextPrompt, options: SUTOptions) -> Hugg
165165

166166
HF_SECRET = InjectSecret(HuggingFaceInferenceToken)
167167

168-
SUTS.register(
169-
HuggingFaceChatCompletionDedicatedSUT,
170-
"gemma-2-9b-it-hf",
171-
"gemma-2-9b-it-plf",
172-
HF_SECRET,
173-
)
174-
175-
SUTS.register(
176-
HuggingFaceChatCompletionDedicatedSUT,
177-
"mistral-nemo-instruct-2407-hf",
178-
"mistral-nemo-instruct-2407-mgt",
179-
HF_SECRET,
180-
)
181-
182168
SUTS.register(
183169
HuggingFaceChatCompletionDedicatedSUT,
184170
"nvidia-llama-3-1-nemotron-nano-8b-v1",
185171
"llama-3-1-nemotron-nano-8b-v-uhu",
186172
HF_SECRET,
187173
)
188174

175+
DEDICATED_SUTS_AND_SERVERS = {
176+
"gemma-2-9b-it": "plf",
177+
"llama-3-1-tulu-3-8b": "bzk", # check
178+
"mistral-nemo-instruct-2407": "mgt",
179+
"olmo-2-0325-32b-instruct": "yft",
180+
"qwen2-5-7b-instruct": "hgy",
181+
"qwq-32b": "usw",
182+
"yi-1-5-34b-chat": "nlm", # check
183+
}
184+
185+
for sut, endpoint in DEDICATED_SUTS_AND_SERVERS.items():
186+
SUTS.register(
187+
HuggingFaceChatCompletionDedicatedSUT,
188+
sut + "-hf",
189+
sut + "-" + endpoint,
190+
HF_SECRET,
191+
)
189192

190-
SUTS.register(
191-
HuggingFaceChatCompletionDedicatedSUT,
192-
"qwen2-5-7b-instruct-hf",
193-
"qwen2-5-7b-instruct-hgy",
194-
HF_SECRET,
195-
)
196193

197194
SUTS.register(
198-
HuggingFaceChatCompletionDedicatedSUT,
199-
"olmo-2-0325-32b-instruct-hf",
200-
"olmo-2-0325-32b-instruct-yft",
195+
HuggingFaceChatCompletionServerlessSUT,
196+
"meta-llama-3_1-8b-instruct-hf",
197+
"meta-llama/Llama-3.1-8B-Instruct",
198+
"hf-inference",
201199
HF_SECRET,
202200
)
203201

0 commit comments

Comments
 (0)