@@ -165,39 +165,37 @@ def translate_text_prompt(self, prompt: TextPrompt, options: SUTOptions) -> Hugg
165165
166166HF_SECRET = InjectSecret (HuggingFaceInferenceToken )
167167
168- SUTS .register (
169- HuggingFaceChatCompletionDedicatedSUT ,
170- "gemma-2-9b-it-hf" ,
171- "gemma-2-9b-it-plf" ,
172- HF_SECRET ,
173- )
174-
175- SUTS .register (
176- HuggingFaceChatCompletionDedicatedSUT ,
177- "mistral-nemo-instruct-2407-hf" ,
178- "mistral-nemo-instruct-2407-mgt" ,
179- HF_SECRET ,
180- )
181-
182168SUTS .register (
183169 HuggingFaceChatCompletionDedicatedSUT ,
184170 "nvidia-llama-3-1-nemotron-nano-8b-v1" ,
185171 "llama-3-1-nemotron-nano-8b-v-uhu" ,
186172 HF_SECRET ,
187173)
188174
175+ DEDICATED_SUTS_AND_SERVERS = {
176+ "gemma-2-9b-it" : "plf" ,
177+ "llama-3-1-tulu-3-8b" : "bzk" , # check
178+ "mistral-nemo-instruct-2407" : "mgt" ,
179+ "olmo-2-0325-32b-instruct" : "yft" ,
180+ "qwen2-5-7b-instruct" : "hgy" ,
181+ "qwq-32b" : "usw" ,
182+ "yi-1-5-34b-chat" : "nlm" , # check
183+ }
184+
185+ for sut , endpoint in DEDICATED_SUTS_AND_SERVERS .items ():
186+ SUTS .register (
187+ HuggingFaceChatCompletionDedicatedSUT ,
188+ sut + "-hf" ,
189+ sut + "-" + endpoint ,
190+ HF_SECRET ,
191+ )
189192
190- SUTS .register (
191- HuggingFaceChatCompletionDedicatedSUT ,
192- "qwen2-5-7b-instruct-hf" ,
193- "qwen2-5-7b-instruct-hgy" ,
194- HF_SECRET ,
195- )
196193
197194SUTS .register (
198- HuggingFaceChatCompletionDedicatedSUT ,
199- "olmo-2-0325-32b-instruct-hf" ,
200- "olmo-2-0325-32b-instruct-yft" ,
195+ HuggingFaceChatCompletionServerlessSUT ,
196+ "meta-llama-3_1-8b-instruct-hf" ,
197+ "meta-llama/Llama-3.1-8B-Instruct" ,
198+ "hf-inference" ,
201199 HF_SECRET ,
202200)
203201
0 commit comments