-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathresources.yaml
More file actions
62 lines (54 loc) · 2.07 KB
/
resources.yaml
File metadata and controls
62 lines (54 loc) · 2.07 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
models:
- name: "gemma3:1b"
type: "ollama"
host: "http://localhost:11434" # is the default, just for illustration
info:
family: "gemma3"
vision: false
function_calling: true
json_output: true
structured_output: true
multiple_system_messages: false
- name: "qwen:0.5b" # good for fast testing, but very stupid
type: "ollama"
host: "https://ollama.cloud.intern.mevis.fraunhofer.de"
- name: "qwen3:8b"
type: "ollama"
host: "https://ollama.cloud.intern.mevis.fraunhofer.de"
- name: "qwen3:30b-a3b"
type: "ollama"
host: "https://ollama.cloud.intern.mevis.fraunhofer.de"
- name: "gpt-oss:20b" # good performance, but slower and more expensive than qwen3:30b-a3b
type: "ollama"
host: "https://ollama.cloud.intern.mevis.fraunhofer.de"
info:
family: "gpt-oss"
vision: false
function_calling: true
json_output: true
structured_output: true
multiple_system_messages: false
#--------------------------------------------------------------------
# Azure OpenAI models hosted by Fraunhofer
# See https://fraunhofer.sharepoint.com/sites/it-sicherheit/SitePages/FhGenie-API.aspx for available FhG models
- name: "gpt-4.1-nano"
type: "openai"
deployment: "gpt-4.1-nano-2025-04-14"
api-version: "2025-03-01-preview"
api-base: "https://fhgenie-api-mevis-mevis-mas.openai.azure.com/openai/v1/"
_approx-cost-per-input-megatoken_usd: 0.05
_approx-cost-per-output-megatoken_usd: 0.20
- name: "gpt-5-nano"
type: "openai"
deployment: "gpt-5-nano-2025-08-07"
api-version: "2025-03-01-preview"
api-base: "https://fhgenie-api-mevis-mevis-mas.openai.azure.com/openai/v1/"
_approx-cost-per-input-megatoken_usd: 0.05
_approx-cost-per-output-megatoken_usd: 0.40
- name: "gpt-5-mini"
type: "openai"
deployment: "gpt-5-mini-2025-08-07"
api-version: "2025-03-01-preview"
api-base: "https://fhgenie-api-mevis-mevis-mas.openai.azure.com/openai/v1/"
_approx-cost-per-input-megatoken_usd: 0.25
_approx-cost-per-output-megatoken_usd: 2.00