-
Notifications
You must be signed in to change notification settings - Fork 21
Expand file tree
/
Copy pathLocalModels.cs
More file actions
335 lines (290 loc) · 12.4 KB
/
LocalModels.cs
File metadata and controls
335 lines (290 loc) · 12.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
using MaIN.Domain.Models.Abstract;
namespace MaIN.Domain.Models.Concrete;
// ===== Gemma Family =====
public sealed record Gemma2_2b() : LocalModel(
Models.Local.Gemma2_2b,
"Gemma2-2b.gguf",
new Uri("https://huggingface.co/Inza124/gemma2_2b/resolve/main/gemma2-2b-maIN.gguf?download=true"),
"Gemma 2B",
8192,
"Lightweight 2B model for general-purpose text generation and understanding");
public sealed record Gemma3_4b() : LocalModel(
Models.Local.Gemma3_4b,
"Gemma3-4b.gguf",
new Uri("https://huggingface.co/Inza124/Gemma3-4b/resolve/main/gemma3-4b.gguf?download=true"),
"Gemma3 4B",
8192,
"Balanced 4B model for writing, analysis, and mathematical reasoning"), IVisionModel
{
public string MMProjectName => "mmproj-model-gemma3-4b.gguf";
}
public sealed record Gemma3_12b() : LocalModel(
Models.Local.Gemma3_12b,
"Gemma3-12b.gguf",
new Uri("https://huggingface.co/Inza124/Gemma3-12b/resolve/main/gemma3-12b.gguf?download=true"),
"Gemma3 12B",
8192,
"Large 12B model for complex analysis, research, and creative writing"), IVisionModel
{
public string MMProjectName => "mmproj-model-gemma3-12b.gguf";
}
public sealed record Gemma3n_e4b() : LocalModel(
Models.Local.Gemma3n_e4b,
"Gemma3n-e4b.gguf",
new Uri("https://huggingface.co/Inza124/Gemma-3n-e4b/resolve/main/gemma-3n-e4b.gguf?download=true"),
"Gemma3n E4B",
8192,
"Compact 4B model optimized for efficient reasoning and general-purpose tasks"), IVisionModel
{
public string MMProjectName => "mmproj-model-gemma3n-e4b.gguf";
}
// ===== Llama Family =====
public sealed record Llama3_2_3b() : LocalModel(
Models.Local.Llama3_2_3b,
"Llama3.2-3b.gguf",
new Uri("https://huggingface.co/Inza124/Llama3.2_3b/resolve/main/Llama3.2-maIN.gguf?download=true"),
"Llama 3.2 3B",
8192,
"Lightweight 3B model for chatbots, content creation, and basic coding");
public sealed record Llama3_1_8b() : LocalModel(
Models.Local.Llama3_1_8b,
"Llama3.1-8b.gguf",
new Uri("https://huggingface.co/Inza124/Llama3.1_8b/resolve/main/Llama3.1-maIN.gguf?download=true"),
"Llama 3.1 8B",
8192,
"Versatile 8B model for writing, coding, math, and general assistance");
public sealed record Llava_7b() : LocalModel(
Models.Local.Llava_7b,
"Llava.gguf",
new Uri("https://huggingface.co/Inza124/Llava/resolve/main/Llava-maIN.gguf?download=true"),
"LLaVA 7B",
4096,
"Vision-language model for image analysis, OCR, and visual Q&A"), IVisionModel
{
public string MMProjectName => "mmproj-model-llava-7b.gguf";
}
public sealed record Llava16Mistral_7b() : LocalModel(
Models.Local.Llava16Mistral_7b,
"llava-1.6-mistral-7b.gguf",
new Uri("https://huggingface.co/cjpais/llava-1.6-mistral-7b-gguf/resolve/main/llava-v1.6-mistral-7b.Q3_K_XS.gguf?download=true"),
"LLaVA 1.6 Mistral 7B",
4096,
"Vision-language model for image analysis, OCR, and visual Q&A"), IVisionModel
{
public string MMProjectName => "mmproj-model-llava16Mistral-7b.gguf";
}
// ===== Hermes Family =====
public sealed record Hermes3_3b() : LocalModel(
Models.Local.Hermes3_3b,
"Hermes3-3b.gguf",
new Uri("https://huggingface.co/Inza124/Hermes3-3b/resolve/main/hermes3-3b.gguf?download=true"),
"Hermes 3 3B",
8192,
"Efficient 3B model for dialogue, roleplay, and conversational AI");
public sealed record Hermes3_8b() : LocalModel(
Models.Local.Hermes3_8b,
"Hermes3-8b.gguf",
new Uri("https://huggingface.co/Inza124/Hermes3_8b/resolve/main/hermes3-8b.gguf?download=true"),
"Hermes 3 8B",
8192,
"Enhanced 8B model for complex dialogue, storytelling, and advice");
// ===== Qwen Family =====
public sealed record Qwen2_5_0_5b() : LocalModel(
Models.Local.Qwen2_5_0_5b,
"Qwen2.5-0.5b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen2.5/resolve/main/Qwen2.5-maIN.gguf?download=true"),
"Qwen 2.5 0.5B",
4096,
"Ultra-lightweight 0.5B model for simple text completion and basic tasks");
public sealed record Qwen2_5_Coder_3b() : LocalModel(
Models.Local.Qwen2_5_Coder_3b,
"Qwen2.5-coder-3b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen2.5-Coder-3b/resolve/main/Qwen2.5-coder-3b.gguf?download=true"),
"Qwen 2.5 Coder 3B",
8192,
"Compact 3B model for Python, JavaScript, bug fixing, and code review");
public sealed record Qwen2_5_Coder_7b() : LocalModel(
Models.Local.Qwen2_5_Coder_7b,
"Qwen2.5-coder-7b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen2.5-Coder-7b/resolve/main/Qwen2.5-coder-7b.gguf?download=true"),
"Qwen 2.5 Coder 7B",
8192,
"Advanced 7B model for full-stack development, API design, and testing");
public sealed record Qwen2_5_Coder_14b() : LocalModel(
Models.Local.Qwen2_5_Coder_14b,
"Qwen2.5-coder-14b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen2.5-Coder-14b/resolve/main/Qwen2.5-coder-14b.gguf?download=true"),
"Qwen 2.5 Coder 14B",
8192,
"Professional 14B model for system design, architecture, and code refactoring");
public sealed record Qwen3_8b() : LocalModel(
Models.Local.Qwen3_8b,
"Qwen3-8b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen3-8b/resolve/main/Qwen3-8b.gguf?download=true"),
"Qwen 3 8B",
8192,
"Fast 8B model for multilingual tasks, translation, and logical reasoning"
), IReasoningModel
{
// IReasoningModel implementation
public Func<string, ThinkingState, LLMTokenValue>? ReasonFunction => ReasoningFunctions.ProcessDeepSeekToken;
public string? AdditionalPrompt => null;
}
public sealed record Qwen3_14b() : LocalModel(
Models.Local.Qwen3_14b,
"Qwen3-14b.gguf",
new Uri("https://huggingface.co/Inza124/Qwen3-14b/resolve/main/Qwen3-14b.gguf?download=true"),
"Qwen 3 14B",
8192,
"Advanced 14B model for complex reasoning, research, and document analysis"), IReasoningModel
{
public Func<string, ThinkingState, LLMTokenValue>? ReasonFunction => ReasoningFunctions.ProcessDeepSeekToken;
public string? AdditionalPrompt => null;
}
public sealed record QwQ_7b() : LocalModel(
Models.Local.QwQ_7b,
"QwQ-7b.gguf",
new Uri("https://huggingface.co/Inza124/QwQ-7b/resolve/main/qwq-7b.gguf?download=true"),
"QwQ 7B",
8192,
"Reasoning-focused 7B model for step-by-step problem solving and analysis"), IReasoningModel
{
public Func<string, ThinkingState, LLMTokenValue>? ReasonFunction => ReasoningFunctions.ProcessQwQ_QwenModToken;
public string? AdditionalPrompt => "- Output nothing before <think>, enclose all step-by-step reasoning (excluding the final answer) within <think>...</think>, and place the final answer immediately after the closing </think>";
}
// ===== DeepSeek Family =====
public sealed record DeepSeek_R1_8b() : LocalModel(
Models.Local.DeepSeekR1_8b,
"DeepSeekR1-8b.gguf",
new Uri("https://huggingface.co/Inza124/DeepseekR1-8b/resolve/main/DeepSeekR1-8b-maIN.gguf?download=true"),
"DeepSeek R1 8B",
8192,
"Advanced 8B model for math proofs, scientific reasoning, and logical puzzles"), IReasoningModel
{
public Func<string, ThinkingState, LLMTokenValue>? ReasonFunction => ReasoningFunctions.ProcessDeepSeekToken;
public string? AdditionalPrompt => null;
}
public sealed record DeepSeek_R1_1_5b() : LocalModel(
Models.Local.DeepSeekR1_1_5b,
"DeepSeekR1-1.5b.gguf",
new Uri("https://huggingface.co/Inza124/DeepseekR1-1.5b/resolve/main/DeepSeekR1-1.5b.gguf?download=true"),
"DeepSeek R1 1.5B",
4096,
"Compact 1.5B model for basic logic, simple math, and chain-of-thought tasks"), IReasoningModel
{
public Func<string, ThinkingState, LLMTokenValue>? ReasonFunction => ReasoningFunctions.ProcessDeepSeekToken;
public string? AdditionalPrompt => null;
}
// ===== Phi Family =====
public sealed record Phi3_5_3b() : LocalModel(
Models.Local.Phi3_5_3b,
"phi3.5-3b.gguf",
new Uri("https://huggingface.co/Inza124/phi3.5-3b/resolve/main/phi3.5-3b.gguf?download=true"),
"Phi 3.5 3B",
4096,
"Efficient 3B model for mobile apps, IoT devices, and edge computing");
public sealed record Phi4_4b() : LocalModel(
Models.Local.Phi4_4b,
"phi4-4b.gguf",
new Uri("https://huggingface.co/Inza124/Phi4-4b/resolve/main/phi4-4b.gguf?download=true"),
"Phi 4 4B",
4096,
"Latest 4B model for factual Q&A, safety-focused applications, and education");
// ===== Other Models =====
public sealed record LFM2_1_2b() : LocalModel(
Models.Local.Lfm2_1_2b,
"lfm2-1.2b.gguf",
new Uri("https://huggingface.co/Inza124/Lfm2-1.2b/resolve/main/lfm2-1.2b.gguf?download=true"),
"LFM2 1.2B",
4096,
"Lightweight modern 1.2B model for fast inference and resource-constrained environments");
public sealed record Minicpm4_8b() : LocalModel(
Models.Local.Minicpm4_8b,
"Minicpm4-8b.gguf",
new Uri("https://huggingface.co/Inza124/Minicpm4-8b/resolve/main/MiniCPM4-8b.gguf?download=true"),
"MiniCPM4 8B",
8192,
"Mid-size 8B model balancing performance and efficiency for diverse applications");
public sealed record Mistral_3_2_24b() : LocalModel(
Models.Local.Mistral3_2_24b,
"Mistral3.2-24b.gguf",
new Uri("https://huggingface.co/Inza124/Mistral3.2-24b/resolve/main/Mistral3.2-24b.gguf?download=true"),
"Mistral 3.2 24B",
8192,
"Large 24B model offering advanced reasoning and comprehensive knowledge for complex tasks");
public sealed record Webgen_4b() : LocalModel(
Models.Local.Webgen_4b,
"webgen-4b.gguf",
new Uri("https://huggingface.co/Inza124/webgen-4b/resolve/main/Webgen-4b.gguf?download=true"),
"Webgen 4B",
8192,
"Specialized 4B model optimized for web development and code generation tasks");
public sealed record Bielik_2_5_11b() : LocalModel(
Models.Local.Bielik2_5_11b,
"Bielik2.5-11b.gguf",
new Uri("https://huggingface.co/Inza124/Bielik2.5-11b/resolve/main/Bielik2.5-11b.gguf?download=true"),
"Bielik 2.5 11B",
8192,
"Large 11B Polish language model with strong multilingual capabilities and reasoning");
public sealed record OlympicCoder_7b() : LocalModel(
Models.Local.OlympicCoder_7b,
"Olympiccoder-7b.gguf",
new Uri("https://huggingface.co/Inza124/OlympicCoder-7b/resolve/main/OlympicCoder-7b.gguf?download=true"),
"OlympicCoder 7B",
8192,
"Specialized 7B model for algorithms, data structures, and contest programming");
public sealed record Yi_6b() : LocalModel(
Models.Local.Yi_6b,
"Yi-6b.gguf",
new Uri("https://huggingface.co/Inza124/yi-6b/resolve/main/yi-6b.gguf?download=true"),
"Yi 6B",
4096,
"Bilingual 6B model for Chinese-English translation and cultural content");
public sealed record Smollm2_0_1b() : LocalModel(
Models.Local.Smollm2_0_1b,
"Smollm2-0.1b.gguf",
new Uri("https://huggingface.co/Inza124/Smollm2-0.1b/resolve/main/smollm2-0.1b.gguf?download=true"),
"SmolLM2 0.1B",
2048,
"Tiny 0.1B model for keyword extraction, simple classification, and demos");
public sealed record Olmo2_7b() : LocalModel(
Models.Local.Olmo2_7b,
"Olmo2-7b.gguf",
new Uri("https://huggingface.co/Inza124/Olmo2-7b/resolve/main/olmo2-7b.gguf?download=true"),
"OLMo2 7B",
8192,
"Open-source 7B model for research, benchmarking, and academic studies");
// ===== Image Generation =====
public sealed record Flux1Shnell() : LocalModel(
Models.Local.Flux1Shnell,
"FLUX.1_Shnell",
null,
"FLUX.1 Schnell",
4096,
"Fast local image generation model"), IImageGenerationModel;
// ===== Embedding Model =====
public sealed record Mxbai_Embedding() : LocalModel(
"mxbai-embedding",
"mxbai-embed-large-v1.Q4_K_M.gguf",
new Uri("https://huggingface.co/ChristianAzinn/mxbai-embed-large-v1-gguf/resolve/main/mxbai-embed-large-v1.Q4_K_M.gguf?download=true"),
"mxbai-embed-large v1",
512,
"Model used to generate embeddings with superior knowledge search recall"), IEmbeddingModel
{
public int EmbeddingDimension => 1024;
}
public sealed record Nomic_Embedding() : LocalModel(
Models.Local.NomicEmbedding,
"nomicv2.gguf",
new Uri("https://huggingface.co/Inza124/Nomic/resolve/main/nomicv2.gguf?download=true"),
"Nomic Embedding",
8192,
"Model used to generate embeddings");
// ===== TTS Model =====
public sealed record Kokoro_82m() : LocalModel(
Models.Local.Kokoro82m,
"kokoro.onnx",
new Uri("https://github.com/taylorchu/kokoro-onnx/releases/download/v0.2.0/kokoro.onnx"),
"Kokoro 82M",
4096,
"Frontier TTS model for its size of 82 million parameters (text in/audio out)"), ITTSModel;