We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 682324e commit b15bb51Copy full SHA for b15bb51
1 file changed
xinference/model/llm/llm_family.json
@@ -29821,6 +29821,24 @@
29821
}
29822
29823
},
29824
+ {
29825
+ "model_size_in_billions": 31,
29826
+ "model_format": "fp4",
29827
+ "model_src": {
29828
+ "huggingface": {
29829
+ "model_id": "nvidia/Gemma-4-31B-IT-NVFP4",
29830
+ "quantizations": [
29831
+ "FP4"
29832
+ ]
29833
+ },
29834
+ "modelscope": {
29835
+ "model_id": "nv-community/Gemma-4-31B-IT-NVFP4",
29836
29837
29838
29839
+ }
29840
29841
29842
{
29843
"model_size_in_billions": 26,
29844
"model_format": "pytorch",
@@ -30212,6 +30230,6 @@
30212
30230
]
30213
30231
30214
30232
"featured": true,
30215
- "updated_at": 1775810942
30233
+ "updated_at": 1775834800
30216
30234
30217
30235
0 commit comments