File tree Expand file tree Collapse file tree
charts/all/vllm-inference-service/templates Expand file tree Collapse file tree Original file line number Diff line number Diff line change 4141 name : models
4242 - mountPath : /cache
4343 name : cache
44+ - mountPath : /.cache
45+ name : dotcache
46+ - mountPath : /.config
47+ name : dotconfig
48+ - mountPath : /.triton
49+ name : dottriton
4450 multiModel : false
4551 supportedModelFormats :
4652 - autoSelect : true
5460 emptyDir : {}
5561 - name : cache
5662 emptyDir : {}
63+ - name : dotcache
64+ emptyDir : {}
65+ - name : dotconfig
66+ emptyDir : {}
67+ - name : dottriton
68+ emptyDir : {}
Original file line number Diff line number Diff line change 1+ global :
2+ model :
3+ vllm : ibm-granite/granite-4.0-h-350m
4+
5+ vllmServingRuntime :
6+ args :
7+ - /cache/models
8+
9+ command : []
10+
11+ image :
12+ repository : vllm/vllm-openai
13+ tag : v0.21.0
Original file line number Diff line number Diff line change @@ -75,6 +75,8 @@ clusterGroup:
7575 selfHeal : true
7676 retry :
7777 limit : 20
78+ extraValueFiles :
79+ - /overrides/vllm-inference-service-ci.yaml
7880 rag-llm :
7981 name : rag-llm
8082 namespace : rag-llm
You can’t perform that action at this time.
0 commit comments