We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 5b473a6 + 0f6c40d commit 3de9afdCopy full SHA for 3de9afd
1 file changed
overrides/values-cpu.yaml
@@ -8,18 +8,20 @@ global:
8
enabled: true
9
resources:
10
limits:
11
- cpu: "4"
12
- memory: 32Gi
+ cpu: "6"
+ memory: 48Gi
13
requests:
14
- cpu: "1"
15
- memory: 16Gi
+ cpu: "2"
+ memory: 24Gi
16
args:
17
- --enable-auto-tool-choice
18
- --chat-template
19
- /chat-templates/tool_chat_template_llama3.2_json.jinja
20
- --tool-call-parser
21
- llama3_json
22
+ - --dtype
23
+ - auto
24
- --max-model-len
- - "8192"
25
+ - "16384"
26
- --max-num-seqs
- - "2"
27
+ - "1"
0 commit comments