-
Notifications
You must be signed in to change notification settings - Fork 87
Expand file tree
/
Copy pathbasic.sh
More file actions
executable file
·26 lines (24 loc) · 1015 Bytes
/
basic.sh
File metadata and controls
executable file
·26 lines (24 loc) · 1015 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
## Model Server Configuration
# See docs/standup.md
export LLMDBENCH_VLLM_COMMON_NAMESPACE="llmd"
# Available methods are `modelservice` llm-d helmchart, `standalone`
# vLLM deployment, or the name of a SVC.
export LLMDBENCH_DEPLOY_METHODS="modelservice"
# Model to deploy
export LLMDBENCH_DEPLOY_MODEL_LIST="ibm-granite/granite-3.1-2b-instruct"
## Benchmark Configuration
# See docs/run.md
export LLMDBENCH_HARNESS_NAMESPACE="llmdbench"
# The benchmark tool to use
export LLMDBENCH_HARNESS_NAME="guidellm"
# The profile to run the tool with
#export LLMDBENCH_HARNESS_EXPERIMENT_PROFILE="shared_prefix_synthetic"
# Cluster PVC for saving results
export LLMDBENCH_HARNESS_PVC_NAME="workload-pvc"
# Service account to deploy harness with
export LLMDBENCH_HARNESS_SERVICE_ACCOUNT="default"
## Common
# Local Work Directory for saving results
export LLMDBENCH_CONTROL_WORK_DIR="/tmp/modelserve"
# HuggingFace token for model/tokenizer pulling
export LLMDBENCH_HF_TOKEN="llm-d-hf-token" # TODO Must set even if unused