We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 1813eaf commit 7003793Copy full SHA for 7003793
2 files changed
examples/inference-deployments/llama2/llama2_13b.yaml
@@ -5,9 +5,8 @@ command: |- # Note this command is a workaround until we build vllm into the inf
5
pip uninstall torch -y
6
pip install torch==2.0.1
7
compute:
8
- gpus: 1
9
- instance: oci.vm.gpu.a10.1
10
-image: mosaicml/inference:0.1.37
11
-cluster: r7z15
+ gpus: 2
+ instance: oci.vm.gpu.a10.2
+image: mosaicml/inference:0.1.40
12
default_model:
13
model_type: llama2-13b
examples/inference-deployments/llama2/llama2_7b_chat.yaml
@@ -7,7 +7,6 @@ command: |- # Note this command is a workaround until we build vllm into the inf
gpus: 1
instance: oci.vm.gpu.a10.1
model_type: llama2-7b-chat
0 commit comments