Skip to content

Commit b89047d

Browse files
functionstackxcquil11
authored andcommitted
remove llama 70b (#149)
1 parent 24ea7de commit b89047d

22 files changed

Lines changed: 0 additions & 1439 deletions

.github/workflows/70b-tmpl.yml

Lines changed: 0 additions & 230 deletions
This file was deleted.

.github/workflows/full-sweep-tmpl.yml

Lines changed: 0 additions & 75 deletions
Original file line numberDiff line numberDiff line change
@@ -37,31 +37,6 @@ on:
3737
default: false
3838

3939
jobs:
40-
_70b-1k1k:
41-
if: ${{ inputs.run_1k1k }}
42-
uses: ./.github/workflows/70b-tmpl.yml
43-
secrets: inherit
44-
with:
45-
exp-name: '70b_1k1k'
46-
isl: 1024
47-
osl: 1024
48-
max-model-len: 2048
49-
random-range-ratio: 0.8
50-
use_h100: ${{ inputs.use_h100 }}
51-
use_h200: ${{ inputs.use_h200 }}
52-
use_b200: ${{ inputs.use_b200 }}
53-
use_mi300x: ${{ inputs.use_mi300x }}
54-
use_mi325x: ${{ inputs.use_mi325x }}
55-
use_mi355x: ${{ inputs.use_mi355x }}
56-
57-
collect-70b-1k1k-results:
58-
needs: _70b-1k1k
59-
if: ${{ inputs.run_1k1k && always() }}
60-
uses: ./.github/workflows/collect-results.yml
61-
secrets: inherit
62-
with:
63-
exp-name: '70b_1k1k'
64-
6540
dsr1-1k1k:
6641
if: ${{ inputs.run_1k1k }}
6742
uses: ./.github/workflows/dsr1-tmpl.yml
@@ -112,31 +87,6 @@ jobs:
11287
with:
11388
exp-name: 'gptoss_1k1k'
11489

115-
_70b-8k1k:
116-
if: ${{ inputs.run_8k1k }}
117-
uses: ./.github/workflows/70b-tmpl.yml
118-
secrets: inherit
119-
with:
120-
exp-name: '70b_8k1k'
121-
isl: 8192
122-
osl: 1024
123-
max-model-len: 9216
124-
random-range-ratio: 0.8
125-
use_h100: ${{ inputs.use_h100 }}
126-
use_h200: ${{ inputs.use_h200 }}
127-
use_b200: ${{ inputs.use_b200 }}
128-
use_mi300x: ${{ inputs.use_mi300x }}
129-
use_mi325x: ${{ inputs.use_mi325x }}
130-
use_mi355x: ${{ inputs.use_mi355x }}
131-
132-
collect-70b-8k1k-results:
133-
needs: _70b-8k1k
134-
if: ${{ inputs.run_8k1k && always() }}
135-
uses: ./.github/workflows/collect-results.yml
136-
secrets: inherit
137-
with:
138-
exp-name: '70b_8k1k'
139-
14090
dsr1-8k1k:
14191
if: ${{ inputs.run_8k1k }}
14292
uses: ./.github/workflows/dsr1-tmpl.yml
@@ -187,31 +137,6 @@ jobs:
187137
with:
188138
exp-name: 'gptoss_8k1k'
189139

190-
_70b-1k8k:
191-
if: ${{ inputs.run_1k8k }}
192-
uses: ./.github/workflows/70b-tmpl.yml
193-
secrets: inherit
194-
with:
195-
exp-name: '70b_1k8k'
196-
isl: 1024
197-
osl: 8192
198-
max-model-len: 9216
199-
random-range-ratio: 0.8
200-
use_h100: ${{ inputs.use_h100 }}
201-
use_h200: ${{ inputs.use_h200 }}
202-
use_b200: ${{ inputs.use_b200 }}
203-
use_mi300x: ${{ inputs.use_mi300x }}
204-
use_mi325x: ${{ inputs.use_mi325x }}
205-
use_mi355x: ${{ inputs.use_mi355x }}
206-
207-
collect-70b-1k8k-results:
208-
needs: _70b-1k8k
209-
if: ${{ inputs.run_1k8k && always() }}
210-
uses: ./.github/workflows/collect-results.yml
211-
secrets: inherit
212-
with:
213-
exp-name: '70b_1k8k'
214-
215140
dsr1-1k8k:
216141
if: ${{ inputs.run_1k8k }}
217142
uses: ./.github/workflows/dsr1-tmpl.yml

.github/workflows/runner-model-sweep-test.yml

Lines changed: 0 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,6 @@ jobs:
3333
- 'h100-cw_0'
3434
- 'h100-cw_1'
3535
config:
36-
- { image: 'vllm/vllm-openai:v0.10.2', model: 'nvidia/Llama-3.3-70B-Instruct-FP8', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
3736
- { image: 'vllm/vllm-openai:v0.10.2', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }
3837

3938
name: '${{ matrix.runner }}'
@@ -70,7 +69,6 @@ jobs:
7069
- 'h200-nv_2'
7170
- 'h200-nv_3'
7271
config:
73-
- { image: 'vllm/vllm-openai:v0.10.2', model: 'nvidia/Llama-3.3-70B-Instruct-FP8', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
7472
- { image: 'lmsysorg/sglang:v0.5.2rc2-cu126', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'sglang', precision: 'fp8', exp-name: 'dsr1_test' }
7573
- { image: 'vllm/vllm-openai:v0.10.2', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }
7674

@@ -108,7 +106,6 @@ jobs:
108106
- 'h200-nv_2'
109107
- 'h200-nv_3'
110108
config:
111-
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'nvidia/Llama-3.3-70B-Instruct-FP8', framework: 'trt', precision: 'fp8', exp-name: '70b_test' }
112109
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'trt', precision: 'fp8', exp-name: 'dsr1_test' }
113110
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'openai/gpt-oss-120b', framework: 'trt', precision: 'fp4', exp-name: 'gptoss_test' }
114111

@@ -140,8 +137,6 @@ jobs:
140137
- 'b200-nvd_2'
141138
- 'b200-nvd_3'
142139
config:
143-
- { image: 'vllm/vllm-openai:v0.10.2', model: 'nvidia/Llama-3.3-70B-Instruct-FP8', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
144-
- { image: 'vllm/vllm-openai:v0.10.2', model: 'nvidia/Llama-3.3-70B-Instruct-FP4', framework: 'vllm', precision: 'fp4', exp-name: '70b_test' }
145140
- { image: 'lmsysorg/sglang:v0.5.3rc1-cu129-b200', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'sglang', precision: 'fp8', exp-name: 'dsr1_test' }
146141
- { image: 'lmsysorg/sglang:v0.5.3rc1-cu129-b200', model: 'nvidia/DeepSeek-R1-0528-FP4', framework: 'sglang', precision: 'fp4', exp-name: 'dsr1_test' }
147142
- { image: 'vllm/vllm-openai:v0.10.2', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }
@@ -174,8 +169,6 @@ jobs:
174169
- 'b200-nb_0'
175170
- 'b200-nb_1'
176171
config:
177-
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'nvidia/Llama-3.3-70B-Instruct-FP8', framework: 'trt', precision: 'fp8', exp-name: '70b_test' }
178-
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'nvidia/Llama-3.3-70B-Instruct-FP4', framework: 'trt', precision: 'fp4', exp-name: '70b_test' }
179172
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'trt', precision: 'fp8', exp-name: 'dsr1_test' }
180173
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'nvidia/DeepSeek-R1-0528-FP4', framework: 'trt', precision: 'fp4', exp-name: 'dsr1_test' }
181174
- { image: 'nvcr.io#nvidia/tensorrt-llm/release:1.1.0rc2.post2', model: 'openai/gpt-oss-120b', framework: 'trt', precision: 'fp4', exp-name: 'gptoss_test' }
@@ -211,7 +204,6 @@ jobs:
211204
- 'mi300x-cr_0'
212205
- 'mi300x-oci_0'
213206
config:
214-
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'amd/Llama-3.3-70B-Instruct-FP8-KV', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
215207
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_sgl-dev-v0.5.2-rocm7.0-mi30x-20250915', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'sglang', precision: 'fp8', exp-name: 'dsr1_test' }
216208
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }
217209

@@ -244,7 +236,6 @@ jobs:
244236
- 'mi325x-tw_2'
245237
- 'mi325x-tw_3'
246238
config:
247-
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'amd/Llama-3.3-70B-Instruct-FP8-KV', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
248239
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_sgl-dev-v0.5.2-rocm7.0-mi30x-20250915', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'sglang', precision: 'fp8', exp-name: 'dsr1_test' }
249240
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }
250241

@@ -276,8 +267,6 @@ jobs:
276267
- 'mi355x-amd_2'
277268
- 'mi355x-amd_3'
278269
config:
279-
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'amd/Llama-3.3-70B-Instruct-FP8-KV', framework: 'vllm', precision: 'fp8', exp-name: '70b_test' }
280-
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'amd/Llama-3.3-70B-Instruct-MXFP4-Preview', framework: 'vllm', precision: 'fp4', exp-name: '70b_test' }
281270
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_sgl-dev-v0.5.2-rocm7.0-mi35x-20250915', model: 'deepseek-ai/DeepSeek-R1-0528', framework: 'sglang', precision: 'fp8', exp-name: 'dsr1_test' }
282271
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_sgl-dev-v0.5.2-rocm7.0-mi35x-20250915', model: 'amd/DeepSeek-R1-0528-MXFP4-Preview', framework: 'sglang', precision: 'fp4', exp-name: 'dsr1_test' }
283272
- { image: 'rocm/7.0:rocm7.0_ubuntu_22.04_vllm_0.10.1_instinct_20250927_rc1', model: 'openai/gpt-oss-120b', framework: 'vllm', precision: 'fp4', exp-name: 'gptoss_test' }

0 commit comments

Comments
 (0)