adding more workflows #16
Workflow file for this run
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| name: "1K/8K Sweep" | ||
| concurrency: | ||
| group: benchmark-lock-1k8k | ||
| cancel-in-progress: false | ||
| on: | ||
| workflow_dispatch: | ||
| schedule: | ||
| - cron: '0 23 * * *' | ||
| on: | ||
| # pull_request: | ||
| workflow_dispatch: | ||
| jobs: | ||
| get-70b-configs: | ||
| runs-on: ubuntu-latest | ||
| outputs: | ||
| search-space-config: ${{ steps.get-70b-configs.outputs.search-space-config }} | ||
| steps: | ||
| - name: Checkout code | ||
| uses: actions/checkout@v4 | ||
| - id: get-70b-configs | ||
| run: | | ||
| CONFIG_JSON=$(python3 ${GITHUB_WORKSPACE}/utils/matrix-logic/generate_sweep_configs.py full-sweep --config-files ${GITHUB_WORKSPACE}/.github/configs/nvidia-master.yaml ${GITHUB_WORKSPACE}/.github/configs/amd-master.yaml --seq-lens 1k8k --model-prefix 70b) | ||
| echo "search-space-config=$CONFIG_JSON" >> $GITHUB_OUTPUT | ||
| get-dsr1-configs: | ||
| runs-on: ubuntu-latest | ||
| outputs: | ||
| search-space-config: ${{ steps.get-dsr1-configs.outputs.search-space-config }} | ||
| steps: | ||
| - name: Checkout code | ||
| uses: actions/checkout@v4 | ||
| - id: get-dsr1-configs | ||
| run: | | ||
| CONFIG_JSON=$(python3 ${GITHUB_WORKSPACE}/utils/matrix-logic/generate_sweep_configs.py full-sweep --config-files ${GITHUB_WORKSPACE}/.github/configs/nvidia-master.yaml ${GITHUB_WORKSPACE}/.github/configs/amd-master.yaml --seq-lens 1k8k --model-prefix dsr1) | ||
| echo "search-space-config=$CONFIG_JSON" >> $GITHUB_OUTPUT | ||
| get-gptoss-configs: | ||
| runs-on: ubuntu-latest | ||
| outputs: | ||
| search-space-config: ${{ steps.get-gptoss-configs.outputs.search-space-config }} | ||
| steps: | ||
| - name: Checkout code | ||
| uses: actions/checkout@v4 | ||
| - id: get-gptoss-configs | ||
| run: | | ||
| CONFIG_JSON=$(python3 ${GITHUB_WORKSPACE}/utils/matrix-logic/generate_sweep_configs.py full-sweep --config-files ${GITHUB_WORKSPACE}/.github/configs/nvidia-master.yaml ${GITHUB_WORKSPACE}/.github/configs/amd-master.yaml --seq-lens 1k8k --model-prefix gptoss) | ||
| echo "search-space-config=$CONFIG_JSON" >> $GITHUB_OUTPUT | ||
| benchmark-70b: | ||
| needs: get-70b-configs | ||
| uses: ./.github/workflows/benchmark-tmpl.yml | ||
| name: 70b 1k8k | ||
| strategy: | ||
| fail-fast: false | ||
| matrix: | ||
| config: ${{ fromJson(needs.get-70b-configs.outputs.search-space-config) }} | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "70b_1k8k" | ||
| isl: 1024 | ||
| osl: 1024 | ||
| max-model-len: 2048 | ||
| runner: ${{ matrix.config.runner }} | ||
| image: ${{ matrix.config.image }} | ||
| model: ${{ matrix.config.model }} | ||
| framework: ${{ matrix.config.framework }} | ||
| precision: ${{ matrix.config.precision }} | ||
| tp: ${{ matrix.config.tp }} | ||
| ep: ${{ matrix.config.ep || 1 }} | ||
| dp-attn: ${{ matrix.config.dp-attn || false }} | ||
| conc: ${{ matrix.config.conc }} | ||
| benchmark-dsr1: | ||
| needs: get-dsr1-configs | ||
| uses: ./.github/workflows/benchmark-tmpl.yml | ||
| name: dsr1 1k8k | ||
| strategy: | ||
| fail-fast: false | ||
| matrix: | ||
| config: ${{ fromJson(needs.get-dsr1-configs.outputs.search-space-config) }} | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "dsr1_1k8k" | ||
| isl: 1024 | ||
| osl: 1024 | ||
| max-model-len: 2048 | ||
| runner: ${{ matrix.config.runner }} | ||
| image: ${{ matrix.config.image }} | ||
| model: ${{ matrix.config.model }} | ||
| framework: ${{ matrix.config.framework }} | ||
| precision: ${{ matrix.config.precision }} | ||
| tp: ${{ matrix.config.tp }} | ||
| ep: ${{ matrix.config.ep || 1 }} | ||
| dp-attn: ${{ matrix.config.dp-attn || false }} | ||
| conc: ${{ matrix.config.conc }} | ||
| benchmark-gptoss: | ||
| needs: get-gptoss-configs | ||
| uses: ./.github/workflows/benchmark-tmpl.yml | ||
| name: gptoss 1k8k | ||
| strategy: | ||
| fail-fast: false | ||
| matrix: | ||
| config: ${{ fromJson(needs.get-gptoss-configs.outputs.search-space-config) }} | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "gptoss_1k8k" | ||
| isl: 1024 | ||
| osl: 1024 | ||
| max-model-len: 2048 | ||
| runner: ${{ matrix.config.runner }} | ||
| image: ${{ matrix.config.image }} | ||
| model: ${{ matrix.config.model }} | ||
| framework: ${{ matrix.config.framework }} | ||
| precision: ${{ matrix.config.precision }} | ||
| tp: ${{ matrix.config.tp }} | ||
| ep: ${{ matrix.config.ep || 1 }} | ||
| dp-attn: ${{ matrix.config.dp-attn || false }} | ||
| conc: ${{ matrix.config.conc }} | ||
| collect-70b-results: | ||
| needs: benchmark-70b | ||
| if: ${{ always() }} | ||
| uses: ./.github/workflows/collect-results.yml | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "70b_1k8k" | ||
| collect-dsr1-results: | ||
| needs: benchmark-dsr1 | ||
| if: ${{ always() }} | ||
| uses: ./.github/workflows/collect-results.yml | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "dsr1_1k8k" | ||
| collect-gptoss-results: | ||
| needs: benchmark-gptoss | ||
| if: ${{ always() }} | ||
| uses: ./.github/workflows/collect-results.yml | ||
| secrets: inherit | ||
| with: | ||
| exp-name: "gptoss_1k8k" | ||