Skip to content

Commit ba9cb38

Browse files
author
Wenlei Bao
committed
Add AMD CI test
1 parent ce7162f commit ba9cb38

1 file changed

Lines changed: 62 additions & 0 deletions

File tree

.github/workflows/ci.yml

Lines changed: 62 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,62 @@
1+
name: Integration Tests
2+
on:
3+
push:
4+
branches: [main]
5+
6+
jobs:
7+
# TODO: Add pre commit checks
8+
# pre-commit:
9+
# uses: ./.github/workflows/pre-commit.yml
10+
11+
# TODO: Add Nvidia integration tests
12+
# integration-tests-nvidia:
13+
14+
integration-tests-amd:
15+
runs-on: ${{ matrix.runner }}
16+
timeout-minutes: 60
17+
strategy:
18+
matrix:
19+
runner: "amd-gfx942"
20+
include:
21+
# - image: "rocm/rocm-6.4-py310-torch25-241101-3"
22+
- image: "rocm/pytorch:rocm6.1_ubuntu22.04_py3.10_pytorch_2.4"
23+
runner: ["amd-gfx942"]
24+
env:
25+
PYTHON: "python3"
26+
27+
container:
28+
- name: "AMD Integration Tests"
29+
image: ${{ matrix.image }}
30+
options: --user root
31+
32+
steps:
33+
- name: Checkout
34+
# uses: actions/checkout@v3
35+
# with:
36+
# submodules: 'recursive'
37+
run: |
38+
git clone https://github.com/ByteDance-Seed/Triton-distributed.git
39+
cd Triton-distributed/
40+
git submodule update --init --recursive
41+
42+
- name: Install dependencies
43+
run: |
44+
echo "Install dependencies..."
45+
sudo apt-get update -y
46+
sudo apt install -y libopenmpi-dev
47+
pip3 install --pre torch --index-url https://download.pytorch.org/whl/nightly/rocm6.3 --no-deps
48+
bash ./shmem/rocshmem_bind/build.sh
49+
python3 -m pip install -i https://test.pypi.org/simple hip-python>=6.3.0 # (or whatever Rocm version you have)
50+
pip3 install pybind11
51+
52+
- name: Build
53+
runs: |
54+
echo "Building Triton-distributed..."
55+
pip3 install -e python --verbose --no-build-isolation --use-pep517
56+
57+
58+
- name: Run AMD Integration Tests
59+
run: |
60+
echo "Running AMD integration tests..."
61+
bash ./scripts/launch_amd.sh ./python/triton_dist/test/amd/test_ag_gemm_intra_node.py 8192 8192 29568
62+

0 commit comments

Comments
 (0)