File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1+ name : Integration Tests
2+ on :
3+ push :
4+ branches : [main]
5+
6+ jobs :
7+ # TODO: Add pre commit checks
8+ # pre-commit:
9+ # uses: ./.github/workflows/pre-commit.yml
10+
11+ # TODO: Add Nvidia integration tests
12+ # integration-tests-nvidia:
13+
14+ integration-tests-amd :
15+ runs-on : ${{ matrix.runner }}
16+ timeout-minutes : 60
17+ strategy :
18+ matrix :
19+ runner : " amd-gfx942"
20+ include :
21+ # - image: "rocm/rocm-6.4-py310-torch25-241101-3"
22+ - image : " rocm/pytorch:rocm6.1_ubuntu22.04_py3.10_pytorch_2.4"
23+ runner : ["amd-gfx942"]
24+ env :
25+ PYTHON : " python3"
26+
27+ container :
28+ - name : " AMD Integration Tests"
29+ image : ${{ matrix.image }}
30+ options : --user root
31+
32+ steps :
33+ - name : Checkout
34+ # uses: actions/checkout@v3
35+ # with:
36+ # submodules: 'recursive'
37+ run : |
38+ git clone https://github.com/ByteDance-Seed/Triton-distributed.git
39+ cd Triton-distributed/
40+ git submodule update --init --recursive
41+
42+ - name : Install dependencies
43+ run : |
44+ echo "Install dependencies..."
45+ sudo apt-get update -y
46+ sudo apt install -y libopenmpi-dev
47+ pip3 install --pre torch --index-url https://download.pytorch.org/whl/nightly/rocm6.3 --no-deps
48+ bash ./shmem/rocshmem_bind/build.sh
49+ python3 -m pip install -i https://test.pypi.org/simple hip-python>=6.3.0 # (or whatever Rocm version you have)
50+ pip3 install pybind11
51+
52+ - name : Build
53+ runs : |
54+ echo "Building Triton-distributed..."
55+ pip3 install -e python --verbose --no-build-isolation --use-pep517
56+
57+
58+ - name : Run AMD Integration Tests
59+ run : |
60+ echo "Running AMD integration tests..."
61+ bash ./scripts/launch_amd.sh ./python/triton_dist/test/amd/test_ag_gemm_intra_node.py 8192 8192 29568
62+
You can’t perform that action at this time.
0 commit comments