-
Notifications
You must be signed in to change notification settings - Fork 134
134 lines (122 loc) · 4.26 KB
/
ci.yml
File metadata and controls
134 lines (122 loc) · 4.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
name: CI
on:
push:
branches:
- main
- "pull-request/[0-9]+"
workflow_dispatch:
jobs:
test:
name: Test ${{ matrix.name }}
runs-on: ${{ matrix.runner }}
timeout-minutes: ${{ matrix.timeout }}
strategy:
fail-fast: false
matrix:
include:
- name: "GPU Linux x86_64"
runner: linux-amd64-gpu-rtxpro6000-latest-1
os: linux
gpu: true
timeout: 30
- name: "CPU Linux x86_64"
runner: ubuntu-latest
os: linux
gpu: false
timeout: 15
- name: "CPU Linux ARM64"
runner: ubuntu-24.04-arm64
os: linux
gpu: false
timeout: 15
- name: "GPU Windows x86_64"
runner: windows-amd64-gpu-rtxpro6000-latest-1
os: windows
gpu: true
timeout: 30
- name: "CPU Windows x86_64"
runner: windows-latest
os: windows
gpu: false
timeout: 15
steps:
- name: Checkout
uses: actions/checkout@v4
timeout-minutes: 5
- name: Test Docker
timeout-minutes: 5
run: |
docker --version
docker run --rm hello-world
- name: Check Hardware (Linux)
if: matrix.os == 'linux'
timeout-minutes: 5
run: |
echo "=== Host Hardware Information ==="
echo "Runner: ${{ matrix.runner }}"
echo "Architecture: $(uname -m)"
if [ "${{ matrix.gpu }}" = "true" ]; then
lspci | grep -i nvidia || echo "No NVIDIA GPU found via lspci"
nvidia-smi || echo "nvidia-smi not available on host"
else
echo "CPU-only runner (no GPU access)"
lscpu | head -10 || echo "CPU info not available"
fi
- name: Check Hardware (Windows)
if: matrix.os == 'windows'
timeout-minutes: 5
shell: cmd
run: |
echo === Host Hardware Information ===
echo Runner: ${{ matrix.runner }}
if "${{ matrix.gpu }}"=="true" (
nvidia-smi || echo nvidia-smi not available
echo Checking GPU via wmic:
wmic path win32_VideoController get name
) else (
echo CPU-only runner (no GPU access)
systeminfo | findstr /C:"Processor"
)
- name: Test CUDA Image with GPU (Linux)
if: matrix.gpu == true && matrix.os == 'linux'
timeout-minutes: 10
run: |
docker pull nvidia/cuda:13.0.2-base-ubuntu24.04
echo "=== Testing with GPU access ==="
docker run --rm --gpus all nvidia/cuda:13.0.2-base-ubuntu24.04 bash -c "
echo 'Container with GPU access:'
nvidia-smi || echo 'nvidia-smi not available in container'
cat /etc/os-release
echo 'CUDA Runtime version:'
cat /usr/local/cuda/version.txt 2>/dev/null || echo 'CUDA version file not found'
" || echo "GPU access failed - may not be available on this runner"
- name: Test CUDA Image CPU Only (Linux)
if: matrix.gpu == false && matrix.os == 'linux'
timeout-minutes: 10
run: |
docker pull nvidia/cuda:13.0.2-base-ubuntu24.04
echo "=== Testing without GPU access (CPU only) ==="
docker run --rm nvidia/cuda:13.0.2-base-ubuntu24.04 bash -c "
echo 'CUDA container test successful (CPU only - no GPU access)'
cat /etc/os-release
which nvcc || echo 'nvcc not in PATH'
nvidia-smi 2>/dev/null || echo 'nvidia-smi not available without --gpus flag (expected)'
"
- name: Test Windows Container with GPU
if: matrix.gpu == true && matrix.os == 'windows'
timeout-minutes: 10
shell: cmd
run: |
echo === Testing with GPU access ===
nvidia-smi || echo nvidia-smi not available on Windows runner
echo Checking for GPU via wmic...
wmic path win32_VideoController get name
echo Windows GPU runner test completed
- name: Test Windows Container CPU Only
if: matrix.gpu == false && matrix.os == 'windows'
timeout-minutes: 10
shell: cmd
run: |
echo === Testing without GPU access (CPU only) ===
echo Windows CPU-only runner test successful
docker --version