Skip to content

chore: update fork to f8f315b (20 model architectures with LayerParti… #10

chore: update fork to f8f315b (20 model architectures with LayerParti…

chore: update fork to f8f315b (20 model architectures with LayerParti… #10

Workflow file for this run

name: E2E Tests
on:
push:
branches: [main, feature/*]
pull_request:
branches: [main]
concurrency:
group: e2e-${{ github.ref }}
cancel-in-progress: true
jobs:
e2e:
runs-on: macos-15
timeout-minutes: 30
steps:
- uses: actions/checkout@v4
- name: Cache Swift packages
uses: actions/cache@v4
with:
path: .build
key: ${{ runner.os }}-spm-${{ hashFiles('Package.resolved') }}
restore-keys: |
${{ runner.os }}-spm-
- name: Build (Release)
run: swift build -c release
- name: Install MLX Metal library
run: |
python3 -m venv /tmp/mlx_venv
/tmp/mlx_venv/bin/pip install --quiet mlx
cp /tmp/mlx_venv/lib/python*/site-packages/mlx/lib/mlx.metallib .build/release/
- name: Cache MLX model
uses: actions/cache@v4
with:
path: ~/.cache/huggingface
key: mlx-model-qwen2.5-0.5b-4bit
- name: Run E2E tests
env:
HF_HUB_DOWNLOAD_TIMEOUT: "120"
run: |
chmod +x tests/test-server.sh
# Retry up to 2 times for transient HuggingFace download failures
for attempt in 1 2 3; do
echo "Attempt $attempt of 3..."
if tests/test-server.sh .build/release/mlx-server 15413; then
exit 0
fi
if [ "$attempt" -lt 3 ]; then
echo "Test failed, retrying in 10s..."
sleep 10
fi
done
echo "All attempts failed"
exit 1
- name: Upload test logs on failure
if: failure()
uses: actions/upload-artifact@v4
with:
name: e2e-test-logs
path: /tmp/mlx-server-test-*.log
retention-days: 7