Skip to content

Commit 2ca57a7

Browse files
committed
up
1 parent 89b499b commit 2ca57a7

9 files changed

Lines changed: 819 additions & 988 deletions

File tree

.github/workflows/mlx.yml

Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,51 @@ jobs:
6363
./cmake-out/backends/mlx/test/multi_thread_test_runner
6464
echo "::endgroup::"
6565
66+
echo "::group::Run gated_delta_rule op tests"
67+
${CONDA_RUN} python -m executorch.backends.mlx.model_ops.test_gated_delta_rule run -v
68+
echo "::endgroup::"
69+
70+
test-mlx-qwen35-moe:
71+
uses: pytorch/test-infra/.github/workflows/macos_job.yml@main
72+
with:
73+
job-name: test-mlx-qwen35-moe
74+
runner: macos-14-xlarge
75+
python-version: "3.12"
76+
submodules: recursive
77+
ref: ${{ github.event_name == 'pull_request' && github.event.pull_request.head.sha || github.sha }}
78+
timeout: 90
79+
script: |
80+
set -eux
81+
82+
echo "::group::Install ExecuTorch"
83+
${CONDA_RUN} python install_executorch.py > /dev/null
84+
echo "::endgroup::"
85+
86+
${CONDA_RUN} pip list
87+
88+
echo "::group::Export Qwen 3.5 MoE (tiny model)"
89+
${CONDA_RUN} python -m executorch.examples.models.qwen3_5_moe.export \
90+
--tiny-test \
91+
--backend mlx \
92+
--qlinear 4w \
93+
--qlinear-group-size 32 \
94+
--output-dir /tmp/qwen35_moe_mlx_tiny
95+
echo "::endgroup::"
96+
97+
echo "::group::Run Qwen 3.5 MoE inference"
98+
OUTPUT=$(${CONDA_RUN} python -m executorch.examples.models.qwen3_5_moe.run \
99+
--pte /tmp/qwen35_moe_mlx_tiny/model.pte \
100+
--prompt-len 4 \
101+
--max-new-tokens 5 2>&1)
102+
echo "$OUTPUT"
103+
if echo "$OUTPUT" | grep -q "Generated token ids:"; then
104+
echo "Success: Qwen 3.5 MoE MLX export + inference completed"
105+
else
106+
echo "Failed: inference did not complete"
107+
exit 1
108+
fi
109+
echo "::endgroup::"
110+
66111
backend-tester:
67112
strategy:
68113
fail-fast: false

0 commit comments

Comments
 (0)