Skip to content

Commit 79d8531

Browse files
Merge branch 'main' into CSY/fix-to
2 parents ef0014a + de4c517 commit 79d8531

111 files changed

Lines changed: 6669 additions & 738 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
#!/usr/bin/env bash
22
set -euo pipefail
33

4-
python -m pip install -U build twine setuptools
4+
python -m pip install uv
5+
uv pip install -U build twine setuptools
56
python -m build --sdist

.github/scripts/ci_release_test_install.sh

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@ set -euo pipefail
44
pkg_name="${1:?package filename is required}"
55
venv_dir="${2:-local_uv_env}"
66

7-
uv venv "$venv_dir"
7+
python -m venv "$venv_dir"
88
source "$venv_dir/bin/activate"
9-
uv pip install "dist/$pkg_name" torch
9+
pip install uv
10+
uv pip install "dist/$pkg_name"

.github/scripts/ci_write_runner_outputs.sh

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -3,23 +3,19 @@ set -euo pipefail
33

44
runner_ip="${1:?runner ip is required}"
55
github_run_id="${2:?github run id is required}"
6-
artifact_id="${3:-}"
7-
max_parallel="${4:-}"
6+
max_parallel="${3:-}"
87

98
if [[ -z "${GITHUB_OUTPUT:-}" ]]; then
109
echo "GITHUB_OUTPUT is required" >&2
1110
exit 1
1211
fi
1312

1413
run_id="$github_run_id"
15-
if [[ -n "$artifact_id" ]]; then
16-
run_id="$artifact_id"
17-
fi
1814

1915
echo "ip=$runner_ip" >> "$GITHUB_OUTPUT"
2016
echo "ip: $runner_ip"
2117
echo "run_id=$run_id" >> "$GITHUB_OUTPUT"
22-
echo "artifact_id=$run_id"
18+
echo "run_id=$run_id"
2319

2420
if [[ -n "$max_parallel" ]]; then
2521
max_parallel_json="{\"size\": ${max_parallel:-20}}"

.github/scripts/deps.yaml

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -107,6 +107,9 @@ tests:
107107
- gguf
108108

109109
tests/models:
110+
test_chatglm:
111+
- sentencepiece
112+
110113
test_cohere2:
111114
- jieba
112115

@@ -123,6 +126,7 @@ tests/models:
123126
- http://10.0.13.31/files/causal_conv1d-1.6.0-cp313-cp313-linux_x86_64.whl
124127
- mamba_ssm
125128
- tiktoken
129+
- attn_gym
126130

127131
test_internlm.py:
128132
- transformers<=4.44.2
@@ -137,10 +141,26 @@ tests/models:
137141
- backoff>=2.2.1
138142
- optimum>=1.24.0
139143
- scipy
144+
- backoff
140145

141146
test_llama3_2_exllamav3.py:
142147
- pydantic
143148

149+
test_internvl_chat.py:
150+
- timm
151+
- sentencepiece
152+
- tiktoken
153+
154+
test_ling_2_6_flash_support:
155+
- flash-linear-attention
156+
157+
test_nemotron_omni_support.py:
158+
- einops
159+
- timm
160+
- open-clip-torch
161+
- librosa
162+
- mamba_ssm
163+
144164
tests/models/awq:
145165
test_qwen3_8b_base_awq.py:
146166
- peft

.github/scripts/test.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,9 @@ tests:
1616
tests/models:
1717
py: 3.13
1818

19+
test_llama3_2_fp8:
20+
sm: '12.0'
21+
1922
tests/kernels:
2023
test_asymmetric_real_models:
2124
sm: '9.0'

.github/workflows/release.yml

Lines changed: 33 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -54,59 +54,57 @@ concurrency:
5454
cancel-in-progress: true
5555

5656
jobs:
57-
check-vm:
58-
runs-on: [ self-hosted, linux ]
59-
container:
60-
image: modelcloud/gptqmodel:alpine-ci-v1
61-
outputs:
62-
ip: ${{ steps.get_ip.outputs.ip }}
63-
run_id: ${{ steps.get_ip.outputs.run_id }}
64-
if: ${{ inputs.github_vm == false }}
65-
steps:
66-
- name: Checkout Codes
67-
uses: actions/checkout@v6
68-
with:
69-
repository: ${{ env.repo }}
70-
ref: ${{ env.ref }}
71-
72-
- name: Print env
73-
run: |
74-
echo "event name: ${{ github.event_name }}"
75-
echo "repo: ${{ env.repo }}"
76-
echo "ref: ${{ env.ref }}"
77-
echo "upload_release: ${{ inputs.upload_release }}"
78-
echo "upload_pypi: ${{ inputs.upload_pypi }}"
79-
80-
- name: Select server
81-
id: get_ip
82-
run: |
83-
bash .github/scripts/ci_write_runner_outputs.sh "$RUNNER" "${{ github.run_id }}"
84-
8557
release-source:
8658
permissions:
8759
contents: write
8860
runs-on: [ self-hosted, xeon5 ]
89-
needs:
90-
- check-vm
9161
if: ${{ inputs.github_vm == false }}
62+
env:
63+
UV_TORCH_BACKEND: cu130
64+
TORCH_VERSION: 2.11.0
65+
PYTHON_VERSION: 3.14
66+
UV_PYTHON: 3.14
9267
container:
93-
image: ${{ needs.check-vm.outputs.ip }}:5000/nvidia/cuda:130-ubuntu24.04_0415
68+
image: 10.0.13.31:5000/nvidia/cuda:130-ubuntu24.04_0415
9469
volumes:
9570
- /monster/ci/env/entrypoint.sh:/etc/profile.d/01-entrypoint.sh
96-
- /monster/ci/uv:/opt/uv
71+
- /github/workspace/uv:/opt/uv
72+
- /github/workspace/tmp:/opt/uv/tmp
73+
- /monster/ci/uv/python:/opt/uv/python
74+
- /monster/ci/uv/cache/python:/opt/uv/cache/python
75+
- /monster/ci/uv/setup_uv_venv.sh:/opt/uv/setup_uv_venv.sh
76+
- /monster/ci/uv/uv:/opt/uv/uv
77+
- /monster/ci/uv/uvx:/opt/uv/uvx
78+
- /monster/ci/uv/env:/opt/uv/env
79+
- /monster/ci/uv/uv.toml:/opt/uv/uv.toml
80+
- /monster/ci/env:/opt/env
9781
steps:
9882
- name: Checkout Codes
9983
uses: actions/checkout@v6
10084
with:
10185
repository: ${{ env.repo }}
10286
ref: ${{ env.ref }}
10387

88+
- name: Activate uv env
89+
run: |
90+
echo "::group::-- dust uv cache dir --"
91+
dust $(uv cache dir)
92+
echo "::endgroup::"
93+
94+
bash .github/scripts/ci_unit_activate_uv_env.sh \
95+
"gptqmodel_py314t_release_source" \
96+
130 \
97+
"${{ env.TORCH_VERSION }}" \
98+
"${{ github.run_id }}" \
99+
"${{ github.run_attempt }}"
100+
104101
- name: Setup release env
105102
run: |
106-
export UV_PYTHON=3.14
107-
echo "UV_PYTHON=3.14" >> "$GITHUB_ENV"
103+
echo "::group::-- uv envs --"
104+
printenv | grep UV
105+
echo "::endgroup::"
108106
109-
env_name="gptqmodel_py314_release_source"
107+
env_name="gptqmodel_py314t_release_source"
110108
/opt/uv/setup_uv_venv.sh $env_name
111109
112110
- name: Run shared release source flow

.github/workflows/unit_tests.yml

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -30,10 +30,6 @@ on:
3030
description: 'Regex to filter test files'
3131
required: false
3232
default: ''
33-
artifact_id:
34-
description: 'Run id for artifact to be downloaded'
35-
required: false
36-
default: ''
3733
max-parallel:
3834
description: 'Parallel jobs'
3935
required: false
@@ -113,7 +109,6 @@ jobs:
113109
run: |
114110
echo "repo: ${{ env.repo }}"
115111
echo "ref: ${{ env.ref }}"
116-
echo "artifact_id: ${{ github.event.inputs.artifact_id }}"
117112
echo "selected server: ${{ github.event.inputs.server }}"
118113
119114
- name: Set server
@@ -122,7 +117,6 @@ jobs:
122117
bash .github/scripts/ci_write_runner_outputs.sh \
123118
"$RUNNER" \
124119
"${{ github.run_id }}" \
125-
"${{ github.event.inputs.artifact_id }}" \
126120
"${{ github.event.inputs['max-parallel'] }}"
127121
128122
list-test-files:

.github/workflows/unit_tests_reusable.yml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,7 @@ env:
7171
repo: ${{ inputs.repo || github.repository }}
7272
ref: ${{ inputs.ref || github.ref }}
7373
HF_TOKEN: ${{ secrets.HF_TOKEN }}
74+
DEBUG_ON: 1
7475

7576
jobs:
7677
test:
@@ -244,7 +245,7 @@ jobs:
244245
rm -rf ./* .[^.] .??* || true
245246
echo "cleaning venv: ${{ env.VIRTUAL_ENV }}"
246247
rm -rf "${{ env.VIRTUAL_ENV }}"
247-
248+
248249
echo "::group::-- dust uv cache dir --"
249250
dust $(uv cache dir)
250251
echo "::endgroup::"

.gitignore

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -194,4 +194,6 @@ example.py
194194
/gptqmodel_ext/machete/generated/
195195
AGENT.md
196196
AGENTs.md
197-
.codex
197+
.codex
198+
temp
199+
tmp

0 commit comments

Comments
 (0)