Merge branch 'main' into qwen-image-batch-size-mismatch

chenyangzhu1 · web-flow · commit b635e65a5304 · 2026-04-08T14:26:59.000+08:00
diff --git a/.github/labeler.yml b/.github/labeler.yml
@@ -0,0 +1,97 @@
+# https://github.com/actions/labeler
+pipelines:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/pipelines/**
+
+models:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/models/**
+
+schedulers:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/schedulers/**
+
+single-file:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/loaders/single_file.py
+            - src/diffusers/loaders/single_file_model.py
+            - src/diffusers/loaders/single_file_utils.py
+
+ip-adapter:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/loaders/ip_adapter.py
+
+lora:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/loaders/lora_base.py
+            - src/diffusers/loaders/lora_conversion_utils.py
+            - src/diffusers/loaders/lora_pipeline.py
+            - src/diffusers/loaders/peft.py
+
+loaders:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/loaders/textual_inversion.py
+            - src/diffusers/loaders/transformer_flux.py
+            - src/diffusers/loaders/transformer_sd3.py
+            - src/diffusers/loaders/unet.py
+            - src/diffusers/loaders/unet_loader_utils.py
+            - src/diffusers/loaders/utils.py
+            - src/diffusers/loaders/__init__.py
+
+quantization:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/quantizers/**
+
+hooks:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/hooks/**
+
+guiders:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/guiders/**
+
+modular-pipelines:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/modular_pipelines/**
+
+experimental:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/experimental/**
+
+documentation:
+    - changed-files:
+        - any-glob-to-any-file:
+            - docs/**
+
+tests:
+    - changed-files:
+        - any-glob-to-any-file:
+            - tests/**
+
+examples:
+    - changed-files:
+        - any-glob-to-any-file:
+            - examples/**
+
+CI:
+    - changed-files:
+        - any-glob-to-any-file:
+            - .github/**
+
+utils:
+    - changed-files:
+        - any-glob-to-any-file:
+            - src/diffusers/utils/**
+            - src/diffusers/commands/**
diff --git a/.github/workflows/issue_labeler.yml b/.github/workflows/issue_labeler.yml
@@ -0,0 +1,36 @@
+name: Issue Labeler
+
+on:
+  issues:
+    types: [opened]
+
+permissions:
+  contents: read
+  issues: write
+
+jobs:
+  label:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
+      - name: Install dependencies
+        run: pip install huggingface_hub
+      - name: Get labels from LLM
+        id: get-labels
+        env:
+          HF_TOKEN: ${{ secrets.HF_TOKEN }}
+          ISSUE_TITLE: ${{ github.event.issue.title }}
+          ISSUE_BODY: ${{ github.event.issue.body }}
+        run: |
+          LABELS=$(python utils/label_issues.py)
+          echo "labels=$LABELS" >> "$GITHUB_OUTPUT"
+      - name: Apply labels
+        if: steps.get-labels.outputs.labels != ''
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          ISSUE_NUMBER: ${{ github.event.issue.number }}
+          LABELS: ${{ steps.get-labels.outputs.labels }}
+        run: |
+          for label in $(echo "$LABELS" | python -c "import json,sys; print('\n'.join(json.load(sys.stdin)))"); do
+            gh issue edit "$ISSUE_NUMBER" --add-label "$label"
+          done
diff --git a/.github/workflows/pr_labeler.yml b/.github/workflows/pr_labeler.yml
@@ -0,0 +1,63 @@
+name: PR Labeler
+
+on:
+  pull_request_target:
+    types: [opened, synchronize, reopened]
+
+permissions:
+  contents: read
+  pull-requests: write
+
+jobs:
+  label:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/labeler@8558fd74291d67161a8a78ce36a881fa63b766a9  # v5
+        with:
+          sync-labels: true
+
+  missing-tests:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
+      - name: Check for missing tests
+        id: check
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          PR_NUMBER: ${{ github.event.pull_request.number }}
+          REPO: ${{ github.repository }}
+        run: |
+          gh api --paginate "repos/${REPO}/pulls/${PR_NUMBER}/files" \
+            | python utils/check_test_missing.py
+      - name: Add or remove missing-tests label
+        if: always()
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          PR_NUMBER: ${{ github.event.pull_request.number }}
+        run: |
+          if [ "${{ steps.check.outcome }}" = "failure" ]; then
+            gh pr edit "$PR_NUMBER" --add-label "missing-tests"
+          else
+            gh pr edit "$PR_NUMBER" --remove-label "missing-tests" 2>/dev/null || true
+          fi
+
+  size-label:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Label PR by diff size
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          PR_NUMBER: ${{ github.event.pull_request.number }}
+          REPO: ${{ github.repository }}
+        run: |
+          DIFF_SIZE=$(gh api "repos/${REPO}/pulls/${PR_NUMBER}" --jq '.additions + .deletions')
+          for label in size/S size/M size/L; do
+            gh pr edit "$PR_NUMBER" --repo "$REPO" --remove-label "$label" 2>/dev/null || true
+          done
+          if [ "$DIFF_SIZE" -lt 50 ]; then
+            gh pr edit "$PR_NUMBER" --repo "$REPO" --add-label "size/S"
+          elif [ "$DIFF_SIZE" -lt 200 ]; then
+            gh pr edit "$PR_NUMBER" --repo "$REPO" --add-label "size/M"
+          else
+            gh pr edit "$PR_NUMBER" --repo "$REPO" --add-label "size/L"
+          fi
diff --git a/src/diffusers/models/transformers/transformer_glm_image.py b/src/diffusers/models/transformers/transformer_glm_image.py
@@ -533,10 +533,11 @@ class GlmImageTransformer2DModel(ModelMixin, ConfigMixin, PeftAdapterMixin, Cach
     """
 
     _supports_gradient_checkpointing = True
+    _repeated_blocks = ["GlmImageTransformerBlock"]
     _no_split_modules = [
         "GlmImageTransformerBlock",
         "GlmImageImageProjector",
-        "GlmImageImageProjector",
+        "GlmImageCombinedTimestepSizeEmbeddings",
     ]
     _skip_layerwise_casting_patterns = ["patch_embed", "norm", "proj_out"]
     _skip_keys = ["kv_caches"]
diff --git a/tests/models/transformers/test_models_transformer_glm_image.py b/tests/models/transformers/test_models_transformer_glm_image.py
@@ -0,0 +1,94 @@
+# coding=utf-8
+# Copyright 2025 HuggingFace Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import torch
+
+from diffusers import GlmImageTransformer2DModel
+from diffusers.utils.torch_utils import randn_tensor
+
+from ...testing_utils import enable_full_determinism, torch_device
+from ..testing_utils import (
+    BaseModelTesterConfig,
+    ModelTesterMixin,
+    TrainingTesterMixin,
+)
+
+
+enable_full_determinism()
+
+
+class GlmImageTransformerTesterConfig(BaseModelTesterConfig):
+    @property
+    def model_class(self):
+        return GlmImageTransformer2DModel
+
+    @property
+    def main_input_name(self) -> str:
+        return "hidden_states"
+
+    @property
+    def output_shape(self) -> tuple:
+        return (4, 8, 8)
+
+    @property
+    def input_shape(self) -> tuple:
+        return (4, 8, 8)
+
+    @property
+    def generator(self):
+        return torch.Generator("cpu").manual_seed(0)
+
+    def get_init_dict(self) -> dict:
+        return {
+            "patch_size": 2,
+            "in_channels": 4,
+            "out_channels": 4,
+            "num_layers": 1,
+            "attention_head_dim": 8,
+            "num_attention_heads": 2,
+            "text_embed_dim": 32,
+            "time_embed_dim": 16,
+            "condition_dim": 8,
+            "prior_vq_quantizer_codebook_size": 64,
+        }
+
+    def get_dummy_inputs(self, batch_size: int = 1) -> dict[str, torch.Tensor]:
+        num_channels = 4
+        height = width = 8
+        sequence_length = 12
+
+        return {
+            "hidden_states": randn_tensor(
+                (batch_size, num_channels, height, width), generator=self.generator, device=torch_device
+            ),
+            "encoder_hidden_states": randn_tensor(
+                (batch_size, sequence_length, 32), generator=self.generator, device=torch_device
+            ),
+            "prior_token_id": torch.randint(0, 64, size=(batch_size,), generator=self.generator).to(torch_device),
+            "prior_token_drop": torch.zeros(batch_size, dtype=torch.bool, device=torch_device),
+            "timestep": torch.randint(0, 1000, size=(batch_size,), generator=self.generator).to(torch_device),
+            "target_size": torch.tensor([[height, width]] * batch_size, dtype=torch.float32).to(torch_device),
+            "crop_coords": torch.tensor([[0, 0]] * batch_size, dtype=torch.float32).to(torch_device),
+        }
+
+
+class TestGlmImageTransformer(GlmImageTransformerTesterConfig, ModelTesterMixin):
+    pass
+
+
+class TestGlmImageTransformerTraining(GlmImageTransformerTesterConfig, TrainingTesterMixin):
+    def test_gradient_checkpointing_is_applied(self):
+        expected_set = {"GlmImageTransformer2DModel"}
+        super().test_gradient_checkpointing_is_applied(expected_set=expected_set)
diff --git a/utils/check_test_missing.py b/utils/check_test_missing.py
@@ -0,0 +1,86 @@
+import ast
+import json
+import sys
+
+
+SRC_DIRS = ["src/diffusers/pipelines/", "src/diffusers/models/", "src/diffusers/schedulers/"]
+MIXIN_BASES = {"ModelMixin", "SchedulerMixin", "DiffusionPipeline"}
+
+
+def extract_classes_from_file(filepath: str) -> list[str]:
+    with open(filepath) as f:
+        tree = ast.parse(f.read())
+
+    classes = []
+    for node in ast.walk(tree):
+        if not isinstance(node, ast.ClassDef):
+            continue
+        base_names = set()
+        for base in node.bases:
+            if isinstance(base, ast.Name):
+                base_names.add(base.id)
+            elif isinstance(base, ast.Attribute):
+                base_names.add(base.attr)
+        if base_names & MIXIN_BASES:
+            classes.append(node.name)
+
+    return classes
+
+
+def extract_imports_from_file(filepath: str) -> set[str]:
+    with open(filepath) as f:
+        tree = ast.parse(f.read())
+
+    names = set()
+    for node in ast.walk(tree):
+        if isinstance(node, ast.ImportFrom):
+            for alias in node.names:
+                names.add(alias.name)
+        elif isinstance(node, ast.Import):
+            for alias in node.names:
+                names.add(alias.name.split(".")[-1])
+
+    return names
+
+
+def main():
+    pr_files = json.load(sys.stdin)
+
+    new_classes = []
+    for f in pr_files:
+        if f["status"] != "added" or not f["filename"].endswith(".py"):
+            continue
+        if not any(f["filename"].startswith(d) for d in SRC_DIRS):
+            continue
+        try:
+            new_classes.extend(extract_classes_from_file(f["filename"]))
+        except (FileNotFoundError, SyntaxError):
+            continue
+
+    if not new_classes:
+        sys.exit(0)
+
+    new_test_files = [
+        f["filename"]
+        for f in pr_files
+        if f["status"] == "added" and f["filename"].startswith("tests/") and f["filename"].endswith(".py")
+    ]
+
+    imported_names = set()
+    for filepath in new_test_files:
+        try:
+            imported_names |= extract_imports_from_file(filepath)
+        except (FileNotFoundError, SyntaxError):
+            continue
+
+    untested = [cls for cls in new_classes if cls not in imported_names]
+
+    if untested:
+        print(f"missing-tests: {', '.join(untested)}")
+        sys.exit(1)
+    else:
+        sys.exit(0)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/utils/label_issues.py b/utils/label_issues.py