|
17 | 17 |
|
18 | 18 | import numpy as np |
19 | 19 | import torch |
20 | | -from transformers import BertModel, BertTokenizer, CLIPImageProcessor, MT5Tokenizer, T5EncoderModel |
| 20 | +from transformers import BertModel, BertTokenizer, CLIPImageProcessor, T5EncoderModel, T5Tokenizer |
21 | 21 |
|
22 | 22 | from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput |
23 | 23 |
|
@@ -173,7 +173,7 @@ class HunyuanDiTPAGPipeline(DiffusionPipeline, PAGMixin): |
173 | 173 | The HunyuanDiT model designed by Tencent Hunyuan. |
174 | 174 | text_encoder_2 (`T5EncoderModel`): |
175 | 175 | The mT5 embedder. Specifically, it is 't5-v1_1-xxl'. |
176 | | - tokenizer_2 (`MT5Tokenizer`): |
| 176 | + tokenizer_2 (`T5Tokenizer`): |
177 | 177 | The tokenizer for the mT5 embedder. |
178 | 178 | scheduler ([`DDPMScheduler`]): |
179 | 179 | A scheduler to be used in combination with HunyuanDiT to denoise the encoded image latents. |
@@ -208,7 +208,7 @@ def __init__( |
208 | 208 | feature_extractor: Optional[CLIPImageProcessor] = None, |
209 | 209 | requires_safety_checker: bool = True, |
210 | 210 | text_encoder_2: Optional[T5EncoderModel] = None, |
211 | | - tokenizer_2: Optional[MT5Tokenizer] = None, |
| 211 | + tokenizer_2: Optional[T5Tokenizer] = None, |
212 | 212 | pag_applied_layers: Union[str, List[str]] = "blocks.1", # "blocks.16.attn1", "blocks.16", "16", 16 |
213 | 213 | ): |
214 | 214 | super().__init__() |
|
0 commit comments