Skip to content

Commit 96865e4

Browse files
authored
[ci] bump transformers to 4.57.1 (#1586)
Signed-off-by: AlpinDale <alpindale@gmail.com>
1 parent e0f91e5 commit 96865e4

9 files changed

Lines changed: 16 additions & 20 deletions

File tree

aphrodite/modeling/models/moonvit.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@
4747
import torch
4848
import torch.nn as nn
4949
import torch.nn.functional as F
50-
from transformers.activations import ACT2FN, PytorchGELUTanh
50+
from transformers.activations import ACT2FN
5151
from transformers.modeling_utils import PreTrainedModel
5252
from transformers.utils import is_flash_attn_2_available
5353

@@ -596,7 +596,7 @@ def __init__(
596596
"num_heads": config.num_attention_heads,
597597
"hidden_dim": config.hidden_size,
598598
"mlp_dim": config.intermediate_size,
599-
"activation": PytorchGELUTanh(),
599+
"activation": ACT2FN["gelu_pytorch_tanh"],
600600
"attn_bias": True,
601601
"attn_implementation": config._attn_implementation,
602602
},

aphrodite/modeling/models/qwen2_vl.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@
3131
import torch.nn as nn
3232
import torch.nn.functional as F
3333
from einops import rearrange, repeat
34-
from transformers import AutoConfig, BatchFeature, PretrainedConfig
34+
from transformers import BatchFeature, PretrainedConfig
3535
from transformers.models.qwen2_vl import Qwen2VLImageProcessor, Qwen2VLProcessor
3636
from transformers.models.qwen2_vl.configuration_qwen2_vl import Qwen2VLConfig, Qwen2VLVisionConfig
3737
from transformers.models.qwen2_vl.image_processing_qwen2_vl import smart_resize
@@ -1500,9 +1500,7 @@ def __init__(
15001500
class Tarsier2ProcessingInfo(Qwen2VLProcessingInfo):
15011501
def get_hf_config(self) -> Qwen2VLConfig:
15021502
model_path = self.ctx.model_config.model
1503-
original_config = AutoConfig.from_pretrained(model_path)
1504-
config_dict = original_config.to_dict()
1505-
correct_config = Qwen2VLConfig.from_dict(config_dict)
1503+
correct_config = Qwen2VLConfig.from_pretrained(model_path)
15061504

15071505
return correct_config
15081506

aphrodite/modeling/models/transformers/base.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -293,7 +293,7 @@ def create_attention_instances(self) -> dict[int, Attention]:
293293
# Aphrodite does not support encoder-decoder models, so if any encoder layer is
294294
# found in a text only model, we assume the whole model is an encoder model
295295
if has_encoder(self.model) and not is_multimodal(self.config):
296-
self.check_version("4.57.0.dev0", "encoder models support")
296+
self.check_version("5.0.0", "encoder models support")
297297
attn_type = AttentionType.ENCODER_ONLY
298298
else:
299299
attn_type = AttentionType.DECODER

aphrodite/modeling/models/transformers/moe.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -112,7 +112,7 @@ def transformers_moe_forward_fake(
112112

113113
class MoEMixin(MixtureOfExperts):
114114
def __init__(self, *, aphrodite_config: "AphroditeConfig", prefix: str = ""):
115-
self.check_version("4.57.0.dev0", "MoE models support")
115+
self.check_version("5.0.0", "MoE models support")
116116
# Skip MixtureOfExperts.__init__ and call the next class in MRO
117117
super(MixtureOfExperts, self).__init__(aphrodite_config=aphrodite_config, prefix=prefix)
118118

requirements/common.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ requests >= 2.26.0
77
tqdm
88
blake3
99
py-cpuinfo
10-
transformers >= 4.56.0
10+
transformers >= 4.56.0, < 5
1111
tokenizers >= 0.21.1 # Required for fast incremental detokenization.
1212
protobuf # Required by LlamaTokenizer.
1313
fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint.

requirements/test.in

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ datamodel_code_generator # required for minicpm3 test
3737
# TODO: Use lm-eval[api]==0.4.10 once released
3838
lm-eval[api] @ git+https://github.com/EleutherAI/lm-evaluation-harness.git@206b7722158f58c35b7ffcd53b035fdbdda5126d # required for model evaluation test
3939
mteb[bm25s]>=1.38.11, <2 # required for mteb test
40-
transformers==4.56.2
40+
transformers==4.57.1
4141
tokenizers==0.22.0
4242
schemathesis>=3.39.15 # Required for openai schema test.
4343
# quantization

requirements/test.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1196,7 +1196,7 @@ tqdm==4.66.6
11961196
# transformers
11971197
tqdm-multiprocess==0.0.11
11981198
# via lm-eval
1199-
transformers==4.56.2
1199+
transformers==4.57.1
12001200
# via
12011201
# -r requirements/test.in
12021202
# genai-perf

tests/models/registry.py

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -745,21 +745,19 @@ def check_available_online(
745745
}
746746

747747
_TRANSFORMERS_BACKEND_MODELS = {
748-
"TransformersEmbeddingModel": _HfExamplesInfo("BAAI/bge-base-en-v1.5", min_transformers_version="4.57.0.dev0"),
748+
"TransformersEmbeddingModel": _HfExamplesInfo("BAAI/bge-base-en-v1.5", min_transformers_version="5.0.0"),
749749
"TransformersForSequenceClassification": _HfExamplesInfo(
750750
"papluca/xlm-roberta-base-language-detection",
751-
min_transformers_version="4.57.0.dev0",
751+
min_transformers_version="5.0.0",
752752
),
753753
"TransformersForCausalLM": _HfExamplesInfo("hmellor/Ilama-3.2-1B", trust_remote_code=True),
754754
"TransformersMultiModalForCausalLM": _HfExamplesInfo("BAAI/Emu3-Chat-hf"),
755-
"TransformersMoEForCausalLM": _HfExamplesInfo("allenai/OLMoE-1B-7B-0924", min_transformers_version="4.57.0.dev0"),
755+
"TransformersMoEForCausalLM": _HfExamplesInfo("allenai/OLMoE-1B-7B-0924", min_transformers_version="5.0.0"),
756756
"TransformersMultiModalMoEForCausalLM": _HfExamplesInfo(
757-
"Qwen/Qwen3-VL-30B-A3B-Instruct", min_transformers_version="4.57.0.dev0"
758-
),
759-
"TransformersMoEEmbeddingModel": _HfExamplesInfo("Qwen/Qwen3-30B-A3B", min_transformers_version="4.57.0.dev0"),
760-
"TransformersMoEForSequenceClassification": _HfExamplesInfo(
761-
"Qwen/Qwen3-30B-A3B", min_transformers_version="4.57.0.dev0"
757+
"Qwen/Qwen3-VL-30B-A3B-Instruct", min_transformers_version="5.0.0"
762758
),
759+
"TransformersMoEEmbeddingModel": _HfExamplesInfo("Qwen/Qwen3-30B-A3B", min_transformers_version="5.0.0"),
760+
"TransformersMoEForSequenceClassification": _HfExamplesInfo("Qwen/Qwen3-30B-A3B", min_transformers_version="5.0.0"),
763761
"TransformersMultiModalEmbeddingModel": _HfExamplesInfo("google/gemma-3-4b-it"),
764762
"TransformersMultiModalForSequenceClassification": _HfExamplesInfo("google/gemma-3-4b-it"),
765763
}

tests/models/test_transformers.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,7 @@ def test_models(
8080
from packaging.version import Version
8181

8282
installed = Version(transformers.__version__)
83-
required = Version("4.57.0.dev0")
83+
required = Version("5.0.0")
8484
if model == "allenai/OLMoE-1B-7B-0924" and installed < required:
8585
pytest.skip(f"MoE models with the Transformers backend require transformers>={required}, but got {installed}")
8686

0 commit comments

Comments
 (0)