@@ -1043,7 +1043,7 @@ def _call_hf_processor(
10431043
10441044 # vLLM may pass add_special_tokens in tok_kwargs; we set it ourselves
10451045 tok_kwargs = {k : v for k , v in tok_kwargs .items () if k != "add_special_tokens" }
1046-
1046+
10471047 if has_encoder_data :
10481048 # Tokenize the encoder text from mm_data
10491049 encoder_texts = mm_data ["texts" ]
@@ -1155,7 +1155,8 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
11551155 config .vocab_size , config .d_model , embed_scale = embed_scale
11561156 )
11571157 # Bias added to logits after lm_head, matching HuggingFace approach
1158- self .register_buffer ("final_logits_bias" , torch .zeros ((1 , config .vocab_size )))
1158+ self .register_buffer ("final_logits_bias" ,
1159+ torch .zeros ((1 , config .vocab_size )))
11591160 self .logits_processor = LogitsProcessor (
11601161 self .unpadded_vocab_size , config .vocab_size
11611162 )
@@ -1343,9 +1344,7 @@ def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]) -> set[str]:
13431344 "Shared weight embedding already loaded with name "
13441345 "%s, skipping. This is expected on facebook/bart-large"
13451346 " like models, where the same shared embedding is "
1346- "present multiple times." ,
1347- name ,
1348- )
1347+ "present multiple times." , name )
13491348 continue
13501349
13511350 loader = AutoWeightsLoader (
@@ -1383,4 +1382,4 @@ def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]) -> set[str]:
13831382 for key in self .keys_to_ignore_on_load_missing :
13841383 loaded_params .add (key )
13851384
1386- return loaded_params
1385+ return loaded_params
0 commit comments