@@ -276,33 +276,20 @@ def get_tokenizer(ckpt_path, trust_remote_code=False, **kwargs) -> PreTrainedTok
276276 if "vila" in ckpt_path .lower ():
277277 ckpt_path += "/llm"
278278
279- # Suppress verbose tokenizer output (e.g., printing all special tokens)
280- import contextlib
281- import io
282- import logging
283- import os
284-
285- # Save current settings
286- old_verbosity = os .environ .get ("TOKENIZERS_PARALLELISM" , None )
287- transformers_log_level = logging .getLogger ("transformers" ).level
288-
289- # Suppress output
290- os .environ ["TOKENIZERS_PARALLELISM" ] = "false"
291- logging .getLogger ("transformers" ).setLevel (logging .ERROR )
292-
293- # Also capture stdout to suppress verbose tokenizer printing
294- with contextlib .redirect_stdout (io .StringIO ()):
295- try :
279+ # Some custom tokenizers (e.g., Nemotron-Parse) print verbose output when loading.
280+ # Only suppress stdout for trust_remote_code models where custom tokenizer code may be noisy.
281+ if trust_remote_code :
282+ import contextlib
283+ import io
284+
285+ with contextlib .redirect_stdout (io .StringIO ()):
296286 tokenizer = AutoTokenizer .from_pretrained (
297287 ckpt_path , trust_remote_code = trust_remote_code , ** kwargs
298288 )
299- finally :
300- # Restore original settings
301- if old_verbosity is not None :
302- os .environ ["TOKENIZERS_PARALLELISM" ] = old_verbosity
303- else :
304- os .environ .pop ("TOKENIZERS_PARALLELISM" , None )
305- logging .getLogger ("transformers" ).setLevel (transformers_log_level )
289+ else :
290+ tokenizer = AutoTokenizer .from_pretrained (
291+ ckpt_path , trust_remote_code = trust_remote_code , ** kwargs
292+ )
306293
307294 # can't set attribute 'pad_token' for "<unk>"
308295 # We skip this step for Nemo models
@@ -355,25 +342,17 @@ def get_processor(
355342
356343 return MllamaImageProcessor (processor , device )
357344 else :
358- # Try to load AutoProcessor for other VL models (e.g., Nemotron-Parse)
359- # This will only work if the model has a processor config
360- try :
361- import contextlib
362- import io
363- import logging
364-
365- # Suppress verbose output from processor/tokenizer loading
366- transformers_log_level = logging .getLogger ("transformers" ).level
367- logging .getLogger ("transformers" ).setLevel (logging .ERROR )
368-
369- with contextlib .redirect_stdout (io .StringIO ()):
370- processor = AutoProcessor .from_pretrained (
371- ckpt_path ,
372- ** model_kwargs ,
373- )
345+ # Try to load AutoProcessor for other VL models (e.g., Nemotron-Parse).
346+ # Suppress stdout for trust_remote_code models where custom processor code may be noisy.
347+ import contextlib
348+ import io
374349
375- # Restore logging
376- logging .getLogger ("transformers" ).setLevel (transformers_log_level )
350+ try :
351+ if model_kwargs .get ("trust_remote_code" , False ):
352+ with contextlib .redirect_stdout (io .StringIO ()):
353+ processor = AutoProcessor .from_pretrained (ckpt_path , ** model_kwargs )
354+ else :
355+ processor = AutoProcessor .from_pretrained (ckpt_path , ** model_kwargs )
377356
378357 print (f"Loaded AutoProcessor for model type: { model_type } " )
379358 return processor
0 commit comments