@@ -1009,7 +1009,6 @@ class _BaseModelWithGenerate(PreTrainedModel, GenerationMixin):
10091009 ("perception_lm" , "PerceptionLMForConditionalGeneration" ),
10101010 ("pi0" , "PI0ForConditionalGeneration" ),
10111011 ("pix2struct" , "Pix2StructForConditionalGeneration" ),
1012- ("pixtral" , "LlavaForConditionalGeneration" ),
10131012 ("pp_chart2table" , "GotOcr2ForConditionalGeneration" ),
10141013 ("qwen2_5_vl" , "Qwen2_5_VLForConditionalGeneration" ),
10151014 ("qwen2_vl" , "Qwen2VLForConditionalGeneration" ),
@@ -1671,7 +1670,6 @@ class _BaseModelWithGenerate(PreTrainedModel, GenerationMixin):
16711670 # Model for Text-To-Waveform mapping
16721671 ("bark" , "BarkModel" ),
16731672 ("csm" , "CsmForConditionalGeneration" ),
1674- ("fastspeech2_conformer" , "FastSpeech2ConformerWithHifiGan" ),
16751673 ("fastspeech2_conformer_with_hifigan" , "FastSpeech2ConformerWithHifiGan" ),
16761674 ("higgs_audio_v2" , "HiggsAudioV2ForConditionalGeneration" ),
16771675 ("musicgen" , "MusicgenForConditionalGeneration" ),
0 commit comments