diff --git a/src/transformers/models/auto/modeling_auto.py b/src/transformers/models/auto/modeling_auto.py index b4d928647561..21bc382e426b 100644 --- a/src/transformers/models/auto/modeling_auto.py +++ b/src/transformers/models/auto/modeling_auto.py @@ -1213,6 +1213,7 @@ class _BaseModelWithGenerate(PreTrainedModel, GenerationMixin): [ ("cohere_asr", "CohereAsrForConditionalGeneration"), ("dia", "DiaForConditionalGeneration"), + ("glmasr", "GlmAsrForConditionalGeneration"), ("granite_speech", "GraniteSpeechForConditionalGeneration"), ("kyutai_speech_to_text", "KyutaiSpeechToTextForConditionalGeneration"), ("moonshine", "MoonshineForConditionalGeneration"), @@ -1684,6 +1685,7 @@ class _BaseModelWithGenerate(PreTrainedModel, GenerationMixin): # Model for Text-To-Waveform mapping ("bark", "BarkModel"), ("csm", "CsmForConditionalGeneration"), + ("dia", "DiaForConditionalGeneration"), ("fastspeech2_conformer_with_hifigan", "FastSpeech2ConformerWithHifiGan"), ("higgs_audio_v2", "HiggsAudioV2ForConditionalGeneration"), ("musicgen", "MusicgenForConditionalGeneration"),