|
51 | 51 | ("deberta-v2", "DebertaV2Model"), |
52 | 52 | ("dpt", "DPTModel"), |
53 | 53 | ("gemma", "GemmaModel"), |
| 54 | + ("m2m_100", "M2M100Model"), |
54 | 55 | ("gemma2", "Gemma2Model"), |
55 | 56 | ("persimmon", "PersimmonModel"), |
56 | 57 | ("glm", "GlmModel"), |
|
135 | 136 | # Model with LM heads mapping |
136 | 137 | ("albert", "AlbertForMaskedLM"), |
137 | 138 | ("bart", "BartForConditionalGeneration"), |
| 139 | + ("m2m_100", "M2M100ForConditionalGeneration"), |
138 | 140 | ("bert", "BertForMaskedLM"), |
139 | 141 | ("deberta", "DebertaForMaskedLM"), |
140 | 142 | ("deberta-v2", "DebertaV2ForMaskedLM"), |
|
328 | 330 | # Model for Seq2Seq Causal LM mapping |
329 | 331 | ("bart", "BartForConditionalGeneration"), |
330 | 332 | ("led", "LEDForConditionalGeneration"), |
| 333 | + ("m2m_100", "M2M100ForConditionalGeneration"), |
331 | 334 | ("mt5", "MT5ForConditionalGeneration"), |
332 | 335 | ("qwen2_audio", "Qwen2AudioForConditionalGeneration"), |
333 | 336 | ("t5", "T5ForConditionalGeneration"), |
|
0 commit comments