|
119 | 119 | ("levit", "LevitModel"), |
120 | 120 | ("lilt", "LiltModel"), |
121 | 121 | ("llama", "LlamaModel"), |
| 122 | + ("longformer", "LongformerModel"), |
| 123 | + ("longt5", "LongT5Model"), |
122 | 124 | ("luke", "LukeModel"), |
123 | 125 | ("m2m_100", "M2M100Model"), |
124 | 126 | ("mamba", "MambaModel"), |
|
177 | 179 | ("swin2sr", "Swin2SRModel"), |
178 | 180 | ("t5", "T5Model"), |
179 | 181 | ("tapas", "TapasModel"), |
| 182 | + ("timesformer", "TimesformerModel"), |
180 | 183 | ("tvp", "TvpModel"), |
181 | 184 | ("umt5", "UMT5Model"), |
182 | 185 | ("unispeech", "UniSpeechModel"), |
|
187 | 190 | ("vit", "ViTModel"), |
188 | 191 | ("vit_msn", "ViTMSNModel"), |
189 | 192 | ("vitdet", "VitDetModel"), |
| 193 | + ("vivit", "VivitModel"), |
190 | 194 | ("wav2vec2", "Wav2Vec2Model"), |
191 | 195 | ("whisper", "WhisperModel"), |
192 | 196 | ("xclip", "XCLIPModel"), |
|
234 | 238 | ("llava_next", "LlavaNextForConditionalGeneration"), |
235 | 239 | ("llava_next_video", "LlavaNextVideoForConditionalGeneration"), |
236 | 240 | ("llava_onevision", "LlavaOnevisionForConditionalGeneration"), |
| 241 | + ("longformer", "LongformerForMaskedLM"), |
237 | 242 | ("luke", "LukeForMaskedLM"), |
| 243 | + ("mobilebert", "MobileBertForPreTraining"), |
| 244 | + ("qwen2_audio", "Qwen2AudioForConditionalGeneration"), |
| 245 | + ("roberta", "RobertaForMaskedLM"), |
238 | 246 | ("megatron-bert", "MegatronBertForPreTraining"), |
239 | 247 | ("mistral3", "Mistral3ForConditionalGeneration"), |
240 | 248 | ("mllama", "MllamaForConditionalGeneration"), |
|
287 | 295 | ("gpt2", "GPT2LMHeadModel"), |
288 | 296 | ("ibert", "IBertForMaskedLM"), |
289 | 297 | ("led", "LEDForConditionalGeneration"), |
| 298 | + ("longformer", "LongformerForMaskedLM"), |
| 299 | + ("longt5", "LongT5ForConditionalGeneration"), |
290 | 300 | ("luke", "LukeForMaskedLM"), |
| 301 | + ("camembert", "CamembertForMaskedLM"), |
291 | 302 | ("roberta", "RobertaForMaskedLM"), |
292 | 303 | ("mamba", "MambaForCausalLM"), |
293 | 304 | ("mamba2", "Mamba2ForCausalLM"), |
|
413 | 424 | ("segformer", "SegformerModel"), |
414 | 425 | ("siglip_vision_model", "SiglipVisionModel"), |
415 | 426 | ("swin2sr", "Swin2SRModel"), |
| 427 | + ("timesformer", "TimesformerModel"), |
416 | 428 | ("vit", "ViTModel"), |
417 | 429 | ("vit_msn", "ViTMSNModel"), |
418 | 430 | ("vitdet", "VitDetModel"), |
| 431 | + ("vivit", "VivitModel"), |
419 | 432 | ("yolos", "YolosModel"), |
420 | 433 | ("zamba2", "Zamba2ForCausalLM"), |
421 | 434 | ] |
|
503 | 516 | ] |
504 | 517 | ) |
505 | 518 |
|
506 | | -MODEL_FOR_VIDEO_CLASSIFICATION_MAPPING_NAMES = OrderedDict() |
| 519 | +MODEL_FOR_VIDEO_CLASSIFICATION_MAPPING_NAMES = OrderedDict( |
| 520 | + [ |
| 521 | + ("timesformer", "TimesformerForVideoClassification"), |
| 522 | + ("vivit", "VivitForVideoClassification"), |
| 523 | + ] |
| 524 | +) |
507 | 525 |
|
508 | 526 | MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES = OrderedDict( |
509 | 527 | [ |
|
584 | 602 | ("electra", "ElectraForMaskedLM"), |
585 | 603 | ("funnel", "FunnelForMaskedLM"), |
586 | 604 | ("ibert", "IBertForMaskedLM"), |
| 605 | + ("longformer", "LongformerForMaskedLM"), |
587 | 606 | ("luke", "LukeForMaskedLM"), |
588 | 607 | ("mobilebert", "MobileBertForMaskedLM"), |
589 | 608 | ("mpnet", "MPNetForMaskedLM"), |
|
640 | 659 | ("blenderbot-small", "BlenderbotSmallForConditionalGeneration"), |
641 | 660 | ("fsmt", "FSMTForConditionalGeneration"), |
642 | 661 | ("led", "LEDForConditionalGeneration"), |
| 662 | + ("longt5", "LongT5ForConditionalGeneration"), |
643 | 663 | ("m2m_100", "M2M100ForConditionalGeneration"), |
644 | 664 | ("mvp", "MvpForConditionalGeneration"), |
645 | 665 | ("nllb-moe", "NllbMoeForConditionalGeneration"), |
|
698 | 718 | ("canine", "CanineForSequenceClassification"), |
699 | 719 | ("lilt", "LiltForSequenceClassification"), |
700 | 720 | ("llama", "LlamaForSequenceClassification"), |
| 721 | + ("longformer", "LongformerForSequenceClassification"), |
701 | 722 | ("opt", "OPTForSequenceClassification"), |
702 | 723 | ("persimmon", "PersimmonForSequenceClassification"), |
703 | 724 | ("mbart", "MBartForSequenceClassification"), |
|
752 | 773 | ("luke", "LukeForQuestionAnswering"), |
753 | 774 | ("convbert", "ConvBertForQuestionAnswering"), |
754 | 775 | ("llama", "LlamaForQuestionAnswering"), |
| 776 | + ("longformer", "LongformerForQuestionAnswering"), |
755 | 777 | ("mistral", "MistralForQuestionAnswering"), |
756 | 778 | ("mobilebert", "MobileBertForQuestionAnswering"), |
757 | 779 | ("mpnet", "MPNetForQuestionAnswering"), |
|
812 | 834 | ("helium", "HeliumForTokenClassification"), |
813 | 835 | ("ibert", "IBertForTokenClassification"), |
814 | 836 | ("lilt", "LiltForTokenClassification"), |
| 837 | + ("longformer", "LongformerForTokenClassification"), |
815 | 838 | ("luke", "LukeForTokenClassification"), |
816 | 839 | ("mistral", "MistralForTokenClassification"), |
817 | 840 | ("mobilebert", "MobileBertForTokenClassification"), |
|
852 | 875 | ("distilbert", "DistilBertForMultipleChoice"), |
853 | 876 | ("funnel", "FunnelForMultipleChoice"), |
854 | 877 | ("ibert", "IBertForMultipleChoice"), |
| 878 | + ("longformer", "LongformerForMultipleChoice"), |
855 | 879 | ("luke", "LukeForMultipleChoice"), |
856 | 880 | ("megatron-bert", "MegatronBertForMultipleChoice"), |
857 | 881 | ("mobilebert", "MobileBertForMultipleChoice"), |
|
971 | 995 | ("distilbert", "DistilBertModel"), |
972 | 996 | ("emu3", "Emu3TextModel"), |
973 | 997 | ("ibert", "IBertModel"), |
| 998 | + ("longformer", "LongformerModel"), |
974 | 999 | ("mllama", "MllamaTextModel"), |
975 | 1000 | ("mobilebert", "MobileBertModel"), |
976 | 1001 | ("mt5", "MT5EncoderModel"), |
|
0 commit comments