|
60 | 60 | "AquilaForCausalLM": ("llama", "LlamaForCausalLM"), # AquilaChat2 |
61 | 61 | "ArceeForCausalLM": ("arcee", "ArceeForCausalLM"), |
62 | 62 | "ArcticForCausalLM": ("arctic", "ArcticForCausalLM"), |
63 | | - "MiniMaxForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
64 | | - "MiniMaxText01ForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
65 | | - "MiniMaxM1ForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
66 | 63 | # baichuan-7b, upper case 'C' in the class name |
67 | 64 | "BaiChuanForCausalLM": ("baichuan", "BaiChuanForCausalLM"), |
68 | 65 | # baichuan-13b, lower case 'c' in the class name |
|
87 | 84 | "Ernie4_5_MoeForCausalLM": ("ernie45_moe", "Ernie4_5_MoeForCausalLM"), |
88 | 85 | "ExaoneForCausalLM": ("exaone", "ExaoneForCausalLM"), |
89 | 86 | "Exaone4ForCausalLM": ("exaone4", "Exaone4ForCausalLM"), |
90 | | - "FalconForCausalLM": ("falcon", "FalconForCausalLM"), |
91 | 87 | "Fairseq2LlamaForCausalLM": ("fairseq2_llama", "Fairseq2LlamaForCausalLM"), |
| 88 | + "FalconForCausalLM": ("falcon", "FalconForCausalLM"), |
| 89 | + "FalconMambaForCausalLM": ("mamba", "MambaForCausalLM"), |
| 90 | + "FalconH1ForCausalLM": ("falcon_h1", "FalconH1ForCausalLM"), |
92 | 91 | "FlexOlmoForCausalLM": ("flex_olmo", "FlexOlmoForCausalLM"), |
93 | 92 | "GemmaForCausalLM": ("gemma", "GemmaForCausalLM"), |
94 | 93 | "Gemma2ForCausalLM": ("gemma2", "Gemma2ForCausalLM"), |
|
126 | 125 | "LLaMAForCausalLM": ("llama", "LlamaForCausalLM"), |
127 | 126 | "LongcatFlashForCausalLM": ("longcat_flash", "LongcatFlashForCausalLM"), |
128 | 127 | "MambaForCausalLM": ("mamba", "MambaForCausalLM"), |
129 | | - "FalconMambaForCausalLM": ("mamba", "MambaForCausalLM"), |
130 | | - "FalconH1ForCausalLM": ("falcon_h1", "FalconH1ForCausalLM"), |
131 | 128 | "Mamba2ForCausalLM": ("mamba2", "Mamba2ForCausalLM"), |
132 | 129 | "MiniCPMForCausalLM": ("minicpm", "MiniCPMForCausalLM"), |
133 | 130 | "MiniCPM3ForCausalLM": ("minicpm3", "MiniCPM3ForCausalLM"), |
| 131 | + "MiniMaxForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
| 132 | + "MiniMaxText01ForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
| 133 | + "MiniMaxM1ForCausalLM": ("minimax_text_01", "MiniMaxText01ForCausalLM"), |
134 | 134 | "MistralForCausalLM": ("llama", "LlamaForCausalLM"), |
135 | 135 | "MixtralForCausalLM": ("mixtral", "MixtralForCausalLM"), |
136 | 136 | # transformers's mpt class has lower case |
|
0 commit comments