Skip to content

Commit fae8291

Browse files
arnavgarg1BenjaminBossan
authored andcommitted
Add default IA3 target modules for Mixtral (huggingface#1376)
* Add default LoRA target modules for Mixtral * Add IA3 modules for Mixtral * Address comments
1 parent 31b58ba commit fae8291

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

src/peft/utils/constants.py

+2
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,7 @@ def starcoder_model_postprocess_past_key_value(past_key_values):
9393
"gpt_bigcode": ["c_attn", "mlp.c_proj"],
9494
"llama": ["k_proj", "v_proj", "down_proj"],
9595
"mistral": ["k_proj", "v_proj", "down_proj"],
96+
"mixtral": ["k_proj", "v_proj", "w2"],
9697
"bert": ["key", "value", "output.dense"],
9798
"deberta-v2": ["key_proj", "value_proj", "output.dense"],
9899
"deberta": ["in_proj", "output.dense"],
@@ -116,6 +117,7 @@ def starcoder_model_postprocess_past_key_value(past_key_values):
116117
"gpt_bigcode": ["mlp.c_proj"],
117118
"llama": ["down_proj"],
118119
"mistral": ["down_proj"],
120+
"mixtral": ["w2"],
119121
"bert": ["output.dense"],
120122
"deberta-v2": ["output.dense"],
121123
"deberta": ["output.dense"],

0 commit comments

Comments
 (0)