{ | |
"bias": "none", | |
"peft_type": "MIXLORA", | |
"task_type": "CAUSAL_LM", | |
"base_model_name_or_path": "meta-llama/Llama-2-7b-hf", | |
"r": 16, | |
"lora_alpha": 32, | |
"lora_dropout": 0.05, | |
"target_modules": [ | |
"q_proj", | |
"k_proj", | |
"v_proj", | |
"o_proj", | |
"gate_proj", | |
"down_proj", | |
"up_proj" | |
], | |
"routing_strategy": "mixlora", | |
"num_experts": 8, | |
"act_fn": "silu", | |
"top_k": 2 | |
} |