| { | |
| "bias": "none", | |
| "peft_type": "MIXLORA", | |
| "r": 16, | |
| "lora_alpha": 32, | |
| "lora_dropout": 0.05, | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj", | |
| "gate_proj", | |
| "down_proj", | |
| "up_proj" | |
| ], | |
| "routing_strategy": "mixlora", | |
| "num_experts": 8, | |
| "act_fn": "silu", | |
| "top_k": 2, | |
| "base_model_name_or_path": "meta-llama/Llama-2-7b-hf", | |
| "task_type": "QUESTION_ANS" | |
| } |