-
Notifications
You must be signed in to change notification settings - Fork 6
/
mixlora_dynamic.json
37 lines (37 loc) · 1021 Bytes
/
mixlora_dynamic.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
{
"cutoff_len": 512,
"save_step": 1000,
"train_lora_candidate_num": 2,
"train_lora_simultaneously_num": 2,
"train_strategy": "optim",
"lora": [
{
"name": "mixlora",
"task_name": "",
"optim": "adamw",
"scheduler_type": "constant",
"warmup_steps": 0,
"lr": 2e-4,
"batch_size": 16,
"micro_batch_size": 8,
"evaluate_batch_size": 16,
"num_epochs": 2,
"r": 16,
"lora_alpha": 32,
"lora_dropout": 0.05,
"target_modules": {
"q_proj": true,
"k_proj": true,
"v_proj": true,
"o_proj": true,
"gate_proj": true,
"down_proj": true,
"up_proj": true
},
"routing_strategy": "mixlora-dynamic",
"num_experts": 8,
"top_p": 0.8,
"group_by_length": false
}
]
}