c2cite / config /config.json
loadingy's picture
first push
51be264
{
"cutoff_len": 1900,
"save_step": 500,
"train_lora_candidate_num": 1,
"train_lora_simultaneously_num": 1,
"train_strategy": "optim",
"evaluate_result": "./result",
"lora": [
{
"name": "c2cite++",
"task_name": "synsci++",
"optim": "adamw",
"scheduler_type": "constant",
"warmup_steps": 0,
"lr": 1e-4,
"batch_size": 1,
"micro_batch_size": 1,
"evaluate_batch_size": 1,
"num_epochs": 4,
"r": 8,
"lora_alpha": 16,
"lora_dropout": 0.05,
"target_modules": {
"q_proj": true,
"k_proj": true,
"v_proj": true,
"o_proj": true,
"gate_proj": true,
"down_proj": true,
"up_proj": true
},
"routing_strategy": "",
"group_by_length": false,
"atten_mat_coin": 0.1,
"router_coin": 0.1,
"cite_coin": 0.2
}
]
}