filco-llama2-multihop / xturing.json
zorazrw's picture
Upload 9 files
3c97db6 verified
{
"model_name": "llama2_lora",
"finetuning_config": {
"learning_rate": 5e-05,
"gradient_accumulation_steps": 1,
"batch_size": 1,
"weight_decay": 0.01,
"warmup_steps": 50,
"eval_steps": 5000,
"save_steps": 5000,
"max_length": 512,
"num_train_epochs": 3,
"logging_steps": 10,
"max_grad_norm": 2.0,
"save_total_limit": 4,
"optimizer_name": "adamw",
"output_dir": "./checkpoints/llama2-lora_hotpotqa-mctx_cxmi-top1"
},
"generation_config": {
"penalty_alpha": 0.6,
"top_k": 4,
"max_new_tokens": 256,
"do_sample": false,
"top_p": null
}
}