bellm-llama-7b-nli / angle.config
SeanLee97's picture
Training in progress, step 200
c4e2359 verified
raw
history blame
435 Bytes
{
"model_name_or_path": "NousResearch/Llama-2-7b-hf",
"max_length": 50,
"model_kwargs": {},
"pooling_strategy": "cls",
"lora_config_kwargs": {
"task_type": "CAUSAL_LM",
"r": 32,
"lora_alpha": 32,
"lora_dropout": 0.1,
"bias": "none",
"target_modules": [
"q_proj",
"k_proj",
"up_proj",
"down_proj",
"v_proj",
"gate_proj",
"o_proj"
]
},
"apply_lora": 1
}