bellm-llama-7b-nli / angle.config
SeanLee97's picture
Training in progress, step 200
d331d18 verified
raw
history blame
437 Bytes
{
"model_name_or_path": "NousResearch/Llama-2-7b-hf",
"max_length": 85,
"model_kwargs": {},
"pooling_strategy": "cls",
"lora_config_kwargs": {
"task_type": "CAUSAL_LM",
"r": 256,
"lora_alpha": 128,
"lora_dropout": 0.1,
"bias": "none",
"target_modules": [
"o_proj",
"down_proj",
"v_proj",
"q_proj",
"up_proj",
"k_proj",
"gate_proj"
]
},
"apply_lora": 1
}