llama3_1_truth_model_bench_1 / training_args.yaml
Ogamon's picture
second commit
2c02d2a verified
raw
history blame contribute delete
No virus
518 Bytes
cutoff_len: 1024
dataset_dir: data
do_predict: true
eval_dataset: truth_dev_0716
finetuning_type: full
flash_attn: auto
max_new_tokens: 512
max_samples: 100000
model_name_or_path: saves/LLaMA3.1-8B-Chat/full/train_2024-07-30-02-00-04_llama3.1_truthqa_bench_1
output_dir: saves/LLaMA3.1-8B-Chat/full/eval_2024-07-30-02-00-04_truthqa_bench1
per_device_eval_batch_size: 2
predict_with_generate: true
preprocessing_num_workers: 16
quantization_method: bitsandbytes
stage: sft
temperature: 0.95
template: llama3
top_p: 0.7