Spaces:

inflaton-ai
/

logical-reasoning

Build error

dh-mc commited on Sep 7, 2024

Commit

64655af

1 Parent(s): b87bc1a

fix training configs

Files changed (2) hide show

llama-factory/config/mgtv_template.yaml CHANGED Viewed

@@ -26,14 +26,14 @@ plot_loss: true
 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
-num_train_epochs: 6.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true
 ddp_timeout: 180000000
 ### eval
-val_size: 0.01
 per_device_eval_batch_size: 1
 eval_strategy: steps
 eval_steps: 35

 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
+num_train_epochs: 2.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true
 ddp_timeout: 180000000
 ### eval
+val_size: 0.1
 per_device_eval_batch_size: 1
 eval_strategy: steps
 eval_steps: 35

llama-factory/config/mgtv_template_4bit.yaml CHANGED Viewed

@@ -27,14 +27,14 @@ plot_loss: true
 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
-num_train_epochs: 6.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true
 ddp_timeout: 180000000
 ### eval
-val_size: 0.01
 per_device_eval_batch_size: 1
 eval_strategy: steps
 eval_steps: 35

 per_device_train_batch_size: 16
 gradient_accumulation_steps: 8
 learning_rate: 1.0e-4
+num_train_epochs: 2.0
 lr_scheduler_type: cosine
 warmup_ratio: 0.1
 bf16: true
 ddp_timeout: 180000000
 ### eval
+val_size: 0.1
 per_device_eval_batch_size: 1
 eval_strategy: steps
 eval_steps: 35