batch_size=128 | |
micro_batch_size=1 | |
num_epochs=5 | |
learning_rate=3e-05 | |
cutoff_len=1024 | |
val_set_size=0.1 | |
warmup_steps=2000 | |
train_on_inputs=True | |
add_eos_token=True | |
group_by_length=False | |
offload_folder= | |
ds_config_path=ds_config_zero3.json | |
batch_size=128 | |
micro_batch_size=1 | |
num_epochs=5 | |
learning_rate=3e-05 | |
cutoff_len=1024 | |
val_set_size=0.1 | |
warmup_steps=2000 | |
train_on_inputs=True | |
add_eos_token=True | |
group_by_length=False | |
offload_folder= | |
ds_config_path=ds_config_zero3.json | |