|
|
|
|
|
|
|
|
|
|
|
|
|
dataset: yahma/alpaca-cleaned |
|
seed: 42 |
|
shuffle: True |
|
|
|
|
|
|
|
|
|
checkpoint_every_n_steps: 500 |
|
|
|
|
|
model_checkpoint: model/llama2_native.tune |
|
tokenizer_checkpoint: model/tokenizer.model |
|
|
|
color_layer_initialization: zeros |
|
norm_before_color_layer: True |
|
|
|
|
|
compile: True |
|
batch_size: 8 |
|
lr: 2e-5 |
|
epochs: 4 |
|
optimizer: SGD |
|
loss: CrossEntropyLoss |
|
output_dir: output/alpaca-colorful-llama2-finetune |
|
device: cuda |
|
dtype: bf16 |
|
enable_fsdp: False |
|
enable_activation_checkpointing: True |
|
resume_from_checkpoint: False |
|
|
|
|
|
metric_logger_type: wandb |
|
project: torchtune |
|
|