--- license: gemma tags: - unsloth - trl - sft --- Experiment 1 SFT ALPACA INDO dataset: 9 millions token indo alpaca dataset max_seq_length = 8192, dataset_num_proc = 2, packing = False, args = TrainingArguments( per_device_train_batch_size = 1, gradient_accumulation_steps = 8, warmup_steps = 5, num_train_epochs = 1, learning_rate = 5e-5, fp16 = not is_bfloat16_supported(), bf16 = is_bfloat16_supported(), logging_steps = 1, optim = "adamw_8bit", weight_decay = 0.01, lr_scheduler_type = "linear", seed = 3407,