File size: 566 Bytes
8464a98
 
e75bd98
 
 
 
8464a98
 
6f191d4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
---
license: gemma
tags:
- unsloth
- trl
- sft
---

Experiment 1 SFT ALPACA INDO

dataset: 9 millions token indo alpaca dataset

max_seq_length = 8192,
dataset_num_proc = 2,
packing = False, 
args = TrainingArguments(
    per_device_train_batch_size = 1,
    gradient_accumulation_steps = 8,
    warmup_steps = 5,
    num_train_epochs = 1,
    learning_rate = 5e-5,
    fp16 = not is_bfloat16_supported(),
    bf16 = is_bfloat16_supported(),
    logging_steps = 1,
    optim = "adamw_8bit",
    weight_decay = 0.01,
    lr_scheduler_type = "linear",
    seed = 3407,