mhenrichsen commited on
Commit
4c8ddf2
1 Parent(s): 669f1d0

new lr, sample pack

Browse files
Files changed (1) hide show
  1. examples/mistral/config.yml +4 -4
examples/mistral/config.yml CHANGED
@@ -16,8 +16,8 @@ val_set_size: 0.01
16
  output_dir: ./out
17
 
18
  sequence_len: 8192
19
- sample_packing:
20
- pad_to_sequence_len:
21
 
22
  wandb_project:
23
  wandb_entity:
@@ -30,7 +30,7 @@ micro_batch_size: 2
30
  num_epochs: 3
31
  optimizer: adamw_bnb_8bit
32
  lr_scheduler: cosine
33
- learning_rate: 0.0002
34
 
35
  train_on_inputs: false
36
  group_by_length: false
@@ -59,4 +59,4 @@ fsdp_config:
59
  special_tokens:
60
  bos_token: "<s>"
61
  eos_token: "</s>"
62
- unk_token: "<unk>"
 
16
  output_dir: ./out
17
 
18
  sequence_len: 8192
19
+ sample_packing: true
20
+ pad_to_sequence_len: true
21
 
22
  wandb_project:
23
  wandb_entity:
 
30
  num_epochs: 3
31
  optimizer: adamw_bnb_8bit
32
  lr_scheduler: cosine
33
+ learning_rate: 0.000005
34
 
35
  train_on_inputs: false
36
  group_by_length: false
 
59
  special_tokens:
60
  bos_token: "<s>"
61
  eos_token: "</s>"
62
+ unk_token: "<unk>"