andreaskoepf commited on
Commit
4d744f7
1 Parent(s): 9ec3ae0

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +56 -0
README.md CHANGED
@@ -1,3 +1,59 @@
1
  ---
2
  license: apache-2.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: apache-2.0
3
  ---
4
+
5
+ wandb: https://wandb.ai/open-assistant/supervised-finetuning/runs/pcw1ejda
6
+
7
+ ```
8
+ pythia-12b-sft-8:
9
+ dtype: fp16
10
+ log_dir: "pythia_log_12b"
11
+ learning_rate: 6e-6
12
+ model_name: OpenAssistant/pythia-12b-pre-v8-12.5k-steps
13
+ output_dir: pythia_model_12b
14
+ weight_decay: 0.0
15
+ residual_dropout: 0.1
16
+ max_length: 2048
17
+ use_flash_attention: true
18
+ warmup_steps: 100
19
+ gradient_checkpointing: true
20
+ gradient_accumulation_steps: 2
21
+ per_device_train_batch_size: 4
22
+ per_device_eval_batch_size: 4
23
+ eval_steps: 251
24
+ save_steps: 500
25
+ num_train_epochs: 8
26
+ save_total_limit: 4
27
+ num_train_epochs: 8
28
+ save_total_limit: 3
29
+ use_custom_sampler: true
30
+ sort_by_length: false
31
+ save_strategy: steps
32
+ datasets:
33
+ - oasst_export:
34
+ lang: "bg,ca,cs,da,de,en,es,fr,hr,hu,it,nl,pl,pt,ro,ru,sl,sr,sv,uk"
35
+ input_file_path: 2023-05-06_OASST_labels.jsonl.gz
36
+ val_split: 0.05
37
+ - vicuna:
38
+ val_split: 0.05
39
+ max_val_set: 800
40
+ fraction: 0.4
41
+ - dolly15k:
42
+ val_split: 0.05
43
+ max_val_set: 300
44
+ - grade_school_math_instructions:
45
+ val_split: 0.05
46
+ - code_alpaca:
47
+ val_split: 0.05
48
+ max_val_set: 250
49
+ - red_pajama:
50
+ fraction: 0.05
51
+ max_val_set: 1000
52
+ - wizardlm_70k:
53
+ val_split: 0.05
54
+ max_val_set: 500
55
+ fraction: 0.4
56
+ - poem_instructions:
57
+ fraction: 0.5
58
+ val_split: 0.025
59
+ ```