Femboyuwu2000 commited on
Commit
66236ed
1 Parent(s): 70c0d37

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:888d6b2d183be0ad051b69e15bacc2f610a2138674c1cefb759c0b5ea44fb84b
3
  size 4725640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e737501f2b45e7567ee47af1ddb09b9cbaa6f653e680bb4a4cad7d8ad854e388
3
  size 4725640
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3da76e9afdf003a898a487820cd7ea1d43e840d64f8865874b93117bab741801
3
  size 2423738
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b322f65dbb3d497733de58208d7e2ff958939a0bbcd4b0f1665fb36b3e6d1a6f
3
  size 2423738
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28d42be630248a5213a70ba5e163d2391a05816dbb273d1b7b48dcd47e871fb4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d1dbd056bdba902bbd15884fe0ae45df7b81d1dab50b96a0c9b32d0eae3e262
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da2b3df137afc8ce0bf3abe9574aa4eb50b6c5bd11e6952c66c439eade1cc134
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35b984f5d5bfe5a9a68144cbebc8463a6390d9811bce29b59e9d59016179fb2e
3
  size 1064
last-checkpoint/tokenizer_config.json CHANGED
@@ -37,12 +37,9 @@
37
  "bos_token": "<s>",
38
  "clean_up_tokenization_spaces": false,
39
  "eos_token": "</s>",
40
- "max_length": 2048,
41
  "model_max_length": 1000000000000000019884624838656,
42
  "pad_token": "</s>",
43
- "padding": true,
44
  "padding_side": "right",
45
  "tokenizer_class": "BloomTokenizer",
46
- "truncation": true,
47
  "unk_token": "<unk>"
48
  }
 
37
  "bos_token": "<s>",
38
  "clean_up_tokenization_spaces": false,
39
  "eos_token": "</s>",
 
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "</s>",
 
42
  "padding_side": "right",
43
  "tokenizer_class": "BloomTokenizer",
 
44
  "unk_token": "<unk>"
45
  }
last-checkpoint/trainer_state.json CHANGED
@@ -1,41 +1,27 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.669515070859891e-05,
5
  "eval_steps": 500,
6
- "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "grad_norm": 4.044270038604736,
14
- "learning_rate": 1.6666666666666667e-06,
15
- "loss": 3.7393,
16
  "step": 20
17
- },
18
- {
19
- "epoch": 0.0,
20
- "grad_norm": 1.908144235610962,
21
- "learning_rate": 3.2500000000000002e-06,
22
- "loss": 3.6056,
23
- "step": 40
24
- },
25
- {
26
- "epoch": 0.0,
27
- "grad_norm": 1.030365228652954,
28
- "learning_rate": 4.9166666666666665e-06,
29
- "loss": 3.526,
30
- "step": 60
31
  }
32
  ],
33
  "logging_steps": 20,
34
  "max_steps": 20000,
35
  "num_input_tokens_seen": 0,
36
- "num_train_epochs": 1,
37
  "save_steps": 20,
38
- "total_flos": 35326762795008.0,
39
  "train_batch_size": 1,
40
  "trial_name": null,
41
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.002725538293813028,
5
  "eval_steps": 500,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "grad_norm": 0.39290162920951843,
14
+ "learning_rate": 1.5833333333333336e-06,
15
+ "loss": 4.0074,
16
  "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  }
18
  ],
19
  "logging_steps": 20,
20
  "max_steps": 20000,
21
  "num_input_tokens_seen": 0,
22
+ "num_train_epochs": 3,
23
  "save_steps": 20,
24
+ "total_flos": 9824796131328.0,
25
  "train_batch_size": 1,
26
  "trial_name": null,
27
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67d9137f50a05785e0ffd11f3ee590825d65f6fa4ba75fb2184bf1dc9266179b
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e76cb4f6a41bce2aadf48ff7cb6d05ab2c9b686a1100b4a6b9867db37ed9160
3
  size 4984