xuancoblab2023 commited on
Commit
faa9bce
·
verified ·
1 Parent(s): 8d1c664

Training in progress, epoch 2

Browse files
logs/events.out.tfevents.1709876067.6c1c016b0e3e.7263.11 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e6d98aed345117a010060b30bf0c50ede7b829e269a95a23a3f2d664634f193
3
- size 5314
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01074bc52c140385b20827d95ac99b468463f9584bede1a73c48a20c3a214266
3
+ size 5984
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:361284d6cbbbf0747d1d2496b9712460a833e47055619c1ce3d78588bf871550
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e11add93b37646b53de44334884f87cfb9c0a7c95ac4d83cc9b3ffce33899bd
3
  size 17549312
run-11/checkpoint-96/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:136877ee651c62ba812d0f99f96161f0f3ecf647b0689286df48d749d4976c6b
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e11add93b37646b53de44334884f87cfb9c0a7c95ac4d83cc9b3ffce33899bd
3
  size 17549312
run-11/checkpoint-96/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:161aac7bcb6524ec9d72a681761a2576fed030a34ed7d6606ea3214ed68f32ae
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605e534cfde92b7c0c50efa96a9f6ba944650bf42f08a44ab81cca6b096fb3fa
3
  size 35122746
run-11/checkpoint-96/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24aa86019b8aea1c551cc1adaf38c4db2fc01de75a22af312230f6b592e0fd81
3
  size 14054
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc13e09b59a62b6fb29cad756bfeefcce6f512c71a9054cc39e336db0b532a5
3
  size 14054
run-11/checkpoint-96/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90937cac39589ae65d6cafbc79eb7a81e4c6f2ab317854f1cdbef198f243a770
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d0c495b8f481c81a3ed7d3d68c42b607133aa0e8efa74714f0b151ec15228ff
3
  size 1064
run-11/checkpoint-96/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.7514677103718199,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-11/checkpoint-96",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
@@ -10,36 +10,55 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 8.867341995239258,
14
- "learning_rate": 0.00047267095070335774,
15
- "loss": 0.5752,
16
- "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.7514677103718199,
21
- "eval_f1": 0.765249537892791,
22
- "eval_loss": 0.501445472240448,
23
- "eval_precision": 0.7250437828371279,
24
- "eval_recall": 0.8101761252446184,
25
- "eval_runtime": 30.0696,
26
- "eval_samples_per_second": 33.988,
27
- "eval_steps_per_second": 1.064,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
- "max_steps": 192,
33
  "num_input_tokens_seen": 0,
34
- "num_train_epochs": 2,
35
  "save_steps": 500,
36
- "total_flos": 235695197280.0,
37
- "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
- "alpha": 0.9981740599737018,
41
- "learning_rate": 0.0009453419014067155,
42
- "num_train_epochs": 2,
43
- "temperature": 30
44
  }
45
  }
 
1
  {
2
+ "best_metric": 0.8199608610567515,
3
  "best_model_checkpoint": "tiny-bert-sst2-distilled/run-11/checkpoint-96",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 2.152926206588745,
14
+ "learning_rate": 0.0007816128679887146,
15
+ "loss": 0.591,
16
+ "step": 48
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.7524461839530333,
21
+ "eval_f1": 0.7944760357432982,
22
+ "eval_loss": 0.4880000948905945,
23
+ "eval_precision": 0.6791666666666667,
24
+ "eval_recall": 0.9569471624266145,
25
+ "eval_runtime": 29.551,
26
+ "eval_samples_per_second": 34.584,
27
+ "eval_steps_per_second": 0.541,
28
+ "step": 48
29
+ },
30
+ {
31
+ "epoch": 2.0,
32
+ "grad_norm": 5.895570278167725,
33
+ "learning_rate": 0.0006513440566572622,
34
+ "loss": 0.4603,
35
+ "step": 96
36
+ },
37
+ {
38
+ "epoch": 2.0,
39
+ "eval_accuracy": 0.8199608610567515,
40
+ "eval_f1": 0.8286778398510243,
41
+ "eval_loss": 0.4088345766067505,
42
+ "eval_precision": 0.7904085257548845,
43
+ "eval_recall": 0.8708414872798435,
44
+ "eval_runtime": 30.3763,
45
+ "eval_samples_per_second": 33.645,
46
+ "eval_steps_per_second": 0.527,
47
  "step": 96
48
  }
49
  ],
50
  "logging_steps": 500,
51
+ "max_steps": 336,
52
  "num_input_tokens_seen": 0,
53
+ "num_train_epochs": 7,
54
  "save_steps": 500,
55
+ "total_flos": 471390394560.0,
56
+ "train_batch_size": 64,
57
  "trial_name": null,
58
  "trial_params": {
59
+ "alpha": 0.9971844266637861,
60
+ "learning_rate": 0.0009118816793201671,
61
+ "num_train_epochs": 7,
62
+ "temperature": 16
63
  }
64
  }
run-11/checkpoint-96/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7ad2a3b631ed3da14471b5ac8c719b5c11baabf1e37c311322e42839c08f1d3
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a283f7ca8fa712756294b7fd6d3247bcb44ee70c9bb9ae961204f34de91039c
3
  size 4920