xuancoblab2023 commited on
Commit
fa80c38
·
verified ·
1 Parent(s): d2183db

Training in progress, epoch 2

Browse files
logs/events.out.tfevents.1709873901.6c1c016b0e3e.7263.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97a0e66e33b4d006e92f859d1584598a9a4ec459ea7d03a1903a2e96052ac436
3
- size 5315
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa03478758dca7f5d682294b4b26342374d8ba160952415e179feeb53e1e9410
3
+ size 5985
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba227b507d263c3235344fafa0ef56d9cc2df1b645639c7fd2ca60dccb81a006
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03fd9f7efee8c0f2f691ddeaa2514f0d3a7e750cabcf068212eca5745fe919ca
3
  size 17549312
run-4/checkpoint-96/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48cf003cc2d83efb9a33c368e8ea859aa2c76a29c130a77724c87ea2b605a4f4
3
  size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03fd9f7efee8c0f2f691ddeaa2514f0d3a7e750cabcf068212eca5745fe919ca
3
  size 17549312
run-4/checkpoint-96/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e1ae2990cf04c6f162e8ec86fdc8cb3745c3bca894e75064e22185509898ee
3
  size 35122746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b5e885aea55dc038ba56b1d1df15d43e6a06f137603ec51216e670bb3aab5de
3
  size 35122746
run-4/checkpoint-96/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24aa86019b8aea1c551cc1adaf38c4db2fc01de75a22af312230f6b592e0fd81
3
  size 14054
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc13e09b59a62b6fb29cad756bfeefcce6f512c71a9054cc39e336db0b532a5
3
  size 14054
run-4/checkpoint-96/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c605d5f5c6e1aaba4a4104abbfe7360b6bc2968ed7924599d9c04c6a8c953dd1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d11807bda42acc64a1933e2f174b9739a116b6fd76032532b4c5e869e5fa4c3f
3
  size 1064
run-4/checkpoint-96/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.7446183953033269,
3
- "best_model_checkpoint": "tiny-bert-sst2-distilled/run-4/checkpoint-96",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
@@ -10,36 +10,55 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "grad_norm": 1.90240478515625,
14
- "learning_rate": 0.0008040462940429662,
15
- "loss": 0.4563,
16
- "step": 96
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.7446183953033269,
21
- "eval_f1": 0.7473378509196515,
22
- "eval_loss": 0.415781170129776,
23
- "eval_precision": 0.7394636015325671,
24
- "eval_recall": 0.7553816046966731,
25
- "eval_runtime": 25.3619,
26
- "eval_samples_per_second": 40.297,
27
- "eval_steps_per_second": 1.262,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  "step": 96
29
  }
30
  ],
31
  "logging_steps": 500,
32
- "max_steps": 960,
33
  "num_input_tokens_seen": 0,
34
- "num_train_epochs": 10,
35
  "save_steps": 500,
36
- "total_flos": 235695197280.0,
37
- "train_batch_size": 32,
38
  "trial_name": null,
39
  "trial_params": {
40
- "alpha": 0.6601531096042508,
41
- "learning_rate": 0.0008933847711588513,
42
- "num_train_epochs": 10,
43
- "temperature": 4
44
  }
45
  }
 
1
  {
2
+ "best_metric": 0.5636007827788649,
3
+ "best_model_checkpoint": "tiny-bert-sst2-distilled/run-4/checkpoint-48",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 96,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "grad_norm": 0.5694383382797241,
14
+ "learning_rate": 0.00021480966845398845,
15
+ "loss": 0.2391,
16
+ "step": 48
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.5636007827788649,
21
+ "eval_f1": 0.2829581993569132,
22
+ "eval_loss": 0.21417579054832458,
23
+ "eval_precision": 0.7927927927927928,
24
+ "eval_recall": 0.17221135029354206,
25
+ "eval_runtime": 31.6316,
26
+ "eval_samples_per_second": 32.309,
27
+ "eval_steps_per_second": 0.506,
28
+ "step": 48
29
+ },
30
+ {
31
+ "epoch": 2.0,
32
+ "grad_norm": 0.45431241393089294,
33
+ "learning_rate": 0.00016110725134049132,
34
+ "loss": 0.2131,
35
+ "step": 96
36
+ },
37
+ {
38
+ "epoch": 2.0,
39
+ "eval_accuracy": 0.5547945205479452,
40
+ "eval_f1": 0.26016260162601623,
41
+ "eval_loss": 0.20607483386993408,
42
+ "eval_precision": 0.7692307692307693,
43
+ "eval_recall": 0.15655577299412915,
44
+ "eval_runtime": 29.4377,
45
+ "eval_samples_per_second": 34.717,
46
+ "eval_steps_per_second": 0.544,
47
  "step": 96
48
  }
49
  ],
50
  "logging_steps": 500,
51
+ "max_steps": 240,
52
  "num_input_tokens_seen": 0,
53
+ "num_train_epochs": 5,
54
  "save_steps": 500,
55
+ "total_flos": 471390394560.0,
56
+ "train_batch_size": 64,
57
  "trial_name": null,
58
  "trial_params": {
59
+ "alpha": 0.27492253593123683,
60
+ "learning_rate": 0.00026851208556748554,
61
+ "num_train_epochs": 5,
62
+ "temperature": 7
63
  }
64
  }
run-4/checkpoint-96/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05a27237c59bc1684c5bc675b662fc3c971fc4d8663bd9fafef0f646ea921a93
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ec7ec7f38e7c2427d32adb2581912875f666fa47e4e936bf0bd24c36192ea0
3
  size 4920