HikasaHana commited on
Commit
6c3256d
·
verified ·
1 Parent(s): 648e221

Training in progress, epoch 2

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca0dc6ea72694ff54a88f458db9aff463c496bd6d83166f6fb57a4e51c5bb172
3
  size 409103316
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b3ada415323df4681659f8a3c19121e9379a2b0c7922cade957c3cc9526017
3
  size 409103316
run-0/checkpoint-534/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2c26a4990298c617435add4fef099a107381df4b5d4dd2ceb1932c28c743541
3
  size 409103316
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b3ada415323df4681659f8a3c19121e9379a2b0c7922cade957c3cc9526017
3
  size 409103316
run-0/checkpoint-534/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7c82d05f4ce26f22c9acaa7998473a49f5f6cbfcd52e5fa856d9f347b60ad8c
3
  size 818327802
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01fc13bfd901a55e2ac038444bc5950e036e98be6e0fb3c7670e6e8a5cef840f
3
  size 818327802
run-0/checkpoint-534/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dda5eab8086c3361f01b6da1d0d501e5d7ffcc15041db5c9a3384c00b843300f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a56050495e1938ae70b239ae8ece3c43ac800b58f0a6e02bd7ed6cd1669797d
3
  size 1064
run-0/checkpoint-534/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.5817901492118835,
3
  "best_model_checkpoint": "BERT-WMM/run-0/checkpoint-534",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,39 +10,39 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.7563380281690141,
14
- "eval_loss": 0.6019130349159241,
15
- "eval_runtime": 2.4228,
16
- "eval_samples_per_second": 879.158,
17
- "eval_steps_per_second": 55.309,
18
  "step": 267
19
  },
20
  {
21
  "epoch": 1.87,
22
- "grad_norm": 9.674468994140625,
23
- "learning_rate": 5.7987153604787005e-06,
24
- "loss": 0.6061,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
- "eval_accuracy": 0.7619718309859155,
30
- "eval_loss": 0.5817901492118835,
31
- "eval_runtime": 2.4333,
32
- "eval_samples_per_second": 875.37,
33
- "eval_steps_per_second": 55.07,
34
  "step": 534
35
  }
36
  ],
37
  "logging_steps": 500,
38
- "max_steps": 801,
39
  "num_input_tokens_seen": 0,
40
- "num_train_epochs": 3,
41
  "save_steps": 500,
42
  "total_flos": 349221394826640.0,
43
  "train_batch_size": 32,
44
  "trial_name": null,
45
  "trial_params": {
46
- "num_train_epochs": 3
47
  }
48
  }
 
1
  {
2
+ "best_metric": 0.6037774682044983,
3
  "best_model_checkpoint": "BERT-WMM/run-0/checkpoint-534",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7530516431924883,
14
+ "eval_loss": 0.6065725684165955,
15
+ "eval_runtime": 2.5073,
16
+ "eval_samples_per_second": 849.524,
17
+ "eval_steps_per_second": 53.444,
18
  "step": 267
19
  },
20
  {
21
  "epoch": 1.87,
22
+ "grad_norm": 9.447751998901367,
23
+ "learning_rate": 9.825065893169892e-07,
24
+ "loss": 0.6083,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
+ "eval_accuracy": 0.7615023474178404,
30
+ "eval_loss": 0.6037774682044983,
31
+ "eval_runtime": 2.4998,
32
+ "eval_samples_per_second": 852.081,
33
+ "eval_steps_per_second": 53.605,
34
  "step": 534
35
  }
36
  ],
37
  "logging_steps": 500,
38
+ "max_steps": 534,
39
  "num_input_tokens_seen": 0,
40
+ "num_train_epochs": 2,
41
  "save_steps": 500,
42
  "total_flos": 349221394826640.0,
43
  "train_batch_size": 32,
44
  "trial_name": null,
45
  "trial_params": {
46
+ "weight_decay": 9.670788404941036e-05
47
  }
48
  }
run-0/checkpoint-534/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11f7c65747bd635b8f0e76f611e224f7ef08b5428ba70dd1530c26977be68e0b
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de07fd0528e0ec401b749f0d80d28e850e36f7e66780675fb859022ed638d382
3
  size 4856
runs/Apr19_10-19-01_dcdaa3e6ec43/events.out.tfevents.1713521944.dcdaa3e6ec43.789.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6f0b3002c4418729fd7ca23e6ae9fc9e8fac9d2478d4a388d69ecd8d2385060
3
- size 5234
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fee924e67051849fdffd25dac35c063461003059dc4fd9c69d77b70a0171a73d
3
+ size 6122