marinone94 commited on
Commit
695a47b
1 Parent(s): ed9781e

Training in progress, step 1000

Browse files
checkpoint-1000/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0d150bb1a47e890e734324095bdcd55d5623b896320a5e9a0459aa856b42b06
3
  size 2490362385
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8bbfd4ba575f9da0f10fafd071b49cb2a417b069734ec3f8f25e57b1ace80ce
3
  size 2490362385
checkpoint-1000/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4aca4a6284adca4d75ba2f01b265d187999f0c8e97b09264b7de0ae8d1cf8e73
3
  size 1262075377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5413d438578028bae2ac5a1c47311442081ff0b4a1db9b89c2080d69df74655b
3
  size 1262075377
checkpoint-1000/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bbf6de402af56dc2b2a14f7e42db0ebd96220f08261d4ff0afbff460336edc5
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512798d6b261c10f4cf46e1adb2e820c4ee1ce81131c16f70b43feb653238645
3
  size 559
checkpoint-1000/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1857ca7370610b3ead1d5c1c34b6dfa40788a343fde2e87dcf51cf4b056364d1
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61c6e8fe2cbf564c32ff5b35a892290556b40ae70bfcf843d4a10850b1b863ed
3
  size 623
checkpoint-1000/trainer_state.json CHANGED
@@ -9,85 +9,85 @@
9
  "log_history": [
10
  {
11
  "epoch": 0.29,
12
- "learning_rate": 7.151470588235293e-05,
13
- "loss": 5.1135,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.58,
18
- "learning_rate": 6.710294117647058e-05,
19
- "loss": 3.0957,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 0.87,
24
- "learning_rate": 6.269117647058824e-05,
25
- "loss": 3.0078,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 1.16,
30
- "learning_rate": 5.827941176470588e-05,
31
- "loss": 2.9785,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 1.45,
36
- "learning_rate": 5.3867647058823525e-05,
37
- "loss": 2.9069,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 1.45,
42
- "eval_loss": 2.9046826362609863,
43
- "eval_runtime": 128.7688,
44
- "eval_samples_per_second": 35.878,
45
- "eval_steps_per_second": 4.489,
46
  "eval_wer": 1.0,
47
  "step": 500
48
  },
49
  {
50
  "epoch": 1.74,
51
- "learning_rate": 4.945588235294117e-05,
52
- "loss": 2.8537,
53
  "step": 600
54
  },
55
  {
56
  "epoch": 2.03,
57
- "learning_rate": 4.504411764705882e-05,
58
- "loss": 2.7928,
59
  "step": 700
60
  },
61
  {
62
  "epoch": 2.32,
63
- "learning_rate": 4.063235294117647e-05,
64
- "loss": 2.6988,
65
  "step": 800
66
  },
67
  {
68
  "epoch": 2.61,
69
- "learning_rate": 3.6220588235294115e-05,
70
- "loss": 2.6342,
71
  "step": 900
72
  },
73
  {
74
  "epoch": 2.91,
75
- "learning_rate": 3.180882352941176e-05,
76
- "loss": 2.5875,
77
  "step": 1000
78
  },
79
  {
80
  "epoch": 2.91,
81
- "eval_loss": 2.415876865386963,
82
- "eval_runtime": 164.5912,
83
- "eval_samples_per_second": 28.07,
84
- "eval_steps_per_second": 3.512,
85
- "eval_wer": 1.199687939790736,
86
  "step": 1000
87
  }
88
  ],
89
- "max_steps": 1720,
90
- "num_train_epochs": 5,
91
  "total_flos": 2.9636799545011507e+18,
92
  "trial_name": null,
93
  "trial_params": null
 
9
  "log_history": [
10
  {
11
  "epoch": 0.29,
12
+ "learning_rate": 3.7125e-06,
13
+ "loss": 12.2713,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 0.58,
18
+ "learning_rate": 7.4625e-06,
19
+ "loss": 6.2026,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 0.87,
24
+ "learning_rate": 1.1212499999999998e-05,
25
+ "loss": 4.1374,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 1.16,
30
+ "learning_rate": 1.49625e-05,
31
+ "loss": 3.6755,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 1.45,
36
+ "learning_rate": 1.8712499999999997e-05,
37
+ "loss": 3.3332,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 1.45,
42
+ "eval_loss": 3.292029857635498,
43
+ "eval_runtime": 137.2974,
44
+ "eval_samples_per_second": 33.65,
45
+ "eval_steps_per_second": 4.21,
46
  "eval_wer": 1.0,
47
  "step": 500
48
  },
49
  {
50
  "epoch": 1.74,
51
+ "learning_rate": 2.2462499999999997e-05,
52
+ "loss": 3.1418,
53
  "step": 600
54
  },
55
  {
56
  "epoch": 2.03,
57
+ "learning_rate": 2.6212499999999997e-05,
58
+ "loss": 3.0879,
59
  "step": 700
60
  },
61
  {
62
  "epoch": 2.32,
63
+ "learning_rate": 2.99625e-05,
64
+ "loss": 3.0216,
65
  "step": 800
66
  },
67
  {
68
  "epoch": 2.61,
69
+ "learning_rate": 3.37125e-05,
70
+ "loss": 2.9595,
71
  "step": 900
72
  },
73
  {
74
  "epoch": 2.91,
75
+ "learning_rate": 3.7462499999999996e-05,
76
+ "loss": 2.9269,
77
  "step": 1000
78
  },
79
  {
80
  "epoch": 2.91,
81
+ "eval_loss": 2.941540241241455,
82
+ "eval_runtime": 178.4388,
83
+ "eval_samples_per_second": 25.891,
84
+ "eval_steps_per_second": 3.239,
85
+ "eval_wer": 0.9966346448020559,
86
  "step": 1000
87
  }
88
  ],
89
+ "max_steps": 17200,
90
+ "num_train_epochs": 50,
91
  "total_flos": 2.9636799545011507e+18,
92
  "trial_name": null,
93
  "trial_params": null
checkpoint-1000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1208f22bb7e06e1e9a51692db0520fbddfc3640941d51dfe45ba3188ada2ecbf
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a168f126d02648193e16ba893c3e1ef9f2c2de91803928caf5e25532aff1325
3
  size 2991
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff113c93cbec054547814830ddbe3b7e8b56d08002f35055cf5facbab2743f16
3
  size 1262075377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5413d438578028bae2ac5a1c47311442081ff0b4a1db9b89c2080d69df74655b
3
  size 1262075377