mprzibilla commited on
Commit
a5803ca
1 Parent(s): c069797

Training in progress, step 4017

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "mprzibilla/dys_base_M14",
3
  "activation_dropout": 0.0,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
 
1
  {
2
+ "_name_or_path": "facebook/wav2vec2-base",
3
  "activation_dropout": 0.0,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
last-checkpoint/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "mprzibilla/dys_base_M14",
3
  "activation_dropout": 0.0,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
 
1
  {
2
+ "_name_or_path": "facebook/wav2vec2-base",
3
  "activation_dropout": 0.0,
4
  "adapter_kernel_size": 3,
5
  "adapter_stride": 2,
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a06fabdd8e40a2415cbe05368ed03179ec54a1e5182bde3d9ba22d80f13c39fa
3
  size 721668101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db25401d6710bd1958c6f51c19bcbfc3c41763a042336726a244dae071aeb197
3
  size 721668101
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c29322461c6641c00268ddbc3ec7fbf3eac47dd6a465262f2c85a21f0e923f3
3
  size 377649505
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4971a68c9621393e9b2d50a639c8a82b0a059cb9042cec298ad92dc07e0c545a
3
  size 377649505
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:867d0fac469b0104f98602164cbc9aaefeeb58efe54cfdeef565345818c9775e
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b5161ff77ee89f2795b7a591f9b22f7fe74e0468c02497e0c2537a5b71a719a
3
  size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:614b2a06196347e24b6b4f4717f17dcc9f41c85649107516c838a44076205f5e
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7395a75c4ab5ea271598dca5da8f8c4f98245cae4f5cff35b4dbb2a0e74423c2
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6c0b6edf3b19e4b41e5e2509db370fca85acfb1ad4b630e5f2532f6549b4daa
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c3424e1374c05636562c17e7efec21ba0140ab354c9520c0792238885bcd45
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,144 +1,32 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 30.0,
5
- "global_step": 40170,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 10.0,
12
- "learning_rate": 9.474548956408946e-05,
13
- "loss": 2.9276,
14
- "step": 13390
15
  },
16
  {
17
- "epoch": 10.0,
18
- "eval_cer": 0.17402597402597403,
19
- "eval_loss": 1.8234585523605347,
20
- "eval_runtime": 7.7319,
21
- "eval_samples_per_second": 27.16,
22
- "eval_steps_per_second": 3.492,
23
- "eval_wer": 0.319047619047619,
24
- "step": 13390
25
- },
26
- {
27
- "epoch": 12.0,
28
- "learning_rate": 6.318589172475237e-05,
29
- "loss": 0.338,
30
- "step": 16068
31
- },
32
- {
33
- "epoch": 12.0,
34
- "eval_cer": 0.13506493506493505,
35
- "eval_loss": 2.124079942703247,
36
- "eval_runtime": 7.7938,
37
- "eval_samples_per_second": 26.944,
38
- "eval_steps_per_second": 3.464,
39
- "eval_wer": 0.30952380952380953,
40
- "step": 16068
41
- },
42
- {
43
- "epoch": 15.0,
44
- "learning_rate": 5.265971385147529e-05,
45
- "loss": 0.1144,
46
- "step": 20085
47
- },
48
- {
49
- "epoch": 15.0,
50
- "eval_cer": 0.10562770562770563,
51
- "eval_loss": 1.8706998825073242,
52
- "eval_runtime": 7.8262,
53
- "eval_samples_per_second": 26.833,
54
- "eval_steps_per_second": 3.45,
55
- "eval_wer": 0.2714285714285714,
56
- "step": 20085
57
- },
58
- {
59
- "epoch": 18.0,
60
- "learning_rate": 4.21387767936691e-05,
61
- "loss": 0.087,
62
- "step": 24102
63
- },
64
- {
65
- "epoch": 18.0,
66
- "eval_cer": 0.11601731601731602,
67
- "eval_loss": 1.7962666749954224,
68
- "eval_runtime": 8.1091,
69
- "eval_samples_per_second": 25.897,
70
- "eval_steps_per_second": 3.33,
71
- "eval_wer": 0.29523809523809524,
72
- "step": 24102
73
- },
74
- {
75
- "epoch": 21.0,
76
- "learning_rate": 3.16178397358629e-05,
77
- "loss": 0.0722,
78
- "step": 28119
79
- },
80
- {
81
- "epoch": 21.0,
82
- "eval_cer": 0.09696969696969697,
83
- "eval_loss": 1.405766487121582,
84
- "eval_runtime": 7.9215,
85
- "eval_samples_per_second": 26.51,
86
- "eval_steps_per_second": 3.408,
87
- "eval_wer": 0.22857142857142856,
88
- "step": 28119
89
- },
90
- {
91
- "epoch": 24.0,
92
- "learning_rate": 2.1091661862585817e-05,
93
- "loss": 0.0558,
94
- "step": 32136
95
- },
96
- {
97
- "epoch": 24.0,
98
- "eval_cer": 0.11688311688311688,
99
- "eval_loss": 2.0048906803131104,
100
- "eval_runtime": 7.8624,
101
- "eval_samples_per_second": 26.71,
102
- "eval_steps_per_second": 3.434,
103
- "eval_wer": 0.2571428571428571,
104
- "step": 32136
105
- },
106
- {
107
- "epoch": 27.0,
108
- "learning_rate": 1.0570724804779624e-05,
109
- "loss": 0.0451,
110
- "step": 36153
111
- },
112
- {
113
- "epoch": 27.0,
114
- "eval_cer": 0.06666666666666667,
115
- "eval_loss": 0.9005960822105408,
116
- "eval_runtime": 7.9263,
117
- "eval_samples_per_second": 26.494,
118
- "eval_steps_per_second": 3.406,
119
- "eval_wer": 0.13333333333333333,
120
- "step": 36153
121
- },
122
- {
123
- "epoch": 30.0,
124
- "learning_rate": 4.9787746973429064e-08,
125
- "loss": 0.0386,
126
- "step": 40170
127
- },
128
- {
129
- "epoch": 30.0,
130
- "eval_cer": 0.09177489177489177,
131
- "eval_loss": 1.1628663539886475,
132
- "eval_runtime": 8.0633,
133
- "eval_samples_per_second": 26.044,
134
- "eval_steps_per_second": 3.349,
135
- "eval_wer": 0.20476190476190476,
136
- "step": 40170
137
  }
138
  ],
139
  "max_steps": 40170,
140
  "num_train_epochs": 30,
141
- "total_flos": 3.0777160112253587e+19,
142
  "trial_name": null,
143
  "trial_params": null
144
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "global_step": 4017,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 3.0,
12
+ "learning_rate": 9.475394371364185e-05,
13
+ "loss": 6.1685,
14
+ "step": 4017
15
  },
16
  {
17
+ "epoch": 3.0,
18
+ "eval_cer": 0.2329004329004329,
19
+ "eval_loss": 1.0849695205688477,
20
+ "eval_runtime": 7.5095,
21
+ "eval_samples_per_second": 27.965,
22
+ "eval_steps_per_second": 3.595,
23
+ "eval_wer": 0.10952380952380952,
24
+ "step": 4017
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "max_steps": 40170,
28
  "num_train_epochs": 30,
29
+ "total_flos": 3.0684859051639557e+18,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffe3b5a4aad1671b33ccddc25dbba51e25a3b8b55bc57f05d04b95bad2307f39
3
  size 3451
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44a7ed8f97dac3c9e0a2af7de4d043ff4ada25dd33067d84682f5e73789b9937
3
  size 3451
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c29322461c6641c00268ddbc3ec7fbf3eac47dd6a465262f2c85a21f0e923f3
3
  size 377649505
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4971a68c9621393e9b2d50a639c8a82b0a059cb9042cec298ad92dc07e0c545a
3
  size 377649505
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffe3b5a4aad1671b33ccddc25dbba51e25a3b8b55bc57f05d04b95bad2307f39
3
  size 3451
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44a7ed8f97dac3c9e0a2af7de4d043ff4ada25dd33067d84682f5e73789b9937
3
  size 3451