lyhourt commited on
Commit
4082eaa
1 Parent(s): 574b697

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b835329ef4709c0d0c8d1cc92ce20cf0824c93a00beec28c143cb8b65a626849
3
  size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c251d99d91b1688198a576bd284d526bc8c64c668230153c5206921df22e939
3
  size 966995080
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8430cf2cfc85209ec72b14935d060f9be6b5ceeaf9fe7ebb3e07ce441c6e8d05
3
  size 1925064044
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3fccd79082e460b132de5707302dfdc687cf969faa26441cbfc3af3a2f24364
3
  size 1925064044
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00e6e721ef589f426d117d352e598663f682c797ffd64051fbd7dfcfb7bd6fac
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c5b9d591372e5065a8120169931ca394511eeff5b6e9d239a15928090e157ec
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d9bed5473f5660663309a68e94acd97d7760b053fdd2cb87c2ed61460498bb6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45e12526c8172a948234d8cb869935e517c484d36da5eb6ac9a7382e7d268eff
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 26.55630683142924,
3
- "best_model_checkpoint": "./whisper-small-clean_6-v2/checkpoint-200",
4
- "epoch": 0.5,
5
  "eval_steps": 200,
6
- "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -72,6 +72,71 @@
72
  "eval_steps_per_second": 0.072,
73
  "eval_wer": 26.55630683142924,
74
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  }
76
  ],
77
  "logging_steps": 25,
@@ -86,12 +151,12 @@
86
  "should_evaluate": false,
87
  "should_log": false,
88
  "should_save": true,
89
- "should_training_stop": false
90
  },
91
  "attributes": {}
92
  }
93
  },
94
- "total_flos": 3.693893124096e+18,
95
  "train_batch_size": 64,
96
  "trial_name": null,
97
  "trial_params": null
 
1
  {
2
+ "best_metric": 25.775238983446023,
3
+ "best_model_checkpoint": "./whisper-small-clean_6-v2/checkpoint-400",
4
+ "epoch": 1.0,
5
  "eval_steps": 200,
6
+ "global_step": 400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
72
  "eval_steps_per_second": 0.072,
73
  "eval_wer": 26.55630683142924,
74
  "step": 200
75
+ },
76
+ {
77
+ "epoch": 0.5625,
78
+ "grad_norm": 3.616425037384033,
79
+ "learning_rate": 5e-06,
80
+ "loss": 0.2072,
81
+ "step": 225
82
+ },
83
+ {
84
+ "epoch": 0.625,
85
+ "grad_norm": 3.8101563453674316,
86
+ "learning_rate": 4.2857142857142855e-06,
87
+ "loss": 0.189,
88
+ "step": 250
89
+ },
90
+ {
91
+ "epoch": 0.6875,
92
+ "grad_norm": 3.7268102169036865,
93
+ "learning_rate": 3.5714285714285718e-06,
94
+ "loss": 0.194,
95
+ "step": 275
96
+ },
97
+ {
98
+ "epoch": 0.75,
99
+ "grad_norm": 3.762694835662842,
100
+ "learning_rate": 2.8571428571428573e-06,
101
+ "loss": 0.1853,
102
+ "step": 300
103
+ },
104
+ {
105
+ "epoch": 0.8125,
106
+ "grad_norm": 4.289006233215332,
107
+ "learning_rate": 2.1428571428571427e-06,
108
+ "loss": 0.1988,
109
+ "step": 325
110
+ },
111
+ {
112
+ "epoch": 0.875,
113
+ "grad_norm": 3.323763132095337,
114
+ "learning_rate": 1.4285714285714286e-06,
115
+ "loss": 0.1948,
116
+ "step": 350
117
+ },
118
+ {
119
+ "epoch": 0.9375,
120
+ "grad_norm": 4.1935200691223145,
121
+ "learning_rate": 7.142857142857143e-07,
122
+ "loss": 0.2095,
123
+ "step": 375
124
+ },
125
+ {
126
+ "epoch": 1.0,
127
+ "grad_norm": 3.7287049293518066,
128
+ "learning_rate": 0.0,
129
+ "loss": 0.1923,
130
+ "step": 400
131
+ },
132
+ {
133
+ "epoch": 1.0,
134
+ "eval_loss": 0.29943087697029114,
135
+ "eval_runtime": 656.7909,
136
+ "eval_samples_per_second": 2.322,
137
+ "eval_steps_per_second": 0.073,
138
+ "eval_wer": 25.775238983446023,
139
+ "step": 400
140
  }
141
  ],
142
  "logging_steps": 25,
 
151
  "should_evaluate": false,
152
  "should_log": false,
153
  "should_save": true,
154
+ "should_training_stop": true
155
  },
156
  "attributes": {}
157
  }
158
  },
159
+ "total_flos": 7.387786248192e+18,
160
  "train_batch_size": 64,
161
  "trial_name": null,
162
  "trial_params": null