Xmm commited on
Commit
92b66c5
1 Parent(s): 2151609

Upload 8 files

Browse files

Finetuned on entities

optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78f128e341188b9eacd001a6e7fc9031eda23366662ad095781567489c262699
3
  size 4921022932
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a85e06e7c385cca92f4a8f54b47798afabd1695c9355dcce12069def7eec593
3
  size 4921022932
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5db582a24c8f3cb13bacddf4482af3b34d4db048210f388d45381562bb066929
3
  size 2460468737
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8cc71cd9ef90537c1cbf650dbdb17b128ca8378784b87ba9a7ed30067db3471
3
  size 2460468737
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20721249d9b8d8bc576b72185919e68c93dae68b49c2363c0236e1172512edff
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5370b871c1a234b36198f0c8eae1923196c8067fcf05542ebf23b694806d4378
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd539ae79de480492c3270d14ced42f10b1174f0cad170e082f8fbf6aa55b60c
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a49346f519a1a9f14fcadd47fb8b2a3d1bafcf68ea79e99ae6a44a8272fb4777
3
  size 627
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.34489724040031433,
3
  "best_model_checkpoint": "./checkpoint-my/checkpoint-1500",
4
- "epoch": 5.127337945170382,
5
  "eval_steps": 500,
6
- "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -167,13 +167,93 @@
167
  "eval_samples_per_second": 5.218,
168
  "eval_steps_per_second": 1.305,
169
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  }
171
  ],
172
  "logging_steps": 500,
173
- "max_steps": 14625,
174
  "num_train_epochs": 15,
175
  "save_steps": 500,
176
- "total_flos": 3.467034171046625e+17,
177
  "trial_name": null,
178
  "trial_params": null
179
  }
 
1
  {
2
  "best_metric": 0.34489724040031433,
3
  "best_model_checkpoint": "./checkpoint-my/checkpoint-1500",
4
+ "epoch": 7.56789812129618,
5
  "eval_steps": 500,
6
+ "global_step": 7500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
167
  "eval_samples_per_second": 5.218,
168
  "eval_steps_per_second": 1.305,
169
  "step": 5000
170
+ },
171
+ {
172
+ "epoch": 5.64,
173
+ "learning_rate": 1.247863247863248e-05,
174
+ "loss": 0.1189,
175
+ "step": 5500
176
+ },
177
+ {
178
+ "epoch": 5.64,
179
+ "eval_bleu": 27.4615,
180
+ "eval_gen_len": 32.2204,
181
+ "eval_loss": 0.34533679485321045,
182
+ "eval_runtime": 186.2569,
183
+ "eval_samples_per_second": 5.433,
184
+ "eval_steps_per_second": 1.358,
185
+ "step": 5500
186
+ },
187
+ {
188
+ "epoch": 6.15,
189
+ "learning_rate": 1.1794871794871796e-05,
190
+ "loss": 0.1166,
191
+ "step": 6000
192
+ },
193
+ {
194
+ "epoch": 6.15,
195
+ "eval_bleu": 27.6321,
196
+ "eval_gen_len": 32.2816,
197
+ "eval_loss": 0.34552034735679626,
198
+ "eval_runtime": 185.1476,
199
+ "eval_samples_per_second": 5.466,
200
+ "eval_steps_per_second": 1.366,
201
+ "step": 6000
202
+ },
203
+ {
204
+ "epoch": 6.56,
205
+ "learning_rate": 1.125462495795493e-05,
206
+ "loss": 0.1171,
207
+ "step": 6500
208
+ },
209
+ {
210
+ "epoch": 6.56,
211
+ "eval_bleu": 27.3986,
212
+ "eval_gen_len": 32.4397,
213
+ "eval_loss": 0.34709280729293823,
214
+ "eval_runtime": 204.1804,
215
+ "eval_samples_per_second": 4.956,
216
+ "eval_steps_per_second": 1.239,
217
+ "step": 6500
218
+ },
219
+ {
220
+ "epoch": 7.06,
221
+ "learning_rate": 1.0581903800874538e-05,
222
+ "loss": 0.1157,
223
+ "step": 7000
224
+ },
225
+ {
226
+ "epoch": 7.06,
227
+ "eval_bleu": 27.5083,
228
+ "eval_gen_len": 32.2816,
229
+ "eval_loss": 0.34769660234451294,
230
+ "eval_runtime": 209.4596,
231
+ "eval_samples_per_second": 4.831,
232
+ "eval_steps_per_second": 1.208,
233
+ "step": 7000
234
+ },
235
+ {
236
+ "epoch": 7.57,
237
+ "learning_rate": 9.909182643794148e-06,
238
+ "loss": 0.1121,
239
+ "step": 7500
240
+ },
241
+ {
242
+ "epoch": 7.57,
243
+ "eval_bleu": 27.4437,
244
+ "eval_gen_len": 32.2194,
245
+ "eval_loss": 0.34789395332336426,
246
+ "eval_runtime": 209.9641,
247
+ "eval_samples_per_second": 4.82,
248
+ "eval_steps_per_second": 1.205,
249
+ "step": 7500
250
  }
251
  ],
252
  "logging_steps": 500,
253
+ "max_steps": 14865,
254
  "num_train_epochs": 15,
255
  "save_steps": 500,
256
+ "total_flos": 5.2005742820563354e+17,
257
  "trial_name": null,
258
  "trial_params": null
259
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa984e3cea098421ca0a4e48e9cd6b184a4ab34fc980cad163565e996bb9d67a
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:644b2690039d83439e28a3112267a0e4adac0af05d4ef5abe06d9d8bbb23d339
3
  size 4155