k4black commited on
Commit
650d0fc
1 Parent(s): 992edb1

Training in progress, step 6000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ab00c9ddd34f1cf2964b1096db77b9d715fbc02bdd5c7d43b00066b8085e40d
3
  size 997351173
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8228de27106e44527ce87d66105e3205dc6540a551e7cca8525ac6fda3a5396f
3
  size 997351173
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d45968dc773842b4524edf097410728d62c61752f13cc8b835d523befb79b605
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2668a06099ffd93fb8a66976b2bedf58dc654e44d146913529cbbe24d18cf2f0
3
  size 498665141
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed4ae02de340745a578ad716a6dcb1ee42a03a56073f856062cfc5a83e2e3b94
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6d8e09ceae8c97b30c879d0a88b02e5d6f9d2c8f95483bbc40029b8fbdfe781
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02d5d506efbd8a343664b3029e84353da8bd575421aff1c64d55aebab3313dcd
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21d2ce5a39857d286d2308d95541d019234b54f63ac7ba9f37f9448c047c7cc8
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.9870629938253499,
3
  "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-4800",
4
- "epoch": 0.5591798695246971,
5
- "global_step": 4800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -198,11 +198,59 @@
198
  "eval_samples_per_second": 2223.361,
199
  "eval_steps_per_second": 34.789,
200
  "step": 4800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
201
  }
202
  ],
203
  "max_steps": 25752,
204
  "num_train_epochs": 3,
205
- "total_flos": 1.2774452433289344e+16,
206
  "trial_name": null,
207
  "trial_params": null
208
  }
 
1
  {
2
  "best_metric": 0.9870629938253499,
3
  "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/roberta-base-e-snli-classification-nli_explanation-base/checkpoint-4800",
4
+ "epoch": 0.6989748369058714,
5
+ "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
198
  "eval_samples_per_second": 2223.361,
199
  "eval_steps_per_second": 34.789,
200
  "step": 4800
201
+ },
202
+ {
203
+ "epoch": 0.61,
204
+ "learning_rate": 8.40091563113146e-06,
205
+ "loss": 0.071,
206
+ "step": 5200
207
+ },
208
+ {
209
+ "epoch": 0.61,
210
+ "eval_accuracy": 0.985876854297907,
211
+ "eval_f1": 0.9858488466773426,
212
+ "eval_loss": 0.0532599538564682,
213
+ "eval_runtime": 4.3538,
214
+ "eval_samples_per_second": 2260.534,
215
+ "eval_steps_per_second": 35.371,
216
+ "step": 5200
217
+ },
218
+ {
219
+ "epoch": 0.65,
220
+ "learning_rate": 8.237410071942446e-06,
221
+ "loss": 0.0723,
222
+ "step": 5600
223
+ },
224
+ {
225
+ "epoch": 0.65,
226
+ "eval_accuracy": 0.9860800650274334,
227
+ "eval_f1": 0.9860406491659012,
228
+ "eval_loss": 0.04955599084496498,
229
+ "eval_runtime": 4.2895,
230
+ "eval_samples_per_second": 2294.439,
231
+ "eval_steps_per_second": 35.902,
232
+ "step": 5600
233
+ },
234
+ {
235
+ "epoch": 0.7,
236
+ "learning_rate": 8.073904512753434e-06,
237
+ "loss": 0.0713,
238
+ "step": 6000
239
+ },
240
+ {
241
+ "epoch": 0.7,
242
+ "eval_accuracy": 0.9860800650274334,
243
+ "eval_f1": 0.9860488223249062,
244
+ "eval_loss": 0.051210932433605194,
245
+ "eval_runtime": 4.2586,
246
+ "eval_samples_per_second": 2311.113,
247
+ "eval_steps_per_second": 36.163,
248
+ "step": 6000
249
  }
250
  ],
251
  "max_steps": 25752,
252
  "num_train_epochs": 3,
253
+ "total_flos": 1.597164223963392e+16,
254
  "trial_name": null,
255
  "trial_params": null
256
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d45968dc773842b4524edf097410728d62c61752f13cc8b835d523befb79b605
3
  size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2668a06099ffd93fb8a66976b2bedf58dc654e44d146913529cbbe24d18cf2f0
3
  size 498665141