daydrill commited on
Commit
5d19dce
1 Parent(s): 515f655

Training in progress, step 3500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:800ce167b888c1555ce149731d7bc2c753c37b67d31170fb09caffc5792b1e4e
3
  size 880446181
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:633117411df249b67810ce444bf3fb43946a8cd66899354347e95f320178ff8d
3
  size 880446181
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc8e99aaece0e5506cc318f72aba485312ecdd92d231f7a6abf4c66a19db2012
3
  size 440235825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
3
  size 440235825
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfa290a26b1da9a46696e39d6f59c27396a70c365e5a24ca8436eb906badd239
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8af43f49c567fc21216a636a0b928ad3f2b478713872cde9fab7fd2e5b3bd94
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98dfa5e5e97bb43603b1e5dcc06c796459aa988da669f9bb10ae35ce686b5186
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52671e748af9f02c099fe74fa17abb19dd5557da6aa5f91f903c19df101db345
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.3124349093938763,
5
- "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -102,11 +102,27 @@
102
  "eval_samples_per_second": 92.093,
103
  "eval_steps_per_second": 11.514,
104
  "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "max_steps": 28806,
108
  "num_train_epochs": 3,
109
- "total_flos": 6271122161664000.0,
110
  "trial_name": null,
111
  "trial_params": null
112
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.36450739429285567,
5
+ "global_step": 3500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 92.093,
103
  "eval_steps_per_second": 11.514,
104
  "step": 3000
105
+ },
106
+ {
107
+ "epoch": 0.36,
108
+ "learning_rate": 2.6354926057071445e-05,
109
+ "loss": 0.8375,
110
+ "step": 3500
111
+ },
112
+ {
113
+ "epoch": 0.36,
114
+ "eval_exact_match": 63.82368283776734,
115
+ "eval_f1": 68.19581427410363,
116
+ "eval_loss": 0.7115561366081238,
117
+ "eval_runtime": 154.7006,
118
+ "eval_samples_per_second": 91.822,
119
+ "eval_steps_per_second": 11.48,
120
+ "step": 3500
121
  }
122
  ],
123
  "max_steps": 28806,
124
  "num_train_epochs": 3,
125
+ "total_flos": 7316309188608000.0,
126
  "trial_name": null,
127
  "trial_params": null
128
  }
nbest_predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc8e99aaece0e5506cc318f72aba485312ecdd92d231f7a6abf4c66a19db2012
3
  size 440235825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89123e2ca1e8f73e8549d0b72898b6506a9d8cab0ca3f0ddf2851992906d3212
3
  size 440235825