ccore commited on
Commit
f6cd8b9
·
verified ·
1 Parent(s): e52a701

Training in progress, epoch 12, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:507e45593144bb2cf41c0598515e2ea5832f9e83502a991e35ca1fd8897d4b7b
3
  size 500979600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea7fc909fdc3f1ae4015f0d4750a4a63b89ee5f2effb1be178a4a372ea6822ec
3
  size 500979600
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08bee2e0984bbf63dd98e3afe5ce279648b51a871ad71dbaa9c855446f016deb
3
  size 1002078330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e57e13a2fd122f2acccb2788d69aba473e357b7997bcdc0b72c1738b5c9421f2
3
  size 1002078330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2816efc9f4c1de5a16c78e02f2554b79cf809e4fff588f530d63512ba1508099
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee46d463575e74c9a732147771eadee45646a33c68ec6df02d9e322d868ddf4c
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:667845ec98850da2da09c9709aecd8f85bd67e83fe7c6e52d5a2e2d27bb40110
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a653363dc6a007bb7991143643fc45ea80be1e2dd1763a9221017fc9c83922
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.9924370050430298,
3
- "best_model_checkpoint": "./opt_trained/checkpoint-2211",
4
- "epoch": 11.0,
5
  "eval_steps": 500,
6
- "global_step": 2211,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -123,6 +123,14 @@
123
  "eval_samples_per_second": 36.992,
124
  "eval_steps_per_second": 9.248,
125
  "step": 2211
 
 
 
 
 
 
 
 
126
  }
127
  ],
128
  "logging_steps": 500,
@@ -142,7 +150,7 @@
142
  "attributes": {}
143
  }
144
  },
145
- "total_flos": 7.442986205952e+16,
146
  "train_batch_size": 16,
147
  "trial_name": null,
148
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9905564785003662,
3
+ "best_model_checkpoint": "./opt_trained/checkpoint-2412",
4
+ "epoch": 12.0,
5
  "eval_steps": 500,
6
+ "global_step": 2412,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
123
  "eval_samples_per_second": 36.992,
124
  "eval_steps_per_second": 9.248,
125
  "step": 2211
126
+ },
127
+ {
128
+ "epoch": 12.0,
129
+ "eval_loss": 0.9905564785003662,
130
+ "eval_runtime": 77.3311,
131
+ "eval_samples_per_second": 36.932,
132
+ "eval_steps_per_second": 9.233,
133
+ "step": 2412
134
  }
135
  ],
136
  "logging_steps": 500,
 
150
  "attributes": {}
151
  }
152
  },
153
+ "total_flos": 8.119621315584e+16,
154
  "train_batch_size": 16,
155
  "trial_name": null,
156
  "trial_params": null