k4black commited on
Commit
7293f48
1 Parent(s): 4d4b7bb

Training in progress, step 18000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b724b506c07e2492f9981025b58ec651d4d50231e4dea69d9b563b9d1f865d13
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5a3994bec819710a835f80f8aa82d0105e0883cf8d0e3c5927322ba2bdcb50
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54ca33f03949fc3cfbc2ebf9e438ce78fb36aa81dcfa2d97902322474874c171
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7117ba2d09b846f698338bed502fc59349bdb397b74b570b5a47983194b363fb
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa7c39bfc9247300062036d6b5dfb74d83183f6a98a8d7dfb5cd875d041bc74a
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25e78732c3b6c033fc1d91347e2ee95775aa5739cc10516823b35ad26afb8ffe
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c919c7365197a2b62a00c59cbb4a32fc90c08ff7bb57ea0becaf024774a80779
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b187cde9afaec36bc905c24419c4f9acf8e94221bbda69a9e5ba0e46c99916
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b505a859840f27c0c9e0931069f4e7c8f87bdd0a0944c961e0940131a2223fb6
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b5ac1d15acc878a836769b8a70fba55d184b57275a4a7a111b126b94c0c60f
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.759707510471344,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-12000",
4
- "epoch": 5.12,
5
- "global_step": 16000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -158,11 +158,30 @@
158
  "eval_samples_per_second": 9.705,
159
  "eval_steps_per_second": 0.306,
160
  "step": 16000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
161
  }
162
  ],
163
  "max_steps": 62500,
164
  "num_train_epochs": 20,
165
- "total_flos": 5.777129929074278e+16,
166
  "trial_name": null,
167
  "trial_params": null
168
  }
 
1
  {
2
  "best_metric": 0.759707510471344,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-12000",
4
+ "epoch": 5.76,
5
+ "global_step": 18000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
158
  "eval_samples_per_second": 9.705,
159
  "eval_steps_per_second": 0.306,
160
  "step": 16000
161
+ },
162
+ {
163
+ "epoch": 5.76,
164
+ "learning_rate": 7.496084210526317e-05,
165
+ "loss": 0.4123,
166
+ "step": 18000
167
+ },
168
+ {
169
+ "epoch": 5.76,
170
+ "eval_bleu": 0.3161064543245236,
171
+ "eval_exact_match": 0.185,
172
+ "eval_loss": 0.7642457485198975,
173
+ "eval_rouge1": 0.6004680977665069,
174
+ "eval_rouge2": 0.4177038650507878,
175
+ "eval_rougeL": 0.5740117301579993,
176
+ "eval_runtime": 216.7206,
177
+ "eval_samples_per_second": 9.228,
178
+ "eval_steps_per_second": 0.291,
179
+ "step": 18000
180
  }
181
  ],
182
  "max_steps": 62500,
183
  "num_train_epochs": 20,
184
+ "total_flos": 6.49345601938391e+16,
185
  "trial_name": null,
186
  "trial_params": null
187
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54ca33f03949fc3cfbc2ebf9e438ce78fb36aa81dcfa2d97902322474874c171
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7117ba2d09b846f698338bed502fc59349bdb397b74b570b5a47983194b363fb
3
  size 242019067