k4black commited on
Commit
f4bf108
1 Parent(s): 8f72d1c

Training in progress, step 13000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e65cf37678993fe3f18088679da537fa01d85da9d152deaa0f44810aeb323ce0
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bda6d8b01959de39ba727cf65ebf1679bca33d79e28f75e3c9a93b97bde2d98
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48589b74cc0dd9aca7fabf6af7fbebeded924f02e75c01d4b186662817a3fc93
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35737dd63de8dd15a434463f352af1ca13361ec6ad940d8d6d57c02ca720a0c5
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f177c85bdffc6c35bccc14f5fae42f9fa475b3565690a355cfcb00cbcbaca2b
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec1d572066a975cce68a6728c4924f1ce1aa043904ec8fb9bf914cc37f8ce9ef
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e0411b19d02a684abea10135971df618e10478843b4b273e508440d8c839ca4
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f897fc5ea9ff3f8b4c69087123f7b049e20d61b25538299e1d2d1327ed7be47
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:772a71df90a23cf1d15b47f710ae6706f64dace0a85b2ffc76c96757f3ee319e
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:752a70445102b249f7f99549c9b0595ef63200e880c377bf3d80c443b9f54831
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
- "epoch": 4.0,
5
- "global_step": 12500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -481,11 +481,30 @@
481
  "eval_samples_per_second": 86.596,
482
  "eval_steps_per_second": 2.728,
483
  "step": 12500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
484
  }
485
  ],
486
  "max_steps": 31250,
487
  "num_train_epochs": 10,
488
- "total_flos": 4.515048174963917e+16,
489
  "trial_name": null,
490
  "trial_params": null
491
  }
 
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
+ "epoch": 4.16,
5
+ "global_step": 13000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
481
  "eval_samples_per_second": 86.596,
482
  "eval_steps_per_second": 2.728,
483
  "step": 12500
484
+ },
485
+ {
486
+ "epoch": 4.16,
487
+ "learning_rate": 6.149493044093374e-05,
488
+ "loss": 0.4422,
489
+ "step": 13000
490
+ },
491
+ {
492
+ "epoch": 4.16,
493
+ "eval_bleu": 0.13537517858880133,
494
+ "eval_exact_match": 0.163,
495
+ "eval_loss": 0.7656739354133606,
496
+ "eval_rouge1": 0.5705462095820004,
497
+ "eval_rouge2": 0.40541664718394044,
498
+ "eval_rougeL": 0.5548493921872111,
499
+ "eval_runtime": 24.1852,
500
+ "eval_samples_per_second": 82.695,
501
+ "eval_steps_per_second": 2.605,
502
+ "step": 13000
503
  }
504
  ],
505
  "max_steps": 31250,
506
  "num_train_epochs": 10,
507
+ "total_flos": 4.693192667037696e+16,
508
  "trial_name": null,
509
  "trial_params": null
510
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48589b74cc0dd9aca7fabf6af7fbebeded924f02e75c01d4b186662817a3fc93
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35737dd63de8dd15a434463f352af1ca13361ec6ad940d8d6d57c02ca720a0c5
3
  size 242019067