k4black commited on
Commit
fad991b
1 Parent(s): 59d61fd

Training in progress, step 12000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a8fd14875f383b9bb0d8593b684d62436d3668082932d0a7478a733a16998ec
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc1f7c55c8f8c0d40f4dd00c60e2187aa0a8aa139514c1b33817125b3fbdcc6f
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:714d445e6b5862d1f88ae613af90d4976e1296d0cc0aafcdd6d58bd826a8cc9a
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01450b005a0c07927774367baf2df85370addf1ae358bb986bedd6b750669cba
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce949685be6274a05b6e7c619789b125fa9355ec848e49da30bf08f8f0728b60
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e94701ea26738e0c3e8924fcfb0f3afba7ae6c7118b9610924cd0ffeaf567c
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4122a09dd635d78f97acc1da1c19d9cae63312b7d149d206a02a14b3e9635d97
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3947d449c9f4d1e0c9eb97a6f1405b24f0cb52a87ee412118f0b3e92dad7ac68
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afbfb3c8724d5e4a4b2ab6b752657e8afd02c3798521639b7d388dc2e14a79ae
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c17de809b895c3bd271032fe901af5531aab205f74c2d6adac3868824296045a
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7635162472724915,
3
- "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-11500",
4
- "epoch": 3.68,
5
- "global_step": 11500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -443,11 +443,30 @@
443
  "eval_samples_per_second": 89.472,
444
  "eval_steps_per_second": 2.818,
445
  "step": 11500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
446
  }
447
  ],
448
  "max_steps": 31250,
449
  "num_train_epochs": 10,
450
- "total_flos": 4.155506758149734e+16,
451
  "trial_name": null,
452
  "trial_params": null
453
  }
 
1
  {
2
+ "best_metric": 0.7575966715812683,
3
+ "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
+ "epoch": 3.84,
5
+ "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
443
  "eval_samples_per_second": 89.472,
444
  "eval_steps_per_second": 2.818,
445
  "step": 11500
446
+ },
447
+ {
448
+ "epoch": 3.84,
449
+ "learning_rate": 6.486340822582275e-05,
450
+ "loss": 0.4779,
451
+ "step": 12000
452
+ },
453
+ {
454
+ "epoch": 3.84,
455
+ "eval_bleu": 0.1349476481247351,
456
+ "eval_exact_match": 0.163,
457
+ "eval_loss": 0.7575966715812683,
458
+ "eval_rouge1": 0.5806974627802324,
459
+ "eval_rouge2": 0.4141474945527226,
460
+ "eval_rougeL": 0.5638708523820954,
461
+ "eval_runtime": 24.2543,
462
+ "eval_samples_per_second": 82.46,
463
+ "eval_steps_per_second": 2.597,
464
+ "step": 12000
465
  }
466
  ],
467
  "max_steps": 31250,
468
  "num_train_epochs": 10,
469
+ "total_flos": 4.334845641621504e+16,
470
  "trial_name": null,
471
  "trial_params": null
472
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:714d445e6b5862d1f88ae613af90d4976e1296d0cc0aafcdd6d58bd826a8cc9a
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01450b005a0c07927774367baf2df85370addf1ae358bb986bedd6b750669cba
3
  size 242019067