Training in progress, step 8000

Files changed (7) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ce1b29e43611a1791a5461a257ae383816002d0a17a03dc277e8a719735bef5
 size 484059375

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ecd2121c62b78fefadaeabf329af30965c1d5254ad8a247a2f5e1c089314099
 size 484059375

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8f43c6d7aa824d347316c8c0065dcbfdd2a290765d5457b73391e794d7a75d1e
 size 242019067

 version https://git-lfs.github.com/spec/v1
+oid sha256:f011fe99c630646ec9bff8b3f6cd382f67008dc8ff7658561572678aac30eb7e
 size 242019067

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9a7efe2714d00ec72b63687f06a0075c6eedcfd7e2d84f5c227fd959380e312
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2142769294a8c158a319ee7619050123d4d200b9168f6287bd440d1df8e4983
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a3ced63d9f6d0d2ae1b52e48fd68ad1de2d74e64a729a2f4ee7983c78f4bea5
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:3782c5183f4b3926da31cb7a03a04d622797e9ed4a0007066495827d4864b745
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ec818c000d4a367b84a97bcfa490a6705f13db5f22600d87b9b934241ca852d0
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:789abdc0646d0e04a81d17afdf777ec7127cfb77488d5350e897ba1735bdfab3
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_metric": 0.7783799767494202,
-  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-6000",
-  "epoch": 1.92,
-  "global_step": 6000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -63,11 +63,30 @@
       "eval_samples_per_second": 7.699,
       "eval_steps_per_second": 0.243,
       "step": 6000
     }
   ],
   "max_steps": 62500,
   "num_train_epochs": 20,
-  "total_flos": 2.171393410911437e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 0.7699160575866699,
+  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-8000",
+  "epoch": 2.56,
+  "global_step": 8000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 7.699,
       "eval_steps_per_second": 0.243,
       "step": 6000
+    },
+    {
+      "epoch": 2.56,
+      "learning_rate": 9.179957894736842e-05,
+      "loss": 0.562,
+      "step": 8000
+    },
+    {
+      "epoch": 2.56,
+      "eval_bleu": 0.2967822969771582,
+      "eval_exact_match": 0.179,
+      "eval_loss": 0.7699160575866699,
+      "eval_rouge1": 0.5769004117490721,
+      "eval_rouge2": 0.400017695314681,
+      "eval_rougeL": 0.5526377939756941,
+      "eval_runtime": 274.6962,
+      "eval_samples_per_second": 7.281,
+      "eval_steps_per_second": 0.229,
+      "step": 8000
     }
   ],
   "max_steps": 62500,
   "num_train_epochs": 20,
+  "total_flos": 2.891269685850931e+16,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8f43c6d7aa824d347316c8c0065dcbfdd2a290765d5457b73391e794d7a75d1e
 size 242019067

 version https://git-lfs.github.com/spec/v1
+oid sha256:f011fe99c630646ec9bff8b3f6cd382f67008dc8ff7658561572678aac30eb7e
 size 242019067