k4black commited on
Commit
1f83525
1 Parent(s): 06d1b6c

Training in progress, step 8000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24bbbd009d6b03b2d3187e21796a48f493cc30cbafb35880f422a1bef28e2f00
3
  size 837935
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cce9b37f48e8675d69401a4b6b60995179e62a8ffbc1f88a02a7bbea5bba909
3
  size 837935
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47d3e0fa1b84d8087eb55cade7f014c4a642412b6534b2f635b32a5709409a01
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19af74a938a7be689d9873da872da964364ba343bd2170276819b7a95570306c
3
  size 242012923
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c087da379d8a74162facf8df088ad54ad5a18830758e9baf4ff0c963c84f233
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9038bd13cee7be809b870072293469c3cd227459e6b82a61f4cf6abfd04c52
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9becabe7dff860235908f1a60152bb8988922b004db913d8677aebddf68e6173
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3550fcb9eeeaf0d0c5e60b4fa40bb13ef4e2248224487e336467d1aedec98b8e
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9728bac511908fc806f53eace77527053eb9775969027422077b4bf29bd2a2e
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5d5ab462f8cc6dcbba2126c3954800aa77845e46f59352aa2ec60dd3148cb35
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.1625,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adafactor/checkpoint-5500",
4
- "epoch": 2.4,
5
- "global_step": 7500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -306,11 +306,31 @@
306
  "eval_samples_per_second": 69.751,
307
  "eval_steps_per_second": 2.197,
308
  "step": 7500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
309
  }
310
  ],
311
  "max_steps": 31250,
312
  "num_train_epochs": 10,
313
- "total_flos": 3.189355774161715e+16,
314
  "trial_name": null,
315
  "trial_params": null
316
  }
 
1
  {
2
  "best_metric": 0.1625,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adafactor/checkpoint-5500",
4
+ "epoch": 2.56,
5
+ "global_step": 8000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
306
  "eval_samples_per_second": 69.751,
307
  "eval_steps_per_second": 2.197,
308
  "step": 7500
309
+ },
310
+ {
311
+ "epoch": 2.56,
312
+ "learning_rate": 0.00023499174722942698,
313
+ "loss": 0.5172,
314
+ "step": 8000
315
+ },
316
+ {
317
+ "epoch": 2.56,
318
+ "eval_bleu": 0.12967243587670185,
319
+ "eval_exact_match": 0.1555,
320
+ "eval_loss": 0.8118115663528442,
321
+ "eval_rouge1": 0.5579744246548106,
322
+ "eval_rouge2": 0.3885609120793808,
323
+ "eval_rougeL": 0.5406865803442568,
324
+ "eval_rougeLsum": 0.5482646526079711,
325
+ "eval_runtime": 27.397,
326
+ "eval_samples_per_second": 73.001,
327
+ "eval_steps_per_second": 2.3,
328
+ "step": 8000
329
  }
330
  ],
331
  "max_steps": 31250,
332
  "num_train_epochs": 10,
333
+ "total_flos": 3.4018432483590144e+16,
334
  "trial_name": null,
335
  "trial_params": null
336
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47d3e0fa1b84d8087eb55cade7f014c4a642412b6534b2f635b32a5709409a01
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19af74a938a7be689d9873da872da964364ba343bd2170276819b7a95570306c
3
  size 242012923