k4black commited on
Commit
0187e01
1 Parent(s): 2e00ae9

Training in progress, step 14000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64170c1ef9674624e302ab8f03fd25a12b89b33fbe057d4bf3fb5447f9aa9930
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:291536c29816f728e3cba77f0913d3caa0ba585f8235f5550bc21065fbddbdd9
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18579680032becc23d37db038694d8397ca17699b4a25ed0a513417866b3f604
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e22cc89eb2136ee82b4e796b0e29d69936f909e099bf0c4884ac8fd18e562f2c
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0494d47a6723ec6fe3e9b22849735e2c1e99577b6fdde5984b8746167b06721c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7759f0c472ca45389e4eae17ffad344d36d27699315b967c42957fe462ab223a
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bd6d67b339a73b53d65263734baa465f18221257501d7c96218a456d5e52593
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0dbca853644b15a29af08332b55f3984d623fef9adee1ac942c6a31df8bd1a1
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6763c28702ee464b28b3066b1b607afdc83789f4713e9068815f524e6b83d56e
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7768db5638271ec21fc5793894a62875a3d6eda3c151f5b4e3e7da2c7e03c3
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.759707510471344,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-12000",
4
- "epoch": 3.84,
5
- "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -120,11 +120,30 @@
120
  "eval_samples_per_second": 8.065,
121
  "eval_steps_per_second": 0.254,
122
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  }
124
  ],
125
  "max_steps": 62500,
126
  "num_train_epochs": 20,
127
- "total_flos": 4.334845641621504e+16,
128
  "trial_name": null,
129
  "trial_params": null
130
  }
 
1
  {
2
  "best_metric": 0.759707510471344,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-selected/checkpoint-12000",
4
+ "epoch": 4.48,
5
+ "global_step": 14000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
120
  "eval_samples_per_second": 8.065,
121
  "eval_steps_per_second": 0.254,
122
  "step": 12000
123
+ },
124
+ {
125
+ "epoch": 4.48,
126
+ "learning_rate": 8.169431578947368e-05,
127
+ "loss": 0.4575,
128
+ "step": 14000
129
+ },
130
+ {
131
+ "epoch": 4.48,
132
+ "eval_bleu": 0.3082674516281405,
133
+ "eval_exact_match": 0.181,
134
+ "eval_loss": 0.7730007171630859,
135
+ "eval_rouge1": 0.59579739088828,
136
+ "eval_rouge2": 0.4140226910138735,
137
+ "eval_rougeL": 0.5699065207669394,
138
+ "eval_runtime": 246.1487,
139
+ "eval_samples_per_second": 8.125,
140
+ "eval_steps_per_second": 0.256,
141
+ "step": 14000
142
  }
143
  ],
144
  "max_steps": 62500,
145
  "num_train_epochs": 20,
146
+ "total_flos": 5.055885856053658e+16,
147
  "trial_name": null,
148
  "trial_params": null
149
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18579680032becc23d37db038694d8397ca17699b4a25ed0a513417866b3f604
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e22cc89eb2136ee82b4e796b0e29d69936f909e099bf0c4884ac8fd18e562f2c
3
  size 242019067