Training in progress, step 24500
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +24 -5
- pytorch_model.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 484085807
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b0071a9336a7161eb4875d8085f042f9ee20ec41a2c3ffe1b8c736abcaafba9
|
3 |
size 484085807
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 242031355
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44f8c7a70c3d2a9d75b2aa00f032c4eb62bbf677cf661d8ea540421cf0e8ec46
|
3 |
size 242031355
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:527eae81bee180cf37314d77cf9bfe68e0dadd0ae429f24dae2354b5ae26973a
|
3 |
size 14503
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 559
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fccda41cf05d0c2582a5ae864ddced240b945973cac170056ad38621f56c053
|
3 |
size 559
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14a47b82e1c0e1303cf3ea519a24a915a49a6100912f6b988940a6848bca4178
|
3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "/home2/s5431786/jb-internship/results/t5-small-CodeXGLUE-CONCODE-faster/checkpoint-
|
4 |
-
"epoch": 7.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -918,11 +918,30 @@
|
|
918 |
"eval_samples_per_second": 76.252,
|
919 |
"eval_steps_per_second": 2.402,
|
920 |
"step": 24000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
921 |
}
|
922 |
],
|
923 |
"max_steps": 62500,
|
924 |
"num_train_epochs": 20,
|
925 |
-
"total_flos": 1.
|
926 |
"trial_name": null,
|
927 |
"trial_params": null
|
928 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.656362771987915,
|
3 |
+
"best_model_checkpoint": "/home2/s5431786/jb-internship/results/t5-small-CodeXGLUE-CONCODE-faster/checkpoint-24500",
|
4 |
+
"epoch": 7.84,
|
5 |
+
"global_step": 24500,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
918 |
"eval_samples_per_second": 76.252,
|
919 |
"eval_steps_per_second": 2.402,
|
920 |
"step": 24000
|
921 |
+
},
|
922 |
+
{
|
923 |
+
"epoch": 7.84,
|
924 |
+
"learning_rate": 0.0003200757894736842,
|
925 |
+
"loss": 0.4345,
|
926 |
+
"step": 24500
|
927 |
+
},
|
928 |
+
{
|
929 |
+
"epoch": 7.84,
|
930 |
+
"eval_bleu": 0.06814284730693101,
|
931 |
+
"eval_exact_match": 0.1025,
|
932 |
+
"eval_loss": 0.656362771987915,
|
933 |
+
"eval_rouge1": 0.5143728841578871,
|
934 |
+
"eval_rouge2": 0.35808146099426286,
|
935 |
+
"eval_rougeL": 0.5020021673160826,
|
936 |
+
"eval_runtime": 26.1074,
|
937 |
+
"eval_samples_per_second": 76.607,
|
938 |
+
"eval_steps_per_second": 2.413,
|
939 |
+
"step": 24500
|
940 |
}
|
941 |
],
|
942 |
"max_steps": 62500,
|
943 |
"num_train_epochs": 20,
|
944 |
+
"total_flos": 1.0242320722034688e+17,
|
945 |
"trial_name": null,
|
946 |
"trial_params": null
|
947 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 242031355
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44f8c7a70c3d2a9d75b2aa00f032c4eb62bbf677cf661d8ea540421cf0e8ec46
|
3 |
size 242031355
|