huranokuma
commited on
Commit
•
d5e6d7b
1
Parent(s):
177df34
End of training
Browse files- all_results.json +11 -11
- eval_results.json +7 -7
- runs/Aug15_10-57-40_09d4b99a5f37/events.out.tfevents.1660567231.09d4b99a5f37.2797.2 +3 -0
- train_results.json +5 -5
- trainer_state.json +12 -18
all_results.json
CHANGED
@@ -1,15 +1,15 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"eval_accuracy": 0.
|
4 |
-
"eval_loss": 1.
|
5 |
-
"eval_runtime":
|
6 |
"eval_samples": 134942,
|
7 |
-
"eval_samples_per_second": 30.
|
8 |
-
"eval_steps_per_second": 7.
|
9 |
-
"perplexity": 3.
|
10 |
-
"train_loss":
|
11 |
-
"train_runtime":
|
12 |
"train_samples": 134942,
|
13 |
-
"train_samples_per_second":
|
14 |
-
"train_steps_per_second":
|
15 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 4.98,
|
3 |
+
"eval_accuracy": 0.6914040854429856,
|
4 |
+
"eval_loss": 1.3205146789550781,
|
5 |
+
"eval_runtime": 4403.2676,
|
6 |
"eval_samples": 134942,
|
7 |
+
"eval_samples_per_second": 30.646,
|
8 |
+
"eval_steps_per_second": 7.662,
|
9 |
+
"perplexity": 3.7453485333545293,
|
10 |
+
"train_loss": 0.0,
|
11 |
+
"train_runtime": 0.0953,
|
12 |
"train_samples": 134942,
|
13 |
+
"train_samples_per_second": 4248275.036,
|
14 |
+
"train_steps_per_second": 1062084.5
|
15 |
}
|
eval_results.json
CHANGED
@@ -1,10 +1,10 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"eval_accuracy": 0.
|
4 |
-
"eval_loss": 1.
|
5 |
-
"eval_runtime":
|
6 |
"eval_samples": 134942,
|
7 |
-
"eval_samples_per_second": 30.
|
8 |
-
"eval_steps_per_second": 7.
|
9 |
-
"perplexity": 3.
|
10 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 4.98,
|
3 |
+
"eval_accuracy": 0.6914040854429856,
|
4 |
+
"eval_loss": 1.3205146789550781,
|
5 |
+
"eval_runtime": 4403.2676,
|
6 |
"eval_samples": 134942,
|
7 |
+
"eval_samples_per_second": 30.646,
|
8 |
+
"eval_steps_per_second": 7.662,
|
9 |
+
"perplexity": 3.7453485333545293
|
10 |
}
|
runs/Aug15_10-57-40_09d4b99a5f37/events.out.tfevents.1660567231.09d4b99a5f37.2797.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aa1c9239e1022f81b2d658efb066191e8a1c59ef84167dcb5b6fefdb1243ab3
|
3 |
+
size 369
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"train_loss":
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 134942,
|
6 |
-
"train_samples_per_second":
|
7 |
-
"train_steps_per_second":
|
8 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 4.98,
|
3 |
+
"train_loss": 0.0,
|
4 |
+
"train_runtime": 0.0953,
|
5 |
"train_samples": 134942,
|
6 |
+
"train_samples_per_second": 4248275.036,
|
7 |
+
"train_steps_per_second": 1062084.5
|
8 |
}
|
trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -2024,24 +2024,18 @@
|
|
2024 |
"step": 168000
|
2025 |
},
|
2026 |
{
|
2027 |
-
"epoch": 4.
|
2028 |
-
"
|
2029 |
-
"
|
2030 |
-
"
|
2031 |
-
|
2032 |
-
|
2033 |
-
"
|
2034 |
-
"step": 168680,
|
2035 |
-
"total_flos": 6.266036456049869e+17,
|
2036 |
-
"train_loss": 1.6101340950849867,
|
2037 |
-
"train_runtime": 65579.3531,
|
2038 |
-
"train_samples_per_second": 10.288,
|
2039 |
-
"train_steps_per_second": 2.572
|
2040 |
}
|
2041 |
],
|
2042 |
-
"max_steps":
|
2043 |
-
"num_train_epochs":
|
2044 |
-
"total_flos": 6.
|
2045 |
"trial_name": null,
|
2046 |
"trial_params": null
|
2047 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 4.979843490633152,
|
5 |
+
"global_step": 168000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
2024 |
"step": 168000
|
2025 |
},
|
2026 |
{
|
2027 |
+
"epoch": 4.98,
|
2028 |
+
"step": 168000,
|
2029 |
+
"total_flos": 6.240794371172598e+17,
|
2030 |
+
"train_loss": 0.0,
|
2031 |
+
"train_runtime": 0.0953,
|
2032 |
+
"train_samples_per_second": 4248275.036,
|
2033 |
+
"train_steps_per_second": 1062084.5
|
|
|
|
|
|
|
|
|
|
|
|
|
2034 |
}
|
2035 |
],
|
2036 |
+
"max_steps": 101208,
|
2037 |
+
"num_train_epochs": 3,
|
2038 |
+
"total_flos": 6.240794371172598e+17,
|
2039 |
"trial_name": null,
|
2040 |
"trial_params": null
|
2041 |
}
|