Jazzweller
commited on
Commit
•
3181777
1
Parent(s):
b1eb970
End of training
Browse files
all_results.json
CHANGED
@@ -2,12 +2,12 @@
|
|
2 |
"epoch": 3.0,
|
3 |
"eval_accuracy": 0.2857142857142857,
|
4 |
"eval_loss": 0.7827825546264648,
|
5 |
-
"eval_runtime": 0.
|
6 |
-
"eval_samples_per_second": 9.
|
7 |
-
"eval_steps_per_second": 1.
|
8 |
"total_flos": 4250374116581376.0,
|
9 |
"train_loss": 0.17864632606506348,
|
10 |
-
"train_runtime":
|
11 |
-
"train_samples_per_second": 3.
|
12 |
-
"train_steps_per_second": 0.
|
13 |
}
|
|
|
2 |
"epoch": 3.0,
|
3 |
"eval_accuracy": 0.2857142857142857,
|
4 |
"eval_loss": 0.7827825546264648,
|
5 |
+
"eval_runtime": 0.7719,
|
6 |
+
"eval_samples_per_second": 9.069,
|
7 |
+
"eval_steps_per_second": 1.296,
|
8 |
"total_flos": 4250374116581376.0,
|
9 |
"train_loss": 0.17864632606506348,
|
10 |
+
"train_runtime": 45.1081,
|
11 |
+
"train_samples_per_second": 3.791,
|
12 |
+
"train_steps_per_second": 0.067
|
13 |
}
|
eval_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 3.0,
|
3 |
"eval_accuracy": 0.2857142857142857,
|
4 |
"eval_loss": 0.7827825546264648,
|
5 |
-
"eval_runtime": 0.
|
6 |
-
"eval_samples_per_second": 9.
|
7 |
-
"eval_steps_per_second": 1.
|
8 |
}
|
|
|
2 |
"epoch": 3.0,
|
3 |
"eval_accuracy": 0.2857142857142857,
|
4 |
"eval_loss": 0.7827825546264648,
|
5 |
+
"eval_runtime": 0.7719,
|
6 |
+
"eval_samples_per_second": 9.069,
|
7 |
+
"eval_steps_per_second": 1.296
|
8 |
}
|
runs/May28_20-29-12_38183ecde2ad/events.out.tfevents.1653769965.38183ecde2ad.92.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0314f2fc5883fd130b79edb3239ac9872e4642746d66e561b0076e0b154a05ce
|
3 |
+
size 357
|
train_results.json
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
"epoch": 3.0,
|
3 |
"total_flos": 4250374116581376.0,
|
4 |
"train_loss": 0.17864632606506348,
|
5 |
-
"train_runtime":
|
6 |
-
"train_samples_per_second": 3.
|
7 |
-
"train_steps_per_second": 0.
|
8 |
}
|
|
|
2 |
"epoch": 3.0,
|
3 |
"total_flos": 4250374116581376.0,
|
4 |
"train_loss": 0.17864632606506348,
|
5 |
+
"train_runtime": 45.1081,
|
6 |
+
"train_samples_per_second": 3.791,
|
7 |
+
"train_steps_per_second": 0.067
|
8 |
}
|
trainer_state.json
CHANGED
@@ -11,27 +11,27 @@
|
|
11 |
"epoch": 1.0,
|
12 |
"eval_accuracy": 0.2857142857142857,
|
13 |
"eval_loss": 0.7827825546264648,
|
14 |
-
"eval_runtime": 0.
|
15 |
-
"eval_samples_per_second": 9.
|
16 |
-
"eval_steps_per_second": 1.
|
17 |
"step": 1
|
18 |
},
|
19 |
{
|
20 |
"epoch": 2.0,
|
21 |
"eval_accuracy": 0.14285714285714285,
|
22 |
"eval_loss": 0.8606036901473999,
|
23 |
-
"eval_runtime": 0.
|
24 |
-
"eval_samples_per_second":
|
25 |
-
"eval_steps_per_second": 1.
|
26 |
"step": 2
|
27 |
},
|
28 |
{
|
29 |
"epoch": 3.0,
|
30 |
"eval_accuracy": 0.2857142857142857,
|
31 |
-
"eval_loss": 0.
|
32 |
-
"eval_runtime": 0.
|
33 |
-
"eval_samples_per_second":
|
34 |
-
"eval_steps_per_second": 1.
|
35 |
"step": 3
|
36 |
},
|
37 |
{
|
@@ -39,9 +39,9 @@
|
|
39 |
"step": 3,
|
40 |
"total_flos": 4250374116581376.0,
|
41 |
"train_loss": 0.17864632606506348,
|
42 |
-
"train_runtime":
|
43 |
-
"train_samples_per_second": 3.
|
44 |
-
"train_steps_per_second": 0.
|
45 |
}
|
46 |
],
|
47 |
"max_steps": 3,
|
|
|
11 |
"epoch": 1.0,
|
12 |
"eval_accuracy": 0.2857142857142857,
|
13 |
"eval_loss": 0.7827825546264648,
|
14 |
+
"eval_runtime": 0.7023,
|
15 |
+
"eval_samples_per_second": 9.967,
|
16 |
+
"eval_steps_per_second": 1.424,
|
17 |
"step": 1
|
18 |
},
|
19 |
{
|
20 |
"epoch": 2.0,
|
21 |
"eval_accuracy": 0.14285714285714285,
|
22 |
"eval_loss": 0.8606036901473999,
|
23 |
+
"eval_runtime": 0.6969,
|
24 |
+
"eval_samples_per_second": 10.044,
|
25 |
+
"eval_steps_per_second": 1.435,
|
26 |
"step": 2
|
27 |
},
|
28 |
{
|
29 |
"epoch": 3.0,
|
30 |
"eval_accuracy": 0.2857142857142857,
|
31 |
+
"eval_loss": 0.8618678450584412,
|
32 |
+
"eval_runtime": 0.7824,
|
33 |
+
"eval_samples_per_second": 8.947,
|
34 |
+
"eval_steps_per_second": 1.278,
|
35 |
"step": 3
|
36 |
},
|
37 |
{
|
|
|
39 |
"step": 3,
|
40 |
"total_flos": 4250374116581376.0,
|
41 |
"train_loss": 0.17864632606506348,
|
42 |
+
"train_runtime": 45.1081,
|
43 |
+
"train_samples_per_second": 3.791,
|
44 |
+
"train_steps_per_second": 0.067
|
45 |
}
|
46 |
],
|
47 |
"max_steps": 3,
|