tarekziade
commited on
Commit
•
569c1e3
1
Parent(s):
ad7371e
Update README.md
Browse files
README.md
CHANGED
@@ -40,24 +40,27 @@ You can find the code used to create the model here: https://github.com/mozilla/
|
|
40 |
|
41 |
# training results
|
42 |
|
43 |
-
|
44 |
-
|
45 |
-
|
46 |
-
|
47 |
-
|
48 |
-
|
49 |
-
|
50 |
-
|
51 |
-
|
52 |
-
|
53 |
-
|
54 |
-
|
55 |
-
|
56 |
-
|
57 |
-
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
-
|
62 |
-
|
|
|
|
|
|
|
63 |
|
|
|
40 |
|
41 |
# training results
|
42 |
|
43 |
+
```
|
44 |
+
{
|
45 |
+
"train/loss": 0.0781,
|
46 |
+
"train/learning_rate": 0.00003793103448275862,
|
47 |
+
"train/epoch": 2.41,
|
48 |
+
"train/global_step": 700,
|
49 |
+
"eval/loss": 0.09741172194480896,
|
50 |
+
"eval/rouge1": 60.382,
|
51 |
+
"eval/rouge2": 38.0754,
|
52 |
+
"eval/rougeL": 56.9132,
|
53 |
+
"eval/rougeLsum": 56.9214,
|
54 |
+
"eval/meteor": 0.5448683804505693,
|
55 |
+
"eval/gen_len": 9.864678265672467,
|
56 |
+
"eval/runtime": 343.0443,
|
57 |
+
"eval/samples_per_second": 10.555,
|
58 |
+
"eval/steps_per_second": 0.108,
|
59 |
+
"train/train_runtime": 10567.9413,
|
60 |
+
"train/train_samples_per_second": 27.414,
|
61 |
+
"train/train_steps_per_second": 0.274,
|
62 |
+
"train/total_flos": 9039628706135409000,
|
63 |
+
"train/train_loss": 0.09852950266429356,
|
64 |
+
}
|
65 |
+
```
|
66 |
|