tarekziade commited on
Commit
569c1e3
1 Parent(s): ad7371e

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +23 -20
README.md CHANGED
@@ -40,24 +40,27 @@ You can find the code used to create the model here: https://github.com/mozilla/
40
 
41
  # training results
42
 
43
- - eval/gen_len 14.99729
44
- - eval/loss 0.17093
45
- - eval/meteor 0.51479
46
- - eval/rouge1 57.8066
47
- - eval/rouge2 35.0888
48
- - eval/rougeL 52.9138
49
- - eval/rougeLsum 52.9101
50
- - eval/runtime 760.2135
51
- - eval/samples_per_second 11.18
52
- - eval/steps_per_second 0.112
53
- - train/epoch 8.0
54
- - train/global_step 11752
55
- - train/learning_rate 0.0
56
- - train/loss 0.1034
57
- - train/total_flos 1.518634875573869e+20
58
- - train/train_loss 0.14875
59
- - train/train_runtime 91405.9053
60
- - train/train_samples_per_second 12.855
61
- - train/train_steps_per_second 0.129
62
-
 
 
 
63
 
 
40
 
41
  # training results
42
 
43
+ ```
44
+ {
45
+ "train/loss": 0.0781,
46
+ "train/learning_rate": 0.00003793103448275862,
47
+ "train/epoch": 2.41,
48
+ "train/global_step": 700,
49
+ "eval/loss": 0.09741172194480896,
50
+ "eval/rouge1": 60.382,
51
+ "eval/rouge2": 38.0754,
52
+ "eval/rougeL": 56.9132,
53
+ "eval/rougeLsum": 56.9214,
54
+ "eval/meteor": 0.5448683804505693,
55
+ "eval/gen_len": 9.864678265672467,
56
+ "eval/runtime": 343.0443,
57
+ "eval/samples_per_second": 10.555,
58
+ "eval/steps_per_second": 0.108,
59
+ "train/train_runtime": 10567.9413,
60
+ "train/train_samples_per_second": 27.414,
61
+ "train/train_steps_per_second": 0.274,
62
+ "train/total_flos": 9039628706135409000,
63
+ "train/train_loss": 0.09852950266429356,
64
+ }
65
+ ```
66