anas-awadalla commited on
Commit
d9ffa7f
1 Parent(s): a245d0f

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +104 -0
trainer_state.json ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.168413444163354,
5
+ "global_step": 6000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.18,
12
+ "learning_rate": 1.9819298879653056e-05,
13
+ "loss": 2.6489,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 0.36,
18
+ "learning_rate": 1.9638597759306108e-05,
19
+ "loss": 1.7223,
20
+ "step": 1000
21
+ },
22
+ {
23
+ "epoch": 0.54,
24
+ "learning_rate": 1.9457896638959163e-05,
25
+ "loss": 1.4874,
26
+ "step": 1500
27
+ },
28
+ {
29
+ "epoch": 0.72,
30
+ "learning_rate": 1.9277195518612218e-05,
31
+ "loss": 1.3632,
32
+ "step": 2000
33
+ },
34
+ {
35
+ "epoch": 0.9,
36
+ "learning_rate": 1.909649439826527e-05,
37
+ "loss": 1.2963,
38
+ "step": 2500
39
+ },
40
+ {
41
+ "epoch": 1.0,
42
+ "eval_loss": 1.1749399900436401,
43
+ "eval_runtime": 25.9529,
44
+ "eval_samples_per_second": 415.522,
45
+ "eval_steps_per_second": 12.985,
46
+ "step": 2767
47
+ },
48
+ {
49
+ "epoch": 1.08,
50
+ "learning_rate": 1.8915793277918324e-05,
51
+ "loss": 1.1963,
52
+ "step": 3000
53
+ },
54
+ {
55
+ "epoch": 1.26,
56
+ "learning_rate": 1.873509215757138e-05,
57
+ "loss": 1.0687,
58
+ "step": 3500
59
+ },
60
+ {
61
+ "epoch": 1.45,
62
+ "learning_rate": 1.8554391037224433e-05,
63
+ "loss": 1.0932,
64
+ "step": 4000
65
+ },
66
+ {
67
+ "epoch": 1.63,
68
+ "learning_rate": 1.8373689916877485e-05,
69
+ "loss": 1.0549,
70
+ "step": 4500
71
+ },
72
+ {
73
+ "epoch": 1.81,
74
+ "learning_rate": 1.819298879653054e-05,
75
+ "loss": 1.0376,
76
+ "step": 5000
77
+ },
78
+ {
79
+ "epoch": 1.99,
80
+ "learning_rate": 1.8012287676183594e-05,
81
+ "loss": 1.0317,
82
+ "step": 5500
83
+ },
84
+ {
85
+ "epoch": 2.0,
86
+ "eval_loss": 1.1026474237442017,
87
+ "eval_runtime": 25.9642,
88
+ "eval_samples_per_second": 415.342,
89
+ "eval_steps_per_second": 12.979,
90
+ "step": 5534
91
+ },
92
+ {
93
+ "epoch": 2.17,
94
+ "learning_rate": 1.783158655583665e-05,
95
+ "loss": 0.861,
96
+ "step": 6000
97
+ }
98
+ ],
99
+ "max_steps": 55340,
100
+ "num_train_epochs": 20,
101
+ "total_flos": 1.115469291829248e+16,
102
+ "trial_name": null,
103
+ "trial_params": null
104
+ }