ShihTing commited on
Commit
f8403f9
1 Parent(s): 6b5599e

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +127 -3
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.347593582887701,
5
- "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -68,11 +68,135 @@
68
  "eval_samples_per_second": 18.484,
69
  "eval_steps_per_second": 4.646,
70
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
  }
72
  ],
73
  "max_steps": 5610,
74
  "num_train_epochs": 30,
75
- "total_flos": 1049850814279680.0,
76
  "trial_name": null,
77
  "trial_params": null
78
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 16.0427807486631,
5
+ "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
68
  "eval_samples_per_second": 18.484,
69
  "eval_steps_per_second": 4.646,
70
  "step": 1000
71
+ },
72
+ {
73
+ "epoch": 6.42,
74
+ "eval_accuracy": 0.9037433155080213,
75
+ "eval_loss": 0.8681638240814209,
76
+ "eval_recall": 0.7755102040816326,
77
+ "eval_runtime": 10.157,
78
+ "eval_samples_per_second": 18.411,
79
+ "eval_steps_per_second": 4.627,
80
+ "step": 1200
81
+ },
82
+ {
83
+ "epoch": 7.49,
84
+ "eval_accuracy": 0.8823529411764706,
85
+ "eval_loss": 0.9168533682823181,
86
+ "eval_recall": 0.6938775510204082,
87
+ "eval_runtime": 10.271,
88
+ "eval_samples_per_second": 18.207,
89
+ "eval_steps_per_second": 4.576,
90
+ "step": 1400
91
+ },
92
+ {
93
+ "epoch": 8.02,
94
+ "learning_rate": 3.6631016042780753e-05,
95
+ "loss": 0.0555,
96
+ "step": 1500
97
+ },
98
+ {
99
+ "epoch": 8.56,
100
+ "eval_accuracy": 0.8556149732620321,
101
+ "eval_loss": 0.9982467293739319,
102
+ "eval_recall": 0.7346938775510204,
103
+ "eval_runtime": 10.134,
104
+ "eval_samples_per_second": 18.453,
105
+ "eval_steps_per_second": 4.638,
106
+ "step": 1600
107
+ },
108
+ {
109
+ "epoch": 9.63,
110
+ "eval_accuracy": 0.8663101604278075,
111
+ "eval_loss": 1.04860258102417,
112
+ "eval_recall": 0.7142857142857143,
113
+ "eval_runtime": 10.225,
114
+ "eval_samples_per_second": 18.289,
115
+ "eval_steps_per_second": 4.597,
116
+ "step": 1800
117
+ },
118
+ {
119
+ "epoch": 10.7,
120
+ "learning_rate": 3.2174688057041004e-05,
121
+ "loss": 0.0224,
122
+ "step": 2000
123
+ },
124
+ {
125
+ "epoch": 10.7,
126
+ "eval_accuracy": 0.8770053475935828,
127
+ "eval_loss": 1.0292185544967651,
128
+ "eval_recall": 0.673469387755102,
129
+ "eval_runtime": 10.362,
130
+ "eval_samples_per_second": 18.047,
131
+ "eval_steps_per_second": 4.536,
132
+ "step": 2000
133
+ },
134
+ {
135
+ "epoch": 11.76,
136
+ "eval_accuracy": 0.8663101604278075,
137
+ "eval_loss": 1.1402537822723389,
138
+ "eval_recall": 0.673469387755102,
139
+ "eval_runtime": 10.233,
140
+ "eval_samples_per_second": 18.274,
141
+ "eval_steps_per_second": 4.593,
142
+ "step": 2200
143
+ },
144
+ {
145
+ "epoch": 12.83,
146
+ "eval_accuracy": 0.8716577540106952,
147
+ "eval_loss": 1.1431100368499756,
148
+ "eval_recall": 0.673469387755102,
149
+ "eval_runtime": 10.226,
150
+ "eval_samples_per_second": 18.287,
151
+ "eval_steps_per_second": 4.596,
152
+ "step": 2400
153
+ },
154
+ {
155
+ "epoch": 13.37,
156
+ "learning_rate": 2.7718360071301247e-05,
157
+ "loss": 0.0001,
158
+ "step": 2500
159
+ },
160
+ {
161
+ "epoch": 13.9,
162
+ "eval_accuracy": 0.8770053475935828,
163
+ "eval_loss": 1.1465816497802734,
164
+ "eval_recall": 0.6530612244897959,
165
+ "eval_runtime": 10.254,
166
+ "eval_samples_per_second": 18.237,
167
+ "eval_steps_per_second": 4.584,
168
+ "step": 2600
169
+ },
170
+ {
171
+ "epoch": 14.97,
172
+ "eval_accuracy": 0.8716577540106952,
173
+ "eval_loss": 1.1757899522781372,
174
+ "eval_recall": 0.6530612244897959,
175
+ "eval_runtime": 10.346,
176
+ "eval_samples_per_second": 18.075,
177
+ "eval_steps_per_second": 4.543,
178
+ "step": 2800
179
+ },
180
+ {
181
+ "epoch": 16.04,
182
+ "learning_rate": 2.32620320855615e-05,
183
+ "loss": 0.0,
184
+ "step": 3000
185
+ },
186
+ {
187
+ "epoch": 16.04,
188
+ "eval_accuracy": 0.8823529411764706,
189
+ "eval_loss": 1.1856350898742676,
190
+ "eval_recall": 0.6530612244897959,
191
+ "eval_runtime": 10.397,
192
+ "eval_samples_per_second": 17.986,
193
+ "eval_steps_per_second": 4.521,
194
+ "step": 3000
195
  }
196
  ],
197
  "max_steps": 5610,
198
  "num_train_epochs": 30,
199
+ "total_flos": 3149026201829376.0,
200
  "trial_name": null,
201
  "trial_params": null
202
  }