vincentmin commited on
Commit
d5857b7
1 Parent(s): 2a74db6

End of training

Browse files
Files changed (3) hide show
  1. README.md +13 -0
  2. score-params.pt +0 -3
  3. trainer_state.json +221 -107
README.md CHANGED
@@ -7,6 +7,7 @@ metrics:
7
  model-index:
8
  - name: llama-2-7b-reward-oasst1
9
  results: []
 
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,6 +34,17 @@ More information needed
33
 
34
  ## Training procedure
35
 
 
 
 
 
 
 
 
 
 
 
 
36
  ### Training hyperparameters
37
 
38
  The following hyperparameters were used during training:
@@ -64,6 +76,7 @@ The following hyperparameters were used during training:
64
 
65
  ### Framework versions
66
 
 
67
  - Transformers 4.32.0.dev0
68
  - Pytorch 2.0.1+cu118
69
  - Datasets 2.14.0
 
7
  model-index:
8
  - name: llama-2-7b-reward-oasst1
9
  results: []
10
+ library_name: peft
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  ## Training procedure
36
 
37
+
38
+ The following `bitsandbytes` quantization config was used during training:
39
+ - load_in_8bit: False
40
+ - load_in_4bit: True
41
+ - llm_int8_threshold: 6.0
42
+ - llm_int8_skip_modules: None
43
+ - llm_int8_enable_fp32_cpu_offload: False
44
+ - llm_int8_has_fp16_weight: False
45
+ - bnb_4bit_quant_type: nf4
46
+ - bnb_4bit_use_double_quant: False
47
+ - bnb_4bit_compute_dtype: float16
48
  ### Training hyperparameters
49
 
50
  The following hyperparameters were used during training:
 
76
 
77
  ### Framework versions
78
 
79
+ - PEFT 0.5.0.dev0
80
  - Transformers 4.32.0.dev0
81
  - Pytorch 2.0.1+cu118
82
  - Datasets 2.14.0
score-params.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:004dfe6b5ceb18d6a8e7a0c4010af0e72a2b3c2156d39ac2f0b42541bafb4dc0
3
- size 34043
 
 
 
 
trainer_state.json CHANGED
@@ -1,296 +1,410 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7584,
5
- "global_step": 1896,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.02,
12
- "learning_rate": 1.9624e-05,
13
- "loss": 0.9388,
14
  "step": 50
15
  },
16
  {
17
  "epoch": 0.04,
18
  "learning_rate": 1.9232e-05,
19
- "loss": 0.9522,
20
  "step": 100
21
  },
22
  {
23
  "epoch": 0.06,
24
  "learning_rate": 1.8832000000000002e-05,
25
- "loss": 0.8005,
26
  "step": 150
27
  },
28
  {
29
  "epoch": 0.08,
30
  "learning_rate": 1.8432000000000002e-05,
31
- "loss": 0.6908,
32
  "step": 200
33
  },
34
  {
35
  "epoch": 0.1,
36
  "learning_rate": 1.8032e-05,
37
- "loss": 0.7927,
38
  "step": 250
39
  },
40
  {
41
  "epoch": 0.1,
42
- "eval_accuracy": 0.6659167604049494,
43
- "eval_loss": 0.7351371645927429,
44
- "eval_runtime": 434.6411,
45
- "eval_samples_per_second": 2.045,
46
- "eval_steps_per_second": 2.045,
47
  "step": 250
48
  },
49
  {
50
  "epoch": 0.12,
51
- "learning_rate": 1.764e-05,
52
- "loss": 0.5962,
53
  "step": 300
54
  },
55
  {
56
  "epoch": 0.14,
57
- "learning_rate": 1.724e-05,
58
- "loss": 0.6989,
59
  "step": 350
60
  },
61
  {
62
  "epoch": 0.16,
63
- "learning_rate": 1.684e-05,
64
- "loss": 0.7051,
65
  "step": 400
66
  },
67
  {
68
  "epoch": 0.18,
69
- "learning_rate": 1.6440000000000002e-05,
70
- "loss": 0.6664,
71
  "step": 450
72
  },
73
  {
74
  "epoch": 0.2,
75
- "learning_rate": 1.6040000000000002e-05,
76
- "loss": 0.6547,
77
  "step": 500
78
  },
79
  {
80
  "epoch": 0.2,
81
- "eval_accuracy": 0.7041619797525309,
82
- "eval_loss": 0.6934666037559509,
83
- "eval_runtime": 436.2176,
84
- "eval_samples_per_second": 2.038,
85
- "eval_steps_per_second": 2.038,
86
  "step": 500
87
  },
88
  {
89
  "epoch": 0.22,
90
- "learning_rate": 1.5640000000000003e-05,
91
- "loss": 0.665,
92
  "step": 550
93
  },
94
  {
95
  "epoch": 0.24,
96
- "learning_rate": 1.5240000000000001e-05,
97
- "loss": 0.654,
98
  "step": 600
99
  },
100
  {
101
  "epoch": 0.26,
102
- "learning_rate": 1.4840000000000002e-05,
103
- "loss": 0.6714,
104
  "step": 650
105
  },
106
  {
107
  "epoch": 0.28,
108
- "learning_rate": 1.444e-05,
109
- "loss": 0.7395,
110
  "step": 700
111
  },
112
  {
113
  "epoch": 0.3,
114
- "learning_rate": 1.4040000000000001e-05,
115
- "loss": 0.5393,
116
  "step": 750
117
  },
118
  {
119
  "epoch": 0.3,
120
- "eval_accuracy": 0.7142857142857143,
121
- "eval_loss": 0.621578574180603,
122
- "eval_runtime": 436.3187,
123
- "eval_samples_per_second": 2.038,
124
- "eval_steps_per_second": 2.038,
125
  "step": 750
126
  },
127
  {
128
  "epoch": 0.32,
129
- "learning_rate": 1.3640000000000002e-05,
130
- "loss": 0.5185,
131
  "step": 800
132
  },
133
  {
134
  "epoch": 0.34,
135
- "learning_rate": 1.3240000000000002e-05,
136
- "loss": 0.6009,
137
  "step": 850
138
  },
139
  {
140
  "epoch": 0.36,
141
- "learning_rate": 1.284e-05,
142
- "loss": 0.6588,
143
  "step": 900
144
  },
145
  {
146
  "epoch": 0.38,
147
- "learning_rate": 1.2440000000000001e-05,
148
- "loss": 0.6022,
149
  "step": 950
150
  },
151
  {
152
  "epoch": 0.4,
153
- "learning_rate": 1.204e-05,
154
- "loss": 0.7316,
155
  "step": 1000
156
  },
157
  {
158
  "epoch": 0.4,
159
- "eval_accuracy": 0.734533183352081,
160
- "eval_loss": 0.5916205644607544,
161
- "eval_runtime": 436.6514,
162
- "eval_samples_per_second": 2.036,
163
- "eval_steps_per_second": 2.036,
164
  "step": 1000
165
  },
166
  {
167
  "epoch": 0.42,
168
- "learning_rate": 1.164e-05,
169
- "loss": 0.6086,
170
  "step": 1050
171
  },
172
  {
173
  "epoch": 0.44,
174
- "learning_rate": 1.1240000000000002e-05,
175
- "loss": 0.5806,
176
  "step": 1100
177
  },
178
  {
179
  "epoch": 0.46,
180
- "learning_rate": 1.0840000000000001e-05,
181
- "loss": 0.5992,
182
  "step": 1150
183
  },
184
  {
185
  "epoch": 0.48,
186
- "learning_rate": 1.0440000000000002e-05,
187
- "loss": 0.5807,
188
  "step": 1200
189
  },
190
  {
191
  "epoch": 0.5,
192
- "learning_rate": 1.004e-05,
193
- "loss": 0.5667,
194
  "step": 1250
195
  },
196
  {
197
  "epoch": 0.5,
198
- "eval_accuracy": 0.734533183352081,
199
- "eval_loss": 0.5785398483276367,
200
- "eval_runtime": 436.2096,
201
- "eval_samples_per_second": 2.038,
202
- "eval_steps_per_second": 2.038,
203
  "step": 1250
204
  },
205
  {
206
  "epoch": 0.52,
207
- "learning_rate": 9.640000000000001e-06,
208
- "loss": 0.4989,
209
  "step": 1300
210
  },
211
  {
212
  "epoch": 0.54,
213
- "learning_rate": 9.240000000000001e-06,
214
- "loss": 0.6015,
215
  "step": 1350
216
  },
217
  {
218
  "epoch": 0.56,
219
- "learning_rate": 8.848e-06,
220
- "loss": 0.5728,
221
  "step": 1400
222
  },
223
  {
224
  "epoch": 0.58,
225
- "learning_rate": 8.448000000000001e-06,
226
- "loss": 0.6285,
227
  "step": 1450
228
  },
229
  {
230
  "epoch": 0.6,
231
- "learning_rate": 8.048e-06,
232
- "loss": 0.498,
233
  "step": 1500
234
  },
235
  {
236
  "epoch": 0.6,
237
- "eval_accuracy": 0.7435320584926884,
238
- "eval_loss": 0.5632913708686829,
239
- "eval_runtime": 436.3374,
240
- "eval_samples_per_second": 2.037,
241
- "eval_steps_per_second": 2.037,
242
  "step": 1500
243
  },
244
  {
245
  "epoch": 0.62,
246
- "learning_rate": 7.648e-06,
247
- "loss": 0.5134,
248
  "step": 1550
249
  },
250
  {
251
  "epoch": 0.64,
252
- "learning_rate": 7.248000000000001e-06,
253
- "loss": 0.4582,
254
  "step": 1600
255
  },
256
  {
257
  "epoch": 0.66,
258
- "learning_rate": 6.848e-06,
259
- "loss": 0.534,
260
  "step": 1650
261
  },
262
  {
263
  "epoch": 0.68,
264
- "learning_rate": 6.448000000000001e-06,
265
- "loss": 0.6765,
266
  "step": 1700
267
  },
268
  {
269
  "epoch": 0.7,
270
- "learning_rate": 6.048e-06,
271
- "loss": 0.6598,
272
  "step": 1750
273
  },
274
  {
275
  "epoch": 0.7,
276
- "eval_accuracy": 0.7457817772778402,
277
- "eval_loss": 0.565944254398346,
278
- "eval_runtime": 435.7582,
279
- "eval_samples_per_second": 2.04,
280
- "eval_steps_per_second": 2.04,
281
  "step": 1750
282
  },
283
  {
284
  "epoch": 0.72,
285
- "learning_rate": 5.648e-06,
286
- "loss": 0.5006,
287
  "step": 1800
288
  },
289
  {
290
  "epoch": 0.74,
291
- "learning_rate": 5.248000000000001e-06,
292
- "loss": 0.579,
293
  "step": 1850
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
294
  }
295
  ],
296
  "max_steps": 2500,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
+ "global_step": 2500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.02,
12
+ "learning_rate": 1.9632e-05,
13
+ "loss": 0.9899,
14
  "step": 50
15
  },
16
  {
17
  "epoch": 0.04,
18
  "learning_rate": 1.9232e-05,
19
+ "loss": 0.9949,
20
  "step": 100
21
  },
22
  {
23
  "epoch": 0.06,
24
  "learning_rate": 1.8832000000000002e-05,
25
+ "loss": 0.828,
26
  "step": 150
27
  },
28
  {
29
  "epoch": 0.08,
30
  "learning_rate": 1.8432000000000002e-05,
31
+ "loss": 0.8372,
32
  "step": 200
33
  },
34
  {
35
  "epoch": 0.1,
36
  "learning_rate": 1.8032e-05,
37
+ "loss": 0.8409,
38
  "step": 250
39
  },
40
  {
41
  "epoch": 0.1,
42
+ "eval_accuracy": 0.6220472440944882,
43
+ "eval_loss": 0.8243474364280701,
44
+ "eval_runtime": 435.8774,
45
+ "eval_samples_per_second": 2.04,
46
+ "eval_steps_per_second": 2.04,
47
  "step": 250
48
  },
49
  {
50
  "epoch": 0.12,
51
+ "learning_rate": 1.7632000000000003e-05,
52
+ "loss": 0.694,
53
  "step": 300
54
  },
55
  {
56
  "epoch": 0.14,
57
+ "learning_rate": 1.7232000000000004e-05,
58
+ "loss": 0.6918,
59
  "step": 350
60
  },
61
  {
62
  "epoch": 0.16,
63
+ "learning_rate": 1.6832e-05,
64
+ "loss": 0.6794,
65
  "step": 400
66
  },
67
  {
68
  "epoch": 0.18,
69
+ "learning_rate": 1.6432e-05,
70
+ "loss": 0.6338,
71
  "step": 450
72
  },
73
  {
74
  "epoch": 0.2,
75
+ "learning_rate": 1.6032e-05,
76
+ "loss": 0.6288,
77
  "step": 500
78
  },
79
  {
80
  "epoch": 0.2,
81
+ "eval_accuracy": 0.671541057367829,
82
+ "eval_loss": 0.7539446949958801,
83
+ "eval_runtime": 434.4073,
84
+ "eval_samples_per_second": 2.046,
85
+ "eval_steps_per_second": 2.046,
86
  "step": 500
87
  },
88
  {
89
  "epoch": 0.22,
90
+ "learning_rate": 1.5632000000000002e-05,
91
+ "loss": 0.6622,
92
  "step": 550
93
  },
94
  {
95
  "epoch": 0.24,
96
+ "learning_rate": 1.5232000000000003e-05,
97
+ "loss": 0.773,
98
  "step": 600
99
  },
100
  {
101
  "epoch": 0.26,
102
+ "learning_rate": 1.4832000000000001e-05,
103
+ "loss": 0.6051,
104
  "step": 650
105
  },
106
  {
107
  "epoch": 0.28,
108
+ "learning_rate": 1.4432000000000002e-05,
109
+ "loss": 0.7805,
110
  "step": 700
111
  },
112
  {
113
  "epoch": 0.3,
114
+ "learning_rate": 1.4032e-05,
115
+ "loss": 0.5882,
116
  "step": 750
117
  },
118
  {
119
  "epoch": 0.3,
120
+ "eval_accuracy": 0.7075365579302587,
121
+ "eval_loss": 0.6791747808456421,
122
+ "eval_runtime": 433.8268,
123
+ "eval_samples_per_second": 2.049,
124
+ "eval_steps_per_second": 2.049,
125
  "step": 750
126
  },
127
  {
128
  "epoch": 0.32,
129
+ "learning_rate": 1.3632000000000001e-05,
130
+ "loss": 0.5672,
131
  "step": 800
132
  },
133
  {
134
  "epoch": 0.34,
135
+ "learning_rate": 1.3232e-05,
136
+ "loss": 0.6807,
137
  "step": 850
138
  },
139
  {
140
  "epoch": 0.36,
141
+ "learning_rate": 1.2832e-05,
142
+ "loss": 0.6796,
143
  "step": 900
144
  },
145
  {
146
  "epoch": 0.38,
147
+ "learning_rate": 1.2432000000000002e-05,
148
+ "loss": 0.6922,
149
  "step": 950
150
  },
151
  {
152
  "epoch": 0.4,
153
+ "learning_rate": 1.2032000000000001e-05,
154
+ "loss": 0.7671,
155
  "step": 1000
156
  },
157
  {
158
  "epoch": 0.4,
159
+ "eval_accuracy": 0.7334083239595051,
160
+ "eval_loss": 0.6129724383354187,
161
+ "eval_runtime": 433.287,
162
+ "eval_samples_per_second": 2.052,
163
+ "eval_steps_per_second": 2.052,
164
  "step": 1000
165
  },
166
  {
167
  "epoch": 0.42,
168
+ "learning_rate": 1.1632000000000001e-05,
169
+ "loss": 0.645,
170
  "step": 1050
171
  },
172
  {
173
  "epoch": 0.44,
174
+ "learning_rate": 1.1232e-05,
175
+ "loss": 0.5891,
176
  "step": 1100
177
  },
178
  {
179
  "epoch": 0.46,
180
+ "learning_rate": 1.0832e-05,
181
+ "loss": 0.6426,
182
  "step": 1150
183
  },
184
  {
185
  "epoch": 0.48,
186
+ "learning_rate": 1.0432e-05,
187
+ "loss": 0.567,
188
  "step": 1200
189
  },
190
  {
191
  "epoch": 0.5,
192
+ "learning_rate": 1.0032000000000002e-05,
193
+ "loss": 0.5782,
194
  "step": 1250
195
  },
196
  {
197
  "epoch": 0.5,
198
+ "eval_accuracy": 0.7255343082114736,
199
+ "eval_loss": 0.6114887595176697,
200
+ "eval_runtime": 433.3273,
201
+ "eval_samples_per_second": 2.052,
202
+ "eval_steps_per_second": 2.052,
203
  "step": 1250
204
  },
205
  {
206
  "epoch": 0.52,
207
+ "learning_rate": 9.632e-06,
208
+ "loss": 0.5736,
209
  "step": 1300
210
  },
211
  {
212
  "epoch": 0.54,
213
+ "learning_rate": 9.232e-06,
214
+ "loss": 0.6849,
215
  "step": 1350
216
  },
217
  {
218
  "epoch": 0.56,
219
+ "learning_rate": 8.832000000000001e-06,
220
+ "loss": 0.5305,
221
  "step": 1400
222
  },
223
  {
224
  "epoch": 0.58,
225
+ "learning_rate": 8.432e-06,
226
+ "loss": 0.7265,
227
  "step": 1450
228
  },
229
  {
230
  "epoch": 0.6,
231
+ "learning_rate": 8.032e-06,
232
+ "loss": 0.5691,
233
  "step": 1500
234
  },
235
  {
236
  "epoch": 0.6,
237
+ "eval_accuracy": 0.7412823397075365,
238
+ "eval_loss": 0.5794617533683777,
239
+ "eval_runtime": 433.4136,
240
+ "eval_samples_per_second": 2.051,
241
+ "eval_steps_per_second": 2.051,
242
  "step": 1500
243
  },
244
  {
245
  "epoch": 0.62,
246
+ "learning_rate": 7.632e-06,
247
+ "loss": 0.519,
248
  "step": 1550
249
  },
250
  {
251
  "epoch": 0.64,
252
+ "learning_rate": 7.232e-06,
253
+ "loss": 0.5378,
254
  "step": 1600
255
  },
256
  {
257
  "epoch": 0.66,
258
+ "learning_rate": 6.832000000000001e-06,
259
+ "loss": 0.5982,
260
  "step": 1650
261
  },
262
  {
263
  "epoch": 0.68,
264
+ "learning_rate": 6.432e-06,
265
+ "loss": 0.7027,
266
  "step": 1700
267
  },
268
  {
269
  "epoch": 0.7,
270
+ "learning_rate": 6.032e-06,
271
+ "loss": 0.6579,
272
  "step": 1750
273
  },
274
  {
275
  "epoch": 0.7,
276
+ "eval_accuracy": 0.7469066366704162,
277
+ "eval_loss": 0.5774183869361877,
278
+ "eval_runtime": 433.4068,
279
+ "eval_samples_per_second": 2.051,
280
+ "eval_steps_per_second": 2.051,
281
  "step": 1750
282
  },
283
  {
284
  "epoch": 0.72,
285
+ "learning_rate": 5.6320000000000005e-06,
286
+ "loss": 0.5044,
287
  "step": 1800
288
  },
289
  {
290
  "epoch": 0.74,
291
+ "learning_rate": 5.232e-06,
292
+ "loss": 0.6482,
293
  "step": 1850
294
+ },
295
+ {
296
+ "epoch": 0.76,
297
+ "learning_rate": 4.8320000000000005e-06,
298
+ "loss": 0.5406,
299
+ "step": 1900
300
+ },
301
+ {
302
+ "epoch": 0.78,
303
+ "learning_rate": 4.432e-06,
304
+ "loss": 0.5372,
305
+ "step": 1950
306
+ },
307
+ {
308
+ "epoch": 0.8,
309
+ "learning_rate": 4.0320000000000005e-06,
310
+ "loss": 0.6107,
311
+ "step": 2000
312
+ },
313
+ {
314
+ "epoch": 0.8,
315
+ "eval_accuracy": 0.7401574803149606,
316
+ "eval_loss": 0.5690832734107971,
317
+ "eval_runtime": 433.3967,
318
+ "eval_samples_per_second": 2.051,
319
+ "eval_steps_per_second": 2.051,
320
+ "step": 2000
321
+ },
322
+ {
323
+ "epoch": 0.82,
324
+ "learning_rate": 3.6320000000000005e-06,
325
+ "loss": 0.4043,
326
+ "step": 2050
327
+ },
328
+ {
329
+ "epoch": 0.84,
330
+ "learning_rate": 3.2400000000000003e-06,
331
+ "loss": 0.5344,
332
+ "step": 2100
333
+ },
334
+ {
335
+ "epoch": 0.86,
336
+ "learning_rate": 2.84e-06,
337
+ "loss": 0.7056,
338
+ "step": 2150
339
+ },
340
+ {
341
+ "epoch": 0.88,
342
+ "learning_rate": 2.4400000000000004e-06,
343
+ "loss": 0.5719,
344
+ "step": 2200
345
+ },
346
+ {
347
+ "epoch": 0.9,
348
+ "learning_rate": 2.04e-06,
349
+ "loss": 0.6255,
350
+ "step": 2250
351
+ },
352
+ {
353
+ "epoch": 0.9,
354
+ "eval_accuracy": 0.7435320584926884,
355
+ "eval_loss": 0.570974588394165,
356
+ "eval_runtime": 433.4106,
357
+ "eval_samples_per_second": 2.051,
358
+ "eval_steps_per_second": 2.051,
359
+ "step": 2250
360
+ },
361
+ {
362
+ "epoch": 0.92,
363
+ "learning_rate": 1.6400000000000002e-06,
364
+ "loss": 0.5958,
365
+ "step": 2300
366
+ },
367
+ {
368
+ "epoch": 0.94,
369
+ "learning_rate": 1.2400000000000002e-06,
370
+ "loss": 0.5984,
371
+ "step": 2350
372
+ },
373
+ {
374
+ "epoch": 0.96,
375
+ "learning_rate": 8.480000000000001e-07,
376
+ "loss": 0.6103,
377
+ "step": 2400
378
+ },
379
+ {
380
+ "epoch": 0.98,
381
+ "learning_rate": 4.4800000000000004e-07,
382
+ "loss": 0.612,
383
+ "step": 2450
384
+ },
385
+ {
386
+ "epoch": 1.0,
387
+ "learning_rate": 4.8e-08,
388
+ "loss": 0.7034,
389
+ "step": 2500
390
+ },
391
+ {
392
+ "epoch": 1.0,
393
+ "eval_accuracy": 0.7435320584926884,
394
+ "eval_loss": 0.5713425874710083,
395
+ "eval_runtime": 434.3078,
396
+ "eval_samples_per_second": 2.047,
397
+ "eval_steps_per_second": 2.047,
398
+ "step": 2500
399
+ },
400
+ {
401
+ "epoch": 1.0,
402
+ "step": 2500,
403
+ "total_flos": 0.0,
404
+ "train_loss": 0.6507886672973633,
405
+ "train_runtime": 17457.236,
406
+ "train_samples_per_second": 0.573,
407
+ "train_steps_per_second": 0.143
408
  }
409
  ],
410
  "max_steps": 2500,