nicholasKluge commited on
Commit
7c4cc9e
1 Parent(s): 048fcf1

Upload 13 files

Browse files
RewardModel.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
RewardModel_emissions.csv CHANGED
@@ -1,2 +1,2 @@
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
- 2023-06-13T15:03:57,RewardModel_emissions,34e3fabc-108d-42d0-8a10-d218a32c89f6,4812.4118773937225,0.17002787857474966,3.5331115230068865e-05,42.5,273.41,31.30528450012207,0.056805772867467685,0.3882571562884012,0.04180739816835735,0.4868703273242265,United States,USA,nevada,,,Linux-5.15.107+-x86_64-with-glibc2.31,3.10.12,2.2.3,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,-115.1164,36.1685,83.48075866699219,machine,N,1.0
 
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
+ 2023-08-27T21:29:04,RewardModel_emissions,9291717a-8ff3-4969-bbfc-56d01299f93b,1671.9951930046082,0.0811242018304008,4.851939896108135e-05,42.5,230.790533112253,31.305280208587646,0.019736131072872216,0.13199262364957,0.014530827622001492,0.16625958234444363,Singapore,SGP,,,,Linux-5.15.109+-x86_64-with-glibc2.35,3.10.12,2.3.1,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,103.8547,1.2929,83.48074722290039,machine,N,1.0
config.json CHANGED
@@ -25,7 +25,7 @@
25
  "pad_token_id": 0,
26
  "position_embedding_type": "absolute",
27
  "torch_dtype": "float32",
28
- "transformers_version": "4.30.1",
29
  "type_vocab_size": 2,
30
  "use_cache": true,
31
  "vocab_size": 28996
 
25
  "pad_token_id": 0,
26
  "position_embedding_type": "absolute",
27
  "torch_dtype": "float32",
28
+ "transformers_version": "4.32.0",
29
  "type_vocab_size": 2,
30
  "use_cache": true,
31
  "vocab_size": 28996
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c52bed61e330ec59d12c04564eb6df59e95ccd9bad6cc5adf5e754358c57566
3
- size 866606277
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b3d650a3141b2e0c2326bf226ade42125fe25070c17c0181b629ef58e54cd18
3
+ size 866656005
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41545686d6ccaf2f3efe0173dacc4c4634b0ade6710f046361ab31987f195591
3
- size 433316981
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5569d11e5bad1d5aded31c9cfa2b7faca36fca2d867e8d5e971fdb9d6271a8b0
3
+ size 433312561
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:008304bdd46c688bbf5feaf85cbcc083837da7f9be6bf363f309170ac62a6d4e
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34328d2f695efeba4db88f7e971d7409bfd04e499cbb6e22c019df50401e0447
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24c083a5f4303f0b59a009934c6dcb05a44520e05c10e837a7e2149a6d4a68d1
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67da5128d498ca4756021811370417b993fb803d16f9d8450b5e82ca5ddbb387
3
  size 627
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 350,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 350
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 400,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 400
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
trainer_state.json CHANGED
@@ -1,240 +1,54 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.901960784313726,
5
- "global_step": 3000,
 
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.33,
12
- "learning_rate": 4.673202614379085e-05,
13
- "loss": 0.0803,
14
  "step": 200
15
  },
16
  {
17
- "epoch": 0.33,
18
- "eval_accuracy": 0.9874985395490128,
19
- "eval_loss": 0.03710582107305527,
20
- "eval_runtime": 80.6999,
21
- "eval_samples_per_second": 106.06,
22
- "eval_steps_per_second": 2.528,
23
- "step": 200
24
- },
25
- {
26
- "epoch": 0.65,
27
- "learning_rate": 4.3464052287581704e-05,
28
- "loss": 0.0393,
29
  "step": 400
30
  },
31
  {
32
- "epoch": 0.65,
33
- "eval_accuracy": 0.9884332281808622,
34
- "eval_loss": 0.03642109036445618,
35
- "eval_runtime": 80.6008,
36
- "eval_samples_per_second": 106.19,
37
- "eval_steps_per_second": 2.531,
38
- "step": 400
39
- },
40
- {
41
- "epoch": 0.98,
42
- "learning_rate": 4.0196078431372555e-05,
43
- "loss": 0.0372,
44
- "step": 600
45
- },
46
- {
47
- "epoch": 0.98,
48
- "eval_accuracy": 0.986447014838182,
49
- "eval_loss": 0.04179869592189789,
50
- "eval_runtime": 80.6457,
51
- "eval_samples_per_second": 106.131,
52
- "eval_steps_per_second": 2.53,
53
  "step": 600
54
  },
55
  {
56
- "epoch": 1.31,
57
- "learning_rate": 3.6928104575163405e-05,
58
- "loss": 0.0114,
59
  "step": 800
60
  },
61
  {
62
- "epoch": 1.31,
63
- "eval_accuracy": 0.9896015889706742,
64
- "eval_loss": 0.0394107885658741,
65
- "eval_runtime": 80.6065,
66
- "eval_samples_per_second": 106.182,
67
- "eval_steps_per_second": 2.531,
68
- "step": 800
69
- },
70
- {
71
- "epoch": 1.63,
72
- "learning_rate": 3.366013071895425e-05,
73
- "loss": 0.0138,
74
- "step": 1000
75
- },
76
- {
77
- "epoch": 1.63,
78
- "eval_accuracy": 0.9897184250496553,
79
- "eval_loss": 0.0397811159491539,
80
- "eval_runtime": 80.5677,
81
- "eval_samples_per_second": 106.234,
82
- "eval_steps_per_second": 2.532,
83
  "step": 1000
84
  },
85
  {
86
- "epoch": 1.96,
87
- "learning_rate": 3.0392156862745097e-05,
88
- "loss": 0.0127,
89
- "step": 1200
90
- },
91
- {
92
- "epoch": 1.96,
93
- "eval_accuracy": 0.9908867858394672,
94
- "eval_loss": 0.034337081015110016,
95
- "eval_runtime": 80.5302,
96
- "eval_samples_per_second": 106.283,
97
- "eval_steps_per_second": 2.533,
98
- "step": 1200
99
- },
100
- {
101
- "epoch": 2.29,
102
- "learning_rate": 2.7124183006535947e-05,
103
- "loss": 0.0052,
104
- "step": 1400
105
- },
106
- {
107
- "epoch": 2.29,
108
- "eval_accuracy": 0.9911204579974296,
109
- "eval_loss": 0.037403274327516556,
110
- "eval_runtime": 80.6258,
111
- "eval_samples_per_second": 106.157,
112
- "eval_steps_per_second": 2.53,
113
- "step": 1400
114
- },
115
- {
116
- "epoch": 2.61,
117
- "learning_rate": 2.38562091503268e-05,
118
- "loss": 0.0018,
119
- "step": 1600
120
- },
121
- {
122
- "epoch": 2.61,
123
- "eval_accuracy": 0.9906531136815049,
124
- "eval_loss": 0.04766124114394188,
125
- "eval_runtime": 80.6271,
126
- "eval_samples_per_second": 106.155,
127
- "eval_steps_per_second": 2.53,
128
- "step": 1600
129
- },
130
- {
131
- "epoch": 2.94,
132
- "learning_rate": 2.058823529411765e-05,
133
  "loss": 0.0009,
134
- "step": 1800
135
- },
136
- {
137
- "epoch": 2.94,
138
- "eval_accuracy": 0.9912372940764108,
139
- "eval_loss": 0.0513538159430027,
140
- "eval_runtime": 80.6405,
141
- "eval_samples_per_second": 106.138,
142
- "eval_steps_per_second": 2.53,
143
- "step": 1800
144
- },
145
- {
146
- "epoch": 3.27,
147
- "learning_rate": 1.7320261437908496e-05,
148
- "loss": 0.001,
149
- "step": 2000
150
- },
151
- {
152
- "epoch": 3.27,
153
- "eval_accuracy": 0.9904194415235424,
154
- "eval_loss": 0.046223659068346024,
155
- "eval_runtime": 80.5163,
156
- "eval_samples_per_second": 106.301,
157
- "eval_steps_per_second": 2.534,
158
- "step": 2000
159
- },
160
- {
161
- "epoch": 3.59,
162
- "learning_rate": 1.4052287581699347e-05,
163
- "loss": 0.0002,
164
- "step": 2200
165
- },
166
- {
167
- "epoch": 3.59,
168
- "eval_accuracy": 0.9911204579974296,
169
- "eval_loss": 0.04658184573054314,
170
- "eval_runtime": 80.6281,
171
- "eval_samples_per_second": 106.154,
172
- "eval_steps_per_second": 2.53,
173
- "step": 2200
174
- },
175
- {
176
- "epoch": 3.92,
177
- "learning_rate": 1.0784313725490197e-05,
178
- "loss": 0.0006,
179
- "step": 2400
180
- },
181
- {
182
- "epoch": 3.92,
183
- "eval_accuracy": 0.9905362776025236,
184
- "eval_loss": 0.046631619334220886,
185
- "eval_runtime": 80.5126,
186
- "eval_samples_per_second": 106.306,
187
- "eval_steps_per_second": 2.534,
188
- "step": 2400
189
- },
190
- {
191
- "epoch": 4.25,
192
- "learning_rate": 7.5163398692810456e-06,
193
- "loss": 0.0001,
194
- "step": 2600
195
- },
196
- {
197
- "epoch": 4.25,
198
- "eval_accuracy": 0.990769949760486,
199
- "eval_loss": 0.05143677070736885,
200
- "eval_runtime": 80.6039,
201
- "eval_samples_per_second": 106.186,
202
- "eval_steps_per_second": 2.531,
203
- "step": 2600
204
- },
205
- {
206
- "epoch": 4.58,
207
- "learning_rate": 4.2483660130718954e-06,
208
- "loss": 0.0005,
209
- "step": 2800
210
- },
211
- {
212
- "epoch": 4.58,
213
- "eval_accuracy": 0.9908867858394672,
214
- "eval_loss": 0.04908544197678566,
215
- "eval_runtime": 80.4782,
216
- "eval_samples_per_second": 106.352,
217
- "eval_steps_per_second": 2.535,
218
- "step": 2800
219
- },
220
- {
221
- "epoch": 4.9,
222
- "learning_rate": 9.80392156862745e-07,
223
- "loss": 0.0004,
224
- "step": 3000
225
- },
226
- {
227
- "epoch": 4.9,
228
- "eval_accuracy": 0.9910036219184484,
229
- "eval_loss": 0.049937766045331955,
230
- "eval_runtime": 80.6026,
231
- "eval_samples_per_second": 106.188,
232
- "eval_steps_per_second": 2.531,
233
- "step": 3000
234
  }
235
  ],
236
- "max_steps": 3060,
237
- "num_train_epochs": 5,
 
 
238
  "total_flos": 0.0,
239
  "trial_name": null,
240
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.5424164524421595,
5
+ "eval_steps": 500,
6
+ "global_step": 1200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.26,
13
+ "learning_rate": 4.166666666666667e-05,
14
+ "loss": 0.0423,
15
  "step": 200
16
  },
17
  {
18
+ "epoch": 0.51,
19
+ "learning_rate": 3.3333333333333335e-05,
20
+ "loss": 0.0085,
 
 
 
 
 
 
 
 
 
21
  "step": 400
22
  },
23
  {
24
+ "epoch": 0.77,
25
+ "learning_rate": 2.5e-05,
26
+ "loss": 0.0069,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  "step": 600
28
  },
29
  {
30
+ "epoch": 1.03,
31
+ "learning_rate": 1.6666666666666667e-05,
32
+ "loss": 0.005,
33
  "step": 800
34
  },
35
  {
36
+ "epoch": 1.29,
37
+ "learning_rate": 8.333333333333334e-06,
38
+ "loss": 0.0012,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  "step": 1000
40
  },
41
  {
42
+ "epoch": 1.54,
43
+ "learning_rate": 0.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  "loss": 0.0009,
45
+ "step": 1200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
+ "logging_steps": 200,
49
+ "max_steps": 1200,
50
+ "num_train_epochs": 2,
51
+ "save_steps": 400,
52
  "total_flos": 0.0,
53
  "trial_name": null,
54
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6715260d8f8dc2d9b6f203feba5b1e85999035d08e8d456813784a2d7ce39f95
3
- size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e31258ce773b88b8066de7b3863038689fcaaa25ca7099e45b4283397681f1e0
3
+ size 4091