nicholasKluge commited on
Commit
5d5bd89
1 Parent(s): 1d9789c

Upload 14 files

Browse files
.gitattributes CHANGED
@@ -25,6 +25,7 @@
25
  *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
 
28
  *.tflite filter=lfs diff=lfs merge=lfs -text
29
  *.tgz filter=lfs diff=lfs merge=lfs -text
30
  *.wasm filter=lfs diff=lfs merge=lfs -text
 
25
  *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
  *.tflite filter=lfs diff=lfs merge=lfs -text
30
  *.tgz filter=lfs diff=lfs merge=lfs -text
31
  *.wasm filter=lfs diff=lfs merge=lfs -text
RewardModel.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
RewardModel_emissions.csv CHANGED
@@ -1,2 +1,2 @@
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
- 2023-06-13T19:45:49,RewardModel_emissions,28b84f34-fd57-4f25-961c-9f6528e5c397,4601.62472319603,0.2357451806109479,5.1230857532252777e-05,42.5,151.204,31.30528450012207,0.054317600807878674,0.38820106547692845,0.039978418433687345,0.48249708471849406,Singapore,SGP,,,,Linux-5.15.107+-x86_64-with-glibc2.31,3.10.12,2.2.3,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,103.8547,1.2929,83.48075866699219,machine,N,1.0
 
1
  timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
+ 2023-08-30T21:51:28,RewardModelPT_emissions,96cbbbe3-62c5-41c9-b8d3-52185e05b85d,1674.8272371292114,0.0797799671652134,4.7634744286797414e-05,42.5,239.12942128798596,31.305280208587646,0.019769437138570673,0.12917863306504598,0.0145565772513079,0.16350464745492432,Singapore,SGP,,,,Linux-5.15.109+-x86_64-with-glibc2.35,3.10.12,2.3.1,12,Intel(R) Xeon(R) CPU @ 2.20GHz,1,1 x NVIDIA A100-SXM4-40GB,103.8547,1.2929,83.48074722290039,machine,N,1.0
config.json CHANGED
@@ -31,7 +31,7 @@
31
  "pooler_type": "first_token_transform",
32
  "position_embedding_type": "absolute",
33
  "torch_dtype": "float32",
34
- "transformers_version": "4.30.1",
35
  "type_vocab_size": 2,
36
  "use_cache": true,
37
  "vocab_size": 29794
 
31
  "pooler_type": "first_token_transform",
32
  "position_embedding_type": "absolute",
33
  "torch_dtype": "float32",
34
+ "transformers_version": "4.32.1",
35
  "type_vocab_size": 2,
36
  "use_cache": true,
37
  "vocab_size": 29794
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42127a92fb8636f60c5268afc9bd5e2885fda45b635559f5d75a5cccd05b5de6
3
- size 871509189
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8c3139a8c3e4279e2a9924bc864d843241a89c526bc8fdc6ea432a88c8d4e10
3
+ size 871558917
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e09aab5cc0f696d5dc7bb319ec42158f0d8241bd8060a7285ec77bec19718c97
3
- size 435768437
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edd62695424c023985a0d6b34f7b764da509f9b6437b6d7af5274f07fc4c6cf6
3
+ size 435764017
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a5bf9f43a8b55cc2c935d5c586202803aafae6b7e25833430938be6e97ddb9b
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34328d2f695efeba4db88f7e971d7409bfd04e499cbb6e22c019df50401e0447
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68dd66f43268be9abd400bd2e864096b73cf1d96aedbf4ec9feacc73aa567580
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67da5128d498ca4756021811370417b993fb803d16f9d8450b5e82ca5ddbb387
3
  size 627
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 350,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 350
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 400,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 400
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
trainer_state.json CHANGED
@@ -1,195 +1,54 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.187604690117253,
5
- "global_step": 2500,
 
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.34,
12
- "learning_rate": 4.66499162479062e-05,
13
- "loss": 0.0795,
14
  "step": 200
15
  },
16
  {
17
- "epoch": 0.34,
18
- "eval_accuracy": 0.9863571086644327,
19
- "eval_loss": 0.04342207312583923,
20
- "eval_runtime": 78.4916,
21
- "eval_samples_per_second": 106.457,
22
- "eval_steps_per_second": 2.535,
23
- "step": 200
24
- },
25
- {
26
- "epoch": 0.67,
27
- "learning_rate": 4.32998324958124e-05,
28
- "loss": 0.0434,
29
- "step": 400
30
- },
31
- {
32
- "epoch": 0.67,
33
- "eval_accuracy": 0.9869554810914313,
34
- "eval_loss": 0.035848040133714676,
35
- "eval_runtime": 78.5171,
36
- "eval_samples_per_second": 106.423,
37
- "eval_steps_per_second": 2.534,
38
  "step": 400
39
  },
40
  {
41
- "epoch": 1.01,
42
- "learning_rate": 3.9949748743718597e-05,
43
- "loss": 0.0375,
44
  "step": 600
45
  },
46
  {
47
- "epoch": 1.01,
48
- "eval_accuracy": 0.9876735280038296,
49
- "eval_loss": 0.03416126221418381,
50
- "eval_runtime": 78.4728,
51
- "eval_samples_per_second": 106.483,
52
- "eval_steps_per_second": 2.536,
53
- "step": 600
54
- },
55
- {
56
- "epoch": 1.34,
57
- "learning_rate": 3.6599664991624795e-05,
58
- "loss": 0.0112,
59
  "step": 800
60
  },
61
  {
62
- "epoch": 1.34,
63
- "eval_accuracy": 0.9885112494016276,
64
- "eval_loss": 0.03930915519595146,
65
- "eval_runtime": 78.5108,
66
- "eval_samples_per_second": 106.431,
67
- "eval_steps_per_second": 2.535,
68
- "step": 800
69
- },
70
- {
71
- "epoch": 1.68,
72
- "learning_rate": 3.324958123953099e-05,
73
- "loss": 0.0089,
74
  "step": 1000
75
  },
76
  {
77
- "epoch": 1.68,
78
- "eval_accuracy": 0.9877932024892293,
79
- "eval_loss": 0.04387575387954712,
80
- "eval_runtime": 78.5288,
81
- "eval_samples_per_second": 106.407,
82
- "eval_steps_per_second": 2.534,
83
- "step": 1000
84
- },
85
- {
86
- "epoch": 2.01,
87
- "learning_rate": 2.989949748743719e-05,
88
- "loss": 0.0117,
89
- "step": 1200
90
- },
91
- {
92
- "epoch": 2.01,
93
- "eval_accuracy": 0.989588319770225,
94
- "eval_loss": 0.04102291911840439,
95
- "eval_runtime": 78.5424,
96
- "eval_samples_per_second": 106.388,
97
- "eval_steps_per_second": 2.534,
98
  "step": 1200
99
- },
100
- {
101
- "epoch": 2.35,
102
- "learning_rate": 2.6549413735343385e-05,
103
- "loss": 0.0028,
104
- "step": 1400
105
- },
106
- {
107
- "epoch": 2.35,
108
- "eval_accuracy": 0.989588319770225,
109
- "eval_loss": 0.055005114525556564,
110
- "eval_runtime": 78.492,
111
- "eval_samples_per_second": 106.457,
112
- "eval_steps_per_second": 2.535,
113
- "step": 1400
114
- },
115
- {
116
- "epoch": 2.68,
117
- "learning_rate": 2.3199329983249583e-05,
118
- "loss": 0.0014,
119
- "step": 1600
120
- },
121
- {
122
- "epoch": 2.68,
123
- "eval_accuracy": 0.9889899473432264,
124
- "eval_loss": 0.054427579045295715,
125
- "eval_runtime": 78.5005,
126
- "eval_samples_per_second": 106.445,
127
- "eval_steps_per_second": 2.535,
128
- "step": 1600
129
- },
130
- {
131
- "epoch": 3.02,
132
- "learning_rate": 1.984924623115578e-05,
133
- "loss": 0.0011,
134
- "step": 1800
135
- },
136
- {
137
- "epoch": 3.02,
138
- "eval_accuracy": 0.989588319770225,
139
- "eval_loss": 0.05314817279577255,
140
- "eval_runtime": 78.5501,
141
- "eval_samples_per_second": 106.378,
142
- "eval_steps_per_second": 2.533,
143
- "step": 1800
144
- },
145
- {
146
- "epoch": 3.35,
147
- "learning_rate": 1.6499162479061976e-05,
148
- "loss": 0.0002,
149
- "step": 2000
150
- },
151
- {
152
- "epoch": 3.35,
153
- "eval_accuracy": 0.9894686452848253,
154
- "eval_loss": 0.058279525488615036,
155
- "eval_runtime": 78.4971,
156
- "eval_samples_per_second": 106.45,
157
- "eval_steps_per_second": 2.535,
158
- "step": 2000
159
- },
160
- {
161
- "epoch": 3.69,
162
- "learning_rate": 1.3149078726968176e-05,
163
- "loss": 0.0002,
164
- "step": 2200
165
- },
166
- {
167
- "epoch": 3.69,
168
- "eval_accuracy": 0.9897079942556247,
169
- "eval_loss": 0.05424511060118675,
170
- "eval_runtime": 78.4985,
171
- "eval_samples_per_second": 106.448,
172
- "eval_steps_per_second": 2.535,
173
- "step": 2200
174
- },
175
- {
176
- "epoch": 4.02,
177
- "learning_rate": 9.798994974874372e-06,
178
- "loss": 0.0002,
179
- "step": 2400
180
- },
181
- {
182
- "epoch": 4.02,
183
- "eval_accuracy": 0.989588319770225,
184
- "eval_loss": 0.05800911784172058,
185
- "eval_runtime": 78.5022,
186
- "eval_samples_per_second": 106.443,
187
- "eval_steps_per_second": 2.535,
188
- "step": 2400
189
  }
190
  ],
191
- "max_steps": 2985,
192
- "num_train_epochs": 5,
 
 
193
  "total_flos": 0.0,
194
  "trial_name": null,
195
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.5424164524421595,
5
+ "eval_steps": 500,
6
+ "global_step": 1200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.26,
13
+ "learning_rate": 4.166666666666667e-05,
14
+ "loss": 0.0396,
15
  "step": 200
16
  },
17
  {
18
+ "epoch": 0.51,
19
+ "learning_rate": 3.3333333333333335e-05,
20
+ "loss": 0.0083,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  "step": 400
22
  },
23
  {
24
+ "epoch": 0.77,
25
+ "learning_rate": 2.5e-05,
26
+ "loss": 0.0074,
27
  "step": 600
28
  },
29
  {
30
+ "epoch": 1.03,
31
+ "learning_rate": 1.6666666666666667e-05,
32
+ "loss": 0.0062,
 
 
 
 
 
 
 
 
 
33
  "step": 800
34
  },
35
  {
36
+ "epoch": 1.29,
37
+ "learning_rate": 8.333333333333334e-06,
38
+ "loss": 0.002,
 
 
 
 
 
 
 
 
 
39
  "step": 1000
40
  },
41
  {
42
+ "epoch": 1.54,
43
+ "learning_rate": 0.0,
44
+ "loss": 0.0013,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  "step": 1200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
+ "logging_steps": 200,
49
+ "max_steps": 1200,
50
+ "num_train_epochs": 2,
51
+ "save_steps": 400,
52
  "total_flos": 0.0,
53
  "trial_name": null,
54
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f250a5c08e1e9c5ee5dcaeb636fb35a215c6505d2392dc80f8e0d6af40a76a8c
3
- size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5ef9405a9d75dbc3d85f18ad44a184070e8187d74f7026a41a46fb38b61a3ad
3
+ size 4091