Shresthadev403 commited on
Commit
1d5674e
1 Parent(s): 6789a54

End of training

Browse files
config.json CHANGED
@@ -63,42 +63,7 @@
63
  "50": "LABEL_50",
64
  "51": "LABEL_51",
65
  "52": "LABEL_52",
66
- "53": "LABEL_53",
67
- "54": "LABEL_54",
68
- "55": "LABEL_55",
69
- "56": "LABEL_56",
70
- "57": "LABEL_57",
71
- "58": "LABEL_58",
72
- "59": "LABEL_59",
73
- "60": "LABEL_60",
74
- "61": "LABEL_61",
75
- "62": "LABEL_62",
76
- "63": "LABEL_63",
77
- "64": "LABEL_64",
78
- "65": "LABEL_65",
79
- "66": "LABEL_66",
80
- "67": "LABEL_67",
81
- "68": "LABEL_68",
82
- "69": "LABEL_69",
83
- "70": "LABEL_70",
84
- "71": "LABEL_71",
85
- "72": "LABEL_72",
86
- "73": "LABEL_73",
87
- "74": "LABEL_74",
88
- "75": "LABEL_75",
89
- "76": "LABEL_76",
90
- "77": "LABEL_77",
91
- "78": "LABEL_78",
92
- "79": "LABEL_79",
93
- "80": "LABEL_80",
94
- "81": "LABEL_81",
95
- "82": "LABEL_82",
96
- "83": "LABEL_83",
97
- "84": "LABEL_84",
98
- "85": "LABEL_85",
99
- "86": "LABEL_86",
100
- "87": "LABEL_87",
101
- "88": "LABEL_88"
102
  },
103
  "initializer_range": 0.02,
104
  "intermediate_size": 3072,
@@ -153,44 +118,9 @@
153
  "LABEL_51": 51,
154
  "LABEL_52": 52,
155
  "LABEL_53": 53,
156
- "LABEL_54": 54,
157
- "LABEL_55": 55,
158
- "LABEL_56": 56,
159
- "LABEL_57": 57,
160
- "LABEL_58": 58,
161
- "LABEL_59": 59,
162
  "LABEL_6": 6,
163
- "LABEL_60": 60,
164
- "LABEL_61": 61,
165
- "LABEL_62": 62,
166
- "LABEL_63": 63,
167
- "LABEL_64": 64,
168
- "LABEL_65": 65,
169
- "LABEL_66": 66,
170
- "LABEL_67": 67,
171
- "LABEL_68": 68,
172
- "LABEL_69": 69,
173
  "LABEL_7": 7,
174
- "LABEL_70": 70,
175
- "LABEL_71": 71,
176
- "LABEL_72": 72,
177
- "LABEL_73": 73,
178
- "LABEL_74": 74,
179
- "LABEL_75": 75,
180
- "LABEL_76": 76,
181
- "LABEL_77": 77,
182
- "LABEL_78": 78,
183
- "LABEL_79": 79,
184
  "LABEL_8": 8,
185
- "LABEL_80": 80,
186
- "LABEL_81": 81,
187
- "LABEL_82": 82,
188
- "LABEL_83": 83,
189
- "LABEL_84": 84,
190
- "LABEL_85": 85,
191
- "LABEL_86": 86,
192
- "LABEL_87": 87,
193
- "LABEL_88": 88,
194
  "LABEL_9": 9
195
  },
196
  "layer_norm_eps": 1e-12,
 
63
  "50": "LABEL_50",
64
  "51": "LABEL_51",
65
  "52": "LABEL_52",
66
+ "53": "LABEL_53"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
67
  },
68
  "initializer_range": 0.02,
69
  "intermediate_size": 3072,
 
118
  "LABEL_51": 51,
119
  "LABEL_52": 52,
120
  "LABEL_53": 53,
 
 
 
 
 
 
121
  "LABEL_6": 6,
 
 
 
 
 
 
 
 
 
 
122
  "LABEL_7": 7,
 
 
 
 
 
 
 
 
 
 
123
  "LABEL_8": 8,
 
 
 
 
 
 
 
 
 
124
  "LABEL_9": 9
125
  },
126
  "layer_norm_eps": 1e-12,
logs/events.out.tfevents.1705981471.70e47a1f5afe.42.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f45493947e1d099fa617c89478315c8ca24f4a96bff6a29ec349377d035f830
3
+ size 6624
logs/events.out.tfevents.1705981596.70e47a1f5afe.42.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2a52d8b5735b82151db217365714e96e44f55139cb6f85cd578b826fd06a9ff
3
+ size 6972
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5dbfecedd805a055d558e713fdab59dc3f5ce6a3cc40f43d3abc6ed1ac915a0b
3
- size 435863700
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15a258d9f93851cdd6ad47d4a89e6e843cd17df5266b4472832d1351b19749f8
3
+ size 435756040
trainer_state.json CHANGED
@@ -11,11 +11,11 @@
11
  {
12
  "epoch": 50.0,
13
  "step": 50,
14
- "total_flos": 32636710679400.0,
15
- "train_loss": 0.2473917007446289,
16
- "train_runtime": 8.5287,
17
- "train_samples_per_second": 52.763,
18
- "train_steps_per_second": 5.863
19
  }
20
  ],
21
  "logging_steps": 750,
@@ -23,7 +23,7 @@
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 50,
25
  "save_steps": 750,
26
- "total_flos": 32636710679400.0,
27
  "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": null
 
11
  {
12
  "epoch": 50.0,
13
  "step": 50,
14
+ "total_flos": 32856154788600.0,
15
+ "train_loss": 0.16719268798828124,
16
+ "train_runtime": 179.6035,
17
+ "train_samples_per_second": 2.506,
18
+ "train_steps_per_second": 0.278
19
  }
20
  ],
21
  "logging_steps": 750,
 
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 50,
25
  "save_steps": 750,
26
+ "total_flos": 32856154788600.0,
27
  "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:539f836c129844c7433ce90ce7a776a98d7e07cfa66853d433c5135b23816fc8
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8557c2036849cd866e8408772ea1bd305acc077f79dba43b158110308a074332
3
  size 4283