Phanh2532 commited on
Commit
99e2fc4
1 Parent(s): 17d1172

Upload folder using huggingface_hub

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1912b4b957d908b8bfc710c3e58558d93617ba78eeee6b44cea5846184e311aa
3
  size 109069176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e962fe1a008096446bba2f5f0939a027f2337b0c8d54a86662f4b97eb3ce56e7
3
  size 109069176
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f61189ba8e2df9508d8734043f68c2833bde41baa22941571ec4278f299a891b
3
  size 218182458
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b9013e63a2c92f1d852bfa0120360bf3b76ec267a1e0375845d5663d98ee45b
3
  size 218182458
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e8d2ce26e6c0f5a47ca9bc5544c0f80a1d4937019d9d7af01320826a96817c0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1218d6cf5250ca208e3f4fa5667046fe64d6adcd8f3e76f241175ded98a71c5
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51c0ed39e99f88f21247352263bae5548e8fbac6d6858a19cd7d11c82b12390d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a9cac68c495800a4bdcb66ffc3cc1e8f81886b9e59bf61baf66314bb15b9839
3
  size 1064
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.9323671497584543,
5
  "eval_steps": 25,
6
- "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -127,6 +127,36 @@
127
  "eval_samples_per_second": 3.915,
128
  "eval_steps_per_second": 0.492,
129
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
130
  }
131
  ],
132
  "logging_steps": 25,
@@ -141,12 +171,12 @@
141
  "should_evaluate": false,
142
  "should_log": false,
143
  "should_save": true,
144
- "should_training_stop": false
145
  },
146
  "attributes": {}
147
  }
148
  },
149
- "total_flos": 1.5515046692683776e+16,
150
  "train_batch_size": 1,
151
  "trial_name": null,
152
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.4154589371980677,
5
  "eval_steps": 25,
6
+ "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
127
  "eval_samples_per_second": 3.915,
128
  "eval_steps_per_second": 0.492,
129
  "step": 200
130
+ },
131
+ {
132
+ "epoch": 2.1739130434782608,
133
+ "grad_norm": 0.11684705317020416,
134
+ "learning_rate": 1.305099728150655e-05,
135
+ "loss": 0.8363,
136
+ "step": 225
137
+ },
138
+ {
139
+ "epoch": 2.1739130434782608,
140
+ "eval_loss": 0.8260972499847412,
141
+ "eval_runtime": 52.8873,
142
+ "eval_samples_per_second": 3.914,
143
+ "eval_steps_per_second": 0.492,
144
+ "step": 225
145
+ },
146
+ {
147
+ "epoch": 2.4154589371980677,
148
+ "grad_norm": 0.12228501588106155,
149
+ "learning_rate": 0.0,
150
+ "loss": 0.8416,
151
+ "step": 250
152
+ },
153
+ {
154
+ "epoch": 2.4154589371980677,
155
+ "eval_loss": 0.8257294297218323,
156
+ "eval_runtime": 52.5215,
157
+ "eval_samples_per_second": 3.941,
158
+ "eval_steps_per_second": 0.495,
159
+ "step": 250
160
  }
161
  ],
162
  "logging_steps": 25,
 
171
  "should_evaluate": false,
172
  "should_log": false,
173
  "should_save": true,
174
+ "should_training_stop": true
175
  },
176
  "attributes": {}
177
  }
178
  },
179
+ "total_flos": 1.9398176774774784e+16,
180
  "train_batch_size": 1,
181
  "trial_name": null,
182
  "trial_params": null