duyvt6663 commited on
Commit
b0226b8
1 Parent(s): 02cd23d

Training in progress, step 50, checkpoint

Browse files
checkpoint-50/README.md CHANGED
@@ -254,4 +254,23 @@ The following `bitsandbytes` quantization config was used during training:
254
  ### Framework versions
255
 
256
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
257
  - PEFT 0.6.0.dev0
 
254
  ### Framework versions
255
 
256
 
257
+ - PEFT 0.6.0.dev0
258
+ ## Training procedure
259
+
260
+
261
+ The following `bitsandbytes` quantization config was used during training:
262
+ - quant_method: bitsandbytes
263
+ - load_in_8bit: True
264
+ - load_in_4bit: False
265
+ - llm_int8_threshold: 6.0
266
+ - llm_int8_skip_modules: None
267
+ - llm_int8_enable_fp32_cpu_offload: False
268
+ - llm_int8_has_fp16_weight: False
269
+ - bnb_4bit_quant_type: fp4
270
+ - bnb_4bit_use_double_quant: False
271
+ - bnb_4bit_compute_dtype: float32
272
+
273
+ ### Framework versions
274
+
275
+
276
  - PEFT 0.6.0.dev0
checkpoint-50/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52f3e2863a99621fe2385df6cddf1bcd468da4073e58c4120b23dac6c05e517b
3
  size 9873829
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efcd616d78aee5801b26823ff845c7a11cb8437ad33b7f54dd9d8c1d6d55430c
3
  size 9873829
checkpoint-50/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:583134c5aa4c8a4be35c76d3ef2147918ca197900e94a9bd441bc6b37318017b
3
  size 42724
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1c19a314df24e848b955548a7f413702cd6ca621d7171dd290931ec47d2a49f
3
  size 42724
checkpoint-50/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc74b07bbeaa07754a3167eed2100e9c261c9fbfeeead9fd2401e092e61ce5ba
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d5f3946af7bb77e06a589294e88390029883f4d85063278eb29d1e1dd7fdf0d
3
  size 14244
checkpoint-50/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cd64bd8bbd74e4d9ac50e02a85e7f6d62a9cf61cc8888584e2b49a46bcf05e3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d0fe70547b4c794870547a1163a5866d6ce45ad88bdeba0273a31e4c75090e4
3
  size 1064
checkpoint-50/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.6568556427955627,
3
  "best_model_checkpoint": "output/checkpoint-50",
4
- "epoch": 0.11347517730496454,
5
  "eval_steps": 50,
6
  "global_step": 50,
7
  "is_hyper_param_search": false,
@@ -10,31 +10,31 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "learning_rate": 1.25e-06,
14
- "loss": 0.5043,
15
  "step": 1
16
  },
17
  {
18
- "epoch": 0.11,
19
- "learning_rate": 5.7499999999999995e-05,
20
- "loss": 0.4906,
21
  "step": 50
22
  },
23
  {
24
- "epoch": 0.11,
25
- "eval_accuracy": 0.608955223880597,
26
- "eval_loss": 0.6568556427955627,
27
- "eval_runtime": 61.5694,
28
- "eval_samples_per_second": 5.441,
29
- "eval_steps_per_second": 1.364,
30
  "step": 50
31
  }
32
  ],
33
  "logging_steps": 50,
34
- "max_steps": 440,
35
- "num_train_epochs": 1,
36
  "save_steps": 50,
37
- "total_flos": 1.846347914809344e+16,
38
  "trial_name": null,
39
  "trial_params": null
40
  }
 
1
  {
2
+ "best_metric": 0.665068507194519,
3
  "best_model_checkpoint": "output/checkpoint-50",
4
+ "epoch": 0.20460358056265984,
5
  "eval_steps": 50,
6
  "global_step": 50,
7
  "is_hyper_param_search": false,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "learning_rate": 7.575757575757576e-07,
14
+ "loss": 0.4968,
15
  "step": 1
16
  },
17
  {
18
+ "epoch": 0.2,
19
+ "learning_rate": 3.484848484848485e-05,
20
+ "loss": 0.5254,
21
  "step": 50
22
  },
23
  {
24
+ "epoch": 0.2,
25
+ "eval_accuracy": 0.6507462686567164,
26
+ "eval_loss": 0.665068507194519,
27
+ "eval_runtime": 61.5592,
28
+ "eval_samples_per_second": 5.442,
29
+ "eval_steps_per_second": 1.365,
30
  "step": 50
31
  }
32
  ],
33
  "logging_steps": 50,
34
+ "max_steps": 732,
35
+ "num_train_epochs": 3,
36
  "save_steps": 50,
37
+ "total_flos": 2.16199352573952e+16,
38
  "trial_name": null,
39
  "trial_params": null
40
  }
checkpoint-50/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87bd30bd4b21b4a0c66f1fd545858ef6e2d33b5984a8d292e79011acc3affd6b
3
  size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9feea516a8a208c393c324d84d047c0ab5036bbdf3fb1f3eea6a2563e9c79a6b
3
  size 4472