jeffrey03 commited on
Commit
740b1b6
·
verified ·
1 Parent(s): 0dbb857

Training in progress, step 1875, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73dcc728bd3117c3ddcb580ef3f1b393dfb729105f5e1d2fdab99854f2758874
3
  size 109086416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a3668c48907d6be9c34a6d02741c3750faabcfd1d5a6333cafe608af5a229ae
3
  size 109086416
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:446a3af6fdee1a0dd1551c20907478e105e6522c7cc9df77f10f1fae6b402ec6
3
  size 218260730
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38c90ddf4352401e02b05f9c5ac779323fe0e9cba9deb1ed0ba3fadee738b6bc
3
  size 218260730
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a1fc5a9c9f608c99649f2e480872fa8be5ea1043623c84a23661e662266b584
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4d45a4286ba74a8054247c8bb988cbde8153b7096a421868e4e6e75e1d96fe8
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f70d0c9a1f2ec5616d0ea31f304bbe8c20a9687c5c28d05c761302a0b97133f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69b45defeb8acd40b1f654b531ab2159e89f65aca484da94094d0271343bc0bd
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.675691843032837,
3
  "best_model_checkpoint": "Pricer-FineTune-OpenSource-2024-10-23_08.48.15/checkpoint-1250",
4
- "epoch": 2.8,
5
  "eval_steps": 50,
6
- "global_step": 1750,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -532,6 +532,36 @@
532
  "eval_samples_per_second": 20.045,
533
  "eval_steps_per_second": 5.011,
534
  "step": 1750
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
535
  }
536
  ],
537
  "logging_steps": 50,
@@ -546,12 +576,12 @@
546
  "should_evaluate": false,
547
  "should_log": false,
548
  "should_save": true,
549
- "should_training_stop": false
550
  },
551
  "attributes": {}
552
  }
553
  },
554
- "total_flos": 4.4981043586832794e+17,
555
  "train_batch_size": 16,
556
  "trial_name": null,
557
  "trial_params": null
 
1
  {
2
  "best_metric": 1.675691843032837,
3
  "best_model_checkpoint": "Pricer-FineTune-OpenSource-2024-10-23_08.48.15/checkpoint-1250",
4
+ "epoch": 3.0,
5
  "eval_steps": 50,
6
+ "global_step": 1875,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
532
  "eval_samples_per_second": 20.045,
533
  "eval_steps_per_second": 5.011,
534
  "step": 1750
535
+ },
536
+ {
537
+ "epoch": 2.88,
538
+ "grad_norm": 3.2328884601593018,
539
+ "learning_rate": 4.1934023124329257e-07,
540
+ "loss": 1.4583,
541
+ "step": 1800
542
+ },
543
+ {
544
+ "epoch": 2.88,
545
+ "eval_loss": 1.7641412019729614,
546
+ "eval_runtime": 4.9803,
547
+ "eval_samples_per_second": 20.079,
548
+ "eval_steps_per_second": 5.02,
549
+ "step": 1800
550
+ },
551
+ {
552
+ "epoch": 2.96,
553
+ "grad_norm": 4.39493465423584,
554
+ "learning_rate": 4.665137700333166e-08,
555
+ "loss": 1.4495,
556
+ "step": 1850
557
+ },
558
+ {
559
+ "epoch": 2.96,
560
+ "eval_loss": 1.765012502670288,
561
+ "eval_runtime": 4.9788,
562
+ "eval_samples_per_second": 20.085,
563
+ "eval_steps_per_second": 5.021,
564
+ "step": 1850
565
  }
566
  ],
567
  "logging_steps": 50,
 
576
  "should_evaluate": false,
577
  "should_log": false,
578
  "should_save": true,
579
+ "should_training_stop": true
580
  },
581
  "attributes": {}
582
  }
583
  },
584
+ "total_flos": 4.819416637396746e+17,
585
  "train_batch_size": 16,
586
  "trial_name": null,
587
  "trial_params": null