TachyHealthResearch commited on
Commit
93b5f99
1 Parent(s): d2e0ac1

Training in progress, step 150, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d3124d5fb3a13a9a5d4ef239279632be8d7d427b5585c408c08388e6b5908ee
3
  size 72673016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2551bca4904088520c6015d446c497d0568f830a7c7fd330b16e1171d06a87b5
3
  size 72673016
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:891f31b05a0835f1f16ade116db6505b177bd225d6898a18b058dd350e0393e9
3
  size 36892116
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c96241bf468c472cac5346ac7ec3308c004be9a7dd5eb6c621fa82bb6f34ec62
3
  size 36892116
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a058db9c54d7f1b53d3bad727f4153301963dc03c27b73419a8068cc21981f0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c76075dc60dc956ebfb1873f21cf2e223089eed32957f63e252eecb72848e3
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9702192071987640411db8cd497f9de57450f22a9586d9cce5affbc116fe7983
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194456d3c9e165255d5406a0f3f62973b0bede79d91784f72431350783e27ae7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.056,
5
  "eval_steps": 1000,
6
- "global_step": 140,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -847,13 +847,73 @@
847
  "learning_rate": 1.3793103448275863e-05,
848
  "loss": 1.8603,
849
  "step": 140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
850
  }
851
  ],
852
  "logging_steps": 1,
853
  "max_steps": 150,
854
  "num_train_epochs": 1,
855
  "save_steps": 10,
856
- "total_flos": 7007817370042368.0,
857
  "trial_name": null,
858
  "trial_params": null
859
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.06,
5
  "eval_steps": 1000,
6
+ "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
847
  "learning_rate": 1.3793103448275863e-05,
848
  "loss": 1.8603,
849
  "step": 140
850
+ },
851
+ {
852
+ "epoch": 0.06,
853
+ "learning_rate": 1.2413793103448277e-05,
854
+ "loss": 1.7057,
855
+ "step": 141
856
+ },
857
+ {
858
+ "epoch": 0.06,
859
+ "learning_rate": 1.103448275862069e-05,
860
+ "loss": 1.6926,
861
+ "step": 142
862
+ },
863
+ {
864
+ "epoch": 0.06,
865
+ "learning_rate": 9.655172413793103e-06,
866
+ "loss": 1.6525,
867
+ "step": 143
868
+ },
869
+ {
870
+ "epoch": 0.06,
871
+ "learning_rate": 8.275862068965518e-06,
872
+ "loss": 1.7455,
873
+ "step": 144
874
+ },
875
+ {
876
+ "epoch": 0.06,
877
+ "learning_rate": 6.896551724137932e-06,
878
+ "loss": 1.775,
879
+ "step": 145
880
+ },
881
+ {
882
+ "epoch": 0.06,
883
+ "learning_rate": 5.517241379310345e-06,
884
+ "loss": 1.6912,
885
+ "step": 146
886
+ },
887
+ {
888
+ "epoch": 0.06,
889
+ "learning_rate": 4.137931034482759e-06,
890
+ "loss": 1.8147,
891
+ "step": 147
892
+ },
893
+ {
894
+ "epoch": 0.06,
895
+ "learning_rate": 2.7586206896551725e-06,
896
+ "loss": 1.8314,
897
+ "step": 148
898
+ },
899
+ {
900
+ "epoch": 0.06,
901
+ "learning_rate": 1.3793103448275862e-06,
902
+ "loss": 1.9115,
903
+ "step": 149
904
+ },
905
+ {
906
+ "epoch": 0.06,
907
+ "learning_rate": 0.0,
908
+ "loss": 1.6862,
909
+ "step": 150
910
  }
911
  ],
912
  "logging_steps": 1,
913
  "max_steps": 150,
914
  "num_train_epochs": 1,
915
  "save_steps": 10,
916
+ "total_flos": 7574630234062848.0,
917
  "trial_name": null,
918
  "trial_params": null
919
  }