ncbateman commited on
Commit
7cbb671
·
verified ·
1 Parent(s): 4cc6987

Training in progress, step 410, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3ba083b80a5ba86c78573397f43c5755304ed3a937a891778f373046687e85a
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:486f843fd963ad047e108ad6e2177b02194372d7badc986147d584a09dce4090
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f7bdba3f023857413f670e1a267e69714b283f392e2ead25387966136304530
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09813614e11f944a54535b49907271670faa0fd78f62de6107511458c58eb3bc
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87c82db480424801d4bb33b59a50589e1c04688890a2475f7053ae263b3756f4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f7913630d73a37908980f47087984697274289698afc9a9db6afe7e4f8cb1c4
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33cf1fc2a7a88cf2a60a50e566aaa7e8972cd330e2ff6eb55fa333ccfaf32fd5
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:960df08ce745ddc135f0c492f6181a23fd839f7222d0b2b71af63986ebe995a6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5241022322872857,
5
  "eval_steps": 386,
6
- "global_step": 405,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -2858,6 +2858,41 @@
2858
  "learning_rate": 9.787311878343157e-05,
2859
  "loss": 0.8378,
2860
  "step": 405
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2861
  }
2862
  ],
2863
  "logging_steps": 1,
@@ -2877,7 +2912,7 @@
2877
  "attributes": {}
2878
  }
2879
  },
2880
- "total_flos": 4.5276455453589504e+17,
2881
  "train_batch_size": 4,
2882
  "trial_name": null,
2883
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.5305726302167584,
5
  "eval_steps": 386,
6
+ "global_step": 410,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
2858
  "learning_rate": 9.787311878343157e-05,
2859
  "loss": 0.8378,
2860
  "step": 405
2861
+ },
2862
+ {
2863
+ "epoch": 0.5253963118731803,
2864
+ "grad_norm": 0.7899916768074036,
2865
+ "learning_rate": 9.786120576305682e-05,
2866
+ "loss": 0.8917,
2867
+ "step": 406
2868
+ },
2869
+ {
2870
+ "epoch": 0.5266903914590747,
2871
+ "grad_norm": 0.8242781758308411,
2872
+ "learning_rate": 9.784926020149398e-05,
2873
+ "loss": 0.9778,
2874
+ "step": 407
2875
+ },
2876
+ {
2877
+ "epoch": 0.5279844710449693,
2878
+ "grad_norm": 0.9736928343772888,
2879
+ "learning_rate": 9.783728210686496e-05,
2880
+ "loss": 1.0145,
2881
+ "step": 408
2882
+ },
2883
+ {
2884
+ "epoch": 0.5292785506308638,
2885
+ "grad_norm": 0.8070263862609863,
2886
+ "learning_rate": 9.782527148731372e-05,
2887
+ "loss": 0.9923,
2888
+ "step": 409
2889
+ },
2890
+ {
2891
+ "epoch": 0.5305726302167584,
2892
+ "grad_norm": 0.861262857913971,
2893
+ "learning_rate": 9.781322835100638e-05,
2894
+ "loss": 1.0261,
2895
+ "step": 410
2896
  }
2897
  ],
2898
  "logging_steps": 1,
 
2912
  "attributes": {}
2913
  }
2914
  },
2915
+ "total_flos": 4.583542403943629e+17,
2916
  "train_batch_size": 4,
2917
  "trial_name": null,
2918
  "trial_params": null