AmberYifan commited on
Commit
b51bed0
1 Parent(s): 10f4aa1

Training in progress, step 558, checkpoint

Browse files
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48f47872b153568880f63e929f3bdd430ab3ca165a871dd7f35283aa5d93a46a
3
+ size 14483467880
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31af3feb2ec011fbc257818fdd66bf54c64e3e6ec1df17f7899a6b1810530e7f
3
+ size 14483467880
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69abf6db88945f5bb6be0b9788b523a8a5a12986dbdd173ee2aa9ffbf50dd455
3
+ size 14483467880
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5083abeebe436b485703d56249238c09c2540c14bc747f5a94d83da7bb496bb7
3
+ size 14483467880
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d3c39cc7165a6ee3bd278e657b74091c7d7445454546c0632393fe1b8f5dbe7
3
+ size 150629
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:246a94e167835a45d3933514047a1ec029f5a0b7f89c6dee634f7d034f972677
3
+ size 150629
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7470e6434a5c8e46bb43a523a725387c3308156d296ee1210e546cad75ca81e
3
+ size 150629
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d186b915651468c281bfc724da55a5e8e424664df1f100081a2cdc05745ae4
3
+ size 150629
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step496
 
1
+ global_step558
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9a7a17d4560692c6bbac7a5803c9ef7966094cd085d51b14cecd1df2d86e64a
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c6a528fcebfa81ad94dc98b813bc2eaf50e2093983c66f1cf062eee248c9ce3
3
  size 4943162336
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d20ac5c3151e609b424576af7297e14857b8b7da6100a1a7704e41612dd7bc42
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87205acf168a99a505e46e06b76a61a6a87e6e70876881ff030e4dad2cd7aa43
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fbc99432985410ff6c43ff6c0882c1950b2b1368324dc2ad9f035c1fb4e9ac4
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c09c12a0ba4fd95fb32e1df06312c869712e92aa026283345f20f3f5ad8b86a
3
  size 4540516344
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6115ef4a3972dc95f8b5f42d8b349e0290ad816095675fd656394e06736eed54
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8698a8fe21a6c40aa81c13fa783f7b480800d0e1c8b8bbfc0f7d795856c9a9d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22995e1828e61a6ae15a2c3ebe4ca0a2b8b2daa337082a4762176b1ca46f3953
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49f599372909f19fb45797a334f06b5100cf004b284caa24cedf789d1047c5c7
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:239793f1a741f8e5a4de788cdc2c78f5187e67d38900b549f3e1a188c27ddb9c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41569355a67e5d54cd2e41fbdb883692602ceaf27587e7a1c779dc0f9f2d51fd
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.5872000000000002,
5
  "eval_steps": 62,
6
- "global_step": 496,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -885,6 +885,112 @@
885
  "eval_samples_per_second": 5.286,
886
  "eval_steps_per_second": 0.344,
887
  "step": 496
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
888
  }
889
  ],
890
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.7856,
5
  "eval_steps": 62,
6
+ "global_step": 558,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
885
  "eval_samples_per_second": 5.286,
886
  "eval_steps_per_second": 0.344,
887
  "step": 496
888
+ },
889
+ {
890
+ "epoch": 1.6,
891
+ "grad_norm": 33.14482905038865,
892
+ "learning_rate": 2.589073634204275e-07,
893
+ "logits/generated": -2.348078727722168,
894
+ "logits/real": -2.3059887886047363,
895
+ "logps/generated": -123.2630615234375,
896
+ "logps/real": -101.59033966064453,
897
+ "loss": 0.3313,
898
+ "rewards/accuracies": 0.987500011920929,
899
+ "rewards/generated": -0.09043073654174805,
900
+ "rewards/margins": 3.036623477935791,
901
+ "rewards/real": 2.946192502975464,
902
+ "step": 500
903
+ },
904
+ {
905
+ "epoch": 1.6320000000000001,
906
+ "grad_norm": 58.37181281947162,
907
+ "learning_rate": 2.529691211401425e-07,
908
+ "logits/generated": -2.3784213066101074,
909
+ "logits/real": -2.445460557937622,
910
+ "logps/generated": -137.46278381347656,
911
+ "logps/real": -98.52521514892578,
912
+ "loss": 0.3326,
913
+ "rewards/accuracies": 0.887499988079071,
914
+ "rewards/generated": -0.19049878418445587,
915
+ "rewards/margins": 3.1443653106689453,
916
+ "rewards/real": 2.953866958618164,
917
+ "step": 510
918
+ },
919
+ {
920
+ "epoch": 1.6640000000000001,
921
+ "grad_norm": 51.7755109683276,
922
+ "learning_rate": 2.4703087885985747e-07,
923
+ "logits/generated": -2.6047139167785645,
924
+ "logits/real": -2.575225353240967,
925
+ "logps/generated": -125.86954498291016,
926
+ "logps/real": -115.58686828613281,
927
+ "loss": 0.3731,
928
+ "rewards/accuracies": 0.9125000238418579,
929
+ "rewards/generated": 0.010144609026610851,
930
+ "rewards/margins": 2.9819352626800537,
931
+ "rewards/real": 2.9920802116394043,
932
+ "step": 520
933
+ },
934
+ {
935
+ "epoch": 1.696,
936
+ "grad_norm": 61.11300533777711,
937
+ "learning_rate": 2.410926365795724e-07,
938
+ "logits/generated": -2.598510503768921,
939
+ "logits/real": -2.6134636402130127,
940
+ "logps/generated": -130.40304565429688,
941
+ "logps/real": -119.8432846069336,
942
+ "loss": 0.4011,
943
+ "rewards/accuracies": 0.925000011920929,
944
+ "rewards/generated": 0.22392193973064423,
945
+ "rewards/margins": 3.1454458236694336,
946
+ "rewards/real": 3.3693675994873047,
947
+ "step": 530
948
+ },
949
+ {
950
+ "epoch": 1.728,
951
+ "grad_norm": 52.94216878715562,
952
+ "learning_rate": 2.351543942992874e-07,
953
+ "logits/generated": -2.54017972946167,
954
+ "logits/real": -2.611607074737549,
955
+ "logps/generated": -123.71136474609375,
956
+ "logps/real": -117.9095687866211,
957
+ "loss": 0.3699,
958
+ "rewards/accuracies": 0.925000011920929,
959
+ "rewards/generated": 0.34511905908584595,
960
+ "rewards/margins": 2.8268630504608154,
961
+ "rewards/real": 3.1719822883605957,
962
+ "step": 540
963
+ },
964
+ {
965
+ "epoch": 1.76,
966
+ "grad_norm": 34.291195649117704,
967
+ "learning_rate": 2.2921615201900234e-07,
968
+ "logits/generated": -2.530885696411133,
969
+ "logits/real": -2.5769619941711426,
970
+ "logps/generated": -129.57070922851562,
971
+ "logps/real": -107.8799057006836,
972
+ "loss": 0.3611,
973
+ "rewards/accuracies": 0.9624999761581421,
974
+ "rewards/generated": 0.188289612531662,
975
+ "rewards/margins": 3.124110460281372,
976
+ "rewards/real": 3.3124001026153564,
977
+ "step": 550
978
+ },
979
+ {
980
+ "epoch": 1.7856,
981
+ "eval_logits/generated": -2.432302951812744,
982
+ "eval_logits/real": -2.436417818069458,
983
+ "eval_logps/generated": -104.27023315429688,
984
+ "eval_logps/real": -115.58291625976562,
985
+ "eval_loss": 0.7119041681289673,
986
+ "eval_rewards/accuracies": 0.6730769276618958,
987
+ "eval_rewards/generated": 1.704530119895935,
988
+ "eval_rewards/margins": 0.6285931468009949,
989
+ "eval_rewards/real": 2.333123207092285,
990
+ "eval_runtime": 37.2029,
991
+ "eval_samples_per_second": 5.376,
992
+ "eval_steps_per_second": 0.349,
993
+ "step": 558
994
  }
995
  ],
996
  "logging_steps": 10,