AmberYifan
commited on
Commit
•
b51bed0
1
Parent(s):
10f4aa1
Training in progress, step 558, checkpoint
Browse files- last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +108 -2
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48f47872b153568880f63e929f3bdd430ab3ca165a871dd7f35283aa5d93a46a
|
3 |
+
size 14483467880
|
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31af3feb2ec011fbc257818fdd66bf54c64e3e6ec1df17f7899a6b1810530e7f
|
3 |
+
size 14483467880
|
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69abf6db88945f5bb6be0b9788b523a8a5a12986dbdd173ee2aa9ffbf50dd455
|
3 |
+
size 14483467880
|
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5083abeebe436b485703d56249238c09c2540c14bc747f5a94d83da7bb496bb7
|
3 |
+
size 14483467880
|
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d3c39cc7165a6ee3bd278e657b74091c7d7445454546c0632393fe1b8f5dbe7
|
3 |
+
size 150629
|
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246a94e167835a45d3933514047a1ec029f5a0b7f89c6dee634f7d034f972677
|
3 |
+
size 150629
|
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7470e6434a5c8e46bb43a523a725387c3308156d296ee1210e546cad75ca81e
|
3 |
+
size 150629
|
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12d186b915651468c281bfc724da55a5e8e424664df1f100081a2cdc05745ae4
|
3 |
+
size 150629
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step558
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943162336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c6a528fcebfa81ad94dc98b813bc2eaf50e2093983c66f1cf062eee248c9ce3
|
3 |
size 4943162336
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87205acf168a99a505e46e06b76a61a6a87e6e70876881ff030e4dad2cd7aa43
|
3 |
size 4999819336
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540516344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c09c12a0ba4fd95fb32e1df06312c869712e92aa026283345f20f3f5ad8b86a
|
3 |
size 4540516344
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41569355a67e5d54cd2e41fbdb883692602ceaf27587e7a1c779dc0f9f2d51fd
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -885,6 +885,112 @@
|
|
885 |
"eval_samples_per_second": 5.286,
|
886 |
"eval_steps_per_second": 0.344,
|
887 |
"step": 496
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
888 |
}
|
889 |
],
|
890 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.7856,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 558,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
885 |
"eval_samples_per_second": 5.286,
|
886 |
"eval_steps_per_second": 0.344,
|
887 |
"step": 496
|
888 |
+
},
|
889 |
+
{
|
890 |
+
"epoch": 1.6,
|
891 |
+
"grad_norm": 33.14482905038865,
|
892 |
+
"learning_rate": 2.589073634204275e-07,
|
893 |
+
"logits/generated": -2.348078727722168,
|
894 |
+
"logits/real": -2.3059887886047363,
|
895 |
+
"logps/generated": -123.2630615234375,
|
896 |
+
"logps/real": -101.59033966064453,
|
897 |
+
"loss": 0.3313,
|
898 |
+
"rewards/accuracies": 0.987500011920929,
|
899 |
+
"rewards/generated": -0.09043073654174805,
|
900 |
+
"rewards/margins": 3.036623477935791,
|
901 |
+
"rewards/real": 2.946192502975464,
|
902 |
+
"step": 500
|
903 |
+
},
|
904 |
+
{
|
905 |
+
"epoch": 1.6320000000000001,
|
906 |
+
"grad_norm": 58.37181281947162,
|
907 |
+
"learning_rate": 2.529691211401425e-07,
|
908 |
+
"logits/generated": -2.3784213066101074,
|
909 |
+
"logits/real": -2.445460557937622,
|
910 |
+
"logps/generated": -137.46278381347656,
|
911 |
+
"logps/real": -98.52521514892578,
|
912 |
+
"loss": 0.3326,
|
913 |
+
"rewards/accuracies": 0.887499988079071,
|
914 |
+
"rewards/generated": -0.19049878418445587,
|
915 |
+
"rewards/margins": 3.1443653106689453,
|
916 |
+
"rewards/real": 2.953866958618164,
|
917 |
+
"step": 510
|
918 |
+
},
|
919 |
+
{
|
920 |
+
"epoch": 1.6640000000000001,
|
921 |
+
"grad_norm": 51.7755109683276,
|
922 |
+
"learning_rate": 2.4703087885985747e-07,
|
923 |
+
"logits/generated": -2.6047139167785645,
|
924 |
+
"logits/real": -2.575225353240967,
|
925 |
+
"logps/generated": -125.86954498291016,
|
926 |
+
"logps/real": -115.58686828613281,
|
927 |
+
"loss": 0.3731,
|
928 |
+
"rewards/accuracies": 0.9125000238418579,
|
929 |
+
"rewards/generated": 0.010144609026610851,
|
930 |
+
"rewards/margins": 2.9819352626800537,
|
931 |
+
"rewards/real": 2.9920802116394043,
|
932 |
+
"step": 520
|
933 |
+
},
|
934 |
+
{
|
935 |
+
"epoch": 1.696,
|
936 |
+
"grad_norm": 61.11300533777711,
|
937 |
+
"learning_rate": 2.410926365795724e-07,
|
938 |
+
"logits/generated": -2.598510503768921,
|
939 |
+
"logits/real": -2.6134636402130127,
|
940 |
+
"logps/generated": -130.40304565429688,
|
941 |
+
"logps/real": -119.8432846069336,
|
942 |
+
"loss": 0.4011,
|
943 |
+
"rewards/accuracies": 0.925000011920929,
|
944 |
+
"rewards/generated": 0.22392193973064423,
|
945 |
+
"rewards/margins": 3.1454458236694336,
|
946 |
+
"rewards/real": 3.3693675994873047,
|
947 |
+
"step": 530
|
948 |
+
},
|
949 |
+
{
|
950 |
+
"epoch": 1.728,
|
951 |
+
"grad_norm": 52.94216878715562,
|
952 |
+
"learning_rate": 2.351543942992874e-07,
|
953 |
+
"logits/generated": -2.54017972946167,
|
954 |
+
"logits/real": -2.611607074737549,
|
955 |
+
"logps/generated": -123.71136474609375,
|
956 |
+
"logps/real": -117.9095687866211,
|
957 |
+
"loss": 0.3699,
|
958 |
+
"rewards/accuracies": 0.925000011920929,
|
959 |
+
"rewards/generated": 0.34511905908584595,
|
960 |
+
"rewards/margins": 2.8268630504608154,
|
961 |
+
"rewards/real": 3.1719822883605957,
|
962 |
+
"step": 540
|
963 |
+
},
|
964 |
+
{
|
965 |
+
"epoch": 1.76,
|
966 |
+
"grad_norm": 34.291195649117704,
|
967 |
+
"learning_rate": 2.2921615201900234e-07,
|
968 |
+
"logits/generated": -2.530885696411133,
|
969 |
+
"logits/real": -2.5769619941711426,
|
970 |
+
"logps/generated": -129.57070922851562,
|
971 |
+
"logps/real": -107.8799057006836,
|
972 |
+
"loss": 0.3611,
|
973 |
+
"rewards/accuracies": 0.9624999761581421,
|
974 |
+
"rewards/generated": 0.188289612531662,
|
975 |
+
"rewards/margins": 3.124110460281372,
|
976 |
+
"rewards/real": 3.3124001026153564,
|
977 |
+
"step": 550
|
978 |
+
},
|
979 |
+
{
|
980 |
+
"epoch": 1.7856,
|
981 |
+
"eval_logits/generated": -2.432302951812744,
|
982 |
+
"eval_logits/real": -2.436417818069458,
|
983 |
+
"eval_logps/generated": -104.27023315429688,
|
984 |
+
"eval_logps/real": -115.58291625976562,
|
985 |
+
"eval_loss": 0.7119041681289673,
|
986 |
+
"eval_rewards/accuracies": 0.6730769276618958,
|
987 |
+
"eval_rewards/generated": 1.704530119895935,
|
988 |
+
"eval_rewards/margins": 0.6285931468009949,
|
989 |
+
"eval_rewards/real": 2.333123207092285,
|
990 |
+
"eval_runtime": 37.2029,
|
991 |
+
"eval_samples_per_second": 5.376,
|
992 |
+
"eval_steps_per_second": 0.349,
|
993 |
+
"step": 558
|
994 |
}
|
995 |
],
|
996 |
"logging_steps": 10,
|