AmberYifan commited on
Commit
8d50dc9
1 Parent(s): b51bed0

Training in progress, step 620, checkpoint

Browse files
last-checkpoint/global_step620/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e3d89c95f89e37f37a87b8e0d63cd51f8eeb84490d139724c37038dafc9c203
3
+ size 14483467880
last-checkpoint/global_step620/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e1a351165427eee6ccf8fb35b75b1c2fa9eeffcf04caa9a69ac29237ad504ce
3
+ size 14483467880
last-checkpoint/global_step620/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f66ebabfdb278389ef82f3a6f5a8a735d49f9fdca8e6e092c4ec0268834a0bb
3
+ size 14483467880
last-checkpoint/global_step620/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fe93e20eaf14ebf1c121193ab084652ac50265019dd4edcfea5758f0b5da0bb
3
+ size 14483467880
last-checkpoint/global_step620/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:353189acafcf58d5522234859c339a3ad63dfa657023ee5b281282dde523627b
3
+ size 150629
last-checkpoint/global_step620/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b4fe5daad0262291e805a44bf4b497bf7ed953be022e301762905bce089f127
3
+ size 150629
last-checkpoint/global_step620/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faed547d8f0a20c92d47f05e5fc5be1f95b522a0e4134205ef062d68da5f1c17
3
+ size 150629
last-checkpoint/global_step620/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e6ce5170fce92ddc28458c28e80546ad5fc11d1afa4dce327a0105ded5be944
3
+ size 150629
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step558
 
1
+ global_step620
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c6a528fcebfa81ad94dc98b813bc2eaf50e2093983c66f1cf062eee248c9ce3
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93daaec3380eb160ed1b2b55d7e6a40b3148f5806a93acda8285c13c6ed11ec4
3
  size 4943162336
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87205acf168a99a505e46e06b76a61a6a87e6e70876881ff030e4dad2cd7aa43
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d99f0e63f5427ff1eb28a5e26e8a6cb5f108907e9ec53956cf11addbcacf1c34
3
  size 4999819336
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c09c12a0ba4fd95fb32e1df06312c869712e92aa026283345f20f3f5ad8b86a
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dd3351df120c66885127c540da0c2667724cb06d47ddfb327a851ef7dace34c
3
  size 4540516344
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3ea85ce0faf4f25f8f01506659575c6ffa73d2668e6dcf972bea416c2f14cf7
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6df02d244f55294fc3a1bed06a850d7dc043249b3e97a2a1f72408d7e378d44b
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbafb0c52cec706b84eb0e477953ab4950ffc8e931e49bbc7a37cd7d5d929a69
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:007e6b920b3c7dfd19dd00d30bc01c0cd1682b25270dc31952d9b737d039f1d1
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41569355a67e5d54cd2e41fbdb883692602ceaf27587e7a1c779dc0f9f2d51fd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44a438c4653759e5a86be993ca4420444015d4e70859f1f853dd1fc989248fda
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.7856,
5
  "eval_steps": 62,
6
- "global_step": 558,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -991,6 +991,127 @@
991
  "eval_samples_per_second": 5.376,
992
  "eval_steps_per_second": 0.349,
993
  "step": 558
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
994
  }
995
  ],
996
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.984,
5
  "eval_steps": 62,
6
+ "global_step": 620,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
991
  "eval_samples_per_second": 5.376,
992
  "eval_steps_per_second": 0.349,
993
  "step": 558
994
+ },
995
+ {
996
+ "epoch": 1.792,
997
+ "grad_norm": 36.45272717171445,
998
+ "learning_rate": 2.2327790973871732e-07,
999
+ "logits/generated": -2.4495067596435547,
1000
+ "logits/real": -2.4794678688049316,
1001
+ "logps/generated": -132.83074951171875,
1002
+ "logps/real": -119.1983413696289,
1003
+ "loss": 0.3839,
1004
+ "rewards/accuracies": 0.8999999761581421,
1005
+ "rewards/generated": 0.6143507957458496,
1006
+ "rewards/margins": 2.7835047245025635,
1007
+ "rewards/real": 3.397855281829834,
1008
+ "step": 560
1009
+ },
1010
+ {
1011
+ "epoch": 1.8239999999999998,
1012
+ "grad_norm": 47.41784238396275,
1013
+ "learning_rate": 2.173396674584323e-07,
1014
+ "logits/generated": -2.371821641921997,
1015
+ "logits/real": -2.4102165699005127,
1016
+ "logps/generated": -118.35310363769531,
1017
+ "logps/real": -104.9133529663086,
1018
+ "loss": 0.3493,
1019
+ "rewards/accuracies": 0.925000011920929,
1020
+ "rewards/generated": 0.35018137097358704,
1021
+ "rewards/margins": 2.667248487472534,
1022
+ "rewards/real": 3.017429828643799,
1023
+ "step": 570
1024
+ },
1025
+ {
1026
+ "epoch": 1.8559999999999999,
1027
+ "grad_norm": 49.63769156744519,
1028
+ "learning_rate": 2.1140142517814726e-07,
1029
+ "logits/generated": -2.4235947132110596,
1030
+ "logits/real": -2.425346851348877,
1031
+ "logps/generated": -111.2136001586914,
1032
+ "logps/real": -107.47050476074219,
1033
+ "loss": 0.3654,
1034
+ "rewards/accuracies": 0.9125000238418579,
1035
+ "rewards/generated": 0.31659263372421265,
1036
+ "rewards/margins": 2.903308153152466,
1037
+ "rewards/real": 3.219900608062744,
1038
+ "step": 580
1039
+ },
1040
+ {
1041
+ "epoch": 1.888,
1042
+ "grad_norm": 58.661910753155134,
1043
+ "learning_rate": 2.0546318289786222e-07,
1044
+ "logits/generated": -2.431994676589966,
1045
+ "logits/real": -2.488813638687134,
1046
+ "logps/generated": -129.04559326171875,
1047
+ "logps/real": -119.28230285644531,
1048
+ "loss": 0.4107,
1049
+ "rewards/accuracies": 0.9125000238418579,
1050
+ "rewards/generated": 0.3402375876903534,
1051
+ "rewards/margins": 2.8488047122955322,
1052
+ "rewards/real": 3.189042091369629,
1053
+ "step": 590
1054
+ },
1055
+ {
1056
+ "epoch": 1.92,
1057
+ "grad_norm": 21.619481492021077,
1058
+ "learning_rate": 1.9952494061757718e-07,
1059
+ "logits/generated": -2.436246871948242,
1060
+ "logits/real": -2.466956377029419,
1061
+ "logps/generated": -116.15250396728516,
1062
+ "logps/real": -107.74141693115234,
1063
+ "loss": 0.4577,
1064
+ "rewards/accuracies": 0.8999999761581421,
1065
+ "rewards/generated": 0.5984365344047546,
1066
+ "rewards/margins": 2.591343641281128,
1067
+ "rewards/real": 3.1897804737091064,
1068
+ "step": 600
1069
+ },
1070
+ {
1071
+ "epoch": 1.952,
1072
+ "grad_norm": 45.346853109328364,
1073
+ "learning_rate": 1.9358669833729216e-07,
1074
+ "logits/generated": -2.4542717933654785,
1075
+ "logits/real": -2.4808132648468018,
1076
+ "logps/generated": -101.80671691894531,
1077
+ "logps/real": -96.19842529296875,
1078
+ "loss": 0.4562,
1079
+ "rewards/accuracies": 0.8999999761581421,
1080
+ "rewards/generated": 0.5814850330352783,
1081
+ "rewards/margins": 2.2760722637176514,
1082
+ "rewards/real": 2.8575568199157715,
1083
+ "step": 610
1084
+ },
1085
+ {
1086
+ "epoch": 1.984,
1087
+ "grad_norm": 44.76458950174624,
1088
+ "learning_rate": 1.876484560570071e-07,
1089
+ "logits/generated": -2.506688356399536,
1090
+ "logits/real": -2.5051321983337402,
1091
+ "logps/generated": -109.52842712402344,
1092
+ "logps/real": -100.06086730957031,
1093
+ "loss": 0.3933,
1094
+ "rewards/accuracies": 0.949999988079071,
1095
+ "rewards/generated": 0.37385421991348267,
1096
+ "rewards/margins": 2.584712266921997,
1097
+ "rewards/real": 2.958566665649414,
1098
+ "step": 620
1099
+ },
1100
+ {
1101
+ "epoch": 1.984,
1102
+ "eval_logits/generated": -2.432065725326538,
1103
+ "eval_logits/real": -2.426744222640991,
1104
+ "eval_logps/generated": -104.29174041748047,
1105
+ "eval_logps/real": -115.62232971191406,
1106
+ "eval_loss": 0.7168198227882385,
1107
+ "eval_rewards/accuracies": 0.6730769276618958,
1108
+ "eval_rewards/generated": 1.7023800611495972,
1109
+ "eval_rewards/margins": 0.6268020868301392,
1110
+ "eval_rewards/real": 2.3291821479797363,
1111
+ "eval_runtime": 36.5982,
1112
+ "eval_samples_per_second": 5.465,
1113
+ "eval_steps_per_second": 0.355,
1114
+ "step": 620
1115
  }
1116
  ],
1117
  "logging_steps": 10,