Training in progress, step 1250, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step1250/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1250/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1250/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1250/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step1250/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step1250/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step1250/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step1250/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +95 -6
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 18516456
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7be96f406ec55e2af59cd5b109f6e76e8a66fbf4acb9841a45fb6d6c486af7d2
|
3 |
size 18516456
|
last-checkpoint/global_step1250/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26d09c9878e4f364e6befa045ded86fab302872674a59212b06946d48f71a3c3
|
3 |
+
size 27700976
|
last-checkpoint/global_step1250/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:886bc6c03f6cad686e8dd5c787093beeb2bc00a1998bf1af23028d58b438c19f
|
3 |
+
size 27700976
|
last-checkpoint/global_step1250/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47214be91922f9512a7d8629e3d1f57cce2325e145959a01509955e36efeeaf6
|
3 |
+
size 27700976
|
last-checkpoint/global_step1250/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beb878cc2717bc78d554c6024454aab9d12e9133b4c67d70fb744bfc48093465
|
3 |
+
size 27700976
|
last-checkpoint/global_step1250/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b63ad4dccc38b42d9e0c6d07c7d8b737dfc65e0309919f86bae8e3dcb0bcafc
|
3 |
+
size 411571
|
last-checkpoint/global_step1250/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce32ab81f64451d7ae4cfc34fc23370ba1931f6e3064a5e10d1c060bd513c1a1
|
3 |
+
size 411507
|
last-checkpoint/global_step1250/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5690617325b666134fb4899a7252c0c721cd060c834a7b7ea14b436a5a1513bb
|
3 |
+
size 411507
|
last-checkpoint/global_step1250/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ec5f102391e11f082bf283dfedabe7199e9df698d2f513d3e140cd8748b7627
|
3 |
+
size 411507
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step1250
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15bbef9a4c878a05b4f189e9f77701a153dc9faf093499714094cb36ac0ca030
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a7122760cfda3f3e13eac4f7e56d09b0fd3beac4bd49b2f0e58da9519469ff9
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71edf044d4ea96e62ffecab515d42b58ae56cd64abd0092a897468e0e0d7c10f
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef5ca30351deca9d83675a183b2186ef346093f56e0d5a6dacdf62ef921f12c2
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e821d0d4ad1c6c22d1f5fd3b6821d2a85d44ee21d649d544e34dfcb627d9b580
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "saves/CADICA_qwenvl_stenosis_classily_scale4_frozenVision/lora/sft/checkpoint-
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -2143,11 +2143,100 @@
|
|
2143 |
"eval_steps_per_second": 0.93,
|
2144 |
"num_input_tokens_seen": 14035544,
|
2145 |
"step": 1200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2146 |
}
|
2147 |
],
|
2148 |
"logging_steps": 5,
|
2149 |
"max_steps": 3400,
|
2150 |
-
"num_input_tokens_seen":
|
2151 |
"num_train_epochs": 2,
|
2152 |
"save_steps": 50,
|
2153 |
"stateful_callbacks": {
|
@@ -2162,7 +2251,7 @@
|
|
2162 |
"attributes": {}
|
2163 |
}
|
2164 |
},
|
2165 |
-
"total_flos":
|
2166 |
"train_batch_size": 1,
|
2167 |
"trial_name": null,
|
2168 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.7407085299491882,
|
3 |
+
"best_model_checkpoint": "saves/CADICA_qwenvl_stenosis_classily_scale4_frozenVision/lora/sft/checkpoint-1250",
|
4 |
+
"epoch": 0.6438320885912954,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 1250,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
2143 |
"eval_steps_per_second": 0.93,
|
2144 |
"num_input_tokens_seen": 14035544,
|
2145 |
"step": 1200
|
2146 |
+
},
|
2147 |
+
{
|
2148 |
+
"epoch": 0.6206541334020087,
|
2149 |
+
"grad_norm": 1.0526811295206564,
|
2150 |
+
"learning_rate": 7.673382966299163e-05,
|
2151 |
+
"loss": 0.7871,
|
2152 |
+
"num_input_tokens_seen": 14094024,
|
2153 |
+
"step": 1205
|
2154 |
+
},
|
2155 |
+
{
|
2156 |
+
"epoch": 0.623229461756374,
|
2157 |
+
"grad_norm": 1.832697637344859,
|
2158 |
+
"learning_rate": 7.65280325993715e-05,
|
2159 |
+
"loss": 0.7594,
|
2160 |
+
"num_input_tokens_seen": 14152504,
|
2161 |
+
"step": 1210
|
2162 |
+
},
|
2163 |
+
{
|
2164 |
+
"epoch": 0.6258047901107391,
|
2165 |
+
"grad_norm": 1.6875031192331054,
|
2166 |
+
"learning_rate": 7.63216081438678e-05,
|
2167 |
+
"loss": 0.7833,
|
2168 |
+
"num_input_tokens_seen": 14210992,
|
2169 |
+
"step": 1215
|
2170 |
+
},
|
2171 |
+
{
|
2172 |
+
"epoch": 0.6283801184651043,
|
2173 |
+
"grad_norm": 1.867117238207419,
|
2174 |
+
"learning_rate": 7.611456117844934e-05,
|
2175 |
+
"loss": 0.8445,
|
2176 |
+
"num_input_tokens_seen": 14269488,
|
2177 |
+
"step": 1220
|
2178 |
+
},
|
2179 |
+
{
|
2180 |
+
"epoch": 0.6309554468194695,
|
2181 |
+
"grad_norm": 0.9089614634143406,
|
2182 |
+
"learning_rate": 7.59068965998074e-05,
|
2183 |
+
"loss": 0.7857,
|
2184 |
+
"num_input_tokens_seen": 14327968,
|
2185 |
+
"step": 1225
|
2186 |
+
},
|
2187 |
+
{
|
2188 |
+
"epoch": 0.6335307751738347,
|
2189 |
+
"grad_norm": 2.3911537408111214,
|
2190 |
+
"learning_rate": 7.569861931923989e-05,
|
2191 |
+
"loss": 0.8064,
|
2192 |
+
"num_input_tokens_seen": 14386448,
|
2193 |
+
"step": 1230
|
2194 |
+
},
|
2195 |
+
{
|
2196 |
+
"epoch": 0.6361061035281999,
|
2197 |
+
"grad_norm": 1.6500224851295993,
|
2198 |
+
"learning_rate": 7.548973426253521e-05,
|
2199 |
+
"loss": 0.7117,
|
2200 |
+
"num_input_tokens_seen": 14444912,
|
2201 |
+
"step": 1235
|
2202 |
+
},
|
2203 |
+
{
|
2204 |
+
"epoch": 0.638681431882565,
|
2205 |
+
"grad_norm": 1.508924461189316,
|
2206 |
+
"learning_rate": 7.528024636985575e-05,
|
2207 |
+
"loss": 0.7449,
|
2208 |
+
"num_input_tokens_seen": 14503392,
|
2209 |
+
"step": 1240
|
2210 |
+
},
|
2211 |
+
{
|
2212 |
+
"epoch": 0.6412567602369302,
|
2213 |
+
"grad_norm": 1.3801142620835953,
|
2214 |
+
"learning_rate": 7.507016059562107e-05,
|
2215 |
+
"loss": 0.7507,
|
2216 |
+
"num_input_tokens_seen": 14561872,
|
2217 |
+
"step": 1245
|
2218 |
+
},
|
2219 |
+
{
|
2220 |
+
"epoch": 0.6438320885912954,
|
2221 |
+
"grad_norm": 1.2994701535106117,
|
2222 |
+
"learning_rate": 7.485948190839077e-05,
|
2223 |
+
"loss": 0.7917,
|
2224 |
+
"num_input_tokens_seen": 14620336,
|
2225 |
+
"step": 1250
|
2226 |
+
},
|
2227 |
+
{
|
2228 |
+
"epoch": 0.6438320885912954,
|
2229 |
+
"eval_loss": 0.7407085299491882,
|
2230 |
+
"eval_runtime": 16.1168,
|
2231 |
+
"eval_samples_per_second": 3.723,
|
2232 |
+
"eval_steps_per_second": 0.931,
|
2233 |
+
"num_input_tokens_seen": 14620336,
|
2234 |
+
"step": 1250
|
2235 |
}
|
2236 |
],
|
2237 |
"logging_steps": 5,
|
2238 |
"max_steps": 3400,
|
2239 |
+
"num_input_tokens_seen": 14620336,
|
2240 |
"num_train_epochs": 2,
|
2241 |
"save_steps": 50,
|
2242 |
"stateful_callbacks": {
|
|
|
2251 |
"attributes": {}
|
2252 |
}
|
2253 |
},
|
2254 |
+
"total_flos": 820953557762048.0,
|
2255 |
"train_batch_size": 1,
|
2256 |
"trial_name": null,
|
2257 |
"trial_params": null
|