Training in progress, epoch 60, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 166496880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f383c6a569aa1757f42c068466838ac2ad34601c735c42e76c4b0eccec7ec251
|
3 |
size 166496880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 330495866
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7985126ab91293b3d360f1dc2d798595b418d44dce13ead2ff7d367e826b6e16
|
3 |
size 330495866
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:521682efd6d19f4a9e6242718069a7e8eb91340f3ce03656684bc97ecd02f9fa
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c5b71df2955d83314469d7d171689f62e78d85dd182a8d60c5a5ca2b526ce72
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 0.28454330563545227,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-28500",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -8422,6 +8422,151 @@
|
|
8422 |
"eval_samples_per_second": 17.921,
|
8423 |
"eval_steps_per_second": 2.33,
|
8424 |
"step": 29500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8425 |
}
|
8426 |
],
|
8427 |
"logging_steps": 30,
|
@@ -8436,12 +8581,12 @@
|
|
8436 |
"should_evaluate": false,
|
8437 |
"should_log": false,
|
8438 |
"should_save": true,
|
8439 |
-
"should_training_stop":
|
8440 |
},
|
8441 |
"attributes": {}
|
8442 |
}
|
8443 |
},
|
8444 |
-
"total_flos": 1.
|
8445 |
"train_batch_size": 2,
|
8446 |
"trial_name": null,
|
8447 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 0.28454330563545227,
|
3 |
"best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-28500",
|
4 |
+
"epoch": 60.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 30000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
8422 |
"eval_samples_per_second": 17.921,
|
8423 |
"eval_steps_per_second": 2.33,
|
8424 |
"step": 29500
|
8425 |
+
},
|
8426 |
+
{
|
8427 |
+
"epoch": 59.04,
|
8428 |
+
"grad_norm": 29.91386604309082,
|
8429 |
+
"learning_rate": 6.315216969912663e-09,
|
8430 |
+
"loss": 0.3851,
|
8431 |
+
"step": 29520
|
8432 |
+
},
|
8433 |
+
{
|
8434 |
+
"epoch": 59.1,
|
8435 |
+
"grad_norm": 505.2102355957031,
|
8436 |
+
"learning_rate": 5.5506251901504825e-09,
|
8437 |
+
"loss": 0.3666,
|
8438 |
+
"step": 29550
|
8439 |
+
},
|
8440 |
+
{
|
8441 |
+
"epoch": 59.16,
|
8442 |
+
"grad_norm": 45.7656135559082,
|
8443 |
+
"learning_rate": 4.835326609376468e-09,
|
8444 |
+
"loss": 0.4178,
|
8445 |
+
"step": 29580
|
8446 |
+
},
|
8447 |
+
{
|
8448 |
+
"epoch": 59.22,
|
8449 |
+
"grad_norm": 56.061153411865234,
|
8450 |
+
"learning_rate": 4.169328287299545e-09,
|
8451 |
+
"loss": 0.4697,
|
8452 |
+
"step": 29610
|
8453 |
+
},
|
8454 |
+
{
|
8455 |
+
"epoch": 59.28,
|
8456 |
+
"grad_norm": 93.67945098876953,
|
8457 |
+
"learning_rate": 3.5526367970539765e-09,
|
8458 |
+
"loss": 0.3581,
|
8459 |
+
"step": 29640
|
8460 |
+
},
|
8461 |
+
{
|
8462 |
+
"epoch": 59.34,
|
8463 |
+
"grad_norm": 56.09961700439453,
|
8464 |
+
"learning_rate": 2.9852582251355124e-09,
|
8465 |
+
"loss": 0.4007,
|
8466 |
+
"step": 29670
|
8467 |
+
},
|
8468 |
+
{
|
8469 |
+
"epoch": 59.4,
|
8470 |
+
"grad_norm": 95.72340393066406,
|
8471 |
+
"learning_rate": 2.4671981713420003e-09,
|
8472 |
+
"loss": 0.4338,
|
8473 |
+
"step": 29700
|
8474 |
+
},
|
8475 |
+
{
|
8476 |
+
"epoch": 59.46,
|
8477 |
+
"grad_norm": 73.806884765625,
|
8478 |
+
"learning_rate": 1.9984617487173174e-09,
|
8479 |
+
"loss": 0.4488,
|
8480 |
+
"step": 29730
|
8481 |
+
},
|
8482 |
+
{
|
8483 |
+
"epoch": 59.52,
|
8484 |
+
"grad_norm": 63.850746154785156,
|
8485 |
+
"learning_rate": 1.5790535835003006e-09,
|
8486 |
+
"loss": 0.4424,
|
8487 |
+
"step": 29760
|
8488 |
+
},
|
8489 |
+
{
|
8490 |
+
"epoch": 59.58,
|
8491 |
+
"grad_norm": 54.269371032714844,
|
8492 |
+
"learning_rate": 1.2089778150797816e-09,
|
8493 |
+
"loss": 0.4145,
|
8494 |
+
"step": 29790
|
8495 |
+
},
|
8496 |
+
{
|
8497 |
+
"epoch": 59.64,
|
8498 |
+
"grad_norm": 45.143714904785156,
|
8499 |
+
"learning_rate": 8.88238095955174e-10,
|
8500 |
+
"loss": 0.4422,
|
8501 |
+
"step": 29820
|
8502 |
+
},
|
8503 |
+
{
|
8504 |
+
"epoch": 59.7,
|
8505 |
+
"grad_norm": 32.879642486572266,
|
8506 |
+
"learning_rate": 6.168375916970615e-10,
|
8507 |
+
"loss": 0.3915,
|
8508 |
+
"step": 29850
|
8509 |
+
},
|
8510 |
+
{
|
8511 |
+
"epoch": 59.76,
|
8512 |
+
"grad_norm": 68.58180236816406,
|
8513 |
+
"learning_rate": 3.9477898091944135e-10,
|
8514 |
+
"loss": 0.423,
|
8515 |
+
"step": 29880
|
8516 |
+
},
|
8517 |
+
{
|
8518 |
+
"epoch": 59.82,
|
8519 |
+
"grad_norm": 57.879634857177734,
|
8520 |
+
"learning_rate": 2.2206445525085886e-10,
|
8521 |
+
"loss": 0.4619,
|
8522 |
+
"step": 29910
|
8523 |
+
},
|
8524 |
+
{
|
8525 |
+
"epoch": 59.88,
|
8526 |
+
"grad_norm": 133.5286102294922,
|
8527 |
+
"learning_rate": 9.869571931442334e-11,
|
8528 |
+
"loss": 0.3987,
|
8529 |
+
"step": 29940
|
8530 |
+
},
|
8531 |
+
{
|
8532 |
+
"epoch": 59.94,
|
8533 |
+
"grad_norm": 63.78921127319336,
|
8534 |
+
"learning_rate": 2.467399070893439e-11,
|
8535 |
+
"loss": 0.3533,
|
8536 |
+
"step": 29970
|
8537 |
+
},
|
8538 |
+
{
|
8539 |
+
"epoch": 60.0,
|
8540 |
+
"grad_norm": 65.49594116210938,
|
8541 |
+
"learning_rate": 0.0,
|
8542 |
+
"loss": 0.4504,
|
8543 |
+
"step": 30000
|
8544 |
+
},
|
8545 |
+
{
|
8546 |
+
"epoch": 60.0,
|
8547 |
+
"eval_loss": 0.28507041931152344,
|
8548 |
+
"eval_map": 0.8003,
|
8549 |
+
"eval_map_50": 0.9645,
|
8550 |
+
"eval_map_75": 0.9196,
|
8551 |
+
"eval_map_chicken": 0.8072,
|
8552 |
+
"eval_map_duck": 0.7689,
|
8553 |
+
"eval_map_large": 0.8772,
|
8554 |
+
"eval_map_medium": 0.7999,
|
8555 |
+
"eval_map_plant": 0.8248,
|
8556 |
+
"eval_map_small": 0.2246,
|
8557 |
+
"eval_mar_1": 0.3086,
|
8558 |
+
"eval_mar_10": 0.8346,
|
8559 |
+
"eval_mar_100": 0.8384,
|
8560 |
+
"eval_mar_100_chicken": 0.8413,
|
8561 |
+
"eval_mar_100_duck": 0.799,
|
8562 |
+
"eval_mar_100_plant": 0.8749,
|
8563 |
+
"eval_mar_large": 0.918,
|
8564 |
+
"eval_mar_medium": 0.8496,
|
8565 |
+
"eval_mar_small": 0.3614,
|
8566 |
+
"eval_runtime": 5.2733,
|
8567 |
+
"eval_samples_per_second": 18.963,
|
8568 |
+
"eval_steps_per_second": 2.465,
|
8569 |
+
"step": 30000
|
8570 |
}
|
8571 |
],
|
8572 |
"logging_steps": 30,
|
|
|
8581 |
"should_evaluate": false,
|
8582 |
"should_log": false,
|
8583 |
"should_save": true,
|
8584 |
+
"should_training_stop": true
|
8585 |
},
|
8586 |
"attributes": {}
|
8587 |
}
|
8588 |
},
|
8589 |
+
"total_flos": 1.0320693387264e+19,
|
8590 |
"train_batch_size": 2,
|
8591 |
"trial_name": null,
|
8592 |
"trial_params": null
|