nicolasdupuisroy
commited on
Commit
•
f1f012a
1
Parent(s):
175a421
End of training
Browse files- README.md +2 -0
- all_results.json +10 -10
- eval_results.json +6 -6
- runs/Jan17_19-49-28_d06676088071/events.out.tfevents.1705521910.d06676088071.25430.1 +3 -0
- train_results.json +5 -5
- trainer_state.json +280 -7
README.md
CHANGED
@@ -2,6 +2,8 @@
|
|
2 |
license: apache-2.0
|
3 |
base_model: google/vit-base-patch16-224-in21k
|
4 |
tags:
|
|
|
|
|
5 |
- generated_from_trainer
|
6 |
datasets:
|
7 |
- imagefolder
|
|
|
2 |
license: apache-2.0
|
3 |
base_model: google/vit-base-patch16-224-in21k
|
4 |
tags:
|
5 |
+
- image-classification
|
6 |
+
- vision
|
7 |
- generated_from_trainer
|
8 |
datasets:
|
9 |
- imagefolder
|
all_results.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"eval_accuracy": 0.
|
4 |
-
"eval_loss": 2.
|
5 |
-
"eval_runtime": 2.
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second": 0.
|
8 |
-
"train_loss":
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second":
|
11 |
-
"train_steps_per_second": 0.
|
12 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 120.0,
|
3 |
+
"eval_accuracy": 0.5846153846153846,
|
4 |
+
"eval_loss": 2.5402629375457764,
|
5 |
+
"eval_runtime": 2.5184,
|
6 |
+
"eval_samples_per_second": 51.619,
|
7 |
+
"eval_steps_per_second": 0.794,
|
8 |
+
"train_loss": 0.3072653747740246,
|
9 |
+
"train_runtime": 892.0889,
|
10 |
+
"train_samples_per_second": 69.948,
|
11 |
+
"train_steps_per_second": 0.942
|
12 |
}
|
eval_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"eval_accuracy": 0.
|
4 |
-
"eval_loss": 2.
|
5 |
-
"eval_runtime": 2.
|
6 |
-
"eval_samples_per_second":
|
7 |
-
"eval_steps_per_second": 0.
|
8 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 120.0,
|
3 |
+
"eval_accuracy": 0.5846153846153846,
|
4 |
+
"eval_loss": 2.5402629375457764,
|
5 |
+
"eval_runtime": 2.5184,
|
6 |
+
"eval_samples_per_second": 51.619,
|
7 |
+
"eval_steps_per_second": 0.794
|
8 |
}
|
runs/Jan17_19-49-28_d06676088071/events.out.tfevents.1705521910.d06676088071.25430.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8e1b9986a9eded89b9fae2faf40d5fd9e7da1fb8a2921cc370881f18a4eb1f4
|
3 |
+
size 411
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"epoch":
|
3 |
-
"train_loss":
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second":
|
6 |
-
"train_steps_per_second": 0.
|
7 |
}
|
|
|
1 |
{
|
2 |
+
"epoch": 120.0,
|
3 |
+
"train_loss": 0.3072653747740246,
|
4 |
+
"train_runtime": 892.0889,
|
5 |
+
"train_samples_per_second": 69.948,
|
6 |
+
"train_steps_per_second": 0.942
|
7 |
}
|
trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 2.
|
3 |
-
"best_model_checkpoint": "./drive/MyDrive/repositories/torch_example_image-classification/outputs_letter3/checkpoint-
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1336,14 +1336,287 @@
|
|
1336 |
"train_runtime": 4344.3701,
|
1337 |
"train_samples_per_second": 11.97,
|
1338 |
"train_steps_per_second": 0.161
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1339 |
}
|
1340 |
],
|
1341 |
"logging_steps": 10,
|
1342 |
-
"max_steps":
|
1343 |
"num_input_tokens_seen": 0,
|
1344 |
-
"num_train_epochs":
|
1345 |
"save_steps": 500,
|
1346 |
-
"total_flos": 4.
|
1347 |
"train_batch_size": 80,
|
1348 |
"trial_name": null,
|
1349 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 2.5402629375457764,
|
3 |
+
"best_model_checkpoint": "./drive/MyDrive/repositories/torch_example_image-classification/outputs_letter3/checkpoint-840",
|
4 |
+
"epoch": 120.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 840,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1336 |
"train_runtime": 4344.3701,
|
1337 |
"train_samples_per_second": 11.97,
|
1338 |
"train_steps_per_second": 0.161
|
1339 |
+
},
|
1340 |
+
{
|
1341 |
+
"epoch": 101.0,
|
1342 |
+
"eval_accuracy": 0.5153846153846153,
|
1343 |
+
"eval_loss": 2.84305477142334,
|
1344 |
+
"eval_runtime": 2.1617,
|
1345 |
+
"eval_samples_per_second": 60.137,
|
1346 |
+
"eval_steps_per_second": 0.925,
|
1347 |
+
"step": 707
|
1348 |
+
},
|
1349 |
+
{
|
1350 |
+
"epoch": 101.43,
|
1351 |
+
"learning_rate": 1.9761904761904763e-05,
|
1352 |
+
"loss": 2.067,
|
1353 |
+
"step": 710
|
1354 |
+
},
|
1355 |
+
{
|
1356 |
+
"epoch": 102.0,
|
1357 |
+
"eval_accuracy": 0.5,
|
1358 |
+
"eval_loss": 2.8063366413116455,
|
1359 |
+
"eval_runtime": 2.1563,
|
1360 |
+
"eval_samples_per_second": 60.288,
|
1361 |
+
"eval_steps_per_second": 0.928,
|
1362 |
+
"step": 714
|
1363 |
+
},
|
1364 |
+
{
|
1365 |
+
"epoch": 102.86,
|
1366 |
+
"learning_rate": 1.9523809523809524e-05,
|
1367 |
+
"loss": 2.0234,
|
1368 |
+
"step": 720
|
1369 |
+
},
|
1370 |
+
{
|
1371 |
+
"epoch": 103.0,
|
1372 |
+
"eval_accuracy": 0.5230769230769231,
|
1373 |
+
"eval_loss": 2.7845773696899414,
|
1374 |
+
"eval_runtime": 2.1676,
|
1375 |
+
"eval_samples_per_second": 59.974,
|
1376 |
+
"eval_steps_per_second": 0.923,
|
1377 |
+
"step": 721
|
1378 |
+
},
|
1379 |
+
{
|
1380 |
+
"epoch": 104.0,
|
1381 |
+
"eval_accuracy": 0.5307692307692308,
|
1382 |
+
"eval_loss": 2.762021541595459,
|
1383 |
+
"eval_runtime": 2.2767,
|
1384 |
+
"eval_samples_per_second": 57.1,
|
1385 |
+
"eval_steps_per_second": 0.878,
|
1386 |
+
"step": 728
|
1387 |
+
},
|
1388 |
+
{
|
1389 |
+
"epoch": 104.29,
|
1390 |
+
"learning_rate": 1.928571428571429e-05,
|
1391 |
+
"loss": 1.9979,
|
1392 |
+
"step": 730
|
1393 |
+
},
|
1394 |
+
{
|
1395 |
+
"epoch": 105.0,
|
1396 |
+
"eval_accuracy": 0.5538461538461539,
|
1397 |
+
"eval_loss": 2.7421603202819824,
|
1398 |
+
"eval_runtime": 2.2859,
|
1399 |
+
"eval_samples_per_second": 56.871,
|
1400 |
+
"eval_steps_per_second": 0.875,
|
1401 |
+
"step": 735
|
1402 |
+
},
|
1403 |
+
{
|
1404 |
+
"epoch": 105.71,
|
1405 |
+
"learning_rate": 1.904761904761905e-05,
|
1406 |
+
"loss": 1.9515,
|
1407 |
+
"step": 740
|
1408 |
+
},
|
1409 |
+
{
|
1410 |
+
"epoch": 106.0,
|
1411 |
+
"eval_accuracy": 0.5615384615384615,
|
1412 |
+
"eval_loss": 2.722872734069824,
|
1413 |
+
"eval_runtime": 2.3487,
|
1414 |
+
"eval_samples_per_second": 55.35,
|
1415 |
+
"eval_steps_per_second": 0.852,
|
1416 |
+
"step": 742
|
1417 |
+
},
|
1418 |
+
{
|
1419 |
+
"epoch": 107.0,
|
1420 |
+
"eval_accuracy": 0.5384615384615384,
|
1421 |
+
"eval_loss": 2.7145817279815674,
|
1422 |
+
"eval_runtime": 2.3976,
|
1423 |
+
"eval_samples_per_second": 54.221,
|
1424 |
+
"eval_steps_per_second": 0.834,
|
1425 |
+
"step": 749
|
1426 |
+
},
|
1427 |
+
{
|
1428 |
+
"epoch": 107.14,
|
1429 |
+
"learning_rate": 1.880952380952381e-05,
|
1430 |
+
"loss": 1.9095,
|
1431 |
+
"step": 750
|
1432 |
+
},
|
1433 |
+
{
|
1434 |
+
"epoch": 108.0,
|
1435 |
+
"eval_accuracy": 0.5538461538461539,
|
1436 |
+
"eval_loss": 2.6905264854431152,
|
1437 |
+
"eval_runtime": 2.3887,
|
1438 |
+
"eval_samples_per_second": 54.422,
|
1439 |
+
"eval_steps_per_second": 0.837,
|
1440 |
+
"step": 756
|
1441 |
+
},
|
1442 |
+
{
|
1443 |
+
"epoch": 108.57,
|
1444 |
+
"learning_rate": 1.8571428571428575e-05,
|
1445 |
+
"loss": 1.8759,
|
1446 |
+
"step": 760
|
1447 |
+
},
|
1448 |
+
{
|
1449 |
+
"epoch": 109.0,
|
1450 |
+
"eval_accuracy": 0.5538461538461539,
|
1451 |
+
"eval_loss": 2.6840174198150635,
|
1452 |
+
"eval_runtime": 2.369,
|
1453 |
+
"eval_samples_per_second": 54.876,
|
1454 |
+
"eval_steps_per_second": 0.844,
|
1455 |
+
"step": 763
|
1456 |
+
},
|
1457 |
+
{
|
1458 |
+
"epoch": 110.0,
|
1459 |
+
"learning_rate": 1.8333333333333333e-05,
|
1460 |
+
"loss": 1.8561,
|
1461 |
+
"step": 770
|
1462 |
+
},
|
1463 |
+
{
|
1464 |
+
"epoch": 110.0,
|
1465 |
+
"eval_accuracy": 0.5461538461538461,
|
1466 |
+
"eval_loss": 2.6554973125457764,
|
1467 |
+
"eval_runtime": 2.3964,
|
1468 |
+
"eval_samples_per_second": 54.248,
|
1469 |
+
"eval_steps_per_second": 0.835,
|
1470 |
+
"step": 770
|
1471 |
+
},
|
1472 |
+
{
|
1473 |
+
"epoch": 111.0,
|
1474 |
+
"eval_accuracy": 0.5692307692307692,
|
1475 |
+
"eval_loss": 2.6465163230895996,
|
1476 |
+
"eval_runtime": 2.5418,
|
1477 |
+
"eval_samples_per_second": 51.146,
|
1478 |
+
"eval_steps_per_second": 0.787,
|
1479 |
+
"step": 777
|
1480 |
+
},
|
1481 |
+
{
|
1482 |
+
"epoch": 111.43,
|
1483 |
+
"learning_rate": 1.8095238095238097e-05,
|
1484 |
+
"loss": 1.8147,
|
1485 |
+
"step": 780
|
1486 |
+
},
|
1487 |
+
{
|
1488 |
+
"epoch": 112.0,
|
1489 |
+
"eval_accuracy": 0.5384615384615384,
|
1490 |
+
"eval_loss": 2.6321260929107666,
|
1491 |
+
"eval_runtime": 2.6607,
|
1492 |
+
"eval_samples_per_second": 48.859,
|
1493 |
+
"eval_steps_per_second": 0.752,
|
1494 |
+
"step": 784
|
1495 |
+
},
|
1496 |
+
{
|
1497 |
+
"epoch": 112.86,
|
1498 |
+
"learning_rate": 1.785714285714286e-05,
|
1499 |
+
"loss": 1.799,
|
1500 |
+
"step": 790
|
1501 |
+
},
|
1502 |
+
{
|
1503 |
+
"epoch": 113.0,
|
1504 |
+
"eval_accuracy": 0.5384615384615384,
|
1505 |
+
"eval_loss": 2.6352975368499756,
|
1506 |
+
"eval_runtime": 2.3449,
|
1507 |
+
"eval_samples_per_second": 55.439,
|
1508 |
+
"eval_steps_per_second": 0.853,
|
1509 |
+
"step": 791
|
1510 |
+
},
|
1511 |
+
{
|
1512 |
+
"epoch": 114.0,
|
1513 |
+
"eval_accuracy": 0.5461538461538461,
|
1514 |
+
"eval_loss": 2.6188342571258545,
|
1515 |
+
"eval_runtime": 2.5585,
|
1516 |
+
"eval_samples_per_second": 50.811,
|
1517 |
+
"eval_steps_per_second": 0.782,
|
1518 |
+
"step": 798
|
1519 |
+
},
|
1520 |
+
{
|
1521 |
+
"epoch": 114.29,
|
1522 |
+
"learning_rate": 1.761904761904762e-05,
|
1523 |
+
"loss": 1.7536,
|
1524 |
+
"step": 800
|
1525 |
+
},
|
1526 |
+
{
|
1527 |
+
"epoch": 115.0,
|
1528 |
+
"eval_accuracy": 0.5461538461538461,
|
1529 |
+
"eval_loss": 2.6063857078552246,
|
1530 |
+
"eval_runtime": 2.5441,
|
1531 |
+
"eval_samples_per_second": 51.098,
|
1532 |
+
"eval_steps_per_second": 0.786,
|
1533 |
+
"step": 805
|
1534 |
+
},
|
1535 |
+
{
|
1536 |
+
"epoch": 115.71,
|
1537 |
+
"learning_rate": 1.7380952380952384e-05,
|
1538 |
+
"loss": 1.7162,
|
1539 |
+
"step": 810
|
1540 |
+
},
|
1541 |
+
{
|
1542 |
+
"epoch": 116.0,
|
1543 |
+
"eval_accuracy": 0.5538461538461539,
|
1544 |
+
"eval_loss": 2.591280937194824,
|
1545 |
+
"eval_runtime": 2.5836,
|
1546 |
+
"eval_samples_per_second": 50.316,
|
1547 |
+
"eval_steps_per_second": 0.774,
|
1548 |
+
"step": 812
|
1549 |
+
},
|
1550 |
+
{
|
1551 |
+
"epoch": 117.0,
|
1552 |
+
"eval_accuracy": 0.5923076923076923,
|
1553 |
+
"eval_loss": 2.5749051570892334,
|
1554 |
+
"eval_runtime": 2.5441,
|
1555 |
+
"eval_samples_per_second": 51.099,
|
1556 |
+
"eval_steps_per_second": 0.786,
|
1557 |
+
"step": 819
|
1558 |
+
},
|
1559 |
+
{
|
1560 |
+
"epoch": 117.14,
|
1561 |
+
"learning_rate": 1.7142857142857142e-05,
|
1562 |
+
"loss": 1.7225,
|
1563 |
+
"step": 820
|
1564 |
+
},
|
1565 |
+
{
|
1566 |
+
"epoch": 118.0,
|
1567 |
+
"eval_accuracy": 0.5846153846153846,
|
1568 |
+
"eval_loss": 2.563140869140625,
|
1569 |
+
"eval_runtime": 2.6117,
|
1570 |
+
"eval_samples_per_second": 49.777,
|
1571 |
+
"eval_steps_per_second": 0.766,
|
1572 |
+
"step": 826
|
1573 |
+
},
|
1574 |
+
{
|
1575 |
+
"epoch": 118.57,
|
1576 |
+
"learning_rate": 1.6904761904761906e-05,
|
1577 |
+
"loss": 1.6841,
|
1578 |
+
"step": 830
|
1579 |
+
},
|
1580 |
+
{
|
1581 |
+
"epoch": 119.0,
|
1582 |
+
"eval_accuracy": 0.5923076923076923,
|
1583 |
+
"eval_loss": 2.547883987426758,
|
1584 |
+
"eval_runtime": 2.5689,
|
1585 |
+
"eval_samples_per_second": 50.605,
|
1586 |
+
"eval_steps_per_second": 0.779,
|
1587 |
+
"step": 833
|
1588 |
+
},
|
1589 |
+
{
|
1590 |
+
"epoch": 120.0,
|
1591 |
+
"learning_rate": 1.6666666666666667e-05,
|
1592 |
+
"loss": 1.6388,
|
1593 |
+
"step": 840
|
1594 |
+
},
|
1595 |
+
{
|
1596 |
+
"epoch": 120.0,
|
1597 |
+
"eval_accuracy": 0.5846153846153846,
|
1598 |
+
"eval_loss": 2.5402629375457764,
|
1599 |
+
"eval_runtime": 2.4843,
|
1600 |
+
"eval_samples_per_second": 52.328,
|
1601 |
+
"eval_steps_per_second": 0.805,
|
1602 |
+
"step": 840
|
1603 |
+
},
|
1604 |
+
{
|
1605 |
+
"epoch": 120.0,
|
1606 |
+
"step": 840,
|
1607 |
+
"total_flos": 4.837667104869581e+18,
|
1608 |
+
"train_loss": 0.3072653747740246,
|
1609 |
+
"train_runtime": 892.0889,
|
1610 |
+
"train_samples_per_second": 69.948,
|
1611 |
+
"train_steps_per_second": 0.942
|
1612 |
}
|
1613 |
],
|
1614 |
"logging_steps": 10,
|
1615 |
+
"max_steps": 840,
|
1616 |
"num_input_tokens_seen": 0,
|
1617 |
+
"num_train_epochs": 120,
|
1618 |
"save_steps": 500,
|
1619 |
+
"total_flos": 4.837667104869581e+18,
|
1620 |
"train_batch_size": 80,
|
1621 |
"trial_name": null,
|
1622 |
"trial_params": null
|