nicolasdupuisroy commited on
Commit
f1f012a
1 Parent(s): 175a421

End of training

Browse files
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
 
 
5
  - generated_from_trainer
6
  datasets:
7
  - imagefolder
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
5
+ - image-classification
6
+ - vision
7
  - generated_from_trainer
8
  datasets:
9
  - imagefolder
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 100.0,
3
- "eval_accuracy": 0.5461538461538461,
4
- "eval_loss": 2.859877347946167,
5
- "eval_runtime": 2.5644,
6
- "eval_samples_per_second": 50.694,
7
- "eval_steps_per_second": 0.78,
8
- "train_loss": 2.6316724504743303,
9
- "train_runtime": 4344.3701,
10
- "train_samples_per_second": 11.97,
11
- "train_steps_per_second": 0.161
12
  }
 
1
  {
2
+ "epoch": 120.0,
3
+ "eval_accuracy": 0.5846153846153846,
4
+ "eval_loss": 2.5402629375457764,
5
+ "eval_runtime": 2.5184,
6
+ "eval_samples_per_second": 51.619,
7
+ "eval_steps_per_second": 0.794,
8
+ "train_loss": 0.3072653747740246,
9
+ "train_runtime": 892.0889,
10
+ "train_samples_per_second": 69.948,
11
+ "train_steps_per_second": 0.942
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 100.0,
3
- "eval_accuracy": 0.5461538461538461,
4
- "eval_loss": 2.859877347946167,
5
- "eval_runtime": 2.5644,
6
- "eval_samples_per_second": 50.694,
7
- "eval_steps_per_second": 0.78
8
  }
 
1
  {
2
+ "epoch": 120.0,
3
+ "eval_accuracy": 0.5846153846153846,
4
+ "eval_loss": 2.5402629375457764,
5
+ "eval_runtime": 2.5184,
6
+ "eval_samples_per_second": 51.619,
7
+ "eval_steps_per_second": 0.794
8
  }
runs/Jan17_19-49-28_d06676088071/events.out.tfevents.1705521910.d06676088071.25430.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8e1b9986a9eded89b9fae2faf40d5fd9e7da1fb8a2921cc370881f18a4eb1f4
3
+ size 411
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 100.0,
3
- "train_loss": 2.6316724504743303,
4
- "train_runtime": 4344.3701,
5
- "train_samples_per_second": 11.97,
6
- "train_steps_per_second": 0.161
7
  }
 
1
  {
2
+ "epoch": 120.0,
3
+ "train_loss": 0.3072653747740246,
4
+ "train_runtime": 892.0889,
5
+ "train_samples_per_second": 69.948,
6
+ "train_steps_per_second": 0.942
7
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.859877347946167,
3
- "best_model_checkpoint": "./drive/MyDrive/repositories/torch_example_image-classification/outputs_letter3/checkpoint-644",
4
- "epoch": 100.0,
5
  "eval_steps": 500,
6
- "global_step": 700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1336,14 +1336,287 @@
1336
  "train_runtime": 4344.3701,
1337
  "train_samples_per_second": 11.97,
1338
  "train_steps_per_second": 0.161
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1339
  }
1340
  ],
1341
  "logging_steps": 10,
1342
- "max_steps": 700,
1343
  "num_input_tokens_seen": 0,
1344
- "num_train_epochs": 100,
1345
  "save_steps": 500,
1346
- "total_flos": 4.031389254057984e+18,
1347
  "train_batch_size": 80,
1348
  "trial_name": null,
1349
  "trial_params": null
 
1
  {
2
+ "best_metric": 2.5402629375457764,
3
+ "best_model_checkpoint": "./drive/MyDrive/repositories/torch_example_image-classification/outputs_letter3/checkpoint-840",
4
+ "epoch": 120.0,
5
  "eval_steps": 500,
6
+ "global_step": 840,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1336
  "train_runtime": 4344.3701,
1337
  "train_samples_per_second": 11.97,
1338
  "train_steps_per_second": 0.161
1339
+ },
1340
+ {
1341
+ "epoch": 101.0,
1342
+ "eval_accuracy": 0.5153846153846153,
1343
+ "eval_loss": 2.84305477142334,
1344
+ "eval_runtime": 2.1617,
1345
+ "eval_samples_per_second": 60.137,
1346
+ "eval_steps_per_second": 0.925,
1347
+ "step": 707
1348
+ },
1349
+ {
1350
+ "epoch": 101.43,
1351
+ "learning_rate": 1.9761904761904763e-05,
1352
+ "loss": 2.067,
1353
+ "step": 710
1354
+ },
1355
+ {
1356
+ "epoch": 102.0,
1357
+ "eval_accuracy": 0.5,
1358
+ "eval_loss": 2.8063366413116455,
1359
+ "eval_runtime": 2.1563,
1360
+ "eval_samples_per_second": 60.288,
1361
+ "eval_steps_per_second": 0.928,
1362
+ "step": 714
1363
+ },
1364
+ {
1365
+ "epoch": 102.86,
1366
+ "learning_rate": 1.9523809523809524e-05,
1367
+ "loss": 2.0234,
1368
+ "step": 720
1369
+ },
1370
+ {
1371
+ "epoch": 103.0,
1372
+ "eval_accuracy": 0.5230769230769231,
1373
+ "eval_loss": 2.7845773696899414,
1374
+ "eval_runtime": 2.1676,
1375
+ "eval_samples_per_second": 59.974,
1376
+ "eval_steps_per_second": 0.923,
1377
+ "step": 721
1378
+ },
1379
+ {
1380
+ "epoch": 104.0,
1381
+ "eval_accuracy": 0.5307692307692308,
1382
+ "eval_loss": 2.762021541595459,
1383
+ "eval_runtime": 2.2767,
1384
+ "eval_samples_per_second": 57.1,
1385
+ "eval_steps_per_second": 0.878,
1386
+ "step": 728
1387
+ },
1388
+ {
1389
+ "epoch": 104.29,
1390
+ "learning_rate": 1.928571428571429e-05,
1391
+ "loss": 1.9979,
1392
+ "step": 730
1393
+ },
1394
+ {
1395
+ "epoch": 105.0,
1396
+ "eval_accuracy": 0.5538461538461539,
1397
+ "eval_loss": 2.7421603202819824,
1398
+ "eval_runtime": 2.2859,
1399
+ "eval_samples_per_second": 56.871,
1400
+ "eval_steps_per_second": 0.875,
1401
+ "step": 735
1402
+ },
1403
+ {
1404
+ "epoch": 105.71,
1405
+ "learning_rate": 1.904761904761905e-05,
1406
+ "loss": 1.9515,
1407
+ "step": 740
1408
+ },
1409
+ {
1410
+ "epoch": 106.0,
1411
+ "eval_accuracy": 0.5615384615384615,
1412
+ "eval_loss": 2.722872734069824,
1413
+ "eval_runtime": 2.3487,
1414
+ "eval_samples_per_second": 55.35,
1415
+ "eval_steps_per_second": 0.852,
1416
+ "step": 742
1417
+ },
1418
+ {
1419
+ "epoch": 107.0,
1420
+ "eval_accuracy": 0.5384615384615384,
1421
+ "eval_loss": 2.7145817279815674,
1422
+ "eval_runtime": 2.3976,
1423
+ "eval_samples_per_second": 54.221,
1424
+ "eval_steps_per_second": 0.834,
1425
+ "step": 749
1426
+ },
1427
+ {
1428
+ "epoch": 107.14,
1429
+ "learning_rate": 1.880952380952381e-05,
1430
+ "loss": 1.9095,
1431
+ "step": 750
1432
+ },
1433
+ {
1434
+ "epoch": 108.0,
1435
+ "eval_accuracy": 0.5538461538461539,
1436
+ "eval_loss": 2.6905264854431152,
1437
+ "eval_runtime": 2.3887,
1438
+ "eval_samples_per_second": 54.422,
1439
+ "eval_steps_per_second": 0.837,
1440
+ "step": 756
1441
+ },
1442
+ {
1443
+ "epoch": 108.57,
1444
+ "learning_rate": 1.8571428571428575e-05,
1445
+ "loss": 1.8759,
1446
+ "step": 760
1447
+ },
1448
+ {
1449
+ "epoch": 109.0,
1450
+ "eval_accuracy": 0.5538461538461539,
1451
+ "eval_loss": 2.6840174198150635,
1452
+ "eval_runtime": 2.369,
1453
+ "eval_samples_per_second": 54.876,
1454
+ "eval_steps_per_second": 0.844,
1455
+ "step": 763
1456
+ },
1457
+ {
1458
+ "epoch": 110.0,
1459
+ "learning_rate": 1.8333333333333333e-05,
1460
+ "loss": 1.8561,
1461
+ "step": 770
1462
+ },
1463
+ {
1464
+ "epoch": 110.0,
1465
+ "eval_accuracy": 0.5461538461538461,
1466
+ "eval_loss": 2.6554973125457764,
1467
+ "eval_runtime": 2.3964,
1468
+ "eval_samples_per_second": 54.248,
1469
+ "eval_steps_per_second": 0.835,
1470
+ "step": 770
1471
+ },
1472
+ {
1473
+ "epoch": 111.0,
1474
+ "eval_accuracy": 0.5692307692307692,
1475
+ "eval_loss": 2.6465163230895996,
1476
+ "eval_runtime": 2.5418,
1477
+ "eval_samples_per_second": 51.146,
1478
+ "eval_steps_per_second": 0.787,
1479
+ "step": 777
1480
+ },
1481
+ {
1482
+ "epoch": 111.43,
1483
+ "learning_rate": 1.8095238095238097e-05,
1484
+ "loss": 1.8147,
1485
+ "step": 780
1486
+ },
1487
+ {
1488
+ "epoch": 112.0,
1489
+ "eval_accuracy": 0.5384615384615384,
1490
+ "eval_loss": 2.6321260929107666,
1491
+ "eval_runtime": 2.6607,
1492
+ "eval_samples_per_second": 48.859,
1493
+ "eval_steps_per_second": 0.752,
1494
+ "step": 784
1495
+ },
1496
+ {
1497
+ "epoch": 112.86,
1498
+ "learning_rate": 1.785714285714286e-05,
1499
+ "loss": 1.799,
1500
+ "step": 790
1501
+ },
1502
+ {
1503
+ "epoch": 113.0,
1504
+ "eval_accuracy": 0.5384615384615384,
1505
+ "eval_loss": 2.6352975368499756,
1506
+ "eval_runtime": 2.3449,
1507
+ "eval_samples_per_second": 55.439,
1508
+ "eval_steps_per_second": 0.853,
1509
+ "step": 791
1510
+ },
1511
+ {
1512
+ "epoch": 114.0,
1513
+ "eval_accuracy": 0.5461538461538461,
1514
+ "eval_loss": 2.6188342571258545,
1515
+ "eval_runtime": 2.5585,
1516
+ "eval_samples_per_second": 50.811,
1517
+ "eval_steps_per_second": 0.782,
1518
+ "step": 798
1519
+ },
1520
+ {
1521
+ "epoch": 114.29,
1522
+ "learning_rate": 1.761904761904762e-05,
1523
+ "loss": 1.7536,
1524
+ "step": 800
1525
+ },
1526
+ {
1527
+ "epoch": 115.0,
1528
+ "eval_accuracy": 0.5461538461538461,
1529
+ "eval_loss": 2.6063857078552246,
1530
+ "eval_runtime": 2.5441,
1531
+ "eval_samples_per_second": 51.098,
1532
+ "eval_steps_per_second": 0.786,
1533
+ "step": 805
1534
+ },
1535
+ {
1536
+ "epoch": 115.71,
1537
+ "learning_rate": 1.7380952380952384e-05,
1538
+ "loss": 1.7162,
1539
+ "step": 810
1540
+ },
1541
+ {
1542
+ "epoch": 116.0,
1543
+ "eval_accuracy": 0.5538461538461539,
1544
+ "eval_loss": 2.591280937194824,
1545
+ "eval_runtime": 2.5836,
1546
+ "eval_samples_per_second": 50.316,
1547
+ "eval_steps_per_second": 0.774,
1548
+ "step": 812
1549
+ },
1550
+ {
1551
+ "epoch": 117.0,
1552
+ "eval_accuracy": 0.5923076923076923,
1553
+ "eval_loss": 2.5749051570892334,
1554
+ "eval_runtime": 2.5441,
1555
+ "eval_samples_per_second": 51.099,
1556
+ "eval_steps_per_second": 0.786,
1557
+ "step": 819
1558
+ },
1559
+ {
1560
+ "epoch": 117.14,
1561
+ "learning_rate": 1.7142857142857142e-05,
1562
+ "loss": 1.7225,
1563
+ "step": 820
1564
+ },
1565
+ {
1566
+ "epoch": 118.0,
1567
+ "eval_accuracy": 0.5846153846153846,
1568
+ "eval_loss": 2.563140869140625,
1569
+ "eval_runtime": 2.6117,
1570
+ "eval_samples_per_second": 49.777,
1571
+ "eval_steps_per_second": 0.766,
1572
+ "step": 826
1573
+ },
1574
+ {
1575
+ "epoch": 118.57,
1576
+ "learning_rate": 1.6904761904761906e-05,
1577
+ "loss": 1.6841,
1578
+ "step": 830
1579
+ },
1580
+ {
1581
+ "epoch": 119.0,
1582
+ "eval_accuracy": 0.5923076923076923,
1583
+ "eval_loss": 2.547883987426758,
1584
+ "eval_runtime": 2.5689,
1585
+ "eval_samples_per_second": 50.605,
1586
+ "eval_steps_per_second": 0.779,
1587
+ "step": 833
1588
+ },
1589
+ {
1590
+ "epoch": 120.0,
1591
+ "learning_rate": 1.6666666666666667e-05,
1592
+ "loss": 1.6388,
1593
+ "step": 840
1594
+ },
1595
+ {
1596
+ "epoch": 120.0,
1597
+ "eval_accuracy": 0.5846153846153846,
1598
+ "eval_loss": 2.5402629375457764,
1599
+ "eval_runtime": 2.4843,
1600
+ "eval_samples_per_second": 52.328,
1601
+ "eval_steps_per_second": 0.805,
1602
+ "step": 840
1603
+ },
1604
+ {
1605
+ "epoch": 120.0,
1606
+ "step": 840,
1607
+ "total_flos": 4.837667104869581e+18,
1608
+ "train_loss": 0.3072653747740246,
1609
+ "train_runtime": 892.0889,
1610
+ "train_samples_per_second": 69.948,
1611
+ "train_steps_per_second": 0.942
1612
  }
1613
  ],
1614
  "logging_steps": 10,
1615
+ "max_steps": 840,
1616
  "num_input_tokens_seen": 0,
1617
+ "num_train_epochs": 120,
1618
  "save_steps": 500,
1619
+ "total_flos": 4.837667104869581e+18,
1620
  "train_batch_size": 80,
1621
  "trial_name": null,
1622
  "trial_params": null