sam1120 commited on
Commit
5fcd0d1
β€’
1 Parent(s): 1196364

Training in progress, step 400

Browse files
{checkpoint-200 β†’ checkpoint-400}/config.json RENAMED
File without changes
{checkpoint-200 β†’ checkpoint-400}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e99eb4915a9c031a0b238e9073d954872575f197f86729f13bd6de811dc502db
3
- size 677455103
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54f857826893e028207db4828854c48872645de01cbffaf1c9c8f288a96ad75
3
+ size 677456319
{checkpoint-200 β†’ checkpoint-400}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88fe2ae83719c292921d03b4192e0d782b3402a59cb46e6de4ceb965265fa3e4
3
  size 338796489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be03cc2a8293c04c55f9def52f92927e02d3469ef2fa6683e2b8860f35537827
3
  size 338796489
{checkpoint-200 β†’ checkpoint-400}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5b7b56f6f509b9d6af4a8829333dc0b928df99677c599ea55fdff7b16712277
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fec8739d5e70d46b759ea2d0095fbbbcaf5dc92c068ebace89ac7569bccb6b8
3
  size 14575
{checkpoint-200 β†’ checkpoint-400}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:033b316679f5034e83037222bb4baf2744ad7787f08506bc291b759537ecdf96
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85a22e5c54682a87dd513d30658d95e6732243a33a4a9c744d3a42982e6c919f
3
  size 627
{checkpoint-200 β†’ checkpoint-400}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.5992904305458069,
3
- "best_model_checkpoint": "/robodata/smodak/Projects/nspl/scripts/terrainseg/training/models/safety-utcustom-train-SF-RGB-b5/checkpoint-200",
4
- "epoch": 18.181818181818183,
5
- "global_step": 200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1546,11 +1546,1551 @@
1546
  "eval_samples_per_second": 6.882,
1547
  "eval_steps_per_second": 0.514,
1548
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1549
  }
1550
  ],
1551
- "max_steps": 330,
1552
- "num_train_epochs": 30,
1553
- "total_flos": 1.1184809584455844e+18,
1554
  "trial_name": null,
1555
  "trial_params": null
1556
  }
 
1
  {
2
+ "best_metric": 0.44339337944984436,
3
+ "best_model_checkpoint": "/robodata/smodak/Projects/nspl/scripts/terrainseg/training/models/safety-utcustom-train-SF-RGB-b5/checkpoint-400",
4
+ "epoch": 36.36363636363637,
5
+ "global_step": 400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1546
  "eval_samples_per_second": 6.882,
1547
  "eval_steps_per_second": 0.514,
1548
  "step": 200
1549
+ },
1550
+ {
1551
+ "epoch": 18.27,
1552
+ "learning_rate": 1.2364217252396168e-06,
1553
+ "loss": 0.6677,
1554
+ "step": 201
1555
+ },
1556
+ {
1557
+ "epoch": 18.36,
1558
+ "learning_rate": 1.2268370607028754e-06,
1559
+ "loss": 0.6658,
1560
+ "step": 202
1561
+ },
1562
+ {
1563
+ "epoch": 18.45,
1564
+ "learning_rate": 1.2172523961661342e-06,
1565
+ "loss": 0.649,
1566
+ "step": 203
1567
+ },
1568
+ {
1569
+ "epoch": 18.55,
1570
+ "learning_rate": 1.207667731629393e-06,
1571
+ "loss": 0.6342,
1572
+ "step": 204
1573
+ },
1574
+ {
1575
+ "epoch": 18.64,
1576
+ "learning_rate": 1.198083067092652e-06,
1577
+ "loss": 0.6441,
1578
+ "step": 205
1579
+ },
1580
+ {
1581
+ "epoch": 18.73,
1582
+ "learning_rate": 1.1884984025559105e-06,
1583
+ "loss": 0.6429,
1584
+ "step": 206
1585
+ },
1586
+ {
1587
+ "epoch": 18.82,
1588
+ "learning_rate": 1.1789137380191693e-06,
1589
+ "loss": 0.6155,
1590
+ "step": 207
1591
+ },
1592
+ {
1593
+ "epoch": 18.91,
1594
+ "learning_rate": 1.1693290734824281e-06,
1595
+ "loss": 0.6347,
1596
+ "step": 208
1597
+ },
1598
+ {
1599
+ "epoch": 19.0,
1600
+ "learning_rate": 1.159744408945687e-06,
1601
+ "loss": 0.6611,
1602
+ "step": 209
1603
+ },
1604
+ {
1605
+ "epoch": 19.09,
1606
+ "learning_rate": 1.1501597444089457e-06,
1607
+ "loss": 0.6398,
1608
+ "step": 210
1609
+ },
1610
+ {
1611
+ "epoch": 19.09,
1612
+ "eval_accuracy_safe": 0.6413602877398313,
1613
+ "eval_accuracy_unlabeled": NaN,
1614
+ "eval_accuracy_unsafe": 0.9258418644556835,
1615
+ "eval_iou_safe": 0.26823363821482293,
1616
+ "eval_iou_unlabeled": 0.0,
1617
+ "eval_iou_unsafe": 0.9159351131912487,
1618
+ "eval_loss": 0.5784907341003418,
1619
+ "eval_mean_accuracy": 0.7836010760977574,
1620
+ "eval_mean_iou": 0.39472291713535723,
1621
+ "eval_overall_accuracy": 0.9174387348231985,
1622
+ "eval_runtime": 11.2723,
1623
+ "eval_samples_per_second": 5.944,
1624
+ "eval_steps_per_second": 0.444,
1625
+ "step": 210
1626
+ },
1627
+ {
1628
+ "epoch": 19.18,
1629
+ "learning_rate": 1.1405750798722045e-06,
1630
+ "loss": 0.6403,
1631
+ "step": 211
1632
+ },
1633
+ {
1634
+ "epoch": 19.27,
1635
+ "learning_rate": 1.1309904153354633e-06,
1636
+ "loss": 0.6271,
1637
+ "step": 212
1638
+ },
1639
+ {
1640
+ "epoch": 19.36,
1641
+ "learning_rate": 1.121405750798722e-06,
1642
+ "loss": 0.679,
1643
+ "step": 213
1644
+ },
1645
+ {
1646
+ "epoch": 19.45,
1647
+ "learning_rate": 1.1118210862619809e-06,
1648
+ "loss": 0.6239,
1649
+ "step": 214
1650
+ },
1651
+ {
1652
+ "epoch": 19.55,
1653
+ "learning_rate": 1.1022364217252397e-06,
1654
+ "loss": 0.6527,
1655
+ "step": 215
1656
+ },
1657
+ {
1658
+ "epoch": 19.64,
1659
+ "learning_rate": 1.0926517571884984e-06,
1660
+ "loss": 0.6228,
1661
+ "step": 216
1662
+ },
1663
+ {
1664
+ "epoch": 19.73,
1665
+ "learning_rate": 1.0830670926517572e-06,
1666
+ "loss": 0.6227,
1667
+ "step": 217
1668
+ },
1669
+ {
1670
+ "epoch": 19.82,
1671
+ "learning_rate": 1.073482428115016e-06,
1672
+ "loss": 0.6347,
1673
+ "step": 218
1674
+ },
1675
+ {
1676
+ "epoch": 19.91,
1677
+ "learning_rate": 1.0638977635782748e-06,
1678
+ "loss": 0.6374,
1679
+ "step": 219
1680
+ },
1681
+ {
1682
+ "epoch": 20.0,
1683
+ "learning_rate": 1.0543130990415336e-06,
1684
+ "loss": 0.5845,
1685
+ "step": 220
1686
+ },
1687
+ {
1688
+ "epoch": 20.0,
1689
+ "eval_accuracy_safe": 0.6426151017151052,
1690
+ "eval_accuracy_unlabeled": NaN,
1691
+ "eval_accuracy_unsafe": 0.9286315640516787,
1692
+ "eval_iou_safe": 0.26982054857603477,
1693
+ "eval_iou_unlabeled": 0.0,
1694
+ "eval_iou_unsafe": 0.9187221572756564,
1695
+ "eval_loss": 0.5641139149665833,
1696
+ "eval_mean_accuracy": 0.7856233328833919,
1697
+ "eval_mean_iou": 0.39618090195056377,
1698
+ "eval_overall_accuracy": 0.9201830963590252,
1699
+ "eval_runtime": 9.4874,
1700
+ "eval_samples_per_second": 7.062,
1701
+ "eval_steps_per_second": 0.527,
1702
+ "step": 220
1703
+ },
1704
+ {
1705
+ "epoch": 20.09,
1706
+ "learning_rate": 1.0447284345047924e-06,
1707
+ "loss": 0.606,
1708
+ "step": 221
1709
+ },
1710
+ {
1711
+ "epoch": 20.18,
1712
+ "learning_rate": 1.0351437699680512e-06,
1713
+ "loss": 0.6491,
1714
+ "step": 222
1715
+ },
1716
+ {
1717
+ "epoch": 20.27,
1718
+ "learning_rate": 1.02555910543131e-06,
1719
+ "loss": 0.6396,
1720
+ "step": 223
1721
+ },
1722
+ {
1723
+ "epoch": 20.36,
1724
+ "learning_rate": 1.0159744408945688e-06,
1725
+ "loss": 0.617,
1726
+ "step": 224
1727
+ },
1728
+ {
1729
+ "epoch": 20.45,
1730
+ "learning_rate": 1.0063897763578276e-06,
1731
+ "loss": 0.614,
1732
+ "step": 225
1733
+ },
1734
+ {
1735
+ "epoch": 20.55,
1736
+ "learning_rate": 9.968051118210861e-07,
1737
+ "loss": 0.6281,
1738
+ "step": 226
1739
+ },
1740
+ {
1741
+ "epoch": 20.64,
1742
+ "learning_rate": 9.872204472843452e-07,
1743
+ "loss": 0.6374,
1744
+ "step": 227
1745
+ },
1746
+ {
1747
+ "epoch": 20.73,
1748
+ "learning_rate": 9.77635782747604e-07,
1749
+ "loss": 0.6394,
1750
+ "step": 228
1751
+ },
1752
+ {
1753
+ "epoch": 20.82,
1754
+ "learning_rate": 9.680511182108625e-07,
1755
+ "loss": 0.6351,
1756
+ "step": 229
1757
+ },
1758
+ {
1759
+ "epoch": 20.91,
1760
+ "learning_rate": 9.584664536741213e-07,
1761
+ "loss": 0.6062,
1762
+ "step": 230
1763
+ },
1764
+ {
1765
+ "epoch": 20.91,
1766
+ "eval_accuracy_safe": 0.6519963300064379,
1767
+ "eval_accuracy_unlabeled": NaN,
1768
+ "eval_accuracy_unsafe": 0.9252195649054266,
1769
+ "eval_iou_safe": 0.2640576051310034,
1770
+ "eval_iou_unlabeled": 0.0,
1771
+ "eval_iou_unsafe": 0.9156001170929594,
1772
+ "eval_loss": 0.5693235397338867,
1773
+ "eval_mean_accuracy": 0.7886079474559322,
1774
+ "eval_mean_iou": 0.3932192407413209,
1775
+ "eval_overall_accuracy": 0.9171489886383513,
1776
+ "eval_runtime": 11.0762,
1777
+ "eval_samples_per_second": 6.049,
1778
+ "eval_steps_per_second": 0.451,
1779
+ "step": 230
1780
+ },
1781
+ {
1782
+ "epoch": 21.0,
1783
+ "learning_rate": 9.488817891373802e-07,
1784
+ "loss": 0.6456,
1785
+ "step": 231
1786
+ },
1787
+ {
1788
+ "epoch": 21.09,
1789
+ "learning_rate": 9.39297124600639e-07,
1790
+ "loss": 0.6055,
1791
+ "step": 232
1792
+ },
1793
+ {
1794
+ "epoch": 21.18,
1795
+ "learning_rate": 9.297124600638977e-07,
1796
+ "loss": 0.6134,
1797
+ "step": 233
1798
+ },
1799
+ {
1800
+ "epoch": 21.27,
1801
+ "learning_rate": 9.201277955271566e-07,
1802
+ "loss": 0.5718,
1803
+ "step": 234
1804
+ },
1805
+ {
1806
+ "epoch": 21.36,
1807
+ "learning_rate": 9.105431309904154e-07,
1808
+ "loss": 0.5939,
1809
+ "step": 235
1810
+ },
1811
+ {
1812
+ "epoch": 21.45,
1813
+ "learning_rate": 9.009584664536742e-07,
1814
+ "loss": 0.5917,
1815
+ "step": 236
1816
+ },
1817
+ {
1818
+ "epoch": 21.55,
1819
+ "learning_rate": 8.913738019169329e-07,
1820
+ "loss": 0.599,
1821
+ "step": 237
1822
+ },
1823
+ {
1824
+ "epoch": 21.64,
1825
+ "learning_rate": 8.817891373801916e-07,
1826
+ "loss": 0.6239,
1827
+ "step": 238
1828
+ },
1829
+ {
1830
+ "epoch": 21.73,
1831
+ "learning_rate": 8.722044728434505e-07,
1832
+ "loss": 0.5946,
1833
+ "step": 239
1834
+ },
1835
+ {
1836
+ "epoch": 21.82,
1837
+ "learning_rate": 8.626198083067093e-07,
1838
+ "loss": 0.6071,
1839
+ "step": 240
1840
+ },
1841
+ {
1842
+ "epoch": 21.82,
1843
+ "eval_accuracy_safe": 0.6591840432380754,
1844
+ "eval_accuracy_unlabeled": NaN,
1845
+ "eval_accuracy_unsafe": 0.9282916959179331,
1846
+ "eval_iou_safe": 0.267531459702011,
1847
+ "eval_iou_unlabeled": 0.0,
1848
+ "eval_iou_unsafe": 0.9188227497665283,
1849
+ "eval_loss": 0.5627052187919617,
1850
+ "eval_mean_accuracy": 0.7937378695780043,
1851
+ "eval_mean_iou": 0.39545140315617977,
1852
+ "eval_overall_accuracy": 0.9203426873506005,
1853
+ "eval_runtime": 9.7383,
1854
+ "eval_samples_per_second": 6.88,
1855
+ "eval_steps_per_second": 0.513,
1856
+ "step": 240
1857
+ },
1858
+ {
1859
+ "epoch": 21.91,
1860
+ "learning_rate": 8.53035143769968e-07,
1861
+ "loss": 0.5784,
1862
+ "step": 241
1863
+ },
1864
+ {
1865
+ "epoch": 22.0,
1866
+ "learning_rate": 8.434504792332268e-07,
1867
+ "loss": 0.6049,
1868
+ "step": 242
1869
+ },
1870
+ {
1871
+ "epoch": 22.09,
1872
+ "learning_rate": 8.338658146964857e-07,
1873
+ "loss": 0.5871,
1874
+ "step": 243
1875
+ },
1876
+ {
1877
+ "epoch": 22.18,
1878
+ "learning_rate": 8.242811501597445e-07,
1879
+ "loss": 0.5894,
1880
+ "step": 244
1881
+ },
1882
+ {
1883
+ "epoch": 22.27,
1884
+ "learning_rate": 8.146964856230032e-07,
1885
+ "loss": 0.5801,
1886
+ "step": 245
1887
+ },
1888
+ {
1889
+ "epoch": 22.36,
1890
+ "learning_rate": 8.05111821086262e-07,
1891
+ "loss": 0.5719,
1892
+ "step": 246
1893
+ },
1894
+ {
1895
+ "epoch": 22.45,
1896
+ "learning_rate": 7.955271565495208e-07,
1897
+ "loss": 0.5979,
1898
+ "step": 247
1899
+ },
1900
+ {
1901
+ "epoch": 22.55,
1902
+ "learning_rate": 7.859424920127797e-07,
1903
+ "loss": 0.5855,
1904
+ "step": 248
1905
+ },
1906
+ {
1907
+ "epoch": 22.64,
1908
+ "learning_rate": 7.763578274760382e-07,
1909
+ "loss": 0.5975,
1910
+ "step": 249
1911
+ },
1912
+ {
1913
+ "epoch": 22.73,
1914
+ "learning_rate": 7.667731629392971e-07,
1915
+ "loss": 0.6209,
1916
+ "step": 250
1917
+ },
1918
+ {
1919
+ "epoch": 22.73,
1920
+ "eval_accuracy_safe": 0.6618690752926936,
1921
+ "eval_accuracy_unlabeled": NaN,
1922
+ "eval_accuracy_unsafe": 0.9299528432231069,
1923
+ "eval_iou_safe": 0.2724302598559697,
1924
+ "eval_iou_unlabeled": 0.0,
1925
+ "eval_iou_unsafe": 0.9205411497943506,
1926
+ "eval_loss": 0.5631816983222961,
1927
+ "eval_mean_accuracy": 0.7959109592579002,
1928
+ "eval_mean_iou": 0.39765713655010676,
1929
+ "eval_overall_accuracy": 0.9220340785695545,
1930
+ "eval_runtime": 10.1606,
1931
+ "eval_samples_per_second": 6.594,
1932
+ "eval_steps_per_second": 0.492,
1933
+ "step": 250
1934
+ },
1935
+ {
1936
+ "epoch": 22.82,
1937
+ "learning_rate": 7.571884984025559e-07,
1938
+ "loss": 0.5852,
1939
+ "step": 251
1940
+ },
1941
+ {
1942
+ "epoch": 22.91,
1943
+ "learning_rate": 7.476038338658147e-07,
1944
+ "loss": 0.5775,
1945
+ "step": 252
1946
+ },
1947
+ {
1948
+ "epoch": 23.0,
1949
+ "learning_rate": 7.380191693290735e-07,
1950
+ "loss": 0.6365,
1951
+ "step": 253
1952
+ },
1953
+ {
1954
+ "epoch": 23.09,
1955
+ "learning_rate": 7.284345047923323e-07,
1956
+ "loss": 0.6243,
1957
+ "step": 254
1958
+ },
1959
+ {
1960
+ "epoch": 23.18,
1961
+ "learning_rate": 7.188498402555911e-07,
1962
+ "loss": 0.5995,
1963
+ "step": 255
1964
+ },
1965
+ {
1966
+ "epoch": 23.27,
1967
+ "learning_rate": 7.092651757188499e-07,
1968
+ "loss": 0.6019,
1969
+ "step": 256
1970
+ },
1971
+ {
1972
+ "epoch": 23.36,
1973
+ "learning_rate": 6.996805111821087e-07,
1974
+ "loss": 0.5883,
1975
+ "step": 257
1976
+ },
1977
+ {
1978
+ "epoch": 23.45,
1979
+ "learning_rate": 6.900958466453674e-07,
1980
+ "loss": 0.589,
1981
+ "step": 258
1982
+ },
1983
+ {
1984
+ "epoch": 23.55,
1985
+ "learning_rate": 6.805111821086263e-07,
1986
+ "loss": 0.5717,
1987
+ "step": 259
1988
+ },
1989
+ {
1990
+ "epoch": 23.64,
1991
+ "learning_rate": 6.709265175718849e-07,
1992
+ "loss": 0.5609,
1993
+ "step": 260
1994
+ },
1995
+ {
1996
+ "epoch": 23.64,
1997
+ "eval_accuracy_safe": 0.6504639534928547,
1998
+ "eval_accuracy_unlabeled": NaN,
1999
+ "eval_accuracy_unsafe": 0.9378781128324656,
2000
+ "eval_iou_safe": 0.2868443063281154,
2001
+ "eval_iou_unlabeled": 0.0,
2002
+ "eval_iou_unsafe": 0.9280609954701114,
2003
+ "eval_loss": 0.5416346192359924,
2004
+ "eval_mean_accuracy": 0.7941710331626601,
2005
+ "eval_mean_iou": 0.40496843393274223,
2006
+ "eval_overall_accuracy": 0.9293883594114389,
2007
+ "eval_runtime": 9.5225,
2008
+ "eval_samples_per_second": 7.036,
2009
+ "eval_steps_per_second": 0.525,
2010
+ "step": 260
2011
+ },
2012
+ {
2013
+ "epoch": 23.73,
2014
+ "learning_rate": 6.613418530351438e-07,
2015
+ "loss": 0.5557,
2016
+ "step": 261
2017
+ },
2018
+ {
2019
+ "epoch": 23.82,
2020
+ "learning_rate": 6.517571884984025e-07,
2021
+ "loss": 0.5968,
2022
+ "step": 262
2023
+ },
2024
+ {
2025
+ "epoch": 23.91,
2026
+ "learning_rate": 6.421725239616614e-07,
2027
+ "loss": 0.5673,
2028
+ "step": 263
2029
+ },
2030
+ {
2031
+ "epoch": 24.0,
2032
+ "learning_rate": 6.325878594249201e-07,
2033
+ "loss": 0.6091,
2034
+ "step": 264
2035
+ },
2036
+ {
2037
+ "epoch": 24.09,
2038
+ "learning_rate": 6.230031948881789e-07,
2039
+ "loss": 0.5776,
2040
+ "step": 265
2041
+ },
2042
+ {
2043
+ "epoch": 24.18,
2044
+ "learning_rate": 6.134185303514377e-07,
2045
+ "loss": 0.5562,
2046
+ "step": 266
2047
+ },
2048
+ {
2049
+ "epoch": 24.27,
2050
+ "learning_rate": 6.038338658146965e-07,
2051
+ "loss": 0.5863,
2052
+ "step": 267
2053
+ },
2054
+ {
2055
+ "epoch": 24.36,
2056
+ "learning_rate": 5.942492012779553e-07,
2057
+ "loss": 0.5565,
2058
+ "step": 268
2059
+ },
2060
+ {
2061
+ "epoch": 24.45,
2062
+ "learning_rate": 5.846645367412141e-07,
2063
+ "loss": 0.5858,
2064
+ "step": 269
2065
+ },
2066
+ {
2067
+ "epoch": 24.55,
2068
+ "learning_rate": 5.750798722044729e-07,
2069
+ "loss": 0.5752,
2070
+ "step": 270
2071
+ },
2072
+ {
2073
+ "epoch": 24.55,
2074
+ "eval_accuracy_safe": 0.6412195789530495,
2075
+ "eval_accuracy_unlabeled": NaN,
2076
+ "eval_accuracy_unsafe": 0.945148932410419,
2077
+ "eval_iou_safe": 0.2982960328042603,
2078
+ "eval_iou_unlabeled": 0.0,
2079
+ "eval_iou_unsafe": 0.9349957034087992,
2080
+ "eval_loss": 0.5140887498855591,
2081
+ "eval_mean_accuracy": 0.7931842556817342,
2082
+ "eval_mean_iou": 0.41109724540435316,
2083
+ "eval_overall_accuracy": 0.9361713466359608,
2084
+ "eval_runtime": 10.0336,
2085
+ "eval_samples_per_second": 6.678,
2086
+ "eval_steps_per_second": 0.498,
2087
+ "step": 270
2088
+ },
2089
+ {
2090
+ "epoch": 24.64,
2091
+ "learning_rate": 5.654952076677316e-07,
2092
+ "loss": 0.5881,
2093
+ "step": 271
2094
+ },
2095
+ {
2096
+ "epoch": 24.73,
2097
+ "learning_rate": 5.559105431309904e-07,
2098
+ "loss": 0.6124,
2099
+ "step": 272
2100
+ },
2101
+ {
2102
+ "epoch": 24.82,
2103
+ "learning_rate": 5.463258785942492e-07,
2104
+ "loss": 0.5648,
2105
+ "step": 273
2106
+ },
2107
+ {
2108
+ "epoch": 24.91,
2109
+ "learning_rate": 5.36741214057508e-07,
2110
+ "loss": 0.578,
2111
+ "step": 274
2112
+ },
2113
+ {
2114
+ "epoch": 25.0,
2115
+ "learning_rate": 5.271565495207668e-07,
2116
+ "loss": 0.5605,
2117
+ "step": 275
2118
+ },
2119
+ {
2120
+ "epoch": 25.09,
2121
+ "learning_rate": 5.175718849840256e-07,
2122
+ "loss": 0.588,
2123
+ "step": 276
2124
+ },
2125
+ {
2126
+ "epoch": 25.18,
2127
+ "learning_rate": 5.079872204472844e-07,
2128
+ "loss": 0.5814,
2129
+ "step": 277
2130
+ },
2131
+ {
2132
+ "epoch": 25.27,
2133
+ "learning_rate": 4.984025559105431e-07,
2134
+ "loss": 0.5671,
2135
+ "step": 278
2136
+ },
2137
+ {
2138
+ "epoch": 25.36,
2139
+ "learning_rate": 4.88817891373802e-07,
2140
+ "loss": 0.5237,
2141
+ "step": 279
2142
+ },
2143
+ {
2144
+ "epoch": 25.45,
2145
+ "learning_rate": 4.792332268370607e-07,
2146
+ "loss": 0.6004,
2147
+ "step": 280
2148
+ },
2149
+ {
2150
+ "epoch": 25.45,
2151
+ "eval_accuracy_safe": 0.6491917918589365,
2152
+ "eval_accuracy_unlabeled": NaN,
2153
+ "eval_accuracy_unsafe": 0.9412261630289883,
2154
+ "eval_iou_safe": 0.2907094372975922,
2155
+ "eval_iou_unlabeled": 0.0,
2156
+ "eval_iou_unsafe": 0.9313366391036164,
2157
+ "eval_loss": 0.5255351662635803,
2158
+ "eval_mean_accuracy": 0.7952089774439624,
2159
+ "eval_mean_iou": 0.4073486921337362,
2160
+ "eval_overall_accuracy": 0.9325999359586346,
2161
+ "eval_runtime": 9.8685,
2162
+ "eval_samples_per_second": 6.789,
2163
+ "eval_steps_per_second": 0.507,
2164
+ "step": 280
2165
+ },
2166
+ {
2167
+ "epoch": 25.55,
2168
+ "learning_rate": 4.696485623003195e-07,
2169
+ "loss": 0.5482,
2170
+ "step": 281
2171
+ },
2172
+ {
2173
+ "epoch": 25.64,
2174
+ "learning_rate": 4.600638977635783e-07,
2175
+ "loss": 0.5764,
2176
+ "step": 282
2177
+ },
2178
+ {
2179
+ "epoch": 25.73,
2180
+ "learning_rate": 4.504792332268371e-07,
2181
+ "loss": 0.5608,
2182
+ "step": 283
2183
+ },
2184
+ {
2185
+ "epoch": 25.82,
2186
+ "learning_rate": 4.408945686900958e-07,
2187
+ "loss": 0.5698,
2188
+ "step": 284
2189
+ },
2190
+ {
2191
+ "epoch": 25.91,
2192
+ "learning_rate": 4.3130990415335466e-07,
2193
+ "loss": 0.5502,
2194
+ "step": 285
2195
+ },
2196
+ {
2197
+ "epoch": 26.0,
2198
+ "learning_rate": 4.217252396166134e-07,
2199
+ "loss": 0.5975,
2200
+ "step": 286
2201
+ },
2202
+ {
2203
+ "epoch": 26.09,
2204
+ "learning_rate": 4.1214057507987225e-07,
2205
+ "loss": 0.5736,
2206
+ "step": 287
2207
+ },
2208
+ {
2209
+ "epoch": 26.18,
2210
+ "learning_rate": 4.02555910543131e-07,
2211
+ "loss": 0.5498,
2212
+ "step": 288
2213
+ },
2214
+ {
2215
+ "epoch": 26.27,
2216
+ "learning_rate": 3.9297124600638983e-07,
2217
+ "loss": 0.5682,
2218
+ "step": 289
2219
+ },
2220
+ {
2221
+ "epoch": 26.36,
2222
+ "learning_rate": 3.8338658146964857e-07,
2223
+ "loss": 0.5524,
2224
+ "step": 290
2225
+ },
2226
+ {
2227
+ "epoch": 26.36,
2228
+ "eval_accuracy_safe": 0.6587715544658655,
2229
+ "eval_accuracy_unlabeled": NaN,
2230
+ "eval_accuracy_unsafe": 0.9386905578378355,
2231
+ "eval_iou_safe": 0.28676309565062713,
2232
+ "eval_iou_unlabeled": 0.0,
2233
+ "eval_iou_unsafe": 0.9290998927343179,
2234
+ "eval_loss": 0.5313962697982788,
2235
+ "eval_mean_accuracy": 0.7987310561518506,
2236
+ "eval_mean_iou": 0.4052876627949817,
2237
+ "eval_overall_accuracy": 0.9304221993062034,
2238
+ "eval_runtime": 9.5415,
2239
+ "eval_samples_per_second": 7.022,
2240
+ "eval_steps_per_second": 0.524,
2241
+ "step": 290
2242
+ },
2243
+ {
2244
+ "epoch": 26.45,
2245
+ "learning_rate": 3.7380191693290736e-07,
2246
+ "loss": 0.5519,
2247
+ "step": 291
2248
+ },
2249
+ {
2250
+ "epoch": 26.55,
2251
+ "learning_rate": 3.6421725239616615e-07,
2252
+ "loss": 0.5424,
2253
+ "step": 292
2254
+ },
2255
+ {
2256
+ "epoch": 26.64,
2257
+ "learning_rate": 3.5463258785942494e-07,
2258
+ "loss": 0.583,
2259
+ "step": 293
2260
+ },
2261
+ {
2262
+ "epoch": 26.73,
2263
+ "learning_rate": 3.450479233226837e-07,
2264
+ "loss": 0.5798,
2265
+ "step": 294
2266
+ },
2267
+ {
2268
+ "epoch": 26.82,
2269
+ "learning_rate": 3.3546325878594247e-07,
2270
+ "loss": 0.5284,
2271
+ "step": 295
2272
+ },
2273
+ {
2274
+ "epoch": 26.91,
2275
+ "learning_rate": 3.2587859424920126e-07,
2276
+ "loss": 0.5681,
2277
+ "step": 296
2278
+ },
2279
+ {
2280
+ "epoch": 27.0,
2281
+ "learning_rate": 3.1629392971246005e-07,
2282
+ "loss": 0.6352,
2283
+ "step": 297
2284
+ },
2285
+ {
2286
+ "epoch": 27.09,
2287
+ "learning_rate": 3.0670926517571884e-07,
2288
+ "loss": 0.5651,
2289
+ "step": 298
2290
+ },
2291
+ {
2292
+ "epoch": 27.18,
2293
+ "learning_rate": 2.9712460063897763e-07,
2294
+ "loss": 0.5707,
2295
+ "step": 299
2296
+ },
2297
+ {
2298
+ "epoch": 27.27,
2299
+ "learning_rate": 2.875399361022364e-07,
2300
+ "loss": 0.5758,
2301
+ "step": 300
2302
+ },
2303
+ {
2304
+ "epoch": 27.27,
2305
+ "eval_accuracy_safe": 0.6544115095932552,
2306
+ "eval_accuracy_unlabeled": NaN,
2307
+ "eval_accuracy_unsafe": 0.9423355893036522,
2308
+ "eval_iou_safe": 0.291325116977104,
2309
+ "eval_iou_unlabeled": 0.0,
2310
+ "eval_iou_unsafe": 0.9325746804551616,
2311
+ "eval_loss": 0.526845395565033,
2312
+ "eval_mean_accuracy": 0.7983735494484537,
2313
+ "eval_mean_iou": 0.40796659914408856,
2314
+ "eval_overall_accuracy": 0.9338307736524895,
2315
+ "eval_runtime": 10.1793,
2316
+ "eval_samples_per_second": 6.582,
2317
+ "eval_steps_per_second": 0.491,
2318
+ "step": 300
2319
+ },
2320
+ {
2321
+ "epoch": 27.36,
2322
+ "learning_rate": 2.779552715654952e-07,
2323
+ "loss": 0.5541,
2324
+ "step": 301
2325
+ },
2326
+ {
2327
+ "epoch": 27.45,
2328
+ "learning_rate": 2.68370607028754e-07,
2329
+ "loss": 0.5143,
2330
+ "step": 302
2331
+ },
2332
+ {
2333
+ "epoch": 27.55,
2334
+ "learning_rate": 2.587859424920128e-07,
2335
+ "loss": 0.5392,
2336
+ "step": 303
2337
+ },
2338
+ {
2339
+ "epoch": 27.64,
2340
+ "learning_rate": 2.4920127795527154e-07,
2341
+ "loss": 0.5803,
2342
+ "step": 304
2343
+ },
2344
+ {
2345
+ "epoch": 27.73,
2346
+ "learning_rate": 2.3961661341853033e-07,
2347
+ "loss": 0.5733,
2348
+ "step": 305
2349
+ },
2350
+ {
2351
+ "epoch": 27.82,
2352
+ "learning_rate": 2.3003194888178915e-07,
2353
+ "loss": 0.5799,
2354
+ "step": 306
2355
+ },
2356
+ {
2357
+ "epoch": 27.91,
2358
+ "learning_rate": 2.204472843450479e-07,
2359
+ "loss": 0.5737,
2360
+ "step": 307
2361
+ },
2362
+ {
2363
+ "epoch": 28.0,
2364
+ "learning_rate": 2.108626198083067e-07,
2365
+ "loss": 0.507,
2366
+ "step": 308
2367
+ },
2368
+ {
2369
+ "epoch": 28.09,
2370
+ "learning_rate": 2.012779552715655e-07,
2371
+ "loss": 0.5913,
2372
+ "step": 309
2373
+ },
2374
+ {
2375
+ "epoch": 28.18,
2376
+ "learning_rate": 1.9169329073482428e-07,
2377
+ "loss": 0.5598,
2378
+ "step": 310
2379
+ },
2380
+ {
2381
+ "epoch": 28.18,
2382
+ "eval_accuracy_safe": 0.6604831901187737,
2383
+ "eval_accuracy_unlabeled": NaN,
2384
+ "eval_accuracy_unsafe": 0.9407892567641855,
2385
+ "eval_iou_safe": 0.2896690945241332,
2386
+ "eval_iou_unlabeled": 0.0,
2387
+ "eval_iou_unsafe": 0.9312167321135931,
2388
+ "eval_loss": 0.5239936709403992,
2389
+ "eval_mean_accuracy": 0.8006362234414796,
2390
+ "eval_mean_iou": 0.4069619422125754,
2391
+ "eval_overall_accuracy": 0.9325094650040812,
2392
+ "eval_runtime": 9.6243,
2393
+ "eval_samples_per_second": 6.962,
2394
+ "eval_steps_per_second": 0.52,
2395
+ "step": 310
2396
+ },
2397
+ {
2398
+ "epoch": 28.27,
2399
+ "learning_rate": 1.8210862619808307e-07,
2400
+ "loss": 0.5394,
2401
+ "step": 311
2402
+ },
2403
+ {
2404
+ "epoch": 28.36,
2405
+ "learning_rate": 1.7252396166134184e-07,
2406
+ "loss": 0.5312,
2407
+ "step": 312
2408
+ },
2409
+ {
2410
+ "epoch": 28.45,
2411
+ "learning_rate": 1.6293929712460063e-07,
2412
+ "loss": 0.5313,
2413
+ "step": 313
2414
+ },
2415
+ {
2416
+ "epoch": 28.55,
2417
+ "learning_rate": 1.5335463258785942e-07,
2418
+ "loss": 0.5188,
2419
+ "step": 314
2420
+ },
2421
+ {
2422
+ "epoch": 28.64,
2423
+ "learning_rate": 1.437699680511182e-07,
2424
+ "loss": 0.5497,
2425
+ "step": 315
2426
+ },
2427
+ {
2428
+ "epoch": 28.73,
2429
+ "learning_rate": 1.34185303514377e-07,
2430
+ "loss": 0.5908,
2431
+ "step": 316
2432
+ },
2433
+ {
2434
+ "epoch": 28.82,
2435
+ "learning_rate": 1.2460063897763577e-07,
2436
+ "loss": 0.56,
2437
+ "step": 317
2438
+ },
2439
+ {
2440
+ "epoch": 28.91,
2441
+ "learning_rate": 1.1501597444089457e-07,
2442
+ "loss": 0.5792,
2443
+ "step": 318
2444
+ },
2445
+ {
2446
+ "epoch": 29.0,
2447
+ "learning_rate": 1.0543130990415335e-07,
2448
+ "loss": 0.6318,
2449
+ "step": 319
2450
+ },
2451
+ {
2452
+ "epoch": 29.09,
2453
+ "learning_rate": 9.584664536741214e-08,
2454
+ "loss": 0.5505,
2455
+ "step": 320
2456
+ },
2457
+ {
2458
+ "epoch": 29.09,
2459
+ "eval_accuracy_safe": 0.6582414871183997,
2460
+ "eval_accuracy_unlabeled": NaN,
2461
+ "eval_accuracy_unsafe": 0.9420817295738547,
2462
+ "eval_iou_safe": 0.29588640634788055,
2463
+ "eval_iou_unlabeled": 0.0,
2464
+ "eval_iou_unsafe": 0.9324414181256692,
2465
+ "eval_loss": 0.5165032744407654,
2466
+ "eval_mean_accuracy": 0.8001616083461272,
2467
+ "eval_mean_iou": 0.4094426081578499,
2468
+ "eval_overall_accuracy": 0.933697543927093,
2469
+ "eval_runtime": 11.4418,
2470
+ "eval_samples_per_second": 5.856,
2471
+ "eval_steps_per_second": 0.437,
2472
+ "step": 320
2473
+ },
2474
+ {
2475
+ "epoch": 29.18,
2476
+ "learning_rate": 1.3160919540229885e-06,
2477
+ "loss": 0.5725,
2478
+ "step": 321
2479
+ },
2480
+ {
2481
+ "epoch": 29.27,
2482
+ "learning_rate": 1.310344827586207e-06,
2483
+ "loss": 0.5195,
2484
+ "step": 322
2485
+ },
2486
+ {
2487
+ "epoch": 29.36,
2488
+ "learning_rate": 1.3045977011494253e-06,
2489
+ "loss": 0.5441,
2490
+ "step": 323
2491
+ },
2492
+ {
2493
+ "epoch": 29.45,
2494
+ "learning_rate": 1.2988505747126436e-06,
2495
+ "loss": 0.5896,
2496
+ "step": 324
2497
+ },
2498
+ {
2499
+ "epoch": 29.55,
2500
+ "learning_rate": 1.293103448275862e-06,
2501
+ "loss": 0.5837,
2502
+ "step": 325
2503
+ },
2504
+ {
2505
+ "epoch": 29.64,
2506
+ "learning_rate": 1.2873563218390806e-06,
2507
+ "loss": 0.5317,
2508
+ "step": 326
2509
+ },
2510
+ {
2511
+ "epoch": 29.73,
2512
+ "learning_rate": 1.2816091954022989e-06,
2513
+ "loss": 0.5395,
2514
+ "step": 327
2515
+ },
2516
+ {
2517
+ "epoch": 29.82,
2518
+ "learning_rate": 1.2758620689655172e-06,
2519
+ "loss": 0.5642,
2520
+ "step": 328
2521
+ },
2522
+ {
2523
+ "epoch": 29.91,
2524
+ "learning_rate": 1.2701149425287357e-06,
2525
+ "loss": 0.5314,
2526
+ "step": 329
2527
+ },
2528
+ {
2529
+ "epoch": 30.0,
2530
+ "learning_rate": 1.2643678160919542e-06,
2531
+ "loss": 0.5754,
2532
+ "step": 330
2533
+ },
2534
+ {
2535
+ "epoch": 30.0,
2536
+ "eval_accuracy_safe": 0.657778882887884,
2537
+ "eval_accuracy_unlabeled": NaN,
2538
+ "eval_accuracy_unsafe": 0.9432738201330771,
2539
+ "eval_iou_safe": 0.2958553359937371,
2540
+ "eval_iou_unlabeled": 0.0,
2541
+ "eval_iou_unsafe": 0.9336061303908306,
2542
+ "eval_loss": 0.5145326852798462,
2543
+ "eval_mean_accuracy": 0.8005263515104806,
2544
+ "eval_mean_iou": 0.40982048879485594,
2545
+ "eval_overall_accuracy": 0.9348407574553987,
2546
+ "eval_runtime": 8.5617,
2547
+ "eval_samples_per_second": 7.826,
2548
+ "eval_steps_per_second": 0.584,
2549
+ "step": 330
2550
+ },
2551
+ {
2552
+ "epoch": 30.09,
2553
+ "learning_rate": 1.2586206896551725e-06,
2554
+ "loss": 0.5332,
2555
+ "step": 331
2556
+ },
2557
+ {
2558
+ "epoch": 30.18,
2559
+ "learning_rate": 1.252873563218391e-06,
2560
+ "loss": 0.5386,
2561
+ "step": 332
2562
+ },
2563
+ {
2564
+ "epoch": 30.27,
2565
+ "learning_rate": 1.2471264367816092e-06,
2566
+ "loss": 0.5446,
2567
+ "step": 333
2568
+ },
2569
+ {
2570
+ "epoch": 30.36,
2571
+ "learning_rate": 1.2413793103448275e-06,
2572
+ "loss": 0.524,
2573
+ "step": 334
2574
+ },
2575
+ {
2576
+ "epoch": 30.45,
2577
+ "learning_rate": 1.235632183908046e-06,
2578
+ "loss": 0.5337,
2579
+ "step": 335
2580
+ },
2581
+ {
2582
+ "epoch": 30.55,
2583
+ "learning_rate": 1.2298850574712645e-06,
2584
+ "loss": 0.5228,
2585
+ "step": 336
2586
+ },
2587
+ {
2588
+ "epoch": 30.64,
2589
+ "learning_rate": 1.2241379310344828e-06,
2590
+ "loss": 0.5856,
2591
+ "step": 337
2592
+ },
2593
+ {
2594
+ "epoch": 30.73,
2595
+ "learning_rate": 1.2183908045977011e-06,
2596
+ "loss": 0.5221,
2597
+ "step": 338
2598
+ },
2599
+ {
2600
+ "epoch": 30.82,
2601
+ "learning_rate": 1.2126436781609196e-06,
2602
+ "loss": 0.5505,
2603
+ "step": 339
2604
+ },
2605
+ {
2606
+ "epoch": 30.91,
2607
+ "learning_rate": 1.206896551724138e-06,
2608
+ "loss": 0.5284,
2609
+ "step": 340
2610
+ },
2611
+ {
2612
+ "epoch": 30.91,
2613
+ "eval_accuracy_safe": 0.6718902394362396,
2614
+ "eval_accuracy_unlabeled": NaN,
2615
+ "eval_accuracy_unsafe": 0.9410974437668724,
2616
+ "eval_iou_safe": 0.29405467602594526,
2617
+ "eval_iou_unlabeled": 0.0,
2618
+ "eval_iou_unsafe": 0.9318466838959976,
2619
+ "eval_loss": 0.5174660086631775,
2620
+ "eval_mean_accuracy": 0.806493841601556,
2621
+ "eval_mean_iou": 0.4086337866406476,
2622
+ "eval_overall_accuracy": 0.933145494603399,
2623
+ "eval_runtime": 8.5465,
2624
+ "eval_samples_per_second": 7.839,
2625
+ "eval_steps_per_second": 0.585,
2626
+ "step": 340
2627
+ },
2628
+ {
2629
+ "epoch": 31.0,
2630
+ "learning_rate": 1.2011494252873564e-06,
2631
+ "loss": 0.5315,
2632
+ "step": 341
2633
+ },
2634
+ {
2635
+ "epoch": 31.09,
2636
+ "learning_rate": 1.1954022988505747e-06,
2637
+ "loss": 0.511,
2638
+ "step": 342
2639
+ },
2640
+ {
2641
+ "epoch": 31.18,
2642
+ "learning_rate": 1.1896551724137932e-06,
2643
+ "loss": 0.5607,
2644
+ "step": 343
2645
+ },
2646
+ {
2647
+ "epoch": 31.27,
2648
+ "learning_rate": 1.1839080459770115e-06,
2649
+ "loss": 0.5254,
2650
+ "step": 344
2651
+ },
2652
+ {
2653
+ "epoch": 31.36,
2654
+ "learning_rate": 1.1781609195402298e-06,
2655
+ "loss": 0.4814,
2656
+ "step": 345
2657
+ },
2658
+ {
2659
+ "epoch": 31.45,
2660
+ "learning_rate": 1.1724137931034483e-06,
2661
+ "loss": 0.5376,
2662
+ "step": 346
2663
+ },
2664
+ {
2665
+ "epoch": 31.55,
2666
+ "learning_rate": 1.1666666666666668e-06,
2667
+ "loss": 0.5253,
2668
+ "step": 347
2669
+ },
2670
+ {
2671
+ "epoch": 31.64,
2672
+ "learning_rate": 1.160919540229885e-06,
2673
+ "loss": 0.5591,
2674
+ "step": 348
2675
+ },
2676
+ {
2677
+ "epoch": 31.73,
2678
+ "learning_rate": 1.1551724137931034e-06,
2679
+ "loss": 0.5161,
2680
+ "step": 349
2681
+ },
2682
+ {
2683
+ "epoch": 31.82,
2684
+ "learning_rate": 1.1494252873563219e-06,
2685
+ "loss": 0.5463,
2686
+ "step": 350
2687
+ },
2688
+ {
2689
+ "epoch": 31.82,
2690
+ "eval_accuracy_safe": 0.6683590271433032,
2691
+ "eval_accuracy_unlabeled": NaN,
2692
+ "eval_accuracy_unsafe": 0.9448280729553086,
2693
+ "eval_iou_safe": 0.3019912053572595,
2694
+ "eval_iou_unlabeled": 0.0,
2695
+ "eval_iou_unsafe": 0.9354427723232134,
2696
+ "eval_loss": 0.5016354918479919,
2697
+ "eval_mean_accuracy": 0.8065935500493059,
2698
+ "eval_mean_iou": 0.4124779925601576,
2699
+ "eval_overall_accuracy": 0.9366616206382637,
2700
+ "eval_runtime": 8.7504,
2701
+ "eval_samples_per_second": 7.657,
2702
+ "eval_steps_per_second": 0.571,
2703
+ "step": 350
2704
+ },
2705
+ {
2706
+ "epoch": 31.91,
2707
+ "learning_rate": 1.1436781609195402e-06,
2708
+ "loss": 0.4994,
2709
+ "step": 351
2710
+ },
2711
+ {
2712
+ "epoch": 32.0,
2713
+ "learning_rate": 1.1379310344827587e-06,
2714
+ "loss": 0.5251,
2715
+ "step": 352
2716
+ },
2717
+ {
2718
+ "epoch": 32.09,
2719
+ "learning_rate": 1.1321839080459772e-06,
2720
+ "loss": 0.5379,
2721
+ "step": 353
2722
+ },
2723
+ {
2724
+ "epoch": 32.18,
2725
+ "learning_rate": 1.1264367816091955e-06,
2726
+ "loss": 0.4885,
2727
+ "step": 354
2728
+ },
2729
+ {
2730
+ "epoch": 32.27,
2731
+ "learning_rate": 1.1206896551724137e-06,
2732
+ "loss": 0.5029,
2733
+ "step": 355
2734
+ },
2735
+ {
2736
+ "epoch": 32.36,
2737
+ "learning_rate": 1.1149425287356322e-06,
2738
+ "loss": 0.5273,
2739
+ "step": 356
2740
+ },
2741
+ {
2742
+ "epoch": 32.45,
2743
+ "learning_rate": 1.1091954022988505e-06,
2744
+ "loss": 0.5111,
2745
+ "step": 357
2746
+ },
2747
+ {
2748
+ "epoch": 32.55,
2749
+ "learning_rate": 1.103448275862069e-06,
2750
+ "loss": 0.5102,
2751
+ "step": 358
2752
+ },
2753
+ {
2754
+ "epoch": 32.64,
2755
+ "learning_rate": 1.0977011494252873e-06,
2756
+ "loss": 0.5197,
2757
+ "step": 359
2758
+ },
2759
+ {
2760
+ "epoch": 32.73,
2761
+ "learning_rate": 1.0919540229885058e-06,
2762
+ "loss": 0.4923,
2763
+ "step": 360
2764
+ },
2765
+ {
2766
+ "epoch": 32.73,
2767
+ "eval_accuracy_safe": 0.6687907910917845,
2768
+ "eval_accuracy_unlabeled": NaN,
2769
+ "eval_accuracy_unsafe": 0.9462536065154241,
2770
+ "eval_iou_safe": 0.3065972713134455,
2771
+ "eval_iou_unlabeled": 0.0,
2772
+ "eval_iou_unsafe": 0.936872865769379,
2773
+ "eval_loss": 0.4946950674057007,
2774
+ "eval_mean_accuracy": 0.8075221988036043,
2775
+ "eval_mean_iou": 0.41449004569427483,
2776
+ "eval_overall_accuracy": 0.9380577998374825,
2777
+ "eval_runtime": 9.7999,
2778
+ "eval_samples_per_second": 6.837,
2779
+ "eval_steps_per_second": 0.51,
2780
+ "step": 360
2781
+ },
2782
+ {
2783
+ "epoch": 32.82,
2784
+ "learning_rate": 1.0862068965517241e-06,
2785
+ "loss": 0.4919,
2786
+ "step": 361
2787
+ },
2788
+ {
2789
+ "epoch": 32.91,
2790
+ "learning_rate": 1.0804597701149424e-06,
2791
+ "loss": 0.5359,
2792
+ "step": 362
2793
+ },
2794
+ {
2795
+ "epoch": 33.0,
2796
+ "learning_rate": 1.0747126436781611e-06,
2797
+ "loss": 0.5646,
2798
+ "step": 363
2799
+ },
2800
+ {
2801
+ "epoch": 33.09,
2802
+ "learning_rate": 1.0689655172413794e-06,
2803
+ "loss": 0.5186,
2804
+ "step": 364
2805
+ },
2806
+ {
2807
+ "epoch": 33.18,
2808
+ "learning_rate": 1.0632183908045977e-06,
2809
+ "loss": 0.4801,
2810
+ "step": 365
2811
+ },
2812
+ {
2813
+ "epoch": 33.27,
2814
+ "learning_rate": 1.057471264367816e-06,
2815
+ "loss": 0.4874,
2816
+ "step": 366
2817
+ },
2818
+ {
2819
+ "epoch": 33.36,
2820
+ "learning_rate": 1.0517241379310345e-06,
2821
+ "loss": 0.5092,
2822
+ "step": 367
2823
+ },
2824
+ {
2825
+ "epoch": 33.45,
2826
+ "learning_rate": 1.045977011494253e-06,
2827
+ "loss": 0.503,
2828
+ "step": 368
2829
+ },
2830
+ {
2831
+ "epoch": 33.55,
2832
+ "learning_rate": 1.0402298850574713e-06,
2833
+ "loss": 0.5327,
2834
+ "step": 369
2835
+ },
2836
+ {
2837
+ "epoch": 33.64,
2838
+ "learning_rate": 1.0344827586206898e-06,
2839
+ "loss": 0.4922,
2840
+ "step": 370
2841
+ },
2842
+ {
2843
+ "epoch": 33.64,
2844
+ "eval_accuracy_safe": 0.6685016634477122,
2845
+ "eval_accuracy_unlabeled": NaN,
2846
+ "eval_accuracy_unsafe": 0.9503706868340143,
2847
+ "eval_iou_safe": 0.3165045602136191,
2848
+ "eval_iou_unlabeled": 0.0,
2849
+ "eval_iou_unsafe": 0.9409432282460215,
2850
+ "eval_loss": 0.4738222360610962,
2851
+ "eval_mean_accuracy": 0.8094361751408632,
2852
+ "eval_mean_iou": 0.41914926281988024,
2853
+ "eval_overall_accuracy": 0.9420447278378615,
2854
+ "eval_runtime": 10.1885,
2855
+ "eval_samples_per_second": 6.576,
2856
+ "eval_steps_per_second": 0.491,
2857
+ "step": 370
2858
+ },
2859
+ {
2860
+ "epoch": 33.73,
2861
+ "learning_rate": 1.028735632183908e-06,
2862
+ "loss": 0.5358,
2863
+ "step": 371
2864
+ },
2865
+ {
2866
+ "epoch": 33.82,
2867
+ "learning_rate": 1.0229885057471264e-06,
2868
+ "loss": 0.4633,
2869
+ "step": 372
2870
+ },
2871
+ {
2872
+ "epoch": 33.91,
2873
+ "learning_rate": 1.0172413793103449e-06,
2874
+ "loss": 0.4886,
2875
+ "step": 373
2876
+ },
2877
+ {
2878
+ "epoch": 34.0,
2879
+ "learning_rate": 1.0114942528735634e-06,
2880
+ "loss": 0.531,
2881
+ "step": 374
2882
+ },
2883
+ {
2884
+ "epoch": 34.09,
2885
+ "learning_rate": 1.0057471264367817e-06,
2886
+ "loss": 0.5054,
2887
+ "step": 375
2888
+ },
2889
+ {
2890
+ "epoch": 34.18,
2891
+ "learning_rate": 1e-06,
2892
+ "loss": 0.498,
2893
+ "step": 376
2894
+ },
2895
+ {
2896
+ "epoch": 34.27,
2897
+ "learning_rate": 9.942528735632185e-07,
2898
+ "loss": 0.5071,
2899
+ "step": 377
2900
+ },
2901
+ {
2902
+ "epoch": 34.36,
2903
+ "learning_rate": 9.885057471264367e-07,
2904
+ "loss": 0.4907,
2905
+ "step": 378
2906
+ },
2907
+ {
2908
+ "epoch": 34.45,
2909
+ "learning_rate": 9.827586206896552e-07,
2910
+ "loss": 0.4967,
2911
+ "step": 379
2912
+ },
2913
+ {
2914
+ "epoch": 34.55,
2915
+ "learning_rate": 9.770114942528735e-07,
2916
+ "loss": 0.4976,
2917
+ "step": 380
2918
+ },
2919
+ {
2920
+ "epoch": 34.55,
2921
+ "eval_accuracy_safe": 0.6747757333240813,
2922
+ "eval_accuracy_unlabeled": NaN,
2923
+ "eval_accuracy_unsafe": 0.9535474829165368,
2924
+ "eval_iou_safe": 0.3232939737984814,
2925
+ "eval_iou_unlabeled": 0.0,
2926
+ "eval_iou_unsafe": 0.944264577460996,
2927
+ "eval_loss": 0.46629098057746887,
2928
+ "eval_mean_accuracy": 0.814161608120309,
2929
+ "eval_mean_iou": 0.42251951708649244,
2930
+ "eval_overall_accuracy": 0.9453130124220207,
2931
+ "eval_runtime": 8.7895,
2932
+ "eval_samples_per_second": 7.623,
2933
+ "eval_steps_per_second": 0.569,
2934
+ "step": 380
2935
+ },
2936
+ {
2937
+ "epoch": 34.64,
2938
+ "learning_rate": 9.71264367816092e-07,
2939
+ "loss": 0.4647,
2940
+ "step": 381
2941
+ },
2942
+ {
2943
+ "epoch": 34.73,
2944
+ "learning_rate": 9.655172413793103e-07,
2945
+ "loss": 0.4782,
2946
+ "step": 382
2947
+ },
2948
+ {
2949
+ "epoch": 34.82,
2950
+ "learning_rate": 9.597701149425286e-07,
2951
+ "loss": 0.4785,
2952
+ "step": 383
2953
+ },
2954
+ {
2955
+ "epoch": 34.91,
2956
+ "learning_rate": 9.540229885057471e-07,
2957
+ "loss": 0.4996,
2958
+ "step": 384
2959
+ },
2960
+ {
2961
+ "epoch": 35.0,
2962
+ "learning_rate": 9.482758620689655e-07,
2963
+ "loss": 0.437,
2964
+ "step": 385
2965
+ },
2966
+ {
2967
+ "epoch": 35.09,
2968
+ "learning_rate": 9.425287356321839e-07,
2969
+ "loss": 0.4617,
2970
+ "step": 386
2971
+ },
2972
+ {
2973
+ "epoch": 35.18,
2974
+ "learning_rate": 9.367816091954024e-07,
2975
+ "loss": 0.4486,
2976
+ "step": 387
2977
+ },
2978
+ {
2979
+ "epoch": 35.27,
2980
+ "learning_rate": 9.310344827586207e-07,
2981
+ "loss": 0.5012,
2982
+ "step": 388
2983
+ },
2984
+ {
2985
+ "epoch": 35.36,
2986
+ "learning_rate": 9.252873563218391e-07,
2987
+ "loss": 0.4752,
2988
+ "step": 389
2989
+ },
2990
+ {
2991
+ "epoch": 35.45,
2992
+ "learning_rate": 9.195402298850574e-07,
2993
+ "loss": 0.4922,
2994
+ "step": 390
2995
+ },
2996
+ {
2997
+ "epoch": 35.45,
2998
+ "eval_accuracy_safe": 0.650909210064726,
2999
+ "eval_accuracy_unlabeled": NaN,
3000
+ "eval_accuracy_unsafe": 0.9652786537349766,
3001
+ "eval_iou_safe": 0.3483788236580638,
3002
+ "eval_iou_unlabeled": 0.0,
3003
+ "eval_iou_unsafe": 0.9551696231808672,
3004
+ "eval_loss": 0.4295278489589691,
3005
+ "eval_mean_accuracy": 0.8080939318998512,
3006
+ "eval_mean_iou": 0.4345161489463103,
3007
+ "eval_overall_accuracy": 0.9559926844354886,
3008
+ "eval_runtime": 9.5593,
3009
+ "eval_samples_per_second": 7.009,
3010
+ "eval_steps_per_second": 0.523,
3011
+ "step": 390
3012
+ },
3013
+ {
3014
+ "epoch": 35.55,
3015
+ "learning_rate": 9.137931034482759e-07,
3016
+ "loss": 0.4963,
3017
+ "step": 391
3018
+ },
3019
+ {
3020
+ "epoch": 35.64,
3021
+ "learning_rate": 9.080459770114943e-07,
3022
+ "loss": 0.4951,
3023
+ "step": 392
3024
+ },
3025
+ {
3026
+ "epoch": 35.73,
3027
+ "learning_rate": 9.022988505747126e-07,
3028
+ "loss": 0.4667,
3029
+ "step": 393
3030
+ },
3031
+ {
3032
+ "epoch": 35.82,
3033
+ "learning_rate": 8.965517241379311e-07,
3034
+ "loss": 0.4694,
3035
+ "step": 394
3036
+ },
3037
+ {
3038
+ "epoch": 35.91,
3039
+ "learning_rate": 8.908045977011495e-07,
3040
+ "loss": 0.471,
3041
+ "step": 395
3042
+ },
3043
+ {
3044
+ "epoch": 36.0,
3045
+ "learning_rate": 8.850574712643678e-07,
3046
+ "loss": 0.5268,
3047
+ "step": 396
3048
+ },
3049
+ {
3050
+ "epoch": 36.09,
3051
+ "learning_rate": 8.793103448275862e-07,
3052
+ "loss": 0.4383,
3053
+ "step": 397
3054
+ },
3055
+ {
3056
+ "epoch": 36.18,
3057
+ "learning_rate": 8.735632183908047e-07,
3058
+ "loss": 0.48,
3059
+ "step": 398
3060
+ },
3061
+ {
3062
+ "epoch": 36.27,
3063
+ "learning_rate": 8.67816091954023e-07,
3064
+ "loss": 0.4727,
3065
+ "step": 399
3066
+ },
3067
+ {
3068
+ "epoch": 36.36,
3069
+ "learning_rate": 8.620689655172414e-07,
3070
+ "loss": 0.4608,
3071
+ "step": 400
3072
+ },
3073
+ {
3074
+ "epoch": 36.36,
3075
+ "eval_accuracy_safe": 0.6580178950736505,
3076
+ "eval_accuracy_unlabeled": NaN,
3077
+ "eval_accuracy_unsafe": 0.9636894929998194,
3078
+ "eval_iou_safe": 0.35071600798452407,
3079
+ "eval_iou_unlabeled": 0.0,
3080
+ "eval_iou_unsafe": 0.9538031459361976,
3081
+ "eval_loss": 0.44339337944984436,
3082
+ "eval_mean_accuracy": 0.810853694036735,
3083
+ "eval_mean_iou": 0.4348397179735739,
3084
+ "eval_overall_accuracy": 0.9546604441173041,
3085
+ "eval_runtime": 9.0957,
3086
+ "eval_samples_per_second": 7.366,
3087
+ "eval_steps_per_second": 0.55,
3088
+ "step": 400
3089
  }
3090
  ],
3091
+ "max_steps": 550,
3092
+ "num_train_epochs": 50,
3093
+ "total_flos": 2.2369619168911688e+18,
3094
  "trial_name": null,
3095
  "trial_params": null
3096
  }
{checkpoint-200 β†’ checkpoint-400}/training_args.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f030ee6346022874816800d95eb680870a6f0608d7f7d70d11613eaa9ed9ab3
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f697330840b2c8edcf38f52d8f9d3ff8699296fe028ab72ebfa8c7f0ffa9e501
3
  size 4155
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d99ed0b372c42b217b30d271e9669c849981b78d4e728284a629d54daf3fe948
3
  size 338796489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be03cc2a8293c04c55f9def52f92927e02d3469ef2fa6683e2b8860f35537827
3
  size 338796489
runs/Feb07_22-35-51_robovision.csres.utexas.edu/events.out.tfevents.1707366957.robovision.csres.utexas.edu.754189.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04127becb52cd254ec08d45cd19f991605fd2af3597f6936155bb2983c5b9585
3
- size 14155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:463f8d9cd683ec2b7fd6c5abd3e67bb04ebfb29112a9418caebd195992048af4
3
+ size 23559