sam1120 commited on
Commit
ff657d7
β€’
1 Parent(s): cb622cf

Training in progress, step 320

Browse files
{checkpoint-120 β†’ checkpoint-320}/config.json RENAMED
File without changes
{checkpoint-120 β†’ checkpoint-320}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a0b8f8fa238bda226b9b536c2b6ca08f45cb34421e13d6c66ca83b071f322ed
3
- size 677455103
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15ceff5290a696dfc950965cfc2401833f617bcb0e78d9e593f50368e218d888
3
+ size 677456319
{checkpoint-120 β†’ checkpoint-320}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c766452e39d4a3b19bc433ad1b8e0ef99636b21632c3752fdd48b17ff02b73ba
3
  size 338796489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8f1820205b4b98713df2a49ff37a9a65771547246a6b06bb8594ee68aa08012
3
  size 338796489
{checkpoint-120 β†’ checkpoint-320}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8498eb2343beddb85ffcc133ccb294e09d3f4149f2d49947ba2c257937583963
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0660d6831501b7ffc617750340e6664c7ef6f4f765e3dcbb8057a746a50c104b
3
  size 14575
{checkpoint-120 β†’ checkpoint-320}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a203cfafd7b21afdd3e3a99a270006d632619b10442f125bd17f5039f93e556b
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d55b28c4f509a3a5a4f57e5a695e1f6bb36e94dddd8abd6cbf432b0c2feb6809
3
  size 627
{checkpoint-120 β†’ checkpoint-320}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7439588308334351,
3
- "best_model_checkpoint": "/robodata/smodak/Projects/nspl/scripts/terrainseg/training/models/safety-utcustom-train-SF-RGB-b5/checkpoint-120",
4
- "epoch": 10.909090909090908,
5
- "global_step": 120,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -930,11 +930,1551 @@
930
  "eval_samples_per_second": 7.053,
931
  "eval_steps_per_second": 0.526,
932
  "step": 120
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
933
  }
934
  ],
935
  "max_steps": 330,
936
  "num_train_epochs": 30,
937
- "total_flos": 6.746012918533325e+17,
938
  "trial_name": null,
939
  "trial_params": null
940
  }
 
1
  {
2
+ "best_metric": 0.5165032744407654,
3
+ "best_model_checkpoint": "/robodata/smodak/Projects/nspl/scripts/terrainseg/training/models/safety-utcustom-train-SF-RGB-b5/checkpoint-320",
4
+ "epoch": 29.09090909090909,
5
+ "global_step": 320,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
930
  "eval_samples_per_second": 7.053,
931
  "eval_steps_per_second": 0.526,
932
  "step": 120
933
+ },
934
+ {
935
+ "epoch": 11.0,
936
+ "learning_rate": 2.003194888178914e-06,
937
+ "loss": 0.8343,
938
+ "step": 121
939
+ },
940
+ {
941
+ "epoch": 11.09,
942
+ "learning_rate": 1.9936102236421723e-06,
943
+ "loss": 0.8413,
944
+ "step": 122
945
+ },
946
+ {
947
+ "epoch": 11.18,
948
+ "learning_rate": 1.9840255591054315e-06,
949
+ "loss": 0.8037,
950
+ "step": 123
951
+ },
952
+ {
953
+ "epoch": 11.27,
954
+ "learning_rate": 1.9744408945686903e-06,
955
+ "loss": 0.8284,
956
+ "step": 124
957
+ },
958
+ {
959
+ "epoch": 11.36,
960
+ "learning_rate": 1.9648562300319487e-06,
961
+ "loss": 0.8023,
962
+ "step": 125
963
+ },
964
+ {
965
+ "epoch": 11.45,
966
+ "learning_rate": 1.955271565495208e-06,
967
+ "loss": 0.8176,
968
+ "step": 126
969
+ },
970
+ {
971
+ "epoch": 11.55,
972
+ "learning_rate": 1.9456869009584667e-06,
973
+ "loss": 0.8078,
974
+ "step": 127
975
+ },
976
+ {
977
+ "epoch": 11.64,
978
+ "learning_rate": 1.936102236421725e-06,
979
+ "loss": 0.8074,
980
+ "step": 128
981
+ },
982
+ {
983
+ "epoch": 11.73,
984
+ "learning_rate": 1.9265175718849843e-06,
985
+ "loss": 0.8139,
986
+ "step": 129
987
+ },
988
+ {
989
+ "epoch": 11.82,
990
+ "learning_rate": 1.9169329073482426e-06,
991
+ "loss": 0.8152,
992
+ "step": 130
993
+ },
994
+ {
995
+ "epoch": 11.82,
996
+ "eval_accuracy_safe": 0.6688004286799203,
997
+ "eval_accuracy_unlabeled": NaN,
998
+ "eval_accuracy_unsafe": 0.8589712690862681,
999
+ "eval_iou_safe": 0.20063653201077156,
1000
+ "eval_iou_unlabeled": 0.0,
1001
+ "eval_iou_unsafe": 0.8506617582762998,
1002
+ "eval_loss": 0.7270171046257019,
1003
+ "eval_mean_accuracy": 0.7638858488830942,
1004
+ "eval_mean_iou": 0.3504327634290238,
1005
+ "eval_overall_accuracy": 0.8533539273845616,
1006
+ "eval_runtime": 11.0671,
1007
+ "eval_samples_per_second": 6.054,
1008
+ "eval_steps_per_second": 0.452,
1009
+ "step": 130
1010
+ },
1011
+ {
1012
+ "epoch": 11.91,
1013
+ "learning_rate": 1.9073482428115018e-06,
1014
+ "loss": 0.8102,
1015
+ "step": 131
1016
+ },
1017
+ {
1018
+ "epoch": 12.0,
1019
+ "learning_rate": 1.8977635782747604e-06,
1020
+ "loss": 0.8192,
1021
+ "step": 132
1022
+ },
1023
+ {
1024
+ "epoch": 12.09,
1025
+ "learning_rate": 1.888178913738019e-06,
1026
+ "loss": 0.8246,
1027
+ "step": 133
1028
+ },
1029
+ {
1030
+ "epoch": 12.18,
1031
+ "learning_rate": 1.878594249201278e-06,
1032
+ "loss": 0.7864,
1033
+ "step": 134
1034
+ },
1035
+ {
1036
+ "epoch": 12.27,
1037
+ "learning_rate": 1.8690095846645368e-06,
1038
+ "loss": 0.7718,
1039
+ "step": 135
1040
+ },
1041
+ {
1042
+ "epoch": 12.36,
1043
+ "learning_rate": 1.8594249201277954e-06,
1044
+ "loss": 0.8074,
1045
+ "step": 136
1046
+ },
1047
+ {
1048
+ "epoch": 12.45,
1049
+ "learning_rate": 1.8498402555910544e-06,
1050
+ "loss": 0.7569,
1051
+ "step": 137
1052
+ },
1053
+ {
1054
+ "epoch": 12.55,
1055
+ "learning_rate": 1.8402555910543132e-06,
1056
+ "loss": 0.7989,
1057
+ "step": 138
1058
+ },
1059
+ {
1060
+ "epoch": 12.64,
1061
+ "learning_rate": 1.8306709265175722e-06,
1062
+ "loss": 0.7987,
1063
+ "step": 139
1064
+ },
1065
+ {
1066
+ "epoch": 12.73,
1067
+ "learning_rate": 1.8210862619808307e-06,
1068
+ "loss": 0.7929,
1069
+ "step": 140
1070
+ },
1071
+ {
1072
+ "epoch": 12.73,
1073
+ "eval_accuracy_safe": 0.6659920354971646,
1074
+ "eval_accuracy_unlabeled": NaN,
1075
+ "eval_accuracy_unsafe": 0.8656634973410731,
1076
+ "eval_iou_safe": 0.20852726465106847,
1077
+ "eval_iou_unlabeled": 0.0,
1078
+ "eval_iou_unsafe": 0.8572303764577973,
1079
+ "eval_loss": 0.7045122981071472,
1080
+ "eval_mean_accuracy": 0.7658277664191189,
1081
+ "eval_mean_iou": 0.3552525470362886,
1082
+ "eval_overall_accuracy": 0.8597655225155959,
1083
+ "eval_runtime": 9.4502,
1084
+ "eval_samples_per_second": 7.09,
1085
+ "eval_steps_per_second": 0.529,
1086
+ "step": 140
1087
+ },
1088
+ {
1089
+ "epoch": 12.82,
1090
+ "learning_rate": 1.8115015974440893e-06,
1091
+ "loss": 0.7703,
1092
+ "step": 141
1093
+ },
1094
+ {
1095
+ "epoch": 12.91,
1096
+ "learning_rate": 1.8019169329073483e-06,
1097
+ "loss": 0.768,
1098
+ "step": 142
1099
+ },
1100
+ {
1101
+ "epoch": 13.0,
1102
+ "learning_rate": 1.7923322683706071e-06,
1103
+ "loss": 0.8397,
1104
+ "step": 143
1105
+ },
1106
+ {
1107
+ "epoch": 13.09,
1108
+ "learning_rate": 1.7827476038338657e-06,
1109
+ "loss": 0.775,
1110
+ "step": 144
1111
+ },
1112
+ {
1113
+ "epoch": 13.18,
1114
+ "learning_rate": 1.7731629392971247e-06,
1115
+ "loss": 0.7718,
1116
+ "step": 145
1117
+ },
1118
+ {
1119
+ "epoch": 13.27,
1120
+ "learning_rate": 1.7635782747603833e-06,
1121
+ "loss": 0.7544,
1122
+ "step": 146
1123
+ },
1124
+ {
1125
+ "epoch": 13.36,
1126
+ "learning_rate": 1.7539936102236423e-06,
1127
+ "loss": 0.7585,
1128
+ "step": 147
1129
+ },
1130
+ {
1131
+ "epoch": 13.45,
1132
+ "learning_rate": 1.744408945686901e-06,
1133
+ "loss": 0.742,
1134
+ "step": 148
1135
+ },
1136
+ {
1137
+ "epoch": 13.55,
1138
+ "learning_rate": 1.7348242811501597e-06,
1139
+ "loss": 0.7629,
1140
+ "step": 149
1141
+ },
1142
+ {
1143
+ "epoch": 13.64,
1144
+ "learning_rate": 1.7252396166134187e-06,
1145
+ "loss": 0.7568,
1146
+ "step": 150
1147
+ },
1148
+ {
1149
+ "epoch": 13.64,
1150
+ "eval_accuracy_safe": 0.657079193989229,
1151
+ "eval_accuracy_unlabeled": NaN,
1152
+ "eval_accuracy_unsafe": 0.8838084544735693,
1153
+ "eval_iou_safe": 0.21846087789622765,
1154
+ "eval_iou_unlabeled": 0.0,
1155
+ "eval_iou_unsafe": 0.874847055157359,
1156
+ "eval_loss": 0.6744459867477417,
1157
+ "eval_mean_accuracy": 0.7704438242313991,
1158
+ "eval_mean_iou": 0.3644359776845289,
1159
+ "eval_overall_accuracy": 0.8771112356612931,
1160
+ "eval_runtime": 10.8117,
1161
+ "eval_samples_per_second": 6.197,
1162
+ "eval_steps_per_second": 0.462,
1163
+ "step": 150
1164
+ },
1165
+ {
1166
+ "epoch": 13.73,
1167
+ "learning_rate": 1.7156549520766772e-06,
1168
+ "loss": 0.7311,
1169
+ "step": 151
1170
+ },
1171
+ {
1172
+ "epoch": 13.82,
1173
+ "learning_rate": 1.706070287539936e-06,
1174
+ "loss": 0.7352,
1175
+ "step": 152
1176
+ },
1177
+ {
1178
+ "epoch": 13.91,
1179
+ "learning_rate": 1.696485623003195e-06,
1180
+ "loss": 0.7661,
1181
+ "step": 153
1182
+ },
1183
+ {
1184
+ "epoch": 14.0,
1185
+ "learning_rate": 1.6869009584664536e-06,
1186
+ "loss": 0.7335,
1187
+ "step": 154
1188
+ },
1189
+ {
1190
+ "epoch": 14.09,
1191
+ "learning_rate": 1.6773162939297126e-06,
1192
+ "loss": 0.7491,
1193
+ "step": 155
1194
+ },
1195
+ {
1196
+ "epoch": 14.18,
1197
+ "learning_rate": 1.6677316293929714e-06,
1198
+ "loss": 0.715,
1199
+ "step": 156
1200
+ },
1201
+ {
1202
+ "epoch": 14.27,
1203
+ "learning_rate": 1.65814696485623e-06,
1204
+ "loss": 0.7349,
1205
+ "step": 157
1206
+ },
1207
+ {
1208
+ "epoch": 14.36,
1209
+ "learning_rate": 1.648562300319489e-06,
1210
+ "loss": 0.7127,
1211
+ "step": 158
1212
+ },
1213
+ {
1214
+ "epoch": 14.45,
1215
+ "learning_rate": 1.6389776357827476e-06,
1216
+ "loss": 0.718,
1217
+ "step": 159
1218
+ },
1219
+ {
1220
+ "epoch": 14.55,
1221
+ "learning_rate": 1.6293929712460064e-06,
1222
+ "loss": 0.7085,
1223
+ "step": 160
1224
+ },
1225
+ {
1226
+ "epoch": 14.55,
1227
+ "eval_accuracy_safe": 0.6519423595128777,
1228
+ "eval_accuracy_unlabeled": NaN,
1229
+ "eval_accuracy_unsafe": 0.8934174588611713,
1230
+ "eval_iou_safe": 0.2259934305828019,
1231
+ "eval_iou_unlabeled": 0.0,
1232
+ "eval_iou_unsafe": 0.8842020655315154,
1233
+ "eval_loss": 0.65559983253479,
1234
+ "eval_mean_accuracy": 0.7726799091870244,
1235
+ "eval_mean_iou": 0.3700651653714391,
1236
+ "eval_overall_accuracy": 0.8862846716126399,
1237
+ "eval_runtime": 9.325,
1238
+ "eval_samples_per_second": 7.185,
1239
+ "eval_steps_per_second": 0.536,
1240
+ "step": 160
1241
+ },
1242
+ {
1243
+ "epoch": 14.64,
1244
+ "learning_rate": 1.6198083067092654e-06,
1245
+ "loss": 0.753,
1246
+ "step": 161
1247
+ },
1248
+ {
1249
+ "epoch": 14.73,
1250
+ "learning_rate": 1.610223642172524e-06,
1251
+ "loss": 0.7376,
1252
+ "step": 162
1253
+ },
1254
+ {
1255
+ "epoch": 14.82,
1256
+ "learning_rate": 1.600638977635783e-06,
1257
+ "loss": 0.7256,
1258
+ "step": 163
1259
+ },
1260
+ {
1261
+ "epoch": 14.91,
1262
+ "learning_rate": 1.5910543130990415e-06,
1263
+ "loss": 0.7132,
1264
+ "step": 164
1265
+ },
1266
+ {
1267
+ "epoch": 15.0,
1268
+ "learning_rate": 1.5814696485623003e-06,
1269
+ "loss": 0.722,
1270
+ "step": 165
1271
+ },
1272
+ {
1273
+ "epoch": 15.09,
1274
+ "learning_rate": 1.5718849840255593e-06,
1275
+ "loss": 0.7015,
1276
+ "step": 166
1277
+ },
1278
+ {
1279
+ "epoch": 15.18,
1280
+ "learning_rate": 1.562300319488818e-06,
1281
+ "loss": 0.7176,
1282
+ "step": 167
1283
+ },
1284
+ {
1285
+ "epoch": 15.27,
1286
+ "learning_rate": 1.5527156549520765e-06,
1287
+ "loss": 0.7147,
1288
+ "step": 168
1289
+ },
1290
+ {
1291
+ "epoch": 15.36,
1292
+ "learning_rate": 1.5431309904153355e-06,
1293
+ "loss": 0.7217,
1294
+ "step": 169
1295
+ },
1296
+ {
1297
+ "epoch": 15.45,
1298
+ "learning_rate": 1.5335463258785943e-06,
1299
+ "loss": 0.7147,
1300
+ "step": 170
1301
+ },
1302
+ {
1303
+ "epoch": 15.45,
1304
+ "eval_accuracy_safe": 0.6561000150346374,
1305
+ "eval_accuracy_unlabeled": NaN,
1306
+ "eval_accuracy_unsafe": 0.8963761831582403,
1307
+ "eval_iou_safe": 0.22827906452703248,
1308
+ "eval_iou_unlabeled": 0.0,
1309
+ "eval_iou_unsafe": 0.8872234626234047,
1310
+ "eval_loss": 0.6508952975273132,
1311
+ "eval_mean_accuracy": 0.7762380990964388,
1312
+ "eval_mean_iou": 0.3718341757168124,
1313
+ "eval_overall_accuracy": 0.889278810415695,
1314
+ "eval_runtime": 10.5537,
1315
+ "eval_samples_per_second": 6.348,
1316
+ "eval_steps_per_second": 0.474,
1317
+ "step": 170
1318
+ },
1319
+ {
1320
+ "epoch": 15.55,
1321
+ "learning_rate": 1.5239616613418533e-06,
1322
+ "loss": 0.7212,
1323
+ "step": 171
1324
+ },
1325
+ {
1326
+ "epoch": 15.64,
1327
+ "learning_rate": 1.5143769968051119e-06,
1328
+ "loss": 0.7196,
1329
+ "step": 172
1330
+ },
1331
+ {
1332
+ "epoch": 15.73,
1333
+ "learning_rate": 1.5047923322683706e-06,
1334
+ "loss": 0.6797,
1335
+ "step": 173
1336
+ },
1337
+ {
1338
+ "epoch": 15.82,
1339
+ "learning_rate": 1.4952076677316294e-06,
1340
+ "loss": 0.6626,
1341
+ "step": 174
1342
+ },
1343
+ {
1344
+ "epoch": 15.91,
1345
+ "learning_rate": 1.4856230031948882e-06,
1346
+ "loss": 0.6783,
1347
+ "step": 175
1348
+ },
1349
+ {
1350
+ "epoch": 16.0,
1351
+ "learning_rate": 1.476038338658147e-06,
1352
+ "loss": 0.7436,
1353
+ "step": 176
1354
+ },
1355
+ {
1356
+ "epoch": 16.09,
1357
+ "learning_rate": 1.4664536741214058e-06,
1358
+ "loss": 0.7123,
1359
+ "step": 177
1360
+ },
1361
+ {
1362
+ "epoch": 16.18,
1363
+ "learning_rate": 1.4568690095846646e-06,
1364
+ "loss": 0.7241,
1365
+ "step": 178
1366
+ },
1367
+ {
1368
+ "epoch": 16.27,
1369
+ "learning_rate": 1.4472843450479234e-06,
1370
+ "loss": 0.6914,
1371
+ "step": 179
1372
+ },
1373
+ {
1374
+ "epoch": 16.36,
1375
+ "learning_rate": 1.4376996805111822e-06,
1376
+ "loss": 0.6991,
1377
+ "step": 180
1378
+ },
1379
+ {
1380
+ "epoch": 16.36,
1381
+ "eval_accuracy_safe": 0.6619847263503225,
1382
+ "eval_accuracy_unlabeled": NaN,
1383
+ "eval_accuracy_unsafe": 0.8964291023808605,
1384
+ "eval_iou_safe": 0.22672413565462626,
1385
+ "eval_iou_unlabeled": 0.0,
1386
+ "eval_iou_unsafe": 0.8874142561414083,
1387
+ "eval_loss": 0.6502141952514648,
1388
+ "eval_mean_accuracy": 0.7792069143655915,
1389
+ "eval_mean_iou": 0.37137946393201154,
1390
+ "eval_overall_accuracy": 0.889503991425927,
1391
+ "eval_runtime": 9.3648,
1392
+ "eval_samples_per_second": 7.154,
1393
+ "eval_steps_per_second": 0.534,
1394
+ "step": 180
1395
+ },
1396
+ {
1397
+ "epoch": 16.45,
1398
+ "learning_rate": 1.428115015974441e-06,
1399
+ "loss": 0.6552,
1400
+ "step": 181
1401
+ },
1402
+ {
1403
+ "epoch": 16.55,
1404
+ "learning_rate": 1.4185303514376998e-06,
1405
+ "loss": 0.6621,
1406
+ "step": 182
1407
+ },
1408
+ {
1409
+ "epoch": 16.64,
1410
+ "learning_rate": 1.4089456869009586e-06,
1411
+ "loss": 0.6742,
1412
+ "step": 183
1413
+ },
1414
+ {
1415
+ "epoch": 16.73,
1416
+ "learning_rate": 1.3993610223642173e-06,
1417
+ "loss": 0.6462,
1418
+ "step": 184
1419
+ },
1420
+ {
1421
+ "epoch": 16.82,
1422
+ "learning_rate": 1.3897763578274761e-06,
1423
+ "loss": 0.6759,
1424
+ "step": 185
1425
+ },
1426
+ {
1427
+ "epoch": 16.91,
1428
+ "learning_rate": 1.3801916932907347e-06,
1429
+ "loss": 0.6773,
1430
+ "step": 186
1431
+ },
1432
+ {
1433
+ "epoch": 17.0,
1434
+ "learning_rate": 1.3706070287539937e-06,
1435
+ "loss": 0.7158,
1436
+ "step": 187
1437
+ },
1438
+ {
1439
+ "epoch": 17.09,
1440
+ "learning_rate": 1.3610223642172525e-06,
1441
+ "loss": 0.6958,
1442
+ "step": 188
1443
+ },
1444
+ {
1445
+ "epoch": 17.18,
1446
+ "learning_rate": 1.3514376996805113e-06,
1447
+ "loss": 0.6747,
1448
+ "step": 189
1449
+ },
1450
+ {
1451
+ "epoch": 17.27,
1452
+ "learning_rate": 1.3418530351437699e-06,
1453
+ "loss": 0.6357,
1454
+ "step": 190
1455
+ },
1456
+ {
1457
+ "epoch": 17.27,
1458
+ "eval_accuracy_safe": 0.6611674588764114,
1459
+ "eval_accuracy_unlabeled": NaN,
1460
+ "eval_accuracy_unsafe": 0.9051011079830231,
1461
+ "eval_iou_safe": 0.24110413837507133,
1462
+ "eval_iou_unlabeled": 0.0,
1463
+ "eval_iou_unsafe": 0.895975219611748,
1464
+ "eval_loss": 0.6229549646377563,
1465
+ "eval_mean_accuracy": 0.7831342834297172,
1466
+ "eval_mean_iou": 0.3790264526622731,
1467
+ "eval_overall_accuracy": 0.8978956991167211,
1468
+ "eval_runtime": 10.2719,
1469
+ "eval_samples_per_second": 6.523,
1470
+ "eval_steps_per_second": 0.487,
1471
+ "step": 190
1472
+ },
1473
+ {
1474
+ "epoch": 17.36,
1475
+ "learning_rate": 1.3322683706070287e-06,
1476
+ "loss": 0.6769,
1477
+ "step": 191
1478
+ },
1479
+ {
1480
+ "epoch": 17.45,
1481
+ "learning_rate": 1.3226837060702877e-06,
1482
+ "loss": 0.6396,
1483
+ "step": 192
1484
+ },
1485
+ {
1486
+ "epoch": 17.55,
1487
+ "learning_rate": 1.3130990415335465e-06,
1488
+ "loss": 0.6567,
1489
+ "step": 193
1490
+ },
1491
+ {
1492
+ "epoch": 17.64,
1493
+ "learning_rate": 1.303514376996805e-06,
1494
+ "loss": 0.6538,
1495
+ "step": 194
1496
+ },
1497
+ {
1498
+ "epoch": 17.73,
1499
+ "learning_rate": 1.2939297124600638e-06,
1500
+ "loss": 0.6654,
1501
+ "step": 195
1502
+ },
1503
+ {
1504
+ "epoch": 17.82,
1505
+ "learning_rate": 1.2843450479233228e-06,
1506
+ "loss": 0.6637,
1507
+ "step": 196
1508
+ },
1509
+ {
1510
+ "epoch": 17.91,
1511
+ "learning_rate": 1.2747603833865816e-06,
1512
+ "loss": 0.6417,
1513
+ "step": 197
1514
+ },
1515
+ {
1516
+ "epoch": 18.0,
1517
+ "learning_rate": 1.2651757188498402e-06,
1518
+ "loss": 0.6707,
1519
+ "step": 198
1520
+ },
1521
+ {
1522
+ "epoch": 18.09,
1523
+ "learning_rate": 1.255591054313099e-06,
1524
+ "loss": 0.6229,
1525
+ "step": 199
1526
+ },
1527
+ {
1528
+ "epoch": 18.18,
1529
+ "learning_rate": 1.2460063897763578e-06,
1530
+ "loss": 0.6815,
1531
+ "step": 200
1532
+ },
1533
+ {
1534
+ "epoch": 18.18,
1535
+ "eval_accuracy_safe": 0.6484207848080771,
1536
+ "eval_accuracy_unlabeled": NaN,
1537
+ "eval_accuracy_unsafe": 0.9178010760554833,
1538
+ "eval_iou_safe": 0.2593923131195133,
1539
+ "eval_iou_unlabeled": 0.0,
1540
+ "eval_iou_unsafe": 0.908185465668198,
1541
+ "eval_loss": 0.5992904305458069,
1542
+ "eval_mean_accuracy": 0.7831109304317803,
1543
+ "eval_mean_iou": 0.3891925929292371,
1544
+ "eval_overall_accuracy": 0.9098440141820195,
1545
+ "eval_runtime": 9.7351,
1546
+ "eval_samples_per_second": 6.882,
1547
+ "eval_steps_per_second": 0.514,
1548
+ "step": 200
1549
+ },
1550
+ {
1551
+ "epoch": 18.27,
1552
+ "learning_rate": 1.2364217252396168e-06,
1553
+ "loss": 0.6677,
1554
+ "step": 201
1555
+ },
1556
+ {
1557
+ "epoch": 18.36,
1558
+ "learning_rate": 1.2268370607028754e-06,
1559
+ "loss": 0.6658,
1560
+ "step": 202
1561
+ },
1562
+ {
1563
+ "epoch": 18.45,
1564
+ "learning_rate": 1.2172523961661342e-06,
1565
+ "loss": 0.649,
1566
+ "step": 203
1567
+ },
1568
+ {
1569
+ "epoch": 18.55,
1570
+ "learning_rate": 1.207667731629393e-06,
1571
+ "loss": 0.6342,
1572
+ "step": 204
1573
+ },
1574
+ {
1575
+ "epoch": 18.64,
1576
+ "learning_rate": 1.198083067092652e-06,
1577
+ "loss": 0.6441,
1578
+ "step": 205
1579
+ },
1580
+ {
1581
+ "epoch": 18.73,
1582
+ "learning_rate": 1.1884984025559105e-06,
1583
+ "loss": 0.6429,
1584
+ "step": 206
1585
+ },
1586
+ {
1587
+ "epoch": 18.82,
1588
+ "learning_rate": 1.1789137380191693e-06,
1589
+ "loss": 0.6155,
1590
+ "step": 207
1591
+ },
1592
+ {
1593
+ "epoch": 18.91,
1594
+ "learning_rate": 1.1693290734824281e-06,
1595
+ "loss": 0.6347,
1596
+ "step": 208
1597
+ },
1598
+ {
1599
+ "epoch": 19.0,
1600
+ "learning_rate": 1.159744408945687e-06,
1601
+ "loss": 0.6611,
1602
+ "step": 209
1603
+ },
1604
+ {
1605
+ "epoch": 19.09,
1606
+ "learning_rate": 1.1501597444089457e-06,
1607
+ "loss": 0.6398,
1608
+ "step": 210
1609
+ },
1610
+ {
1611
+ "epoch": 19.09,
1612
+ "eval_accuracy_safe": 0.6413602877398313,
1613
+ "eval_accuracy_unlabeled": NaN,
1614
+ "eval_accuracy_unsafe": 0.9258418644556835,
1615
+ "eval_iou_safe": 0.26823363821482293,
1616
+ "eval_iou_unlabeled": 0.0,
1617
+ "eval_iou_unsafe": 0.9159351131912487,
1618
+ "eval_loss": 0.5784907341003418,
1619
+ "eval_mean_accuracy": 0.7836010760977574,
1620
+ "eval_mean_iou": 0.39472291713535723,
1621
+ "eval_overall_accuracy": 0.9174387348231985,
1622
+ "eval_runtime": 11.2723,
1623
+ "eval_samples_per_second": 5.944,
1624
+ "eval_steps_per_second": 0.444,
1625
+ "step": 210
1626
+ },
1627
+ {
1628
+ "epoch": 19.18,
1629
+ "learning_rate": 1.1405750798722045e-06,
1630
+ "loss": 0.6403,
1631
+ "step": 211
1632
+ },
1633
+ {
1634
+ "epoch": 19.27,
1635
+ "learning_rate": 1.1309904153354633e-06,
1636
+ "loss": 0.6271,
1637
+ "step": 212
1638
+ },
1639
+ {
1640
+ "epoch": 19.36,
1641
+ "learning_rate": 1.121405750798722e-06,
1642
+ "loss": 0.679,
1643
+ "step": 213
1644
+ },
1645
+ {
1646
+ "epoch": 19.45,
1647
+ "learning_rate": 1.1118210862619809e-06,
1648
+ "loss": 0.6239,
1649
+ "step": 214
1650
+ },
1651
+ {
1652
+ "epoch": 19.55,
1653
+ "learning_rate": 1.1022364217252397e-06,
1654
+ "loss": 0.6527,
1655
+ "step": 215
1656
+ },
1657
+ {
1658
+ "epoch": 19.64,
1659
+ "learning_rate": 1.0926517571884984e-06,
1660
+ "loss": 0.6228,
1661
+ "step": 216
1662
+ },
1663
+ {
1664
+ "epoch": 19.73,
1665
+ "learning_rate": 1.0830670926517572e-06,
1666
+ "loss": 0.6227,
1667
+ "step": 217
1668
+ },
1669
+ {
1670
+ "epoch": 19.82,
1671
+ "learning_rate": 1.073482428115016e-06,
1672
+ "loss": 0.6347,
1673
+ "step": 218
1674
+ },
1675
+ {
1676
+ "epoch": 19.91,
1677
+ "learning_rate": 1.0638977635782748e-06,
1678
+ "loss": 0.6374,
1679
+ "step": 219
1680
+ },
1681
+ {
1682
+ "epoch": 20.0,
1683
+ "learning_rate": 1.0543130990415336e-06,
1684
+ "loss": 0.5845,
1685
+ "step": 220
1686
+ },
1687
+ {
1688
+ "epoch": 20.0,
1689
+ "eval_accuracy_safe": 0.6426151017151052,
1690
+ "eval_accuracy_unlabeled": NaN,
1691
+ "eval_accuracy_unsafe": 0.9286315640516787,
1692
+ "eval_iou_safe": 0.26982054857603477,
1693
+ "eval_iou_unlabeled": 0.0,
1694
+ "eval_iou_unsafe": 0.9187221572756564,
1695
+ "eval_loss": 0.5641139149665833,
1696
+ "eval_mean_accuracy": 0.7856233328833919,
1697
+ "eval_mean_iou": 0.39618090195056377,
1698
+ "eval_overall_accuracy": 0.9201830963590252,
1699
+ "eval_runtime": 9.4874,
1700
+ "eval_samples_per_second": 7.062,
1701
+ "eval_steps_per_second": 0.527,
1702
+ "step": 220
1703
+ },
1704
+ {
1705
+ "epoch": 20.09,
1706
+ "learning_rate": 1.0447284345047924e-06,
1707
+ "loss": 0.606,
1708
+ "step": 221
1709
+ },
1710
+ {
1711
+ "epoch": 20.18,
1712
+ "learning_rate": 1.0351437699680512e-06,
1713
+ "loss": 0.6491,
1714
+ "step": 222
1715
+ },
1716
+ {
1717
+ "epoch": 20.27,
1718
+ "learning_rate": 1.02555910543131e-06,
1719
+ "loss": 0.6396,
1720
+ "step": 223
1721
+ },
1722
+ {
1723
+ "epoch": 20.36,
1724
+ "learning_rate": 1.0159744408945688e-06,
1725
+ "loss": 0.617,
1726
+ "step": 224
1727
+ },
1728
+ {
1729
+ "epoch": 20.45,
1730
+ "learning_rate": 1.0063897763578276e-06,
1731
+ "loss": 0.614,
1732
+ "step": 225
1733
+ },
1734
+ {
1735
+ "epoch": 20.55,
1736
+ "learning_rate": 9.968051118210861e-07,
1737
+ "loss": 0.6281,
1738
+ "step": 226
1739
+ },
1740
+ {
1741
+ "epoch": 20.64,
1742
+ "learning_rate": 9.872204472843452e-07,
1743
+ "loss": 0.6374,
1744
+ "step": 227
1745
+ },
1746
+ {
1747
+ "epoch": 20.73,
1748
+ "learning_rate": 9.77635782747604e-07,
1749
+ "loss": 0.6394,
1750
+ "step": 228
1751
+ },
1752
+ {
1753
+ "epoch": 20.82,
1754
+ "learning_rate": 9.680511182108625e-07,
1755
+ "loss": 0.6351,
1756
+ "step": 229
1757
+ },
1758
+ {
1759
+ "epoch": 20.91,
1760
+ "learning_rate": 9.584664536741213e-07,
1761
+ "loss": 0.6062,
1762
+ "step": 230
1763
+ },
1764
+ {
1765
+ "epoch": 20.91,
1766
+ "eval_accuracy_safe": 0.6519963300064379,
1767
+ "eval_accuracy_unlabeled": NaN,
1768
+ "eval_accuracy_unsafe": 0.9252195649054266,
1769
+ "eval_iou_safe": 0.2640576051310034,
1770
+ "eval_iou_unlabeled": 0.0,
1771
+ "eval_iou_unsafe": 0.9156001170929594,
1772
+ "eval_loss": 0.5693235397338867,
1773
+ "eval_mean_accuracy": 0.7886079474559322,
1774
+ "eval_mean_iou": 0.3932192407413209,
1775
+ "eval_overall_accuracy": 0.9171489886383513,
1776
+ "eval_runtime": 11.0762,
1777
+ "eval_samples_per_second": 6.049,
1778
+ "eval_steps_per_second": 0.451,
1779
+ "step": 230
1780
+ },
1781
+ {
1782
+ "epoch": 21.0,
1783
+ "learning_rate": 9.488817891373802e-07,
1784
+ "loss": 0.6456,
1785
+ "step": 231
1786
+ },
1787
+ {
1788
+ "epoch": 21.09,
1789
+ "learning_rate": 9.39297124600639e-07,
1790
+ "loss": 0.6055,
1791
+ "step": 232
1792
+ },
1793
+ {
1794
+ "epoch": 21.18,
1795
+ "learning_rate": 9.297124600638977e-07,
1796
+ "loss": 0.6134,
1797
+ "step": 233
1798
+ },
1799
+ {
1800
+ "epoch": 21.27,
1801
+ "learning_rate": 9.201277955271566e-07,
1802
+ "loss": 0.5718,
1803
+ "step": 234
1804
+ },
1805
+ {
1806
+ "epoch": 21.36,
1807
+ "learning_rate": 9.105431309904154e-07,
1808
+ "loss": 0.5939,
1809
+ "step": 235
1810
+ },
1811
+ {
1812
+ "epoch": 21.45,
1813
+ "learning_rate": 9.009584664536742e-07,
1814
+ "loss": 0.5917,
1815
+ "step": 236
1816
+ },
1817
+ {
1818
+ "epoch": 21.55,
1819
+ "learning_rate": 8.913738019169329e-07,
1820
+ "loss": 0.599,
1821
+ "step": 237
1822
+ },
1823
+ {
1824
+ "epoch": 21.64,
1825
+ "learning_rate": 8.817891373801916e-07,
1826
+ "loss": 0.6239,
1827
+ "step": 238
1828
+ },
1829
+ {
1830
+ "epoch": 21.73,
1831
+ "learning_rate": 8.722044728434505e-07,
1832
+ "loss": 0.5946,
1833
+ "step": 239
1834
+ },
1835
+ {
1836
+ "epoch": 21.82,
1837
+ "learning_rate": 8.626198083067093e-07,
1838
+ "loss": 0.6071,
1839
+ "step": 240
1840
+ },
1841
+ {
1842
+ "epoch": 21.82,
1843
+ "eval_accuracy_safe": 0.6591840432380754,
1844
+ "eval_accuracy_unlabeled": NaN,
1845
+ "eval_accuracy_unsafe": 0.9282916959179331,
1846
+ "eval_iou_safe": 0.267531459702011,
1847
+ "eval_iou_unlabeled": 0.0,
1848
+ "eval_iou_unsafe": 0.9188227497665283,
1849
+ "eval_loss": 0.5627052187919617,
1850
+ "eval_mean_accuracy": 0.7937378695780043,
1851
+ "eval_mean_iou": 0.39545140315617977,
1852
+ "eval_overall_accuracy": 0.9203426873506005,
1853
+ "eval_runtime": 9.7383,
1854
+ "eval_samples_per_second": 6.88,
1855
+ "eval_steps_per_second": 0.513,
1856
+ "step": 240
1857
+ },
1858
+ {
1859
+ "epoch": 21.91,
1860
+ "learning_rate": 8.53035143769968e-07,
1861
+ "loss": 0.5784,
1862
+ "step": 241
1863
+ },
1864
+ {
1865
+ "epoch": 22.0,
1866
+ "learning_rate": 8.434504792332268e-07,
1867
+ "loss": 0.6049,
1868
+ "step": 242
1869
+ },
1870
+ {
1871
+ "epoch": 22.09,
1872
+ "learning_rate": 8.338658146964857e-07,
1873
+ "loss": 0.5871,
1874
+ "step": 243
1875
+ },
1876
+ {
1877
+ "epoch": 22.18,
1878
+ "learning_rate": 8.242811501597445e-07,
1879
+ "loss": 0.5894,
1880
+ "step": 244
1881
+ },
1882
+ {
1883
+ "epoch": 22.27,
1884
+ "learning_rate": 8.146964856230032e-07,
1885
+ "loss": 0.5801,
1886
+ "step": 245
1887
+ },
1888
+ {
1889
+ "epoch": 22.36,
1890
+ "learning_rate": 8.05111821086262e-07,
1891
+ "loss": 0.5719,
1892
+ "step": 246
1893
+ },
1894
+ {
1895
+ "epoch": 22.45,
1896
+ "learning_rate": 7.955271565495208e-07,
1897
+ "loss": 0.5979,
1898
+ "step": 247
1899
+ },
1900
+ {
1901
+ "epoch": 22.55,
1902
+ "learning_rate": 7.859424920127797e-07,
1903
+ "loss": 0.5855,
1904
+ "step": 248
1905
+ },
1906
+ {
1907
+ "epoch": 22.64,
1908
+ "learning_rate": 7.763578274760382e-07,
1909
+ "loss": 0.5975,
1910
+ "step": 249
1911
+ },
1912
+ {
1913
+ "epoch": 22.73,
1914
+ "learning_rate": 7.667731629392971e-07,
1915
+ "loss": 0.6209,
1916
+ "step": 250
1917
+ },
1918
+ {
1919
+ "epoch": 22.73,
1920
+ "eval_accuracy_safe": 0.6618690752926936,
1921
+ "eval_accuracy_unlabeled": NaN,
1922
+ "eval_accuracy_unsafe": 0.9299528432231069,
1923
+ "eval_iou_safe": 0.2724302598559697,
1924
+ "eval_iou_unlabeled": 0.0,
1925
+ "eval_iou_unsafe": 0.9205411497943506,
1926
+ "eval_loss": 0.5631816983222961,
1927
+ "eval_mean_accuracy": 0.7959109592579002,
1928
+ "eval_mean_iou": 0.39765713655010676,
1929
+ "eval_overall_accuracy": 0.9220340785695545,
1930
+ "eval_runtime": 10.1606,
1931
+ "eval_samples_per_second": 6.594,
1932
+ "eval_steps_per_second": 0.492,
1933
+ "step": 250
1934
+ },
1935
+ {
1936
+ "epoch": 22.82,
1937
+ "learning_rate": 7.571884984025559e-07,
1938
+ "loss": 0.5852,
1939
+ "step": 251
1940
+ },
1941
+ {
1942
+ "epoch": 22.91,
1943
+ "learning_rate": 7.476038338658147e-07,
1944
+ "loss": 0.5775,
1945
+ "step": 252
1946
+ },
1947
+ {
1948
+ "epoch": 23.0,
1949
+ "learning_rate": 7.380191693290735e-07,
1950
+ "loss": 0.6365,
1951
+ "step": 253
1952
+ },
1953
+ {
1954
+ "epoch": 23.09,
1955
+ "learning_rate": 7.284345047923323e-07,
1956
+ "loss": 0.6243,
1957
+ "step": 254
1958
+ },
1959
+ {
1960
+ "epoch": 23.18,
1961
+ "learning_rate": 7.188498402555911e-07,
1962
+ "loss": 0.5995,
1963
+ "step": 255
1964
+ },
1965
+ {
1966
+ "epoch": 23.27,
1967
+ "learning_rate": 7.092651757188499e-07,
1968
+ "loss": 0.6019,
1969
+ "step": 256
1970
+ },
1971
+ {
1972
+ "epoch": 23.36,
1973
+ "learning_rate": 6.996805111821087e-07,
1974
+ "loss": 0.5883,
1975
+ "step": 257
1976
+ },
1977
+ {
1978
+ "epoch": 23.45,
1979
+ "learning_rate": 6.900958466453674e-07,
1980
+ "loss": 0.589,
1981
+ "step": 258
1982
+ },
1983
+ {
1984
+ "epoch": 23.55,
1985
+ "learning_rate": 6.805111821086263e-07,
1986
+ "loss": 0.5717,
1987
+ "step": 259
1988
+ },
1989
+ {
1990
+ "epoch": 23.64,
1991
+ "learning_rate": 6.709265175718849e-07,
1992
+ "loss": 0.5609,
1993
+ "step": 260
1994
+ },
1995
+ {
1996
+ "epoch": 23.64,
1997
+ "eval_accuracy_safe": 0.6504639534928547,
1998
+ "eval_accuracy_unlabeled": NaN,
1999
+ "eval_accuracy_unsafe": 0.9378781128324656,
2000
+ "eval_iou_safe": 0.2868443063281154,
2001
+ "eval_iou_unlabeled": 0.0,
2002
+ "eval_iou_unsafe": 0.9280609954701114,
2003
+ "eval_loss": 0.5416346192359924,
2004
+ "eval_mean_accuracy": 0.7941710331626601,
2005
+ "eval_mean_iou": 0.40496843393274223,
2006
+ "eval_overall_accuracy": 0.9293883594114389,
2007
+ "eval_runtime": 9.5225,
2008
+ "eval_samples_per_second": 7.036,
2009
+ "eval_steps_per_second": 0.525,
2010
+ "step": 260
2011
+ },
2012
+ {
2013
+ "epoch": 23.73,
2014
+ "learning_rate": 6.613418530351438e-07,
2015
+ "loss": 0.5557,
2016
+ "step": 261
2017
+ },
2018
+ {
2019
+ "epoch": 23.82,
2020
+ "learning_rate": 6.517571884984025e-07,
2021
+ "loss": 0.5968,
2022
+ "step": 262
2023
+ },
2024
+ {
2025
+ "epoch": 23.91,
2026
+ "learning_rate": 6.421725239616614e-07,
2027
+ "loss": 0.5673,
2028
+ "step": 263
2029
+ },
2030
+ {
2031
+ "epoch": 24.0,
2032
+ "learning_rate": 6.325878594249201e-07,
2033
+ "loss": 0.6091,
2034
+ "step": 264
2035
+ },
2036
+ {
2037
+ "epoch": 24.09,
2038
+ "learning_rate": 6.230031948881789e-07,
2039
+ "loss": 0.5776,
2040
+ "step": 265
2041
+ },
2042
+ {
2043
+ "epoch": 24.18,
2044
+ "learning_rate": 6.134185303514377e-07,
2045
+ "loss": 0.5562,
2046
+ "step": 266
2047
+ },
2048
+ {
2049
+ "epoch": 24.27,
2050
+ "learning_rate": 6.038338658146965e-07,
2051
+ "loss": 0.5863,
2052
+ "step": 267
2053
+ },
2054
+ {
2055
+ "epoch": 24.36,
2056
+ "learning_rate": 5.942492012779553e-07,
2057
+ "loss": 0.5565,
2058
+ "step": 268
2059
+ },
2060
+ {
2061
+ "epoch": 24.45,
2062
+ "learning_rate": 5.846645367412141e-07,
2063
+ "loss": 0.5858,
2064
+ "step": 269
2065
+ },
2066
+ {
2067
+ "epoch": 24.55,
2068
+ "learning_rate": 5.750798722044729e-07,
2069
+ "loss": 0.5752,
2070
+ "step": 270
2071
+ },
2072
+ {
2073
+ "epoch": 24.55,
2074
+ "eval_accuracy_safe": 0.6412195789530495,
2075
+ "eval_accuracy_unlabeled": NaN,
2076
+ "eval_accuracy_unsafe": 0.945148932410419,
2077
+ "eval_iou_safe": 0.2982960328042603,
2078
+ "eval_iou_unlabeled": 0.0,
2079
+ "eval_iou_unsafe": 0.9349957034087992,
2080
+ "eval_loss": 0.5140887498855591,
2081
+ "eval_mean_accuracy": 0.7931842556817342,
2082
+ "eval_mean_iou": 0.41109724540435316,
2083
+ "eval_overall_accuracy": 0.9361713466359608,
2084
+ "eval_runtime": 10.0336,
2085
+ "eval_samples_per_second": 6.678,
2086
+ "eval_steps_per_second": 0.498,
2087
+ "step": 270
2088
+ },
2089
+ {
2090
+ "epoch": 24.64,
2091
+ "learning_rate": 5.654952076677316e-07,
2092
+ "loss": 0.5881,
2093
+ "step": 271
2094
+ },
2095
+ {
2096
+ "epoch": 24.73,
2097
+ "learning_rate": 5.559105431309904e-07,
2098
+ "loss": 0.6124,
2099
+ "step": 272
2100
+ },
2101
+ {
2102
+ "epoch": 24.82,
2103
+ "learning_rate": 5.463258785942492e-07,
2104
+ "loss": 0.5648,
2105
+ "step": 273
2106
+ },
2107
+ {
2108
+ "epoch": 24.91,
2109
+ "learning_rate": 5.36741214057508e-07,
2110
+ "loss": 0.578,
2111
+ "step": 274
2112
+ },
2113
+ {
2114
+ "epoch": 25.0,
2115
+ "learning_rate": 5.271565495207668e-07,
2116
+ "loss": 0.5605,
2117
+ "step": 275
2118
+ },
2119
+ {
2120
+ "epoch": 25.09,
2121
+ "learning_rate": 5.175718849840256e-07,
2122
+ "loss": 0.588,
2123
+ "step": 276
2124
+ },
2125
+ {
2126
+ "epoch": 25.18,
2127
+ "learning_rate": 5.079872204472844e-07,
2128
+ "loss": 0.5814,
2129
+ "step": 277
2130
+ },
2131
+ {
2132
+ "epoch": 25.27,
2133
+ "learning_rate": 4.984025559105431e-07,
2134
+ "loss": 0.5671,
2135
+ "step": 278
2136
+ },
2137
+ {
2138
+ "epoch": 25.36,
2139
+ "learning_rate": 4.88817891373802e-07,
2140
+ "loss": 0.5237,
2141
+ "step": 279
2142
+ },
2143
+ {
2144
+ "epoch": 25.45,
2145
+ "learning_rate": 4.792332268370607e-07,
2146
+ "loss": 0.6004,
2147
+ "step": 280
2148
+ },
2149
+ {
2150
+ "epoch": 25.45,
2151
+ "eval_accuracy_safe": 0.6491917918589365,
2152
+ "eval_accuracy_unlabeled": NaN,
2153
+ "eval_accuracy_unsafe": 0.9412261630289883,
2154
+ "eval_iou_safe": 0.2907094372975922,
2155
+ "eval_iou_unlabeled": 0.0,
2156
+ "eval_iou_unsafe": 0.9313366391036164,
2157
+ "eval_loss": 0.5255351662635803,
2158
+ "eval_mean_accuracy": 0.7952089774439624,
2159
+ "eval_mean_iou": 0.4073486921337362,
2160
+ "eval_overall_accuracy": 0.9325999359586346,
2161
+ "eval_runtime": 9.8685,
2162
+ "eval_samples_per_second": 6.789,
2163
+ "eval_steps_per_second": 0.507,
2164
+ "step": 280
2165
+ },
2166
+ {
2167
+ "epoch": 25.55,
2168
+ "learning_rate": 4.696485623003195e-07,
2169
+ "loss": 0.5482,
2170
+ "step": 281
2171
+ },
2172
+ {
2173
+ "epoch": 25.64,
2174
+ "learning_rate": 4.600638977635783e-07,
2175
+ "loss": 0.5764,
2176
+ "step": 282
2177
+ },
2178
+ {
2179
+ "epoch": 25.73,
2180
+ "learning_rate": 4.504792332268371e-07,
2181
+ "loss": 0.5608,
2182
+ "step": 283
2183
+ },
2184
+ {
2185
+ "epoch": 25.82,
2186
+ "learning_rate": 4.408945686900958e-07,
2187
+ "loss": 0.5698,
2188
+ "step": 284
2189
+ },
2190
+ {
2191
+ "epoch": 25.91,
2192
+ "learning_rate": 4.3130990415335466e-07,
2193
+ "loss": 0.5502,
2194
+ "step": 285
2195
+ },
2196
+ {
2197
+ "epoch": 26.0,
2198
+ "learning_rate": 4.217252396166134e-07,
2199
+ "loss": 0.5975,
2200
+ "step": 286
2201
+ },
2202
+ {
2203
+ "epoch": 26.09,
2204
+ "learning_rate": 4.1214057507987225e-07,
2205
+ "loss": 0.5736,
2206
+ "step": 287
2207
+ },
2208
+ {
2209
+ "epoch": 26.18,
2210
+ "learning_rate": 4.02555910543131e-07,
2211
+ "loss": 0.5498,
2212
+ "step": 288
2213
+ },
2214
+ {
2215
+ "epoch": 26.27,
2216
+ "learning_rate": 3.9297124600638983e-07,
2217
+ "loss": 0.5682,
2218
+ "step": 289
2219
+ },
2220
+ {
2221
+ "epoch": 26.36,
2222
+ "learning_rate": 3.8338658146964857e-07,
2223
+ "loss": 0.5524,
2224
+ "step": 290
2225
+ },
2226
+ {
2227
+ "epoch": 26.36,
2228
+ "eval_accuracy_safe": 0.6587715544658655,
2229
+ "eval_accuracy_unlabeled": NaN,
2230
+ "eval_accuracy_unsafe": 0.9386905578378355,
2231
+ "eval_iou_safe": 0.28676309565062713,
2232
+ "eval_iou_unlabeled": 0.0,
2233
+ "eval_iou_unsafe": 0.9290998927343179,
2234
+ "eval_loss": 0.5313962697982788,
2235
+ "eval_mean_accuracy": 0.7987310561518506,
2236
+ "eval_mean_iou": 0.4052876627949817,
2237
+ "eval_overall_accuracy": 0.9304221993062034,
2238
+ "eval_runtime": 9.5415,
2239
+ "eval_samples_per_second": 7.022,
2240
+ "eval_steps_per_second": 0.524,
2241
+ "step": 290
2242
+ },
2243
+ {
2244
+ "epoch": 26.45,
2245
+ "learning_rate": 3.7380191693290736e-07,
2246
+ "loss": 0.5519,
2247
+ "step": 291
2248
+ },
2249
+ {
2250
+ "epoch": 26.55,
2251
+ "learning_rate": 3.6421725239616615e-07,
2252
+ "loss": 0.5424,
2253
+ "step": 292
2254
+ },
2255
+ {
2256
+ "epoch": 26.64,
2257
+ "learning_rate": 3.5463258785942494e-07,
2258
+ "loss": 0.583,
2259
+ "step": 293
2260
+ },
2261
+ {
2262
+ "epoch": 26.73,
2263
+ "learning_rate": 3.450479233226837e-07,
2264
+ "loss": 0.5798,
2265
+ "step": 294
2266
+ },
2267
+ {
2268
+ "epoch": 26.82,
2269
+ "learning_rate": 3.3546325878594247e-07,
2270
+ "loss": 0.5284,
2271
+ "step": 295
2272
+ },
2273
+ {
2274
+ "epoch": 26.91,
2275
+ "learning_rate": 3.2587859424920126e-07,
2276
+ "loss": 0.5681,
2277
+ "step": 296
2278
+ },
2279
+ {
2280
+ "epoch": 27.0,
2281
+ "learning_rate": 3.1629392971246005e-07,
2282
+ "loss": 0.6352,
2283
+ "step": 297
2284
+ },
2285
+ {
2286
+ "epoch": 27.09,
2287
+ "learning_rate": 3.0670926517571884e-07,
2288
+ "loss": 0.5651,
2289
+ "step": 298
2290
+ },
2291
+ {
2292
+ "epoch": 27.18,
2293
+ "learning_rate": 2.9712460063897763e-07,
2294
+ "loss": 0.5707,
2295
+ "step": 299
2296
+ },
2297
+ {
2298
+ "epoch": 27.27,
2299
+ "learning_rate": 2.875399361022364e-07,
2300
+ "loss": 0.5758,
2301
+ "step": 300
2302
+ },
2303
+ {
2304
+ "epoch": 27.27,
2305
+ "eval_accuracy_safe": 0.6544115095932552,
2306
+ "eval_accuracy_unlabeled": NaN,
2307
+ "eval_accuracy_unsafe": 0.9423355893036522,
2308
+ "eval_iou_safe": 0.291325116977104,
2309
+ "eval_iou_unlabeled": 0.0,
2310
+ "eval_iou_unsafe": 0.9325746804551616,
2311
+ "eval_loss": 0.526845395565033,
2312
+ "eval_mean_accuracy": 0.7983735494484537,
2313
+ "eval_mean_iou": 0.40796659914408856,
2314
+ "eval_overall_accuracy": 0.9338307736524895,
2315
+ "eval_runtime": 10.1793,
2316
+ "eval_samples_per_second": 6.582,
2317
+ "eval_steps_per_second": 0.491,
2318
+ "step": 300
2319
+ },
2320
+ {
2321
+ "epoch": 27.36,
2322
+ "learning_rate": 2.779552715654952e-07,
2323
+ "loss": 0.5541,
2324
+ "step": 301
2325
+ },
2326
+ {
2327
+ "epoch": 27.45,
2328
+ "learning_rate": 2.68370607028754e-07,
2329
+ "loss": 0.5143,
2330
+ "step": 302
2331
+ },
2332
+ {
2333
+ "epoch": 27.55,
2334
+ "learning_rate": 2.587859424920128e-07,
2335
+ "loss": 0.5392,
2336
+ "step": 303
2337
+ },
2338
+ {
2339
+ "epoch": 27.64,
2340
+ "learning_rate": 2.4920127795527154e-07,
2341
+ "loss": 0.5803,
2342
+ "step": 304
2343
+ },
2344
+ {
2345
+ "epoch": 27.73,
2346
+ "learning_rate": 2.3961661341853033e-07,
2347
+ "loss": 0.5733,
2348
+ "step": 305
2349
+ },
2350
+ {
2351
+ "epoch": 27.82,
2352
+ "learning_rate": 2.3003194888178915e-07,
2353
+ "loss": 0.5799,
2354
+ "step": 306
2355
+ },
2356
+ {
2357
+ "epoch": 27.91,
2358
+ "learning_rate": 2.204472843450479e-07,
2359
+ "loss": 0.5737,
2360
+ "step": 307
2361
+ },
2362
+ {
2363
+ "epoch": 28.0,
2364
+ "learning_rate": 2.108626198083067e-07,
2365
+ "loss": 0.507,
2366
+ "step": 308
2367
+ },
2368
+ {
2369
+ "epoch": 28.09,
2370
+ "learning_rate": 2.012779552715655e-07,
2371
+ "loss": 0.5913,
2372
+ "step": 309
2373
+ },
2374
+ {
2375
+ "epoch": 28.18,
2376
+ "learning_rate": 1.9169329073482428e-07,
2377
+ "loss": 0.5598,
2378
+ "step": 310
2379
+ },
2380
+ {
2381
+ "epoch": 28.18,
2382
+ "eval_accuracy_safe": 0.6604831901187737,
2383
+ "eval_accuracy_unlabeled": NaN,
2384
+ "eval_accuracy_unsafe": 0.9407892567641855,
2385
+ "eval_iou_safe": 0.2896690945241332,
2386
+ "eval_iou_unlabeled": 0.0,
2387
+ "eval_iou_unsafe": 0.9312167321135931,
2388
+ "eval_loss": 0.5239936709403992,
2389
+ "eval_mean_accuracy": 0.8006362234414796,
2390
+ "eval_mean_iou": 0.4069619422125754,
2391
+ "eval_overall_accuracy": 0.9325094650040812,
2392
+ "eval_runtime": 9.6243,
2393
+ "eval_samples_per_second": 6.962,
2394
+ "eval_steps_per_second": 0.52,
2395
+ "step": 310
2396
+ },
2397
+ {
2398
+ "epoch": 28.27,
2399
+ "learning_rate": 1.8210862619808307e-07,
2400
+ "loss": 0.5394,
2401
+ "step": 311
2402
+ },
2403
+ {
2404
+ "epoch": 28.36,
2405
+ "learning_rate": 1.7252396166134184e-07,
2406
+ "loss": 0.5312,
2407
+ "step": 312
2408
+ },
2409
+ {
2410
+ "epoch": 28.45,
2411
+ "learning_rate": 1.6293929712460063e-07,
2412
+ "loss": 0.5313,
2413
+ "step": 313
2414
+ },
2415
+ {
2416
+ "epoch": 28.55,
2417
+ "learning_rate": 1.5335463258785942e-07,
2418
+ "loss": 0.5188,
2419
+ "step": 314
2420
+ },
2421
+ {
2422
+ "epoch": 28.64,
2423
+ "learning_rate": 1.437699680511182e-07,
2424
+ "loss": 0.5497,
2425
+ "step": 315
2426
+ },
2427
+ {
2428
+ "epoch": 28.73,
2429
+ "learning_rate": 1.34185303514377e-07,
2430
+ "loss": 0.5908,
2431
+ "step": 316
2432
+ },
2433
+ {
2434
+ "epoch": 28.82,
2435
+ "learning_rate": 1.2460063897763577e-07,
2436
+ "loss": 0.56,
2437
+ "step": 317
2438
+ },
2439
+ {
2440
+ "epoch": 28.91,
2441
+ "learning_rate": 1.1501597444089457e-07,
2442
+ "loss": 0.5792,
2443
+ "step": 318
2444
+ },
2445
+ {
2446
+ "epoch": 29.0,
2447
+ "learning_rate": 1.0543130990415335e-07,
2448
+ "loss": 0.6318,
2449
+ "step": 319
2450
+ },
2451
+ {
2452
+ "epoch": 29.09,
2453
+ "learning_rate": 9.584664536741214e-08,
2454
+ "loss": 0.5505,
2455
+ "step": 320
2456
+ },
2457
+ {
2458
+ "epoch": 29.09,
2459
+ "eval_accuracy_safe": 0.6582414871183997,
2460
+ "eval_accuracy_unlabeled": NaN,
2461
+ "eval_accuracy_unsafe": 0.9420817295738547,
2462
+ "eval_iou_safe": 0.29588640634788055,
2463
+ "eval_iou_unlabeled": 0.0,
2464
+ "eval_iou_unsafe": 0.9324414181256692,
2465
+ "eval_loss": 0.5165032744407654,
2466
+ "eval_mean_accuracy": 0.8001616083461272,
2467
+ "eval_mean_iou": 0.4094426081578499,
2468
+ "eval_overall_accuracy": 0.933697543927093,
2469
+ "eval_runtime": 11.4418,
2470
+ "eval_samples_per_second": 5.856,
2471
+ "eval_steps_per_second": 0.437,
2472
+ "step": 320
2473
  }
2474
  ],
2475
  "max_steps": 330,
2476
  "num_train_epochs": 30,
2477
+ "total_flos": 1.7886913543164396e+18,
2478
  "trial_name": null,
2479
  "trial_params": null
2480
  }
{checkpoint-120 β†’ checkpoint-320}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77f03bab7ef5a9db57b2529dde5273404861bcaa585ecaa39364ff26b054db34
3
  size 338796489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8f1820205b4b98713df2a49ff37a9a65771547246a6b06bb8594ee68aa08012
3
  size 338796489
runs/Feb07_22-15-06_robovision.csres.utexas.edu/events.out.tfevents.1707365713.robovision.csres.utexas.edu.742362.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54dbe9f470077caea550152fabd91fe321d013bf31799bcd93a3c229d0e10a36
3
- size 70030
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b353ecb08ab497af3d7949b83ce4cc388c189b4180d30d01d6d55877b293d3cf
3
+ size 79434