nielsr HF staff commited on
Commit
8937053
1 Parent(s): 398eb8d

End of training

Browse files
all_results.json CHANGED
@@ -1,84 +1,84 @@
1
  {
2
- "epoch": 50.0,
3
  "eval_accuracy_construction-bridge": 0.0,
4
- "eval_accuracy_construction-building": 0.923248608581478,
5
  "eval_accuracy_construction-door": 0.0,
6
- "eval_accuracy_construction-fenceguardrail": 0.09433107330840278,
7
  "eval_accuracy_construction-stairs": 0.0,
8
  "eval_accuracy_construction-tunnel": NaN,
9
- "eval_accuracy_construction-wall": 0.21464674476906634,
10
- "eval_accuracy_flat-crosswalk": 0.3228431325584535,
11
- "eval_accuracy_flat-curb": 0.3171838475268673,
12
- "eval_accuracy_flat-cyclinglane": 0.7303143809670815,
13
- "eval_accuracy_flat-parkingdriveway": 0.27434110103060105,
14
  "eval_accuracy_flat-railtrack": NaN,
15
- "eval_accuracy_flat-road": 0.6562864431018484,
16
- "eval_accuracy_flat-sidewalk": 0.9295361346748208,
17
- "eval_accuracy_human-person": 0.010889394661161983,
18
  "eval_accuracy_human-rider": 0.0,
19
- "eval_accuracy_nature-terrain": 0.7748158286891488,
20
- "eval_accuracy_nature-vegetation": 0.9083438657394087,
21
- "eval_accuracy_object-pole": 0.2119288699124848,
22
  "eval_accuracy_object-trafficlight": 0.0,
23
  "eval_accuracy_object-trafficsign": 0.0,
24
- "eval_accuracy_sky": 0.8846353126324072,
25
  "eval_accuracy_unlabeled": NaN,
26
  "eval_accuracy_vehicle-bicycle": 0.0,
27
  "eval_accuracy_vehicle-bus": 0.0,
28
- "eval_accuracy_vehicle-car": 0.9388154884849852,
29
  "eval_accuracy_vehicle-caravan": 0.0,
30
  "eval_accuracy_vehicle-cartrailer": 0.0,
31
  "eval_accuracy_vehicle-motorcycle": 0.0,
32
- "eval_accuracy_vehicle-tramtrain": 0.0,
33
  "eval_accuracy_vehicle-truck": 0.0,
34
  "eval_accuracy_void-dynamic": 0.0,
35
  "eval_accuracy_void-ground": 0.0,
36
- "eval_accuracy_void-static": 0.17566618866656386,
37
  "eval_accuracy_void-unclear": 0.0,
38
  "eval_iou_construction-bridge": 0.0,
39
- "eval_iou_construction-building": 0.6151782821349004,
40
  "eval_iou_construction-door": 0.0,
41
- "eval_iou_construction-fenceguardrail": 0.09239785150765831,
42
  "eval_iou_construction-stairs": 0.0,
43
  "eval_iou_construction-tunnel": NaN,
44
- "eval_iou_construction-wall": 0.1796009958723711,
45
- "eval_iou_flat-crosswalk": 0.26608723430220454,
46
- "eval_iou_flat-curb": 0.19206793691107385,
47
- "eval_iou_flat-cyclinglane": 0.6165186094558613,
48
- "eval_iou_flat-parkingdriveway": 0.22540000014154912,
49
  "eval_iou_flat-railtrack": NaN,
50
- "eval_iou_flat-road": 0.5341623036040656,
51
- "eval_iou_flat-sidewalk": 0.8035619780040725,
52
- "eval_iou_human-person": 0.010872092613600332,
53
  "eval_iou_human-rider": 0.0,
54
- "eval_iou_nature-terrain": 0.646685749747382,
55
- "eval_iou_nature-vegetation": 0.7900638904880851,
56
- "eval_iou_object-pole": 0.14375182721824295,
57
  "eval_iou_object-trafficlight": 0.0,
58
  "eval_iou_object-trafficsign": 0.0,
59
- "eval_iou_sky": 0.8389204690587999,
60
  "eval_iou_unlabeled": NaN,
61
  "eval_iou_vehicle-bicycle": 0.0,
62
  "eval_iou_vehicle-bus": 0.0,
63
- "eval_iou_vehicle-car": 0.7190160819570569,
64
  "eval_iou_vehicle-caravan": 0.0,
65
  "eval_iou_vehicle-cartrailer": 0.0,
66
  "eval_iou_vehicle-motorcycle": 0.0,
67
- "eval_iou_vehicle-tramtrain": 0.0,
68
  "eval_iou_vehicle-truck": 0.0,
69
  "eval_iou_void-dynamic": 0.0,
70
  "eval_iou_void-ground": 0.0,
71
- "eval_iou_void-static": 0.09915330318294081,
72
  "eval_iou_void-unclear": 0.0,
73
- "eval_loss": 0.7689843773841858,
74
- "eval_mean_accuracy": 0.26149457547827437,
75
- "eval_mean_iou": 0.21166995644374575,
76
- "eval_overall_accuracy": 0.7839745993658742,
77
- "eval_runtime": 140.2555,
78
- "eval_samples_per_second": 1.069,
79
- "eval_steps_per_second": 0.071,
80
- "train_loss": 0.9338362375895183,
81
- "train_runtime": 1300.5624,
82
- "train_samples_per_second": 32.678,
83
- "train_steps_per_second": 2.076
84
  }
 
1
  {
2
+ "epoch": 18.52,
3
  "eval_accuracy_construction-bridge": 0.0,
4
+ "eval_accuracy_construction-building": 0.8696130299150018,
5
  "eval_accuracy_construction-door": 0.0,
6
+ "eval_accuracy_construction-fenceguardrail": 0.0,
7
  "eval_accuracy_construction-stairs": 0.0,
8
  "eval_accuracy_construction-tunnel": NaN,
9
+ "eval_accuracy_construction-wall": 0.003668217029526036,
10
+ "eval_accuracy_flat-crosswalk": 0.0018557628622486598,
11
+ "eval_accuracy_flat-curb": 0.12767179695127617,
12
+ "eval_accuracy_flat-cyclinglane": 0.790813348290863,
13
+ "eval_accuracy_flat-parkingdriveway": 0.1034764257101185,
14
  "eval_accuracy_flat-railtrack": NaN,
15
+ "eval_accuracy_flat-road": 0.6270179782365589,
16
+ "eval_accuracy_flat-sidewalk": 0.9313179571967581,
17
+ "eval_accuracy_human-person": 0.0,
18
  "eval_accuracy_human-rider": 0.0,
19
+ "eval_accuracy_nature-terrain": 0.7721406421014229,
20
+ "eval_accuracy_nature-vegetation": 0.9034924242863521,
21
+ "eval_accuracy_object-pole": 0.0048094393262509885,
22
  "eval_accuracy_object-trafficlight": 0.0,
23
  "eval_accuracy_object-trafficsign": 0.0,
24
+ "eval_accuracy_sky": 0.8740045100333971,
25
  "eval_accuracy_unlabeled": NaN,
26
  "eval_accuracy_vehicle-bicycle": 0.0,
27
  "eval_accuracy_vehicle-bus": 0.0,
28
+ "eval_accuracy_vehicle-car": 0.8866936750042469,
29
  "eval_accuracy_vehicle-caravan": 0.0,
30
  "eval_accuracy_vehicle-cartrailer": 0.0,
31
  "eval_accuracy_vehicle-motorcycle": 0.0,
32
+ "eval_accuracy_vehicle-tramtrain": NaN,
33
  "eval_accuracy_vehicle-truck": 0.0,
34
  "eval_accuracy_void-dynamic": 0.0,
35
  "eval_accuracy_void-ground": 0.0,
36
+ "eval_accuracy_void-static": 0.0,
37
  "eval_accuracy_void-unclear": 0.0,
38
  "eval_iou_construction-bridge": 0.0,
39
+ "eval_iou_construction-building": 0.5254073493770961,
40
  "eval_iou_construction-door": 0.0,
41
+ "eval_iou_construction-fenceguardrail": 0.0,
42
  "eval_iou_construction-stairs": 0.0,
43
  "eval_iou_construction-tunnel": NaN,
44
+ "eval_iou_construction-wall": 0.003613796876006998,
45
+ "eval_iou_flat-crosswalk": 0.0018557628622486598,
46
+ "eval_iou_flat-curb": 0.09914351771584731,
47
+ "eval_iou_flat-cyclinglane": 0.543396562537026,
48
+ "eval_iou_flat-parkingdriveway": 0.08473532362172038,
49
  "eval_iou_flat-railtrack": NaN,
50
+ "eval_iou_flat-road": 0.48147359145471436,
51
+ "eval_iou_flat-sidewalk": 0.7837101825318907,
52
+ "eval_iou_human-person": 0.0,
53
  "eval_iou_human-rider": 0.0,
54
+ "eval_iou_nature-terrain": 0.5919753566336926,
55
+ "eval_iou_nature-vegetation": 0.7441744730399532,
56
+ "eval_iou_object-pole": 0.004807428163287731,
57
  "eval_iou_object-trafficlight": 0.0,
58
  "eval_iou_object-trafficsign": 0.0,
59
+ "eval_iou_sky": 0.8242789743401755,
60
  "eval_iou_unlabeled": NaN,
61
  "eval_iou_vehicle-bicycle": 0.0,
62
  "eval_iou_vehicle-bus": 0.0,
63
+ "eval_iou_vehicle-car": 0.5682343005687291,
64
  "eval_iou_vehicle-caravan": 0.0,
65
  "eval_iou_vehicle-cartrailer": 0.0,
66
  "eval_iou_vehicle-motorcycle": 0.0,
67
+ "eval_iou_vehicle-tramtrain": NaN,
68
  "eval_iou_vehicle-truck": 0.0,
69
  "eval_iou_void-dynamic": 0.0,
70
  "eval_iou_void-ground": 0.0,
71
+ "eval_iou_void-static": 0.0,
72
  "eval_iou_void-unclear": 0.0,
73
+ "eval_loss": 1.002479910850525,
74
+ "eval_mean_accuracy": 0.22247016796593616,
75
+ "eval_mean_iou": 0.16957440708781898,
76
+ "eval_overall_accuracy": 0.7429234629999191,
77
+ "eval_runtime": 135.2466,
78
+ "eval_samples_per_second": 1.109,
79
+ "eval_steps_per_second": 0.074,
80
+ "train_loss": 1.3263815078735353,
81
+ "train_runtime": 482.7688,
82
+ "train_samples_per_second": 33.142,
83
+ "train_steps_per_second": 2.071
84
  }
eval_results.json CHANGED
@@ -1,80 +1,80 @@
1
  {
2
- "epoch": 50.0,
3
  "eval_accuracy_construction-bridge": 0.0,
4
- "eval_accuracy_construction-building": 0.923248608581478,
5
  "eval_accuracy_construction-door": 0.0,
6
- "eval_accuracy_construction-fenceguardrail": 0.09433107330840278,
7
  "eval_accuracy_construction-stairs": 0.0,
8
  "eval_accuracy_construction-tunnel": NaN,
9
- "eval_accuracy_construction-wall": 0.21464674476906634,
10
- "eval_accuracy_flat-crosswalk": 0.3228431325584535,
11
- "eval_accuracy_flat-curb": 0.3171838475268673,
12
- "eval_accuracy_flat-cyclinglane": 0.7303143809670815,
13
- "eval_accuracy_flat-parkingdriveway": 0.27434110103060105,
14
  "eval_accuracy_flat-railtrack": NaN,
15
- "eval_accuracy_flat-road": 0.6562864431018484,
16
- "eval_accuracy_flat-sidewalk": 0.9295361346748208,
17
- "eval_accuracy_human-person": 0.010889394661161983,
18
  "eval_accuracy_human-rider": 0.0,
19
- "eval_accuracy_nature-terrain": 0.7748158286891488,
20
- "eval_accuracy_nature-vegetation": 0.9083438657394087,
21
- "eval_accuracy_object-pole": 0.2119288699124848,
22
  "eval_accuracy_object-trafficlight": 0.0,
23
  "eval_accuracy_object-trafficsign": 0.0,
24
- "eval_accuracy_sky": 0.8846353126324072,
25
  "eval_accuracy_unlabeled": NaN,
26
  "eval_accuracy_vehicle-bicycle": 0.0,
27
  "eval_accuracy_vehicle-bus": 0.0,
28
- "eval_accuracy_vehicle-car": 0.9388154884849852,
29
  "eval_accuracy_vehicle-caravan": 0.0,
30
  "eval_accuracy_vehicle-cartrailer": 0.0,
31
  "eval_accuracy_vehicle-motorcycle": 0.0,
32
- "eval_accuracy_vehicle-tramtrain": 0.0,
33
  "eval_accuracy_vehicle-truck": 0.0,
34
  "eval_accuracy_void-dynamic": 0.0,
35
  "eval_accuracy_void-ground": 0.0,
36
- "eval_accuracy_void-static": 0.17566618866656386,
37
  "eval_accuracy_void-unclear": 0.0,
38
  "eval_iou_construction-bridge": 0.0,
39
- "eval_iou_construction-building": 0.6151782821349004,
40
  "eval_iou_construction-door": 0.0,
41
- "eval_iou_construction-fenceguardrail": 0.09239785150765831,
42
  "eval_iou_construction-stairs": 0.0,
43
  "eval_iou_construction-tunnel": NaN,
44
- "eval_iou_construction-wall": 0.1796009958723711,
45
- "eval_iou_flat-crosswalk": 0.26608723430220454,
46
- "eval_iou_flat-curb": 0.19206793691107385,
47
- "eval_iou_flat-cyclinglane": 0.6165186094558613,
48
- "eval_iou_flat-parkingdriveway": 0.22540000014154912,
49
  "eval_iou_flat-railtrack": NaN,
50
- "eval_iou_flat-road": 0.5341623036040656,
51
- "eval_iou_flat-sidewalk": 0.8035619780040725,
52
- "eval_iou_human-person": 0.010872092613600332,
53
  "eval_iou_human-rider": 0.0,
54
- "eval_iou_nature-terrain": 0.646685749747382,
55
- "eval_iou_nature-vegetation": 0.7900638904880851,
56
- "eval_iou_object-pole": 0.14375182721824295,
57
  "eval_iou_object-trafficlight": 0.0,
58
  "eval_iou_object-trafficsign": 0.0,
59
- "eval_iou_sky": 0.8389204690587999,
60
  "eval_iou_unlabeled": NaN,
61
  "eval_iou_vehicle-bicycle": 0.0,
62
  "eval_iou_vehicle-bus": 0.0,
63
- "eval_iou_vehicle-car": 0.7190160819570569,
64
  "eval_iou_vehicle-caravan": 0.0,
65
  "eval_iou_vehicle-cartrailer": 0.0,
66
  "eval_iou_vehicle-motorcycle": 0.0,
67
- "eval_iou_vehicle-tramtrain": 0.0,
68
  "eval_iou_vehicle-truck": 0.0,
69
  "eval_iou_void-dynamic": 0.0,
70
  "eval_iou_void-ground": 0.0,
71
- "eval_iou_void-static": 0.09915330318294081,
72
  "eval_iou_void-unclear": 0.0,
73
- "eval_loss": 0.7689843773841858,
74
- "eval_mean_accuracy": 0.26149457547827437,
75
- "eval_mean_iou": 0.21166995644374575,
76
- "eval_overall_accuracy": 0.7839745993658742,
77
- "eval_runtime": 140.2555,
78
- "eval_samples_per_second": 1.069,
79
- "eval_steps_per_second": 0.071
80
  }
 
1
  {
2
+ "epoch": 18.52,
3
  "eval_accuracy_construction-bridge": 0.0,
4
+ "eval_accuracy_construction-building": 0.8696130299150018,
5
  "eval_accuracy_construction-door": 0.0,
6
+ "eval_accuracy_construction-fenceguardrail": 0.0,
7
  "eval_accuracy_construction-stairs": 0.0,
8
  "eval_accuracy_construction-tunnel": NaN,
9
+ "eval_accuracy_construction-wall": 0.003668217029526036,
10
+ "eval_accuracy_flat-crosswalk": 0.0018557628622486598,
11
+ "eval_accuracy_flat-curb": 0.12767179695127617,
12
+ "eval_accuracy_flat-cyclinglane": 0.790813348290863,
13
+ "eval_accuracy_flat-parkingdriveway": 0.1034764257101185,
14
  "eval_accuracy_flat-railtrack": NaN,
15
+ "eval_accuracy_flat-road": 0.6270179782365589,
16
+ "eval_accuracy_flat-sidewalk": 0.9313179571967581,
17
+ "eval_accuracy_human-person": 0.0,
18
  "eval_accuracy_human-rider": 0.0,
19
+ "eval_accuracy_nature-terrain": 0.7721406421014229,
20
+ "eval_accuracy_nature-vegetation": 0.9034924242863521,
21
+ "eval_accuracy_object-pole": 0.0048094393262509885,
22
  "eval_accuracy_object-trafficlight": 0.0,
23
  "eval_accuracy_object-trafficsign": 0.0,
24
+ "eval_accuracy_sky": 0.8740045100333971,
25
  "eval_accuracy_unlabeled": NaN,
26
  "eval_accuracy_vehicle-bicycle": 0.0,
27
  "eval_accuracy_vehicle-bus": 0.0,
28
+ "eval_accuracy_vehicle-car": 0.8866936750042469,
29
  "eval_accuracy_vehicle-caravan": 0.0,
30
  "eval_accuracy_vehicle-cartrailer": 0.0,
31
  "eval_accuracy_vehicle-motorcycle": 0.0,
32
+ "eval_accuracy_vehicle-tramtrain": NaN,
33
  "eval_accuracy_vehicle-truck": 0.0,
34
  "eval_accuracy_void-dynamic": 0.0,
35
  "eval_accuracy_void-ground": 0.0,
36
+ "eval_accuracy_void-static": 0.0,
37
  "eval_accuracy_void-unclear": 0.0,
38
  "eval_iou_construction-bridge": 0.0,
39
+ "eval_iou_construction-building": 0.5254073493770961,
40
  "eval_iou_construction-door": 0.0,
41
+ "eval_iou_construction-fenceguardrail": 0.0,
42
  "eval_iou_construction-stairs": 0.0,
43
  "eval_iou_construction-tunnel": NaN,
44
+ "eval_iou_construction-wall": 0.003613796876006998,
45
+ "eval_iou_flat-crosswalk": 0.0018557628622486598,
46
+ "eval_iou_flat-curb": 0.09914351771584731,
47
+ "eval_iou_flat-cyclinglane": 0.543396562537026,
48
+ "eval_iou_flat-parkingdriveway": 0.08473532362172038,
49
  "eval_iou_flat-railtrack": NaN,
50
+ "eval_iou_flat-road": 0.48147359145471436,
51
+ "eval_iou_flat-sidewalk": 0.7837101825318907,
52
+ "eval_iou_human-person": 0.0,
53
  "eval_iou_human-rider": 0.0,
54
+ "eval_iou_nature-terrain": 0.5919753566336926,
55
+ "eval_iou_nature-vegetation": 0.7441744730399532,
56
+ "eval_iou_object-pole": 0.004807428163287731,
57
  "eval_iou_object-trafficlight": 0.0,
58
  "eval_iou_object-trafficsign": 0.0,
59
+ "eval_iou_sky": 0.8242789743401755,
60
  "eval_iou_unlabeled": NaN,
61
  "eval_iou_vehicle-bicycle": 0.0,
62
  "eval_iou_vehicle-bus": 0.0,
63
+ "eval_iou_vehicle-car": 0.5682343005687291,
64
  "eval_iou_vehicle-caravan": 0.0,
65
  "eval_iou_vehicle-cartrailer": 0.0,
66
  "eval_iou_vehicle-motorcycle": 0.0,
67
+ "eval_iou_vehicle-tramtrain": NaN,
68
  "eval_iou_vehicle-truck": 0.0,
69
  "eval_iou_void-dynamic": 0.0,
70
  "eval_iou_void-ground": 0.0,
71
+ "eval_iou_void-static": 0.0,
72
  "eval_iou_void-unclear": 0.0,
73
+ "eval_loss": 1.002479910850525,
74
+ "eval_mean_accuracy": 0.22247016796593616,
75
+ "eval_mean_iou": 0.16957440708781898,
76
+ "eval_overall_accuracy": 0.7429234629999191,
77
+ "eval_runtime": 135.2466,
78
+ "eval_samples_per_second": 1.109,
79
+ "eval_steps_per_second": 0.074
80
  }
runs/Apr20_08-53-58_brutasse/events.out.tfevents.1650445475.brutasse.3277.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d691e8357c9e63fce2c331338a95a9d790dc52b115e2371f65b986de3909a08
3
+ size 5039
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 50.0,
3
- "train_loss": 0.9338362375895183,
4
- "train_runtime": 1300.5624,
5
- "train_samples_per_second": 32.678,
6
- "train_steps_per_second": 2.076
7
  }
 
1
  {
2
+ "epoch": 18.52,
3
+ "train_loss": 1.3263815078735353,
4
+ "train_runtime": 482.7688,
5
+ "train_samples_per_second": 33.142,
6
+ "train_steps_per_second": 2.071
7
  }
trainer_state.json CHANGED
@@ -1,187 +1,85 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 50.0,
5
- "global_step": 2700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.85,
12
- "learning_rate": 4.814814814814815e-05,
13
- "loss": 2.6107,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 3.7,
18
- "learning_rate": 4.62962962962963e-05,
19
- "loss": 1.8688,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 5.56,
24
- "learning_rate": 4.4444444444444447e-05,
25
- "loss": 1.5544,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 7.41,
30
- "learning_rate": 4.259259259259259e-05,
31
- "loss": 1.3367,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 9.26,
36
- "learning_rate": 4.074074074074074e-05,
37
- "loss": 1.2102,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 11.11,
42
- "learning_rate": 3.888888888888889e-05,
43
- "loss": 1.1085,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 12.96,
48
- "learning_rate": 3.7037037037037037e-05,
49
- "loss": 1.0013,
50
  "step": 700
51
  },
52
  {
53
  "epoch": 14.81,
54
- "learning_rate": 3.518518518518519e-05,
55
- "loss": 0.9601,
56
  "step": 800
57
  },
58
  {
59
  "epoch": 16.67,
60
- "learning_rate": 3.3333333333333335e-05,
61
- "loss": 0.9108,
62
  "step": 900
63
  },
64
  {
65
  "epoch": 18.52,
66
- "learning_rate": 3.148148148148148e-05,
67
- "loss": 0.8639,
68
  "step": 1000
69
  },
70
  {
71
- "epoch": 20.37,
72
- "learning_rate": 2.962962962962963e-05,
73
- "loss": 0.8091,
74
- "step": 1100
75
- },
76
- {
77
- "epoch": 22.22,
78
- "learning_rate": 2.777777777777778e-05,
79
- "loss": 0.8038,
80
- "step": 1200
81
- },
82
- {
83
- "epoch": 24.07,
84
- "learning_rate": 2.5925925925925925e-05,
85
- "loss": 0.7915,
86
- "step": 1300
87
- },
88
- {
89
- "epoch": 25.93,
90
- "learning_rate": 2.4074074074074074e-05,
91
- "loss": 0.7648,
92
- "step": 1400
93
- },
94
- {
95
- "epoch": 27.78,
96
- "learning_rate": 2.2222222222222223e-05,
97
- "loss": 0.7557,
98
- "step": 1500
99
- },
100
- {
101
- "epoch": 29.63,
102
- "learning_rate": 2.037037037037037e-05,
103
- "loss": 0.7004,
104
- "step": 1600
105
- },
106
- {
107
- "epoch": 31.48,
108
- "learning_rate": 1.8518518518518518e-05,
109
- "loss": 0.6927,
110
- "step": 1700
111
- },
112
- {
113
- "epoch": 33.33,
114
- "learning_rate": 1.6666666666666667e-05,
115
- "loss": 0.6847,
116
- "step": 1800
117
- },
118
- {
119
- "epoch": 35.19,
120
- "learning_rate": 1.4814814814814815e-05,
121
- "loss": 0.6828,
122
- "step": 1900
123
- },
124
- {
125
- "epoch": 37.04,
126
- "learning_rate": 1.2962962962962962e-05,
127
- "loss": 0.6526,
128
- "step": 2000
129
- },
130
- {
131
- "epoch": 38.89,
132
- "learning_rate": 1.1111111111111112e-05,
133
- "loss": 0.6612,
134
- "step": 2100
135
- },
136
- {
137
- "epoch": 40.74,
138
- "learning_rate": 9.259259259259259e-06,
139
- "loss": 0.6528,
140
- "step": 2200
141
- },
142
- {
143
- "epoch": 42.59,
144
- "learning_rate": 7.4074074074074075e-06,
145
- "loss": 0.6264,
146
- "step": 2300
147
- },
148
- {
149
- "epoch": 44.44,
150
- "learning_rate": 5.555555555555556e-06,
151
- "loss": 0.6403,
152
- "step": 2400
153
- },
154
- {
155
- "epoch": 46.3,
156
- "learning_rate": 3.7037037037037037e-06,
157
- "loss": 0.6413,
158
- "step": 2500
159
- },
160
- {
161
- "epoch": 48.15,
162
- "learning_rate": 1.8518518518518519e-06,
163
- "loss": 0.6121,
164
- "step": 2600
165
- },
166
- {
167
- "epoch": 50.0,
168
- "learning_rate": 0.0,
169
- "loss": 0.6161,
170
- "step": 2700
171
- },
172
- {
173
- "epoch": 50.0,
174
- "step": 2700,
175
- "total_flos": 7.4663889076224e+17,
176
- "train_loss": 0.9338362375895183,
177
- "train_runtime": 1300.5624,
178
- "train_samples_per_second": 32.678,
179
- "train_steps_per_second": 2.076
180
  }
181
  ],
182
- "max_steps": 2700,
183
- "num_train_epochs": 50,
184
- "total_flos": 7.4663889076224e+17,
185
  "trial_name": null,
186
  "trial_params": null
187
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 18.51851851851852,
5
+ "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.85,
12
+ "learning_rate": 5.401e-05,
13
+ "loss": 2.5377,
14
  "step": 100
15
  },
16
  {
17
  "epoch": 3.7,
18
+ "learning_rate": 4.8020000000000004e-05,
19
+ "loss": 1.7685,
20
  "step": 200
21
  },
22
  {
23
  "epoch": 5.56,
24
+ "learning_rate": 4.203e-05,
25
+ "loss": 1.4614,
26
  "step": 300
27
  },
28
  {
29
  "epoch": 7.41,
30
+ "learning_rate": 3.604e-05,
31
+ "loss": 1.282,
32
  "step": 400
33
  },
34
  {
35
  "epoch": 9.26,
36
+ "learning_rate": 3.0050000000000002e-05,
37
+ "loss": 1.157,
38
  "step": 500
39
  },
40
  {
41
  "epoch": 11.11,
42
+ "learning_rate": 2.406e-05,
43
+ "loss": 1.0986,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 12.96,
48
+ "learning_rate": 1.807e-05,
49
+ "loss": 1.0388,
50
  "step": 700
51
  },
52
  {
53
  "epoch": 14.81,
54
+ "learning_rate": 1.2079999999999998e-05,
55
+ "loss": 0.9946,
56
  "step": 800
57
  },
58
  {
59
  "epoch": 16.67,
60
+ "learning_rate": 6.0899999999999984e-06,
61
+ "loss": 0.9791,
62
  "step": 900
63
  },
64
  {
65
  "epoch": 18.52,
66
+ "learning_rate": 1e-07,
67
+ "loss": 0.9462,
68
  "step": 1000
69
  },
70
  {
71
+ "epoch": 18.52,
72
+ "step": 1000,
73
+ "total_flos": 2.7666045298173542e+17,
74
+ "train_loss": 1.3263815078735353,
75
+ "train_runtime": 482.7688,
76
+ "train_samples_per_second": 33.142,
77
+ "train_steps_per_second": 2.071
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  }
79
  ],
80
+ "max_steps": 1000,
81
+ "num_train_epochs": 19,
82
+ "total_flos": 2.7666045298173542e+17,
83
  "trial_name": null,
84
  "trial_params": null
85
  }