Update training_history.json - Run 20251104_144102
Browse files
weights/David-decoupled-cantor_scale/20251104_144102/training_history.json
CHANGED
|
@@ -3,80 +3,93 @@
|
|
| 3 |
1,
|
| 4 |
2,
|
| 5 |
3,
|
| 6 |
-
4
|
|
|
|
| 7 |
],
|
| 8 |
"train_loss": [
|
| 9 |
1.8473644912409581,
|
| 10 |
1.2349187319534949,
|
| 11 |
1.0967776605571407,
|
| 12 |
-
0.9883316958422095
|
|
|
|
| 13 |
],
|
| 14 |
"train_acc": [
|
| 15 |
83.50909756495444,
|
| 16 |
87.53558279287556,
|
| 17 |
88.92135061237137,
|
| 18 |
-
90.1239260767722
|
|
|
|
| 19 |
],
|
| 20 |
"val_acc": [
|
| 21 |
84.296,
|
| 22 |
84.784,
|
| 23 |
85.094,
|
| 24 |
-
85.114
|
|
|
|
| 25 |
],
|
| 26 |
"scale_accs": {
|
| 27 |
"384": [
|
| 28 |
82.254,
|
| 29 |
83.082,
|
| 30 |
83.518,
|
| 31 |
-
83.574
|
|
|
|
| 32 |
],
|
| 33 |
"512": [
|
| 34 |
82.682,
|
| 35 |
83.472,
|
| 36 |
84.012,
|
| 37 |
-
84.268
|
|
|
|
| 38 |
],
|
| 39 |
"768": [
|
| 40 |
83.39,
|
| 41 |
84.056,
|
| 42 |
84.434,
|
| 43 |
-
84.538
|
|
|
|
| 44 |
],
|
| 45 |
"1024": [
|
| 46 |
83.314,
|
| 47 |
83.934,
|
| 48 |
84.376,
|
| 49 |
-
84.428
|
|
|
|
| 50 |
],
|
| 51 |
"1280": [
|
| 52 |
83.256,
|
| 53 |
83.656,
|
| 54 |
84.022,
|
| 55 |
-
84.308
|
|
|
|
| 56 |
],
|
| 57 |
"1536": [
|
| 58 |
83.196,
|
| 59 |
83.854,
|
| 60 |
84.16,
|
| 61 |
-
84.14
|
|
|
|
| 62 |
],
|
| 63 |
"1792": [
|
| 64 |
83.188,
|
| 65 |
83.842,
|
| 66 |
84.126,
|
| 67 |
-
83.91
|
|
|
|
| 68 |
],
|
| 69 |
"2048": [
|
| 70 |
83.254,
|
| 71 |
84.048,
|
| 72 |
84.176,
|
| 73 |
-
84.008
|
|
|
|
| 74 |
]
|
| 75 |
},
|
| 76 |
"lr": [
|
| 77 |
0.0009755527298894294,
|
| 78 |
0.0009046039886902864,
|
| 79 |
0.0007940987335200904,
|
| 80 |
-
0.0006548539886902864
|
|
|
|
| 81 |
]
|
| 82 |
}
|
|
|
|
| 3 |
1,
|
| 4 |
2,
|
| 5 |
3,
|
| 6 |
+
4,
|
| 7 |
+
5
|
| 8 |
],
|
| 9 |
"train_loss": [
|
| 10 |
1.8473644912409581,
|
| 11 |
1.2349187319534949,
|
| 12 |
1.0967776605571407,
|
| 13 |
+
0.9883316958422095,
|
| 14 |
+
0.8936501936678214
|
| 15 |
],
|
| 16 |
"train_acc": [
|
| 17 |
83.50909756495444,
|
| 18 |
87.53558279287556,
|
| 19 |
88.92135061237137,
|
| 20 |
+
90.1239260767722,
|
| 21 |
+
91.28685019205146
|
| 22 |
],
|
| 23 |
"val_acc": [
|
| 24 |
84.296,
|
| 25 |
84.784,
|
| 26 |
85.094,
|
| 27 |
+
85.114,
|
| 28 |
+
85.25
|
| 29 |
],
|
| 30 |
"scale_accs": {
|
| 31 |
"384": [
|
| 32 |
82.254,
|
| 33 |
83.082,
|
| 34 |
83.518,
|
| 35 |
+
83.574,
|
| 36 |
+
83.992
|
| 37 |
],
|
| 38 |
"512": [
|
| 39 |
82.682,
|
| 40 |
83.472,
|
| 41 |
84.012,
|
| 42 |
+
84.268,
|
| 43 |
+
84.384
|
| 44 |
],
|
| 45 |
"768": [
|
| 46 |
83.39,
|
| 47 |
84.056,
|
| 48 |
84.434,
|
| 49 |
+
84.538,
|
| 50 |
+
84.716
|
| 51 |
],
|
| 52 |
"1024": [
|
| 53 |
83.314,
|
| 54 |
83.934,
|
| 55 |
84.376,
|
| 56 |
+
84.428,
|
| 57 |
+
84.668
|
| 58 |
],
|
| 59 |
"1280": [
|
| 60 |
83.256,
|
| 61 |
83.656,
|
| 62 |
84.022,
|
| 63 |
+
84.308,
|
| 64 |
+
84.458
|
| 65 |
],
|
| 66 |
"1536": [
|
| 67 |
83.196,
|
| 68 |
83.854,
|
| 69 |
84.16,
|
| 70 |
+
84.14,
|
| 71 |
+
84.162
|
| 72 |
],
|
| 73 |
"1792": [
|
| 74 |
83.188,
|
| 75 |
83.842,
|
| 76 |
84.126,
|
| 77 |
+
83.91,
|
| 78 |
+
84.038
|
| 79 |
],
|
| 80 |
"2048": [
|
| 81 |
83.254,
|
| 82 |
84.048,
|
| 83 |
84.176,
|
| 84 |
+
84.008,
|
| 85 |
+
84.234
|
| 86 |
]
|
| 87 |
},
|
| 88 |
"lr": [
|
| 89 |
0.0009755527298894294,
|
| 90 |
0.0009046039886902864,
|
| 91 |
0.0007940987335200904,
|
| 92 |
+
0.0006548539886902864,
|
| 93 |
+
0.0005005000000000001
|
| 94 |
]
|
| 95 |
}
|