File size: 3,970 Bytes
7ba5ff3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 |
[
{
"loss": 2.1632102966308593,
"learning_rate": 1.0000000000000002e-06,
"epoch": 0.2127659574468085,
"total_flos": 4181675520000,
"step": 10
},
{
"loss": 1.9698543548583984,
"learning_rate": 2.0000000000000003e-06,
"epoch": 0.425531914893617,
"total_flos": 8363351040000,
"step": 20
},
{
"loss": 1.5943157196044921,
"learning_rate": 3e-06,
"epoch": 0.6382978723404256,
"total_flos": 12545026560000,
"step": 30
},
{
"loss": 1.1324241638183594,
"learning_rate": 4.000000000000001e-06,
"epoch": 0.851063829787234,
"total_flos": 16726702080000,
"step": 40
},
{
"loss": 0.7799140930175781,
"learning_rate": 5e-06,
"epoch": 1.0638297872340425,
"total_flos": 20620887408000,
"step": 50
},
{
"loss": 0.5984169006347656,
"learning_rate": 6e-06,
"epoch": 1.2765957446808511,
"total_flos": 24802562928000,
"step": 60
},
{
"loss": 0.4769012451171875,
"learning_rate": 7.000000000000001e-06,
"epoch": 1.4893617021276595,
"total_flos": 28984238448000,
"step": 70
},
{
"loss": 0.3644599914550781,
"learning_rate": 8.000000000000001e-06,
"epoch": 1.702127659574468,
"total_flos": 33165913968000,
"step": 80
},
{
"loss": 0.29639739990234376,
"learning_rate": 9e-06,
"epoch": 1.9148936170212765,
"total_flos": 37347589488000,
"step": 90
},
{
"loss": 0.26825637817382814,
"learning_rate": 1e-05,
"epoch": 2.127659574468085,
"total_flos": 41241774816000,
"step": 100
},
{
"loss": 0.19923171997070313,
"learning_rate": 1.1000000000000001e-05,
"epoch": 2.3404255319148937,
"total_flos": 45423450336000,
"step": 110
},
{
"loss": 0.19310073852539061,
"learning_rate": 1.2e-05,
"epoch": 2.5531914893617023,
"total_flos": 49605125856000,
"step": 120
},
{
"loss": 0.15804977416992189,
"learning_rate": 1.3000000000000001e-05,
"epoch": 2.7659574468085104,
"total_flos": 53786801376000,
"step": 130
},
{
"loss": 0.17403030395507812,
"learning_rate": 1.4000000000000001e-05,
"epoch": 2.978723404255319,
"total_flos": 57968476896000,
"step": 140
},
{
"loss": 0.11231231689453125,
"learning_rate": 1.5e-05,
"epoch": 3.1914893617021276,
"total_flos": 61862662224000,
"step": 150
},
{
"loss": 0.0972991943359375,
"learning_rate": 1.6000000000000003e-05,
"epoch": 3.404255319148936,
"total_flos": 66044337744000,
"step": 160
},
{
"loss": 0.09285507202148438,
"learning_rate": 1.7000000000000003e-05,
"epoch": 3.617021276595745,
"total_flos": 70226013264000,
"step": 170
},
{
"loss": 0.10490646362304687,
"learning_rate": 1.8e-05,
"epoch": 3.829787234042553,
"total_flos": 74407688784000,
"step": 180
},
{
"loss": 0.08623809814453125,
"learning_rate": 1.9e-05,
"epoch": 4.042553191489362,
"total_flos": 78301874112000,
"step": 190
},
{
"loss": 0.05904541015625,
"learning_rate": 2e-05,
"epoch": 4.25531914893617,
"total_flos": 82483549632000,
"step": 200
},
{
"loss": 0.052008056640625,
"learning_rate": 2.1e-05,
"epoch": 4.468085106382979,
"total_flos": 86665225152000,
"step": 210
},
{
"loss": 0.06222076416015625,
"learning_rate": 2.2000000000000003e-05,
"epoch": 4.680851063829787,
"total_flos": 90846900672000,
"step": 220
},
{
"loss": 0.05680923461914063,
"learning_rate": 2.3000000000000003e-05,
"epoch": 4.8936170212765955,
"total_flos": 95028576192000,
"step": 230
},
{
"eval_loss": 0.0899211324525602,
"eval_accuracy_score": 0.974121282348397,
"eval_precision": 0.9776031434184675,
"eval_recall": 0.9749216300940439,
"eval_f1": 0.9762605454188739,
"epoch": 5.0,
"total_flos": 96831923760000,
"step": 235
}
] |