diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" --- "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" +++ "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 2.7226, "train/learning_rate": 2.1101543942992875e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 35174, "_timestamp": 1646982413, "_step": 6003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 17.0, 17.0, 13.0, 12.0, 22.0, 27.0, 29.0, 29.0, 32.0, 34.0, 26.0, 43.0, 38.0, 41.0, 34.0, 43.0, 55.0, 34.0, 32.0, 42.0, 43.0, 41.0, 28.0, 29.0, 45.0, 29.0, 29.0, 13.0, 18.0, 22.0, 15.0, 11.0, 8.0, 8.0, 5.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.104436874389648, -13.784018516540527, -13.463600158691406, -13.143182754516602, -12.82276439666748, -12.50234603881836, -12.181928634643555, -11.861510276794434, -11.541091918945312, -11.220673561096191, -10.90025520324707, -10.579837799072266, -10.259419441223145, -9.939001083374023, -9.618583679199219, -9.298165321350098, -8.977746963500977, -8.657328605651855, -8.336910247802734, -8.01649284362793, -7.696074485778809, -7.3756561279296875, -7.055238246917725, -6.734820365905762, -6.414402008056641, -6.0939836502075195, -5.773565769195557, -5.453147888183594, -5.132729530334473, -4.812311172485352, -4.491893291473389, -4.171475410461426, -3.851058006286621, -3.530639886856079, -3.210221767425537, -2.889803647994995, -2.569385528564453, -2.248967409133911, -1.9285492897033691, -1.6081311702728271, -1.2877130508422852, -0.9672949314117432, -0.6468768119812012, -0.3264586925506592, -0.0060405731201171875, 0.3143775463104248, 0.6347956657409668, 0.9552137851715088, 1.2756319046020508, 1.5960500240325928, 1.9164681434631348, 2.2368862628936768, 2.5573043823242188, 2.8777225017547607, 3.1981406211853027, 3.5185587406158447, 3.8389768600463867, 4.159395217895508, 4.479813098907471, 4.800230979919434, 5.120649337768555, 5.441067695617676, 5.761485576629639, 6.081903457641602, 6.402321815490723]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 3.0, 14.0, 14.0, 18.0, 15.0, 15.0, 13.0, 23.0, 34.0, 23.0, 25.0, 41.0, 31.0, 33.0, 35.0, 33.0, 46.0, 30.0, 35.0, 44.0, 40.0, 25.0, 22.0, 37.0, 32.0, 24.0, 31.0, 24.0, 25.0, 22.0, 20.0, 28.0, 16.0, 17.0, 21.0, 13.0, 9.0, 19.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-10.389012336730957, -10.077750205993652, -9.766488075256348, -9.455225944519043, -9.143962860107422, -8.832700729370117, -8.521438598632812, -8.210176467895508, -7.898914337158203, -7.587652206420898, -7.276390075683594, -6.965127468109131, -6.653865337371826, -6.3426032066345215, -6.031340599060059, -5.720078468322754, -5.408816337585449, -5.0975542068481445, -4.78629207611084, -4.475029468536377, -4.163767337799072, -3.8525052070617676, -3.541242837905884, -3.22998046875, -2.9187183380126953, -2.6074562072753906, -2.296193838119507, -1.9849315881729126, -1.6736693382263184, -1.3624070882797241, -1.0511448383331299, -0.7398824691772461, -0.4286203384399414, -0.11735808849334717, 0.19390416145324707, 0.5051664113998413, 0.8164286613464355, 1.1276909112930298, 1.438953161239624, 1.7502155303955078, 2.0614776611328125, 2.372739791870117, 2.684002161026001, 2.9952645301818848, 3.3065266609191895, 3.617788791656494, 3.929051160812378, 4.240313529968262, 4.551575660705566, 4.862837791442871, 5.174099922180176, 5.485362529754639, 5.796624660491943, 6.107886791229248, 6.419149398803711, 6.730411529541016, 7.04167366027832, 7.352935791015625, 7.66419792175293, 7.975460529327393, 8.286722183227539, 8.59798526763916, 8.909247398376465, 9.22050952911377, 9.531771659851074]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 9.0, 5.0, 12.0, 20.0, 53.0, 82.0, 134.0, 225.0, 347.0, 588.0, 854.0, 1408.0, 2314.0, 3799.0, 6163.0, 9889.0, 15410.0, 24360.0, 38350.0, 59343.0, 90629.0, 135415.0, 196980.0, 275513.0, 363914.0, 445566.0, 492764.0, 485901.0, 427128.0, 340018.0, 252449.0, 176690.0, 121570.0, 80241.0, 52873.0, 33876.0, 21700.0, 14103.0, 8800.0, 5519.0, 3470.0, 2257.0, 1314.0, 878.0, 512.0, 303.0, 206.0, 131.0, 86.0, 54.0, 22.0, 16.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.3828125, -8.1197509765625, -7.856689453125, -7.5936279296875, -7.33056640625, -7.0675048828125, -6.804443359375, -6.5413818359375, -6.2783203125, -6.0152587890625, -5.752197265625, -5.4891357421875, -5.22607421875, -4.9630126953125, -4.699951171875, -4.4368896484375, -4.173828125, -3.9107666015625, -3.647705078125, -3.3846435546875, -3.12158203125, -2.8585205078125, -2.595458984375, -2.3323974609375, -2.0693359375, -1.8062744140625, -1.543212890625, -1.2801513671875, -1.01708984375, -0.7540283203125, -0.490966796875, -0.2279052734375, 0.03515625, 0.2982177734375, 0.561279296875, 0.8243408203125, 1.08740234375, 1.3504638671875, 1.613525390625, 1.8765869140625, 2.1396484375, 2.4027099609375, 2.665771484375, 2.9288330078125, 3.19189453125, 3.4549560546875, 3.718017578125, 3.9810791015625, 4.244140625, 4.5072021484375, 4.770263671875, 5.0333251953125, 5.29638671875, 5.5594482421875, 5.822509765625, 6.0855712890625, 6.3486328125, 6.6116943359375, 6.874755859375, 7.1378173828125, 7.40087890625, 7.6639404296875, 7.927001953125, 8.1900634765625, 8.453125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 14.0, 5.0, 6.0, 12.0, 11.0, 20.0, 16.0, 25.0, 17.0, 31.0, 31.0, 27.0, 33.0, 37.0, 32.0, 29.0, 35.0, 42.0, 42.0, 25.0, 30.0, 38.0, 31.0, 32.0, 24.0, 30.0, 26.0, 17.0, 32.0, 19.0, 21.0, 27.0, 16.0, 19.0, 18.0, 26.0, 16.0, 14.0, 9.0, 8.0, 8.0, 6.0, 9.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.421875, -7.18927001953125, -6.9566650390625, -6.72406005859375, -6.491455078125, -6.25885009765625, -6.0262451171875, -5.79364013671875, -5.56103515625, -5.32843017578125, -5.0958251953125, -4.86322021484375, -4.630615234375, -4.39801025390625, -4.1654052734375, -3.93280029296875, -3.7001953125, -3.46759033203125, -3.2349853515625, -3.00238037109375, -2.769775390625, -2.53717041015625, -2.3045654296875, -2.07196044921875, -1.83935546875, -1.60675048828125, -1.3741455078125, -1.14154052734375, -0.908935546875, -0.67633056640625, -0.4437255859375, -0.21112060546875, 0.021484375, 0.25408935546875, 0.4866943359375, 0.71929931640625, 0.951904296875, 1.18450927734375, 1.4171142578125, 1.64971923828125, 1.88232421875, 2.11492919921875, 2.3475341796875, 2.58013916015625, 2.812744140625, 3.04534912109375, 3.2779541015625, 3.51055908203125, 3.7431640625, 3.97576904296875, 4.2083740234375, 4.44097900390625, 4.673583984375, 4.90618896484375, 5.1387939453125, 5.37139892578125, 5.60400390625, 5.83660888671875, 6.0692138671875, 6.30181884765625, 6.534423828125, 6.76702880859375, 6.9996337890625, 7.23223876953125, 7.46484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 18.0, 33.0, 56.0, 75.0, 157.0, 219.0, 397.0, 636.0, 1143.0, 1765.0, 3004.0, 4931.0, 8007.0, 13234.0, 21243.0, 33629.0, 52129.0, 79303.0, 115602.0, 165230.0, 227527.0, 298698.0, 366861.0, 420312.0, 442428.0, 431101.0, 384272.0, 317623.0, 247247.0, 181209.0, 129345.0, 88518.0, 58480.0, 37524.0, 23685.0, 15016.0, 9460.0, 5649.0, 3477.0, 2079.0, 1244.0, 712.0, 398.0, 253.0, 154.0, 79.0, 51.0, 30.0, 18.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.8515625, -7.6033935546875, -7.355224609375, -7.1070556640625, -6.85888671875, -6.6107177734375, -6.362548828125, -6.1143798828125, -5.8662109375, -5.6180419921875, -5.369873046875, -5.1217041015625, -4.87353515625, -4.6253662109375, -4.377197265625, -4.1290283203125, -3.880859375, -3.6326904296875, -3.384521484375, -3.1363525390625, -2.88818359375, -2.6400146484375, -2.391845703125, -2.1436767578125, -1.8955078125, -1.6473388671875, -1.399169921875, -1.1510009765625, -0.90283203125, -0.6546630859375, -0.406494140625, -0.1583251953125, 0.08984375, 0.3380126953125, 0.586181640625, 0.8343505859375, 1.08251953125, 1.3306884765625, 1.578857421875, 1.8270263671875, 2.0751953125, 2.3233642578125, 2.571533203125, 2.8197021484375, 3.06787109375, 3.3160400390625, 3.564208984375, 3.8123779296875, 4.060546875, 4.3087158203125, 4.556884765625, 4.8050537109375, 5.05322265625, 5.3013916015625, 5.549560546875, 5.7977294921875, 6.0458984375, 6.2940673828125, 6.542236328125, 6.7904052734375, 7.03857421875, 7.2867431640625, 7.534912109375, 7.7830810546875, 8.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 15.0, 19.0, 18.0, 23.0, 36.0, 37.0, 48.0, 75.0, 86.0, 88.0, 104.0, 128.0, 152.0, 181.0, 166.0, 181.0, 199.0, 203.0, 226.0, 218.0, 200.0, 220.0, 192.0, 167.0, 162.0, 159.0, 134.0, 110.0, 97.0, 73.0, 71.0, 70.0, 42.0, 37.0, 29.0, 22.0, 22.0, 9.0, 16.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.04339599609375, -3.9110107421875, -3.77862548828125, -3.646240234375, -3.51385498046875, -3.3814697265625, -3.24908447265625, -3.11669921875, -2.98431396484375, -2.8519287109375, -2.71954345703125, -2.587158203125, -2.45477294921875, -2.3223876953125, -2.19000244140625, -2.0576171875, -1.92523193359375, -1.7928466796875, -1.66046142578125, -1.528076171875, -1.39569091796875, -1.2633056640625, -1.13092041015625, -0.99853515625, -0.86614990234375, -0.7337646484375, -0.60137939453125, -0.468994140625, -0.33660888671875, -0.2042236328125, -0.07183837890625, 0.060546875, 0.19293212890625, 0.3253173828125, 0.45770263671875, 0.590087890625, 0.72247314453125, 0.8548583984375, 0.98724365234375, 1.11962890625, 1.25201416015625, 1.3843994140625, 1.51678466796875, 1.649169921875, 1.78155517578125, 1.9139404296875, 2.04632568359375, 2.1787109375, 2.31109619140625, 2.4434814453125, 2.57586669921875, 2.708251953125, 2.84063720703125, 2.9730224609375, 3.10540771484375, 3.23779296875, 3.37017822265625, 3.5025634765625, 3.63494873046875, 3.767333984375, 3.89971923828125, 4.0321044921875, 4.16448974609375, 4.296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 9.0, 4.0, 8.0, 3.0, 8.0, 11.0, 15.0, 12.0, 20.0, 18.0, 25.0, 21.0, 24.0, 16.0, 30.0, 23.0, 36.0, 37.0, 36.0, 32.0, 46.0, 45.0, 43.0, 50.0, 43.0, 42.0, 36.0, 41.0, 39.0, 34.0, 27.0, 24.0, 25.0, 15.0, 16.0, 13.0, 16.0, 10.0, 11.0, 3.0, 8.0, 4.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-10.4581937789917, -10.15226936340332, -9.846344947814941, -9.540420532226562, -9.234496116638184, -8.928571701049805, -8.622647285461426, -8.316722869873047, -8.010798454284668, -7.704874038696289, -7.39894962310791, -7.093025207519531, -6.787100791931152, -6.481176376342773, -6.1752519607543945, -5.869327545166016, -5.563403129577637, -5.257478713989258, -4.951554298400879, -4.6456298828125, -4.339705467224121, -4.033781051635742, -3.7278566360473633, -3.4219322204589844, -3.1160078048706055, -2.8100833892822266, -2.5041589736938477, -2.1982345581054688, -1.8923101425170898, -1.586385726928711, -1.280461311340332, -0.9745368957519531, -0.6686115264892578, -0.3626871109008789, -0.0567626953125, 0.2491617202758789, 0.5550861358642578, 0.8610105514526367, 1.1669349670410156, 1.4728593826293945, 1.7787837982177734, 2.0847082138061523, 2.3906326293945312, 2.69655704498291, 3.002481460571289, 3.308405876159668, 3.614330291748047, 3.920254707336426, 4.226179122924805, 4.532103538513184, 4.8380279541015625, 5.143952369689941, 5.44987678527832, 5.755801200866699, 6.061725616455078, 6.367650032043457, 6.673574447631836, 6.979498863220215, 7.285423278808594, 7.591347694396973, 7.897272109985352, 8.20319652557373, 8.50912094116211, 8.815045356750488, 9.120969772338867]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 6.0, 11.0, 7.0, 6.0, 14.0, 19.0, 14.0, 13.0, 13.0, 34.0, 29.0, 29.0, 35.0, 33.0, 40.0, 29.0, 36.0, 40.0, 41.0, 40.0, 38.0, 38.0, 35.0, 33.0, 34.0, 28.0, 27.0, 31.0, 27.0, 34.0, 20.0, 19.0, 12.0, 16.0, 18.0, 13.0, 23.0, 16.0, 6.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.67910385131836, -9.376543045043945, -9.073982238769531, -8.771421432495117, -8.468860626220703, -8.166299819946289, -7.863739013671875, -7.561178207397461, -7.258617401123047, -6.956056594848633, -6.653495788574219, -6.350934982299805, -6.048374176025391, -5.745813369750977, -5.4432525634765625, -5.140691757202148, -4.838130950927734, -4.53557014465332, -4.233009338378906, -3.930448532104492, -3.627887725830078, -3.325326919555664, -3.02276611328125, -2.720205307006836, -2.417644500732422, -2.115083694458008, -1.8125228881835938, -1.5099620819091797, -1.2074012756347656, -0.9048404693603516, -0.6022796630859375, -0.29971885681152344, 0.002841949462890625, 0.3054027557373047, 0.6079635620117188, 0.9105243682861328, 1.2130851745605469, 1.515645980834961, 1.818206787109375, 2.120767593383789, 2.423328399658203, 2.725889205932617, 3.0284500122070312, 3.3310108184814453, 3.6335716247558594, 3.9361324310302734, 4.2386932373046875, 4.541254043579102, 4.843814849853516, 5.14637565612793, 5.448936462402344, 5.751497268676758, 6.054058074951172, 6.356618881225586, 6.6591796875, 6.961740493774414, 7.264301300048828, 7.566862106323242, 7.869422912597656, 8.17198371887207, 8.474544525146484, 8.777105331420898, 9.079666137695312, 9.382226943969727, 9.68478775024414]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 14.0, 29.0, 30.0, 50.0, 68.0, 89.0, 122.0, 197.0, 266.0, 383.0, 546.0, 743.0, 1092.0, 1534.0, 2316.0, 3716.0, 5647.0, 9073.0, 14827.0, 25097.0, 43585.0, 76493.0, 133669.0, 208879.0, 206369.0, 130781.0, 75500.0, 42937.0, 24386.0, 14628.0, 8903.0, 5510.0, 3581.0, 2332.0, 1605.0, 1081.0, 715.0, 493.0, 365.0, 253.0, 162.0, 143.0, 97.0, 73.0, 43.0, 39.0, 26.0, 22.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0], "bins": [-5.9609375, -5.7855224609375, -5.610107421875, -5.4346923828125, -5.25927734375, -5.0838623046875, -4.908447265625, -4.7330322265625, -4.5576171875, -4.3822021484375, -4.206787109375, -4.0313720703125, -3.85595703125, -3.6805419921875, -3.505126953125, -3.3297119140625, -3.154296875, -2.9788818359375, -2.803466796875, -2.6280517578125, -2.45263671875, -2.2772216796875, -2.101806640625, -1.9263916015625, -1.7509765625, -1.5755615234375, -1.400146484375, -1.2247314453125, -1.04931640625, -0.8739013671875, -0.698486328125, -0.5230712890625, -0.34765625, -0.1722412109375, 0.003173828125, 0.1785888671875, 0.35400390625, 0.5294189453125, 0.704833984375, 0.8802490234375, 1.0556640625, 1.2310791015625, 1.406494140625, 1.5819091796875, 1.75732421875, 1.9327392578125, 2.108154296875, 2.2835693359375, 2.458984375, 2.6343994140625, 2.809814453125, 2.9852294921875, 3.16064453125, 3.3360595703125, 3.511474609375, 3.6868896484375, 3.8623046875, 4.0377197265625, 4.213134765625, 4.3885498046875, 4.56396484375, 4.7393798828125, 4.914794921875, 5.0902099609375, 5.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 6.0, 12.0, 6.0, 7.0, 13.0, 18.0, 15.0, 11.0, 16.0, 36.0, 26.0, 29.0, 33.0, 33.0, 36.0, 35.0, 32.0, 42.0, 39.0, 46.0, 32.0, 36.0, 39.0, 29.0, 35.0, 26.0, 31.0, 28.0, 29.0, 32.0, 22.0, 20.0, 13.0, 18.0, 14.0, 14.0, 21.0, 17.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.53125, -9.2353515625, -8.939453125, -8.6435546875, -8.34765625, -8.0517578125, -7.755859375, -7.4599609375, -7.1640625, -6.8681640625, -6.572265625, -6.2763671875, -5.98046875, -5.6845703125, -5.388671875, -5.0927734375, -4.796875, -4.5009765625, -4.205078125, -3.9091796875, -3.61328125, -3.3173828125, -3.021484375, -2.7255859375, -2.4296875, -2.1337890625, -1.837890625, -1.5419921875, -1.24609375, -0.9501953125, -0.654296875, -0.3583984375, -0.0625, 0.2333984375, 0.529296875, 0.8251953125, 1.12109375, 1.4169921875, 1.712890625, 2.0087890625, 2.3046875, 2.6005859375, 2.896484375, 3.1923828125, 3.48828125, 3.7841796875, 4.080078125, 4.3759765625, 4.671875, 4.9677734375, 5.263671875, 5.5595703125, 5.85546875, 6.1513671875, 6.447265625, 6.7431640625, 7.0390625, 7.3349609375, 7.630859375, 7.9267578125, 8.22265625, 8.5185546875, 8.814453125, 9.1103515625, 9.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 13.0, 14.0, 12.0, 17.0, 35.0, 41.0, 67.0, 108.0, 133.0, 203.0, 298.0, 458.0, 702.0, 1123.0, 1909.0, 3400.0, 6616.0, 13928.0, 37788.0, 148093.0, 535589.0, 213666.0, 49833.0, 17287.0, 7653.0, 3859.0, 2137.0, 1273.0, 793.0, 493.0, 298.0, 189.0, 157.0, 108.0, 85.0, 52.0, 41.0, 18.0, 21.0, 10.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.641845703125, -9.34619140625, -9.050537109375, -8.7548828125, -8.459228515625, -8.16357421875, -7.867919921875, -7.572265625, -7.276611328125, -6.98095703125, -6.685302734375, -6.3896484375, -6.093994140625, -5.79833984375, -5.502685546875, -5.20703125, -4.911376953125, -4.61572265625, -4.320068359375, -4.0244140625, -3.728759765625, -3.43310546875, -3.137451171875, -2.841796875, -2.546142578125, -2.25048828125, -1.954833984375, -1.6591796875, -1.363525390625, -1.06787109375, -0.772216796875, -0.4765625, -0.180908203125, 0.11474609375, 0.410400390625, 0.7060546875, 1.001708984375, 1.29736328125, 1.593017578125, 1.888671875, 2.184326171875, 2.47998046875, 2.775634765625, 3.0712890625, 3.366943359375, 3.66259765625, 3.958251953125, 4.25390625, 4.549560546875, 4.84521484375, 5.140869140625, 5.4365234375, 5.732177734375, 6.02783203125, 6.323486328125, 6.619140625, 6.914794921875, 7.21044921875, 7.506103515625, 7.8017578125, 8.097412109375, 8.39306640625, 8.688720703125, 8.984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 15.0, 10.0, 9.0, 15.0, 15.0, 23.0, 25.0, 17.0, 22.0, 22.0, 29.0, 33.0, 30.0, 23.0, 32.0, 30.0, 34.0, 36.0, 23.0, 35.0, 50.0, 50.0, 35.0, 40.0, 24.0, 25.0, 40.0, 24.0, 30.0, 23.0, 27.0, 21.0, 22.0, 20.0, 16.0, 15.0, 8.0, 9.0, 4.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0], "bins": [-6.69140625, -6.49725341796875, -6.3031005859375, -6.10894775390625, -5.914794921875, -5.72064208984375, -5.5264892578125, -5.33233642578125, -5.13818359375, -4.94403076171875, -4.7498779296875, -4.55572509765625, -4.361572265625, -4.16741943359375, -3.9732666015625, -3.77911376953125, -3.5849609375, -3.39080810546875, -3.1966552734375, -3.00250244140625, -2.808349609375, -2.61419677734375, -2.4200439453125, -2.22589111328125, -2.03173828125, -1.83758544921875, -1.6434326171875, -1.44927978515625, -1.255126953125, -1.06097412109375, -0.8668212890625, -0.67266845703125, -0.478515625, -0.28436279296875, -0.0902099609375, 0.10394287109375, 0.298095703125, 0.49224853515625, 0.6864013671875, 0.88055419921875, 1.07470703125, 1.26885986328125, 1.4630126953125, 1.65716552734375, 1.851318359375, 2.04547119140625, 2.2396240234375, 2.43377685546875, 2.6279296875, 2.82208251953125, 3.0162353515625, 3.21038818359375, 3.404541015625, 3.59869384765625, 3.7928466796875, 3.98699951171875, 4.18115234375, 4.37530517578125, 4.5694580078125, 4.76361083984375, 4.957763671875, 5.15191650390625, 5.3460693359375, 5.54022216796875, 5.734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 8.0, 11.0, 19.0, 22.0, 33.0, 37.0, 69.0, 112.0, 116.0, 179.0, 307.0, 414.0, 705.0, 1282.0, 2404.0, 5193.0, 13920.0, 61526.0, 726875.0, 194492.0, 25282.0, 7996.0, 3359.0, 1613.0, 947.0, 542.0, 342.0, 222.0, 164.0, 95.0, 84.0, 50.0, 30.0, 35.0, 19.0, 13.0, 16.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.22393798828125, -6.0338134765625, -5.84368896484375, -5.653564453125, -5.46343994140625, -5.2733154296875, -5.08319091796875, -4.89306640625, -4.70294189453125, -4.5128173828125, -4.32269287109375, -4.132568359375, -3.94244384765625, -3.7523193359375, -3.56219482421875, -3.3720703125, -3.18194580078125, -2.9918212890625, -2.80169677734375, -2.611572265625, -2.42144775390625, -2.2313232421875, -2.04119873046875, -1.85107421875, -1.66094970703125, -1.4708251953125, -1.28070068359375, -1.090576171875, -0.90045166015625, -0.7103271484375, -0.52020263671875, -0.330078125, -0.13995361328125, 0.0501708984375, 0.24029541015625, 0.430419921875, 0.62054443359375, 0.8106689453125, 1.00079345703125, 1.19091796875, 1.38104248046875, 1.5711669921875, 1.76129150390625, 1.951416015625, 2.14154052734375, 2.3316650390625, 2.52178955078125, 2.7119140625, 2.90203857421875, 3.0921630859375, 3.28228759765625, 3.472412109375, 3.66253662109375, 3.8526611328125, 4.04278564453125, 4.23291015625, 4.42303466796875, 4.6131591796875, 4.80328369140625, 4.993408203125, 5.18353271484375, 5.3736572265625, 5.56378173828125, 5.75390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 8.0, 9.0, 31.0, 31.0, 67.0, 130.0, 207.0, 207.0, 143.0, 81.0, 38.0, 14.0, 9.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007839202880859375, -0.0007601827383041382, -0.0007364451885223389, -0.0007127076387405396, -0.0006889700889587402, -0.0006652325391769409, -0.0006414949893951416, -0.0006177574396133423, -0.000594019889831543, -0.0005702823400497437, -0.0005465447902679443, -0.000522807240486145, -0.0004990696907043457, -0.0004753321409225464, -0.00045159459114074707, -0.00042785704135894775, -0.00040411949157714844, -0.0003803819417953491, -0.0003566443920135498, -0.0003329068422317505, -0.00030916929244995117, -0.00028543174266815186, -0.00026169419288635254, -0.00023795664310455322, -0.0002142190933227539, -0.0001904815435409546, -0.00016674399375915527, -0.00014300644397735596, -0.00011926889419555664, -9.553134441375732e-05, -7.179379463195801e-05, -4.805624485015869e-05, -2.4318695068359375e-05, -5.811452865600586e-07, 2.3156404495239258e-05, 4.6893954277038574e-05, 7.063150405883789e-05, 9.436905384063721e-05, 0.00011810660362243652, 0.00014184415340423584, 0.00016558170318603516, 0.00018931925296783447, 0.0002130568027496338, 0.0002367943525314331, 0.0002605319023132324, 0.00028426945209503174, 0.00030800700187683105, 0.00033174455165863037, 0.0003554821014404297, 0.000379219651222229, 0.0004029572010040283, 0.00042669475078582764, 0.00045043230056762695, 0.00047416985034942627, 0.0004979074001312256, 0.0005216449499130249, 0.0005453824996948242, 0.0005691200494766235, 0.0005928575992584229, 0.0006165951490402222, 0.0006403326988220215, 0.0006640702486038208, 0.0006878077983856201, 0.0007115453481674194, 0.0007352828979492188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 11.0, 14.0, 15.0, 18.0, 32.0, 58.0, 77.0, 112.0, 182.0, 241.0, 352.0, 463.0, 772.0, 1204.0, 1992.0, 3574.0, 6789.0, 15402.0, 38476.0, 105845.0, 298430.0, 351526.0, 137010.0, 48183.0, 19131.0, 8445.0, 4118.0, 2192.0, 1262.0, 847.0, 529.0, 367.0, 281.0, 174.0, 129.0, 84.0, 57.0, 52.0, 27.0, 19.0, 23.0, 5.0, 5.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.91796875, -4.76947021484375, -4.6209716796875, -4.47247314453125, -4.323974609375, -4.17547607421875, -4.0269775390625, -3.87847900390625, -3.72998046875, -3.58148193359375, -3.4329833984375, -3.28448486328125, -3.135986328125, -2.98748779296875, -2.8389892578125, -2.69049072265625, -2.5419921875, -2.39349365234375, -2.2449951171875, -2.09649658203125, -1.947998046875, -1.79949951171875, -1.6510009765625, -1.50250244140625, -1.35400390625, -1.20550537109375, -1.0570068359375, -0.90850830078125, -0.760009765625, -0.61151123046875, -0.4630126953125, -0.31451416015625, -0.166015625, -0.01751708984375, 0.1309814453125, 0.27947998046875, 0.427978515625, 0.57647705078125, 0.7249755859375, 0.87347412109375, 1.02197265625, 1.17047119140625, 1.3189697265625, 1.46746826171875, 1.615966796875, 1.76446533203125, 1.9129638671875, 2.06146240234375, 2.2099609375, 2.35845947265625, 2.5069580078125, 2.65545654296875, 2.803955078125, 2.95245361328125, 3.1009521484375, 3.24945068359375, 3.39794921875, 3.54644775390625, 3.6949462890625, 3.84344482421875, 3.991943359375, 4.14044189453125, 4.2889404296875, 4.43743896484375, 4.5859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 4.0, 9.0, 8.0, 20.0, 21.0, 28.0, 30.0, 43.0, 86.0, 133.0, 145.0, 127.0, 91.0, 67.0, 51.0, 32.0, 15.0, 21.0, 20.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1601715087890625, -1.111358642578125, -1.0625457763671875, -1.01373291015625, -0.9649200439453125, -0.916107177734375, -0.8672943115234375, -0.8184814453125, -0.7696685791015625, -0.720855712890625, -0.6720428466796875, -0.62322998046875, -0.5744171142578125, -0.525604248046875, -0.4767913818359375, -0.427978515625, -0.3791656494140625, -0.330352783203125, -0.2815399169921875, -0.23272705078125, -0.1839141845703125, -0.135101318359375, -0.0862884521484375, -0.0374755859375, 0.0113372802734375, 0.060150146484375, 0.1089630126953125, 0.15777587890625, 0.2065887451171875, 0.255401611328125, 0.3042144775390625, 0.35302734375, 0.4018402099609375, 0.450653076171875, 0.4994659423828125, 0.54827880859375, 0.5970916748046875, 0.645904541015625, 0.6947174072265625, 0.7435302734375, 0.7923431396484375, 0.841156005859375, 0.8899688720703125, 0.93878173828125, 0.9875946044921875, 1.036407470703125, 1.0852203369140625, 1.134033203125, 1.1828460693359375, 1.231658935546875, 1.2804718017578125, 1.32928466796875, 1.3780975341796875, 1.426910400390625, 1.4757232666015625, 1.5245361328125, 1.5733489990234375, 1.622161865234375, 1.6709747314453125, 1.71978759765625, 1.7686004638671875, 1.817413330078125, 1.8662261962890625, 1.9150390625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 8.0, 16.0, 12.0, 12.0, 22.0, 16.0, 27.0, 13.0, 22.0, 30.0, 27.0, 26.0, 33.0, 41.0, 44.0, 33.0, 38.0, 47.0, 53.0, 39.0, 39.0, 42.0, 44.0, 40.0, 37.0, 27.0, 23.0, 18.0, 16.0, 23.0, 14.0, 18.0, 13.0, 13.0, 7.0, 7.0, 5.0, 6.0, 7.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.455994606018066, -10.153267860412598, -9.850540161132812, -9.547813415527344, -9.245086669921875, -8.94235897064209, -8.639632225036621, -8.336904525756836, -8.034177780151367, -7.73145055770874, -7.428723335266113, -7.1259965896606445, -6.823269367218018, -6.520542144775391, -6.217815399169922, -5.915088176727295, -5.612360954284668, -5.309633731842041, -5.006906509399414, -4.704179763793945, -4.401452541351318, -4.098725318908691, -3.7959983348846436, -3.4932713508605957, -3.1905441284179688, -2.887816905975342, -2.585089921951294, -2.282362937927246, -1.9796357154846191, -1.6769086122512817, -1.3741815090179443, -1.0714545249938965, -0.7687263488769531, -0.4659992456436157, -0.16327214241027832, 0.13945496082305908, 0.4421820640563965, 0.7449091672897339, 1.0476362705230713, 1.3503632545471191, 1.653090476989746, 1.9558175802230835, 2.258544683456421, 2.5612716674804688, 2.8639988899230957, 3.1667261123657227, 3.4694530963897705, 3.7721800804138184, 4.074907302856445, 4.377634525299072, 4.680361747741699, 4.983088493347168, 5.285815715789795, 5.588542938232422, 5.891269683837891, 6.193996906280518, 6.4967241287231445, 6.7994513511657715, 7.102178573608398, 7.404905319213867, 7.707632541656494, 8.010359764099121, 8.31308650970459, 8.615814208984375, 8.918540954589844]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 4.0, 11.0, 5.0, 8.0, 10.0, 13.0, 18.0, 14.0, 16.0, 24.0, 27.0, 30.0, 28.0, 31.0, 45.0, 33.0, 40.0, 35.0, 35.0, 44.0, 35.0, 47.0, 31.0, 32.0, 28.0, 35.0, 38.0, 27.0, 23.0, 35.0, 20.0, 26.0, 13.0, 19.0, 17.0, 17.0, 16.0, 18.0, 5.0, 6.0, 10.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.74306869506836, -9.444079399108887, -9.145090103149414, -8.846100807189941, -8.547111511230469, -8.248123168945312, -7.94913387298584, -7.650144577026367, -7.3511552810668945, -7.052165985107422, -6.753176689147949, -6.454187870025635, -6.155198574066162, -5.8562092781066895, -5.557220458984375, -5.258231163024902, -4.95924186706543, -4.660252571105957, -4.361263275146484, -4.06227445602417, -3.7632851600646973, -3.4642958641052246, -3.165306806564331, -2.8663177490234375, -2.567328453063965, -2.268339157104492, -1.9693500995635986, -1.6703609228134155, -1.3713717460632324, -1.0723825693130493, -0.7733933925628662, -0.47440433502197266, -0.1754150390625, 0.1235741376876831, 0.4225633144378662, 0.7215524911880493, 1.0205416679382324, 1.3195308446884155, 1.6185200214385986, 1.9175090789794922, 2.216498374938965, 2.5154876708984375, 2.814476728439331, 3.1134657859802246, 3.4124550819396973, 3.71144437789917, 4.010433197021484, 4.309422492980957, 4.60841178894043, 4.907401084899902, 5.206390380859375, 5.5053791999816895, 5.804368495941162, 6.103357791900635, 6.402346611022949, 6.701335906982422, 7.0003252029418945, 7.299314498901367, 7.59830379486084, 7.897292613983154, 8.196281433105469, 8.495270729064941, 8.794260025024414, 9.093249320983887, 9.39223861694336]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 16.0, 10.0, 30.0, 25.0, 64.0, 104.0, 134.0, 209.0, 295.0, 524.0, 749.0, 1161.0, 1717.0, 2736.0, 3963.0, 5911.0, 8534.0, 12299.0, 17430.0, 23644.0, 32368.0, 42054.0, 52726.0, 63289.0, 74079.0, 82335.0, 86679.0, 87579.0, 83937.0, 76728.0, 66606.0, 55593.0, 44150.0, 34272.0, 25810.0, 18718.0, 13346.0, 9431.0, 6451.0, 4269.0, 2897.0, 1919.0, 1316.0, 866.0, 545.0, 364.0, 229.0, 170.0, 87.0, 83.0, 34.0, 19.0, 23.0, 12.0, 9.0, 3.0, 5.0], "bins": [-7.91796875, -7.6859130859375, -7.453857421875, -7.2218017578125, -6.98974609375, -6.7576904296875, -6.525634765625, -6.2935791015625, -6.0615234375, -5.8294677734375, -5.597412109375, -5.3653564453125, -5.13330078125, -4.9012451171875, -4.669189453125, -4.4371337890625, -4.205078125, -3.9730224609375, -3.740966796875, -3.5089111328125, -3.27685546875, -3.0447998046875, -2.812744140625, -2.5806884765625, -2.3486328125, -2.1165771484375, -1.884521484375, -1.6524658203125, -1.42041015625, -1.1883544921875, -0.956298828125, -0.7242431640625, -0.4921875, -0.2601318359375, -0.028076171875, 0.2039794921875, 0.43603515625, 0.6680908203125, 0.900146484375, 1.1322021484375, 1.3642578125, 1.5963134765625, 1.828369140625, 2.0604248046875, 2.29248046875, 2.5245361328125, 2.756591796875, 2.9886474609375, 3.220703125, 3.4527587890625, 3.684814453125, 3.9168701171875, 4.14892578125, 4.3809814453125, 4.613037109375, 4.8450927734375, 5.0771484375, 5.3092041015625, 5.541259765625, 5.7733154296875, 6.00537109375, 6.2374267578125, 6.469482421875, 6.7015380859375, 6.93359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 9.0, 6.0, 9.0, 13.0, 17.0, 15.0, 13.0, 26.0, 26.0, 28.0, 30.0, 34.0, 38.0, 34.0, 41.0, 37.0, 35.0, 42.0, 37.0, 41.0, 36.0, 32.0, 29.0, 34.0, 40.0, 27.0, 20.0, 35.0, 23.0, 23.0, 18.0, 20.0, 15.0, 18.0, 13.0, 20.0, 6.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4921875, -9.2020263671875, -8.911865234375, -8.6217041015625, -8.33154296875, -8.0413818359375, -7.751220703125, -7.4610595703125, -7.1708984375, -6.8807373046875, -6.590576171875, -6.3004150390625, -6.01025390625, -5.7200927734375, -5.429931640625, -5.1397705078125, -4.849609375, -4.5594482421875, -4.269287109375, -3.9791259765625, -3.68896484375, -3.3988037109375, -3.108642578125, -2.8184814453125, -2.5283203125, -2.2381591796875, -1.947998046875, -1.6578369140625, -1.36767578125, -1.0775146484375, -0.787353515625, -0.4971923828125, -0.20703125, 0.0831298828125, 0.373291015625, 0.6634521484375, 0.95361328125, 1.2437744140625, 1.533935546875, 1.8240966796875, 2.1142578125, 2.4044189453125, 2.694580078125, 2.9847412109375, 3.27490234375, 3.5650634765625, 3.855224609375, 4.1453857421875, 4.435546875, 4.7257080078125, 5.015869140625, 5.3060302734375, 5.59619140625, 5.8863525390625, 6.176513671875, 6.4666748046875, 6.7568359375, 7.0469970703125, 7.337158203125, 7.6273193359375, 7.91748046875, 8.2076416015625, 8.497802734375, 8.7879638671875, 9.078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 7.0, 12.0, 32.0, 46.0, 82.0, 134.0, 219.0, 319.0, 649.0, 970.0, 1634.0, 2841.0, 4766.0, 7680.0, 12283.0, 19030.0, 29181.0, 42539.0, 60000.0, 78688.0, 97339.0, 110114.0, 115314.0, 109942.0, 96624.0, 78316.0, 59234.0, 42081.0, 28578.0, 18756.0, 12053.0, 7550.0, 4492.0, 2773.0, 1646.0, 993.0, 684.0, 394.0, 217.0, 130.0, 82.0, 39.0, 26.0, 26.0, 12.0, 3.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.7734375, -10.4417724609375, -10.110107421875, -9.7784423828125, -9.44677734375, -9.1151123046875, -8.783447265625, -8.4517822265625, -8.1201171875, -7.7884521484375, -7.456787109375, -7.1251220703125, -6.79345703125, -6.4617919921875, -6.130126953125, -5.7984619140625, -5.466796875, -5.1351318359375, -4.803466796875, -4.4718017578125, -4.14013671875, -3.8084716796875, -3.476806640625, -3.1451416015625, -2.8134765625, -2.4818115234375, -2.150146484375, -1.8184814453125, -1.48681640625, -1.1551513671875, -0.823486328125, -0.4918212890625, -0.16015625, 0.1715087890625, 0.503173828125, 0.8348388671875, 1.16650390625, 1.4981689453125, 1.829833984375, 2.1614990234375, 2.4931640625, 2.8248291015625, 3.156494140625, 3.4881591796875, 3.81982421875, 4.1514892578125, 4.483154296875, 4.8148193359375, 5.146484375, 5.4781494140625, 5.809814453125, 6.1414794921875, 6.47314453125, 6.8048095703125, 7.136474609375, 7.4681396484375, 7.7998046875, 8.1314697265625, 8.463134765625, 8.7947998046875, 9.12646484375, 9.4581298828125, 9.789794921875, 10.1214599609375, 10.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 3.0, 15.0, 8.0, 15.0, 13.0, 14.0, 20.0, 23.0, 28.0, 29.0, 38.0, 29.0, 31.0, 42.0, 46.0, 53.0, 35.0, 38.0, 33.0, 36.0, 43.0, 27.0, 48.0, 35.0, 39.0, 33.0, 33.0, 27.0, 23.0, 23.0, 11.0, 23.0, 11.0, 7.0, 7.0, 12.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.75390625, -6.54119873046875, -6.3284912109375, -6.11578369140625, -5.903076171875, -5.69036865234375, -5.4776611328125, -5.26495361328125, -5.05224609375, -4.83953857421875, -4.6268310546875, -4.41412353515625, -4.201416015625, -3.98870849609375, -3.7760009765625, -3.56329345703125, -3.3505859375, -3.13787841796875, -2.9251708984375, -2.71246337890625, -2.499755859375, -2.28704833984375, -2.0743408203125, -1.86163330078125, -1.64892578125, -1.43621826171875, -1.2235107421875, -1.01080322265625, -0.798095703125, -0.58538818359375, -0.3726806640625, -0.15997314453125, 0.052734375, 0.26544189453125, 0.4781494140625, 0.69085693359375, 0.903564453125, 1.11627197265625, 1.3289794921875, 1.54168701171875, 1.75439453125, 1.96710205078125, 2.1798095703125, 2.39251708984375, 2.605224609375, 2.81793212890625, 3.0306396484375, 3.24334716796875, 3.4560546875, 3.66876220703125, 3.8814697265625, 4.09417724609375, 4.306884765625, 4.51959228515625, 4.7322998046875, 4.94500732421875, 5.15771484375, 5.37042236328125, 5.5831298828125, 5.79583740234375, 6.008544921875, 6.22125244140625, 6.4339599609375, 6.64666748046875, 6.859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 12.0, 14.0, 25.0, 33.0, 50.0, 72.0, 111.0, 178.0, 286.0, 449.0, 675.0, 1174.0, 1789.0, 2920.0, 4696.0, 7919.0, 12719.0, 21007.0, 32963.0, 51622.0, 76936.0, 104877.0, 130370.0, 140888.0, 131122.0, 107062.0, 77524.0, 52492.0, 33711.0, 21307.0, 12976.0, 7872.0, 4802.0, 2918.0, 1795.0, 1164.0, 707.0, 472.0, 307.0, 184.0, 126.0, 72.0, 52.0, 40.0, 28.0, 14.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.039794921875, -3.91162109375, -3.783447265625, -3.6552734375, -3.527099609375, -3.39892578125, -3.270751953125, -3.142578125, -3.014404296875, -2.88623046875, -2.758056640625, -2.6298828125, -2.501708984375, -2.37353515625, -2.245361328125, -2.1171875, -1.989013671875, -1.86083984375, -1.732666015625, -1.6044921875, -1.476318359375, -1.34814453125, -1.219970703125, -1.091796875, -0.963623046875, -0.83544921875, -0.707275390625, -0.5791015625, -0.450927734375, -0.32275390625, -0.194580078125, -0.06640625, 0.061767578125, 0.18994140625, 0.318115234375, 0.4462890625, 0.574462890625, 0.70263671875, 0.830810546875, 0.958984375, 1.087158203125, 1.21533203125, 1.343505859375, 1.4716796875, 1.599853515625, 1.72802734375, 1.856201171875, 1.984375, 2.112548828125, 2.24072265625, 2.368896484375, 2.4970703125, 2.625244140625, 2.75341796875, 2.881591796875, 3.009765625, 3.137939453125, 3.26611328125, 3.394287109375, 3.5224609375, 3.650634765625, 3.77880859375, 3.906982421875, 4.03515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 10.0, 15.0, 18.0, 17.0, 21.0, 29.0, 24.0, 40.0, 41.0, 43.0, 40.0, 46.0, 52.0, 40.0, 53.0, 70.0, 48.0, 67.0, 51.0, 41.0, 37.0, 25.0, 29.0, 20.0, 23.0, 11.0, 12.0, 8.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00048279762268066406, -0.0004680268466472626, -0.0004532560706138611, -0.0004384852945804596, -0.0004237145185470581, -0.0004089437425136566, -0.0003941729664802551, -0.00037940219044685364, -0.00036463141441345215, -0.00034986063838005066, -0.00033508986234664917, -0.0003203190863132477, -0.0003055483102798462, -0.0002907775342464447, -0.0002760067582130432, -0.0002612359821796417, -0.00024646520614624023, -0.00023169443011283875, -0.00021692365407943726, -0.00020215287804603577, -0.00018738210201263428, -0.0001726113259792328, -0.0001578405499458313, -0.0001430697739124298, -0.00012829899787902832, -0.00011352822184562683, -9.875744581222534e-05, -8.398666977882385e-05, -6.921589374542236e-05, -5.4445117712020874e-05, -3.9674341678619385e-05, -2.4903565645217896e-05, -1.0132789611816406e-05, 4.637986421585083e-06, 1.9408762454986572e-05, 3.417953848838806e-05, 4.895031452178955e-05, 6.372109055519104e-05, 7.849186658859253e-05, 9.326264262199402e-05, 0.00010803341865539551, 0.000122804194688797, 0.00013757497072219849, 0.00015234574675559998, 0.00016711652278900146, 0.00018188729882240295, 0.00019665807485580444, 0.00021142885088920593, 0.00022619962692260742, 0.0002409704029560089, 0.0002557411789894104, 0.0002705119550228119, 0.0002852827310562134, 0.00030005350708961487, 0.00031482428312301636, 0.00032959505915641785, 0.00034436583518981934, 0.0003591366112232208, 0.0003739073872566223, 0.0003886781632900238, 0.0004034489393234253, 0.0004182197153568268, 0.00043299049139022827, 0.00044776126742362976, 0.00046253204345703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 4.0, 10.0, 7.0, 24.0, 24.0, 50.0, 78.0, 91.0, 170.0, 190.0, 337.0, 480.0, 755.0, 1154.0, 1808.0, 2806.0, 4717.0, 7686.0, 12605.0, 20573.0, 33186.0, 52089.0, 76455.0, 106052.0, 129966.0, 139483.0, 131100.0, 105919.0, 78610.0, 52912.0, 34141.0, 21215.0, 12934.0, 7942.0, 4803.0, 2901.0, 1819.0, 1215.0, 737.0, 496.0, 321.0, 229.0, 155.0, 103.0, 67.0, 49.0, 37.0, 25.0, 10.0, 7.0, 8.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.763427734375, -3.64013671875, -3.516845703125, -3.3935546875, -3.270263671875, -3.14697265625, -3.023681640625, -2.900390625, -2.777099609375, -2.65380859375, -2.530517578125, -2.4072265625, -2.283935546875, -2.16064453125, -2.037353515625, -1.9140625, -1.790771484375, -1.66748046875, -1.544189453125, -1.4208984375, -1.297607421875, -1.17431640625, -1.051025390625, -0.927734375, -0.804443359375, -0.68115234375, -0.557861328125, -0.4345703125, -0.311279296875, -0.18798828125, -0.064697265625, 0.05859375, 0.181884765625, 0.30517578125, 0.428466796875, 0.5517578125, 0.675048828125, 0.79833984375, 0.921630859375, 1.044921875, 1.168212890625, 1.29150390625, 1.414794921875, 1.5380859375, 1.661376953125, 1.78466796875, 1.907958984375, 2.03125, 2.154541015625, 2.27783203125, 2.401123046875, 2.5244140625, 2.647705078125, 2.77099609375, 2.894287109375, 3.017578125, 3.140869140625, 3.26416015625, 3.387451171875, 3.5107421875, 3.634033203125, 3.75732421875, 3.880615234375, 4.00390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 10.0, 18.0, 19.0, 26.0, 21.0, 31.0, 38.0, 48.0, 46.0, 66.0, 76.0, 49.0, 55.0, 57.0, 41.0, 58.0, 48.0, 38.0, 36.0, 31.0, 31.0, 25.0, 17.0, 12.0, 9.0, 13.0, 13.0, 5.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.959197998046875, -1.89495849609375, -1.830718994140625, -1.7664794921875, -1.702239990234375, -1.63800048828125, -1.573760986328125, -1.509521484375, -1.445281982421875, -1.38104248046875, -1.316802978515625, -1.2525634765625, -1.188323974609375, -1.12408447265625, -1.059844970703125, -0.99560546875, -0.931365966796875, -0.86712646484375, -0.802886962890625, -0.7386474609375, -0.674407958984375, -0.61016845703125, -0.545928955078125, -0.481689453125, -0.417449951171875, -0.35321044921875, -0.288970947265625, -0.2247314453125, -0.160491943359375, -0.09625244140625, -0.032012939453125, 0.0322265625, 0.096466064453125, 0.16070556640625, 0.224945068359375, 0.2891845703125, 0.353424072265625, 0.41766357421875, 0.481903076171875, 0.546142578125, 0.610382080078125, 0.67462158203125, 0.738861083984375, 0.8031005859375, 0.867340087890625, 0.93157958984375, 0.995819091796875, 1.06005859375, 1.124298095703125, 1.18853759765625, 1.252777099609375, 1.3170166015625, 1.381256103515625, 1.44549560546875, 1.509735107421875, 1.573974609375, 1.638214111328125, 1.70245361328125, 1.766693115234375, 1.8309326171875, 1.895172119140625, 1.95941162109375, 2.023651123046875, 2.087890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 9.0, 12.0, 8.0, 16.0, 9.0, 18.0, 22.0, 19.0, 37.0, 32.0, 27.0, 21.0, 36.0, 31.0, 37.0, 31.0, 46.0, 33.0, 54.0, 47.0, 39.0, 41.0, 43.0, 40.0, 30.0, 38.0, 31.0, 26.0, 21.0, 15.0, 17.0, 13.0, 14.0, 13.0, 12.0, 6.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.584078788757324, -9.281476020812988, -8.978874206542969, -8.676271438598633, -8.373669624328613, -8.071066856384277, -7.7684645652771, -7.465862274169922, -7.163259983062744, -6.860657691955566, -6.558055400848389, -6.255453109741211, -5.952850341796875, -5.6502485275268555, -5.3476457595825195, -5.045043468475342, -4.742441177368164, -4.439838886260986, -4.137236595153809, -3.8346340656280518, -3.532031774520874, -3.2294294834136963, -2.9268269538879395, -2.6242246627807617, -2.321622371673584, -2.0190200805664062, -1.716417670249939, -1.4138152599334717, -1.111212968826294, -0.8086106777191162, -0.5060082674026489, -0.20340585708618164, 0.0991973876953125, 0.401799738407135, 0.7044020891189575, 1.0070044994354248, 1.3096067905426025, 1.6122090816497803, 1.9148114919662476, 2.217413902282715, 2.5200161933898926, 2.8226184844970703, 3.125220775604248, 3.427823305130005, 3.7304255962371826, 4.033027648925781, 4.335630416870117, 4.638232707977295, 4.940834999084473, 5.24343729019165, 5.546039581298828, 5.848641872406006, 6.151244163513184, 6.4538469314575195, 6.756449222564697, 7.059051513671875, 7.361653804779053, 7.6642560958862305, 7.966858386993408, 8.269460678100586, 8.572063446044922, 8.874665260314941, 9.177268028259277, 9.479869842529297, 9.782472610473633]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 10.0, 8.0, 7.0, 10.0, 13.0, 16.0, 13.0, 18.0, 26.0, 18.0, 23.0, 25.0, 35.0, 32.0, 39.0, 41.0, 43.0, 44.0, 52.0, 32.0, 45.0, 51.0, 35.0, 35.0, 36.0, 33.0, 37.0, 31.0, 24.0, 21.0, 24.0, 18.0, 22.0, 13.0, 14.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.64548397064209, -10.315455436706543, -9.985426902770996, -9.655397415161133, -9.325368881225586, -8.995340347290039, -8.665311813354492, -8.335283279418945, -8.005254745483398, -7.675226211547852, -7.3451972007751465, -7.0151686668396, -6.6851396560668945, -6.355111122131348, -6.025082588195801, -5.695054054260254, -5.365024566650391, -5.034996032714844, -4.704967021942139, -4.374938488006592, -4.044909477233887, -3.71488094329834, -3.384852409362793, -3.054823637008667, -2.724794864654541, -2.394766092300415, -2.064737319946289, -1.7347087860107422, -1.4046800136566162, -1.0746512413024902, -0.7446225881576538, -0.4145939350128174, -0.084564208984375, 0.2454645037651062, 0.5754932165145874, 0.9055219292640686, 1.2355506420135498, 1.5655794143676758, 1.8956080675125122, 2.2256367206573486, 2.5556654930114746, 2.8856942653656006, 3.2157230377197266, 3.5457515716552734, 3.8757803440093994, 4.205809116363525, 4.535837650299072, 4.865866661071777, 5.195895195007324, 5.525923728942871, 5.855952739715576, 6.185981273651123, 6.516010284423828, 6.846038818359375, 7.176067352294922, 7.506095886230469, 7.836124897003174, 8.166153907775879, 8.496182441711426, 8.826210975646973, 9.15623950958252, 9.486268997192383, 9.81629753112793, 10.146326065063477, 10.476354598999023]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [4.0, 8.0, 6.0, 12.0, 23.0, 25.0, 40.0, 54.0, 97.0, 168.0, 274.0, 428.0, 567.0, 878.0, 1337.0, 2225.0, 3411.0, 5107.0, 7816.0, 12059.0, 18320.0, 27599.0, 42260.0, 62912.0, 92310.0, 133517.0, 186631.0, 253182.0, 326801.0, 393902.0, 439139.0, 446920.0, 414939.0, 354020.0, 280631.0, 211098.0, 152485.0, 106177.0, 72942.0, 49233.0, 32260.0, 21848.0, 13912.0, 9353.0, 6115.0, 3919.0, 2552.0, 1720.0, 1110.0, 721.0, 427.0, 305.0, 186.0, 110.0, 73.0, 53.0, 34.0, 24.0, 10.0, 8.0, 0.0, 4.0, 1.0, 2.0], "bins": [-7.45703125, -7.21795654296875, -6.9788818359375, -6.73980712890625, -6.500732421875, -6.26165771484375, -6.0225830078125, -5.78350830078125, -5.54443359375, -5.30535888671875, -5.0662841796875, -4.82720947265625, -4.588134765625, -4.34906005859375, -4.1099853515625, -3.87091064453125, -3.6318359375, -3.39276123046875, -3.1536865234375, -2.91461181640625, -2.675537109375, -2.43646240234375, -2.1973876953125, -1.95831298828125, -1.71923828125, -1.48016357421875, -1.2410888671875, -1.00201416015625, -0.762939453125, -0.52386474609375, -0.2847900390625, -0.04571533203125, 0.193359375, 0.43243408203125, 0.6715087890625, 0.91058349609375, 1.149658203125, 1.38873291015625, 1.6278076171875, 1.86688232421875, 2.10595703125, 2.34503173828125, 2.5841064453125, 2.82318115234375, 3.062255859375, 3.30133056640625, 3.5404052734375, 3.77947998046875, 4.0185546875, 4.25762939453125, 4.4967041015625, 4.73577880859375, 4.974853515625, 5.21392822265625, 5.4530029296875, 5.69207763671875, 5.93115234375, 6.17022705078125, 6.4093017578125, 6.64837646484375, 6.887451171875, 7.12652587890625, 7.3656005859375, 7.60467529296875, 7.84375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 7.0, 3.0, 16.0, 11.0, 14.0, 11.0, 13.0, 20.0, 24.0, 20.0, 23.0, 28.0, 33.0, 32.0, 34.0, 37.0, 46.0, 37.0, 53.0, 32.0, 38.0, 40.0, 47.0, 36.0, 33.0, 43.0, 23.0, 30.0, 28.0, 27.0, 23.0, 21.0, 18.0, 14.0, 16.0, 11.0, 7.0, 7.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.4583740234375, -8.190185546875, -7.9219970703125, -7.65380859375, -7.3856201171875, -7.117431640625, -6.8492431640625, -6.5810546875, -6.3128662109375, -6.044677734375, -5.7764892578125, -5.50830078125, -5.2401123046875, -4.971923828125, -4.7037353515625, -4.435546875, -4.1673583984375, -3.899169921875, -3.6309814453125, -3.36279296875, -3.0946044921875, -2.826416015625, -2.5582275390625, -2.2900390625, -2.0218505859375, -1.753662109375, -1.4854736328125, -1.21728515625, -0.9490966796875, -0.680908203125, -0.4127197265625, -0.14453125, 0.1236572265625, 0.391845703125, 0.6600341796875, 0.92822265625, 1.1964111328125, 1.464599609375, 1.7327880859375, 2.0009765625, 2.2691650390625, 2.537353515625, 2.8055419921875, 3.07373046875, 3.3419189453125, 3.610107421875, 3.8782958984375, 4.146484375, 4.4146728515625, 4.682861328125, 4.9510498046875, 5.21923828125, 5.4874267578125, 5.755615234375, 6.0238037109375, 6.2919921875, 6.5601806640625, 6.828369140625, 7.0965576171875, 7.36474609375, 7.6329345703125, 7.901123046875, 8.1693115234375, 8.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 18.0, 29.0, 49.0, 76.0, 141.0, 216.0, 361.0, 617.0, 1046.0, 1672.0, 2845.0, 4583.0, 7457.0, 11930.0, 19071.0, 29816.0, 45279.0, 68769.0, 100653.0, 142537.0, 194644.0, 256983.0, 320425.0, 375054.0, 413644.0, 421271.0, 397908.0, 348375.0, 286333.0, 222656.0, 166025.0, 118230.0, 81797.0, 55477.0, 36400.0, 23242.0, 14591.0, 9244.0, 5832.0, 3534.0, 2188.0, 1288.0, 776.0, 533.0, 254.0, 146.0, 115.0, 50.0, 45.0, 16.0, 15.0, 13.0, 5.0, 1.0, 2.0, 1.0], "bins": [-8.0625, -7.81988525390625, -7.5772705078125, -7.33465576171875, -7.092041015625, -6.84942626953125, -6.6068115234375, -6.36419677734375, -6.12158203125, -5.87896728515625, -5.6363525390625, -5.39373779296875, -5.151123046875, -4.90850830078125, -4.6658935546875, -4.42327880859375, -4.1806640625, -3.93804931640625, -3.6954345703125, -3.45281982421875, -3.210205078125, -2.96759033203125, -2.7249755859375, -2.48236083984375, -2.23974609375, -1.99713134765625, -1.7545166015625, -1.51190185546875, -1.269287109375, -1.02667236328125, -0.7840576171875, -0.54144287109375, -0.298828125, -0.05621337890625, 0.1864013671875, 0.42901611328125, 0.671630859375, 0.91424560546875, 1.1568603515625, 1.39947509765625, 1.64208984375, 1.88470458984375, 2.1273193359375, 2.36993408203125, 2.612548828125, 2.85516357421875, 3.0977783203125, 3.34039306640625, 3.5830078125, 3.82562255859375, 4.0682373046875, 4.31085205078125, 4.553466796875, 4.79608154296875, 5.0386962890625, 5.28131103515625, 5.52392578125, 5.76654052734375, 6.0091552734375, 6.25177001953125, 6.494384765625, 6.73699951171875, 6.9796142578125, 7.22222900390625, 7.46484375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 9.0, 6.0, 8.0, 9.0, 13.0, 20.0, 17.0, 15.0, 31.0, 49.0, 42.0, 44.0, 50.0, 75.0, 76.0, 83.0, 102.0, 110.0, 138.0, 132.0, 159.0, 169.0, 183.0, 194.0, 193.0, 180.0, 179.0, 179.0, 160.0, 163.0, 182.0, 145.0, 121.0, 129.0, 111.0, 94.0, 82.0, 86.0, 70.0, 44.0, 34.0, 39.0, 25.0, 20.0, 22.0, 20.0, 16.0, 13.0, 11.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0], "bins": [-3.6640625, -3.548553466796875, -3.43304443359375, -3.317535400390625, -3.2020263671875, -3.086517333984375, -2.97100830078125, -2.855499267578125, -2.739990234375, -2.624481201171875, -2.50897216796875, -2.393463134765625, -2.2779541015625, -2.162445068359375, -2.04693603515625, -1.931427001953125, -1.81591796875, -1.700408935546875, -1.58489990234375, -1.469390869140625, -1.3538818359375, -1.238372802734375, -1.12286376953125, -1.007354736328125, -0.891845703125, -0.776336669921875, -0.66082763671875, -0.545318603515625, -0.4298095703125, -0.314300537109375, -0.19879150390625, -0.083282470703125, 0.0322265625, 0.147735595703125, 0.26324462890625, 0.378753662109375, 0.4942626953125, 0.609771728515625, 0.72528076171875, 0.840789794921875, 0.956298828125, 1.071807861328125, 1.18731689453125, 1.302825927734375, 1.4183349609375, 1.533843994140625, 1.64935302734375, 1.764862060546875, 1.88037109375, 1.995880126953125, 2.11138916015625, 2.226898193359375, 2.3424072265625, 2.457916259765625, 2.57342529296875, 2.688934326171875, 2.804443359375, 2.919952392578125, 3.03546142578125, 3.150970458984375, 3.2664794921875, 3.381988525390625, 3.49749755859375, 3.613006591796875, 3.728515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 7.0, 6.0, 6.0, 9.0, 13.0, 16.0, 25.0, 23.0, 19.0, 28.0, 25.0, 30.0, 28.0, 34.0, 39.0, 53.0, 46.0, 51.0, 46.0, 48.0, 44.0, 36.0, 35.0, 43.0, 35.0, 30.0, 32.0, 43.0, 30.0, 14.0, 13.0, 20.0, 16.0, 9.0, 8.0, 14.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.409661293029785, -10.067312240600586, -9.724963188171387, -9.382614135742188, -9.040265083312988, -8.697916030883789, -8.355566024780273, -8.01321792602539, -7.670868396759033, -7.328519344329834, -6.986170291900635, -6.643820762634277, -6.301471710205078, -5.959122657775879, -5.61677360534668, -5.2744245529174805, -4.932075500488281, -4.589726448059082, -4.247377395629883, -3.9050281047821045, -3.5626790523529053, -3.220329999923706, -2.8779807090759277, -2.5356316566467285, -2.1932826042175293, -1.85093355178833, -1.5085843801498413, -1.1662352085113525, -0.8238861560821533, -0.4815371036529541, -0.13918781280517578, 0.20316123962402344, 0.5455093383789062, 0.8878584504127502, 1.2302075624465942, 1.572556734085083, 1.9149057865142822, 2.2572548389434814, 2.5996041297912598, 2.941953182220459, 3.284302234649658, 3.6266512870788574, 3.9690003395080566, 4.311349868774414, 4.653698921203613, 4.9960479736328125, 5.338397026062012, 5.680746078491211, 6.02309513092041, 6.365444183349609, 6.707793235778809, 7.050142288208008, 7.392491340637207, 7.734840393066406, 8.077190399169922, 8.419538497924805, 8.76188850402832, 9.10423755645752, 9.446586608886719, 9.788935661315918, 10.131284713745117, 10.473633766174316, 10.815982818603516, 11.158332824707031, 11.500680923461914]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 11.0, 9.0, 7.0, 9.0, 9.0, 13.0, 14.0, 11.0, 13.0, 13.0, 21.0, 22.0, 27.0, 29.0, 28.0, 43.0, 38.0, 30.0, 40.0, 42.0, 32.0, 42.0, 26.0, 47.0, 38.0, 36.0, 41.0, 32.0, 35.0, 27.0, 33.0, 19.0, 26.0, 25.0, 12.0, 10.0, 17.0, 11.0, 15.0, 9.0, 4.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.375836372375488, -9.074422836303711, -8.773009300231934, -8.471595764160156, -8.170182228088379, -7.868768692016602, -7.567354679107666, -7.265941143035889, -6.964527606964111, -6.663114070892334, -6.361700534820557, -6.060286998748779, -5.758872985839844, -5.457459449768066, -5.156045913696289, -4.854632377624512, -4.553218841552734, -4.251805305480957, -3.9503917694091797, -3.6489779949188232, -3.347564458847046, -3.0461509227752686, -2.744737148284912, -2.4433236122131348, -2.1419100761413574, -1.84049654006958, -1.5390828847885132, -1.2376692295074463, -0.936255693435669, -0.6348421573638916, -0.3334285020828247, -0.03201484680175781, 0.2693977355957031, 0.5708113312721252, 0.8722249269485474, 1.1736385822296143, 1.4750521183013916, 1.776465654373169, 2.0778794288635254, 2.3792929649353027, 2.68070650100708, 2.9821200370788574, 3.2835335731506348, 3.584947347640991, 3.8863608837127686, 4.187774658203125, 4.489188194274902, 4.79060173034668, 5.092015266418457, 5.393428802490234, 5.694842338562012, 5.996255874633789, 6.297669410705566, 6.599082946777344, 6.900496959686279, 7.201910495758057, 7.503324031829834, 7.804737567901611, 8.106151580810547, 8.407565116882324, 8.708978652954102, 9.010392189025879, 9.311805725097656, 9.613219261169434, 9.914632797241211]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 10.0, 14.0, 23.0, 35.0, 41.0, 50.0, 94.0, 131.0, 194.0, 269.0, 408.0, 628.0, 1006.0, 1616.0, 2706.0, 4399.0, 7418.0, 12953.0, 23002.0, 41927.0, 74379.0, 127960.0, 192461.0, 206557.0, 147292.0, 88160.0, 49369.0, 27927.0, 15379.0, 8789.0, 5104.0, 3062.0, 1864.0, 1137.0, 743.0, 463.0, 323.0, 198.0, 127.0, 112.0, 64.0, 45.0, 25.0, 26.0, 14.0, 13.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.91015625, -5.726318359375, -5.54248046875, -5.358642578125, -5.1748046875, -4.990966796875, -4.80712890625, -4.623291015625, -4.439453125, -4.255615234375, -4.07177734375, -3.887939453125, -3.7041015625, -3.520263671875, -3.33642578125, -3.152587890625, -2.96875, -2.784912109375, -2.60107421875, -2.417236328125, -2.2333984375, -2.049560546875, -1.86572265625, -1.681884765625, -1.498046875, -1.314208984375, -1.13037109375, -0.946533203125, -0.7626953125, -0.578857421875, -0.39501953125, -0.211181640625, -0.02734375, 0.156494140625, 0.34033203125, 0.524169921875, 0.7080078125, 0.891845703125, 1.07568359375, 1.259521484375, 1.443359375, 1.627197265625, 1.81103515625, 1.994873046875, 2.1787109375, 2.362548828125, 2.54638671875, 2.730224609375, 2.9140625, 3.097900390625, 3.28173828125, 3.465576171875, 3.6494140625, 3.833251953125, 4.01708984375, 4.200927734375, 4.384765625, 4.568603515625, 4.75244140625, 4.936279296875, 5.1201171875, 5.303955078125, 5.48779296875, 5.671630859375, 5.85546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 2.0, 8.0, 7.0, 11.0, 6.0, 11.0, 11.0, 12.0, 15.0, 13.0, 12.0, 18.0, 20.0, 27.0, 28.0, 26.0, 33.0, 44.0, 36.0, 32.0, 43.0, 38.0, 35.0, 32.0, 45.0, 36.0, 38.0, 32.0, 38.0, 43.0, 17.0, 39.0, 23.0, 20.0, 32.0, 17.0, 10.0, 16.0, 10.0, 9.0, 18.0, 3.0, 10.0, 6.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.40625, -9.1070556640625, -8.807861328125, -8.5086669921875, -8.20947265625, -7.9102783203125, -7.611083984375, -7.3118896484375, -7.0126953125, -6.7135009765625, -6.414306640625, -6.1151123046875, -5.81591796875, -5.5167236328125, -5.217529296875, -4.9183349609375, -4.619140625, -4.3199462890625, -4.020751953125, -3.7215576171875, -3.42236328125, -3.1231689453125, -2.823974609375, -2.5247802734375, -2.2255859375, -1.9263916015625, -1.627197265625, -1.3280029296875, -1.02880859375, -0.7296142578125, -0.430419921875, -0.1312255859375, 0.16796875, 0.4671630859375, 0.766357421875, 1.0655517578125, 1.36474609375, 1.6639404296875, 1.963134765625, 2.2623291015625, 2.5615234375, 2.8607177734375, 3.159912109375, 3.4591064453125, 3.75830078125, 4.0574951171875, 4.356689453125, 4.6558837890625, 4.955078125, 5.2542724609375, 5.553466796875, 5.8526611328125, 6.15185546875, 6.4510498046875, 6.750244140625, 7.0494384765625, 7.3486328125, 7.6478271484375, 7.947021484375, 8.2462158203125, 8.54541015625, 8.8446044921875, 9.143798828125, 9.4429931640625, 9.7421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 6.0, 4.0, 12.0, 13.0, 22.0, 29.0, 24.0, 44.0, 54.0, 107.0, 106.0, 187.0, 204.0, 344.0, 448.0, 735.0, 1104.0, 1696.0, 2875.0, 5255.0, 10107.0, 21708.0, 52899.0, 138308.0, 326922.0, 287885.0, 113979.0, 44023.0, 18713.0, 8803.0, 4702.0, 2608.0, 1580.0, 932.0, 636.0, 462.0, 267.0, 193.0, 143.0, 117.0, 84.0, 62.0, 32.0, 28.0, 20.0, 21.0, 13.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-6.21875, -6.02972412109375, -5.8406982421875, -5.65167236328125, -5.462646484375, -5.27362060546875, -5.0845947265625, -4.89556884765625, -4.70654296875, -4.51751708984375, -4.3284912109375, -4.13946533203125, -3.950439453125, -3.76141357421875, -3.5723876953125, -3.38336181640625, -3.1943359375, -3.00531005859375, -2.8162841796875, -2.62725830078125, -2.438232421875, -2.24920654296875, -2.0601806640625, -1.87115478515625, -1.68212890625, -1.49310302734375, -1.3040771484375, -1.11505126953125, -0.926025390625, -0.73699951171875, -0.5479736328125, -0.35894775390625, -0.169921875, 0.01910400390625, 0.2081298828125, 0.39715576171875, 0.586181640625, 0.77520751953125, 0.9642333984375, 1.15325927734375, 1.34228515625, 1.53131103515625, 1.7203369140625, 1.90936279296875, 2.098388671875, 2.28741455078125, 2.4764404296875, 2.66546630859375, 2.8544921875, 3.04351806640625, 3.2325439453125, 3.42156982421875, 3.610595703125, 3.79962158203125, 3.9886474609375, 4.17767333984375, 4.36669921875, 4.55572509765625, 4.7447509765625, 4.93377685546875, 5.122802734375, 5.31182861328125, 5.5008544921875, 5.68988037109375, 5.87890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 4.0, 6.0, 3.0, 8.0, 8.0, 12.0, 9.0, 14.0, 9.0, 25.0, 14.0, 27.0, 28.0, 32.0, 27.0, 43.0, 39.0, 37.0, 27.0, 28.0, 44.0, 38.0, 40.0, 41.0, 39.0, 44.0, 32.0, 30.0, 29.0, 32.0, 25.0, 41.0, 29.0, 19.0, 20.0, 17.0, 15.0, 10.0, 12.0, 13.0, 7.0, 7.0, 5.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-7.19140625, -6.98876953125, -6.7861328125, -6.58349609375, -6.380859375, -6.17822265625, -5.9755859375, -5.77294921875, -5.5703125, -5.36767578125, -5.1650390625, -4.96240234375, -4.759765625, -4.55712890625, -4.3544921875, -4.15185546875, -3.94921875, -3.74658203125, -3.5439453125, -3.34130859375, -3.138671875, -2.93603515625, -2.7333984375, -2.53076171875, -2.328125, -2.12548828125, -1.9228515625, -1.72021484375, -1.517578125, -1.31494140625, -1.1123046875, -0.90966796875, -0.70703125, -0.50439453125, -0.3017578125, -0.09912109375, 0.103515625, 0.30615234375, 0.5087890625, 0.71142578125, 0.9140625, 1.11669921875, 1.3193359375, 1.52197265625, 1.724609375, 1.92724609375, 2.1298828125, 2.33251953125, 2.53515625, 2.73779296875, 2.9404296875, 3.14306640625, 3.345703125, 3.54833984375, 3.7509765625, 3.95361328125, 4.15625, 4.35888671875, 4.5615234375, 4.76416015625, 4.966796875, 5.16943359375, 5.3720703125, 5.57470703125, 5.77734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 15.0, 16.0, 16.0, 36.0, 45.0, 73.0, 88.0, 141.0, 216.0, 353.0, 627.0, 1022.0, 2215.0, 5910.0, 27348.0, 898733.0, 95816.0, 9461.0, 3174.0, 1345.0, 744.0, 397.0, 254.0, 151.0, 100.0, 69.0, 51.0, 38.0, 27.0, 20.0, 10.0, 6.0, 4.0, 11.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.924072265625, -10.54345703125, -10.162841796875, -9.7822265625, -9.401611328125, -9.02099609375, -8.640380859375, -8.259765625, -7.879150390625, -7.49853515625, -7.117919921875, -6.7373046875, -6.356689453125, -5.97607421875, -5.595458984375, -5.21484375, -4.834228515625, -4.45361328125, -4.072998046875, -3.6923828125, -3.311767578125, -2.93115234375, -2.550537109375, -2.169921875, -1.789306640625, -1.40869140625, -1.028076171875, -0.6474609375, -0.266845703125, 0.11376953125, 0.494384765625, 0.875, 1.255615234375, 1.63623046875, 2.016845703125, 2.3974609375, 2.778076171875, 3.15869140625, 3.539306640625, 3.919921875, 4.300537109375, 4.68115234375, 5.061767578125, 5.4423828125, 5.822998046875, 6.20361328125, 6.584228515625, 6.96484375, 7.345458984375, 7.72607421875, 8.106689453125, 8.4873046875, 8.867919921875, 9.24853515625, 9.629150390625, 10.009765625, 10.390380859375, 10.77099609375, 11.151611328125, 11.5322265625, 11.912841796875, 12.29345703125, 12.674072265625, 13.0546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 19.0, 30.0, 83.0, 133.0, 215.0, 216.0, 131.0, 80.0, 33.0, 17.0, 13.0, 3.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001346588134765625, -0.001316666603088379, -0.0012867450714111328, -0.0012568235397338867, -0.0012269020080566406, -0.0011969804763793945, -0.0011670589447021484, -0.0011371374130249023, -0.0011072158813476562, -0.0010772943496704102, -0.001047372817993164, -0.001017451286315918, -0.0009875297546386719, -0.0009576082229614258, -0.0009276866912841797, -0.0008977651596069336, -0.0008678436279296875, -0.0008379220962524414, -0.0008080005645751953, -0.0007780790328979492, -0.0007481575012207031, -0.000718235969543457, -0.0006883144378662109, -0.0006583929061889648, -0.0006284713745117188, -0.0005985498428344727, -0.0005686283111572266, -0.0005387067794799805, -0.0005087852478027344, -0.0004788637161254883, -0.0004489421844482422, -0.0004190206527709961, -0.00038909912109375, -0.0003591775894165039, -0.0003292560577392578, -0.0002993345260620117, -0.0002694129943847656, -0.00023949146270751953, -0.00020956993103027344, -0.00017964839935302734, -0.00014972686767578125, -0.00011980533599853516, -8.988380432128906e-05, -5.996227264404297e-05, -3.0040740966796875e-05, -1.1920928955078125e-07, 2.9802322387695312e-05, 5.9723854064941406e-05, 8.96453857421875e-05, 0.0001195669174194336, 0.0001494884490966797, 0.00017940998077392578, 0.00020933151245117188, 0.00023925304412841797, 0.00026917457580566406, 0.00029909610748291016, 0.00032901763916015625, 0.00035893917083740234, 0.00038886070251464844, 0.00041878223419189453, 0.0004487037658691406, 0.0004786252975463867, 0.0005085468292236328, 0.0005384683609008789, 0.000568389892578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 15.0, 12.0, 25.0, 30.0, 36.0, 54.0, 72.0, 118.0, 139.0, 233.0, 317.0, 459.0, 677.0, 1049.0, 1704.0, 2889.0, 5776.0, 14047.0, 48201.0, 312295.0, 532760.0, 89563.0, 20836.0, 7673.0, 3705.0, 2063.0, 1281.0, 787.0, 517.0, 358.0, 273.0, 166.0, 105.0, 79.0, 50.0, 45.0, 34.0, 27.0, 21.0, 15.0, 15.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.92578125, -8.6484375, -8.37109375, -8.09375, -7.81640625, -7.5390625, -7.26171875, -6.984375, -6.70703125, -6.4296875, -6.15234375, -5.875, -5.59765625, -5.3203125, -5.04296875, -4.765625, -4.48828125, -4.2109375, -3.93359375, -3.65625, -3.37890625, -3.1015625, -2.82421875, -2.546875, -2.26953125, -1.9921875, -1.71484375, -1.4375, -1.16015625, -0.8828125, -0.60546875, -0.328125, -0.05078125, 0.2265625, 0.50390625, 0.78125, 1.05859375, 1.3359375, 1.61328125, 1.890625, 2.16796875, 2.4453125, 2.72265625, 3.0, 3.27734375, 3.5546875, 3.83203125, 4.109375, 4.38671875, 4.6640625, 4.94140625, 5.21875, 5.49609375, 5.7734375, 6.05078125, 6.328125, 6.60546875, 6.8828125, 7.16015625, 7.4375, 7.71484375, 7.9921875, 8.26953125, 8.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 10.0, 10.0, 12.0, 18.0, 15.0, 35.0, 33.0, 64.0, 83.0, 123.0, 129.0, 146.0, 93.0, 63.0, 51.0, 39.0, 20.0, 14.0, 11.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.0205078125, -1.95703125, -1.8935546875, -1.830078125, -1.7666015625, -1.703125, -1.6396484375, -1.576171875, -1.5126953125, -1.44921875, -1.3857421875, -1.322265625, -1.2587890625, -1.1953125, -1.1318359375, -1.068359375, -1.0048828125, -0.94140625, -0.8779296875, -0.814453125, -0.7509765625, -0.6875, -0.6240234375, -0.560546875, -0.4970703125, -0.43359375, -0.3701171875, -0.306640625, -0.2431640625, -0.1796875, -0.1162109375, -0.052734375, 0.0107421875, 0.07421875, 0.1376953125, 0.201171875, 0.2646484375, 0.328125, 0.3916015625, 0.455078125, 0.5185546875, 0.58203125, 0.6455078125, 0.708984375, 0.7724609375, 0.8359375, 0.8994140625, 0.962890625, 1.0263671875, 1.08984375, 1.1533203125, 1.216796875, 1.2802734375, 1.34375, 1.4072265625, 1.470703125, 1.5341796875, 1.59765625, 1.6611328125, 1.724609375, 1.7880859375, 1.8515625, 1.9150390625, 1.978515625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 7.0, 7.0, 7.0, 12.0, 17.0, 19.0, 21.0, 18.0, 36.0, 30.0, 40.0, 32.0, 42.0, 43.0, 42.0, 50.0, 43.0, 55.0, 56.0, 47.0, 40.0, 40.0, 31.0, 34.0, 42.0, 34.0, 32.0, 15.0, 22.0, 12.0, 18.0, 17.0, 5.0, 5.0, 11.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.436753273010254, -10.071313858032227, -9.7058744430542, -9.340435028076172, -8.974996566772461, -8.609557151794434, -8.244117736816406, -7.878678321838379, -7.51323938369751, -7.147799968719482, -6.782361030578613, -6.416921615600586, -6.051482200622559, -5.6860432624816895, -5.320603847503662, -4.955164909362793, -4.589725494384766, -4.224286079406738, -3.858847141265869, -3.493407726287842, -3.1279685497283936, -2.7625293731689453, -2.397089958190918, -2.0316507816314697, -1.6662116050720215, -1.3007724285125732, -0.9353331327438354, -0.5698938369750977, -0.20445466041564941, 0.16098451614379883, 0.5264239311218262, 0.8918631076812744, 1.2573022842407227, 1.622741460800171, 1.9881807565689087, 2.3536200523376465, 2.7190592288970947, 3.084498405456543, 3.4499378204345703, 3.8153769969940186, 4.180816173553467, 4.546255588531494, 4.911694526672363, 5.277133941650391, 5.642573356628418, 6.008012294769287, 6.3734517097473145, 6.738890647888184, 7.104330062866211, 7.469769477844238, 7.835208415985107, 8.200647354125977, 8.566086769104004, 8.931526184082031, 9.296965599060059, 9.662405014038086, 10.027843475341797, 10.393282890319824, 10.758722305297852, 11.124160766601562, 11.48960018157959, 11.855039596557617, 12.220479011535645, 12.585918426513672, 12.9513578414917]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 6.0, 6.0, 10.0, 9.0, 21.0, 10.0, 9.0, 17.0, 18.0, 20.0, 25.0, 33.0, 26.0, 34.0, 34.0, 45.0, 35.0, 40.0, 28.0, 41.0, 38.0, 34.0, 45.0, 32.0, 31.0, 39.0, 34.0, 37.0, 32.0, 17.0, 24.0, 27.0, 13.0, 10.0, 20.0, 12.0, 11.0, 13.0, 8.0, 7.0, 7.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.277950286865234, -8.9810209274292, -8.684091567993164, -8.387163162231445, -8.09023380279541, -7.793304443359375, -7.49637508392334, -7.199445724487305, -6.902516841888428, -6.605587482452393, -6.308658599853516, -6.0117292404174805, -5.714799880981445, -5.417870998382568, -5.120941638946533, -4.824012756347656, -4.527083396911621, -4.230154037475586, -3.933225154876709, -3.636295795440674, -3.3393666744232178, -3.0424375534057617, -2.7455081939697266, -2.4485790729522705, -2.1516499519348145, -1.8547208309173584, -1.5577915906906128, -1.2608623504638672, -0.9639332294464111, -0.6670041084289551, -0.3700748682022095, -0.07314562797546387, 0.2237834930419922, 0.520712673664093, 0.8176418542861938, 1.1145710945129395, 1.4115002155303955, 1.7084293365478516, 2.0053586959838867, 2.3022878170013428, 2.599216938018799, 2.896146059036255, 3.193075180053711, 3.490004539489746, 3.786933660507202, 4.083862781524658, 4.380792140960693, 4.67772102355957, 4.9746503829956055, 5.271579742431641, 5.568508625030518, 5.865437984466553, 6.16236686706543, 6.459296226501465, 6.7562255859375, 7.053154945373535, 7.350083827972412, 7.647013187408447, 7.943942070007324, 8.24087142944336, 8.537800788879395, 8.83473014831543, 9.131658554077148, 9.428587913513184, 9.725517272949219]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 19.0, 41.0, 64.0, 87.0, 140.0, 201.0, 308.0, 512.0, 808.0, 1218.0, 1875.0, 2797.0, 4252.0, 6347.0, 9439.0, 13961.0, 19428.0, 27074.0, 36860.0, 48352.0, 60769.0, 72483.0, 83123.0, 90918.0, 93244.0, 90123.0, 82869.0, 71880.0, 59426.0, 47097.0, 36006.0, 26697.0, 19235.0, 13383.0, 9374.0, 6214.0, 4206.0, 2739.0, 1805.0, 1174.0, 717.0, 465.0, 279.0, 189.0, 122.0, 81.0, 54.0, 35.0, 17.0, 15.0, 9.0, 6.0, 7.0, 0.0, 1.0], "bins": [-8.484375, -8.2308349609375, -7.977294921875, -7.7237548828125, -7.47021484375, -7.2166748046875, -6.963134765625, -6.7095947265625, -6.4560546875, -6.2025146484375, -5.948974609375, -5.6954345703125, -5.44189453125, -5.1883544921875, -4.934814453125, -4.6812744140625, -4.427734375, -4.1741943359375, -3.920654296875, -3.6671142578125, -3.41357421875, -3.1600341796875, -2.906494140625, -2.6529541015625, -2.3994140625, -2.1458740234375, -1.892333984375, -1.6387939453125, -1.38525390625, -1.1317138671875, -0.878173828125, -0.6246337890625, -0.37109375, -0.1175537109375, 0.135986328125, 0.3895263671875, 0.64306640625, 0.8966064453125, 1.150146484375, 1.4036865234375, 1.6572265625, 1.9107666015625, 2.164306640625, 2.4178466796875, 2.67138671875, 2.9249267578125, 3.178466796875, 3.4320068359375, 3.685546875, 3.9390869140625, 4.192626953125, 4.4461669921875, 4.69970703125, 4.9532470703125, 5.206787109375, 5.4603271484375, 5.7138671875, 5.9674072265625, 6.220947265625, 6.4744873046875, 6.72802734375, 6.9815673828125, 7.235107421875, 7.4886474609375, 7.7421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 8.0, 6.0, 9.0, 10.0, 14.0, 14.0, 11.0, 14.0, 19.0, 18.0, 30.0, 27.0, 24.0, 30.0, 43.0, 37.0, 39.0, 38.0, 30.0, 33.0, 36.0, 40.0, 44.0, 37.0, 30.0, 35.0, 36.0, 30.0, 42.0, 21.0, 22.0, 28.0, 15.0, 11.0, 16.0, 14.0, 12.0, 13.0, 6.0, 12.0, 2.0, 9.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.0, -8.7154541015625, -8.430908203125, -8.1463623046875, -7.86181640625, -7.5772705078125, -7.292724609375, -7.0081787109375, -6.7236328125, -6.4390869140625, -6.154541015625, -5.8699951171875, -5.58544921875, -5.3009033203125, -5.016357421875, -4.7318115234375, -4.447265625, -4.1627197265625, -3.878173828125, -3.5936279296875, -3.30908203125, -3.0245361328125, -2.739990234375, -2.4554443359375, -2.1708984375, -1.8863525390625, -1.601806640625, -1.3172607421875, -1.03271484375, -0.7481689453125, -0.463623046875, -0.1790771484375, 0.10546875, 0.3900146484375, 0.674560546875, 0.9591064453125, 1.24365234375, 1.5281982421875, 1.812744140625, 2.0972900390625, 2.3818359375, 2.6663818359375, 2.950927734375, 3.2354736328125, 3.52001953125, 3.8045654296875, 4.089111328125, 4.3736572265625, 4.658203125, 4.9427490234375, 5.227294921875, 5.5118408203125, 5.79638671875, 6.0809326171875, 6.365478515625, 6.6500244140625, 6.9345703125, 7.2191162109375, 7.503662109375, 7.7882080078125, 8.07275390625, 8.3572998046875, 8.641845703125, 8.9263916015625, 9.2109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 27.0, 38.0, 60.0, 90.0, 140.0, 240.0, 327.0, 567.0, 819.0, 1365.0, 2220.0, 3527.0, 5717.0, 8914.0, 13969.0, 21477.0, 32081.0, 46422.0, 63612.0, 83237.0, 100286.0, 112366.0, 114792.0, 106842.0, 91504.0, 72886.0, 54192.0, 37753.0, 25989.0, 17100.0, 11247.0, 6954.0, 4423.0, 2669.0, 1777.0, 1032.0, 679.0, 406.0, 295.0, 172.0, 120.0, 77.0, 52.0, 32.0, 15.0, 9.0, 8.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.545166015625, -10.20751953125, -9.869873046875, -9.5322265625, -9.194580078125, -8.85693359375, -8.519287109375, -8.181640625, -7.843994140625, -7.50634765625, -7.168701171875, -6.8310546875, -6.493408203125, -6.15576171875, -5.818115234375, -5.48046875, -5.142822265625, -4.80517578125, -4.467529296875, -4.1298828125, -3.792236328125, -3.45458984375, -3.116943359375, -2.779296875, -2.441650390625, -2.10400390625, -1.766357421875, -1.4287109375, -1.091064453125, -0.75341796875, -0.415771484375, -0.078125, 0.259521484375, 0.59716796875, 0.934814453125, 1.2724609375, 1.610107421875, 1.94775390625, 2.285400390625, 2.623046875, 2.960693359375, 3.29833984375, 3.635986328125, 3.9736328125, 4.311279296875, 4.64892578125, 4.986572265625, 5.32421875, 5.661865234375, 5.99951171875, 6.337158203125, 6.6748046875, 7.012451171875, 7.35009765625, 7.687744140625, 8.025390625, 8.363037109375, 8.70068359375, 9.038330078125, 9.3759765625, 9.713623046875, 10.05126953125, 10.388916015625, 10.7265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 6.0, 12.0, 13.0, 15.0, 9.0, 22.0, 14.0, 24.0, 24.0, 19.0, 28.0, 34.0, 34.0, 31.0, 32.0, 33.0, 48.0, 34.0, 46.0, 44.0, 40.0, 36.0, 36.0, 26.0, 36.0, 27.0, 33.0, 31.0, 29.0, 28.0, 19.0, 17.0, 19.0, 14.0, 12.0, 8.0, 10.0, 8.0, 9.0, 7.0, 5.0, 4.0, 1.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.41082763671875, -6.2122802734375, -6.01373291015625, -5.815185546875, -5.61663818359375, -5.4180908203125, -5.21954345703125, -5.02099609375, -4.82244873046875, -4.6239013671875, -4.42535400390625, -4.226806640625, -4.02825927734375, -3.8297119140625, -3.63116455078125, -3.4326171875, -3.23406982421875, -3.0355224609375, -2.83697509765625, -2.638427734375, -2.43988037109375, -2.2413330078125, -2.04278564453125, -1.84423828125, -1.64569091796875, -1.4471435546875, -1.24859619140625, -1.050048828125, -0.85150146484375, -0.6529541015625, -0.45440673828125, -0.255859375, -0.05731201171875, 0.1412353515625, 0.33978271484375, 0.538330078125, 0.73687744140625, 0.9354248046875, 1.13397216796875, 1.33251953125, 1.53106689453125, 1.7296142578125, 1.92816162109375, 2.126708984375, 2.32525634765625, 2.5238037109375, 2.72235107421875, 2.9208984375, 3.11944580078125, 3.3179931640625, 3.51654052734375, 3.715087890625, 3.91363525390625, 4.1121826171875, 4.31072998046875, 4.50927734375, 4.70782470703125, 4.9063720703125, 5.10491943359375, 5.303466796875, 5.50201416015625, 5.7005615234375, 5.89910888671875, 6.09765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 11.0, 9.0, 23.0, 34.0, 44.0, 73.0, 121.0, 178.0, 260.0, 402.0, 665.0, 1144.0, 1770.0, 2723.0, 4445.0, 7170.0, 11722.0, 18839.0, 29577.0, 46539.0, 69226.0, 96975.0, 121857.0, 137063.0, 133228.0, 112702.0, 85818.0, 60054.0, 39432.0, 24937.0, 15793.0, 9864.0, 5961.0, 3645.0, 2306.0, 1480.0, 899.0, 551.0, 348.0, 263.0, 143.0, 87.0, 71.0, 41.0, 26.0, 9.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2421875, -4.10882568359375, -3.9754638671875, -3.84210205078125, -3.708740234375, -3.57537841796875, -3.4420166015625, -3.30865478515625, -3.17529296875, -3.04193115234375, -2.9085693359375, -2.77520751953125, -2.641845703125, -2.50848388671875, -2.3751220703125, -2.24176025390625, -2.1083984375, -1.97503662109375, -1.8416748046875, -1.70831298828125, -1.574951171875, -1.44158935546875, -1.3082275390625, -1.17486572265625, -1.04150390625, -0.90814208984375, -0.7747802734375, -0.64141845703125, -0.508056640625, -0.37469482421875, -0.2413330078125, -0.10797119140625, 0.025390625, 0.15875244140625, 0.2921142578125, 0.42547607421875, 0.558837890625, 0.69219970703125, 0.8255615234375, 0.95892333984375, 1.09228515625, 1.22564697265625, 1.3590087890625, 1.49237060546875, 1.625732421875, 1.75909423828125, 1.8924560546875, 2.02581787109375, 2.1591796875, 2.29254150390625, 2.4259033203125, 2.55926513671875, 2.692626953125, 2.82598876953125, 2.9593505859375, 3.09271240234375, 3.22607421875, 3.35943603515625, 3.4927978515625, 3.62615966796875, 3.759521484375, 3.89288330078125, 4.0262451171875, 4.15960693359375, 4.29296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 5.0, 15.0, 14.0, 13.0, 18.0, 25.0, 25.0, 42.0, 59.0, 49.0, 43.0, 40.0, 58.0, 62.0, 51.0, 76.0, 60.0, 44.0, 41.0, 36.0, 44.0, 33.0, 29.0, 29.0, 21.0, 13.0, 11.0, 3.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005974769592285156, -0.0005784407258033752, -0.0005594044923782349, -0.0005403682589530945, -0.0005213320255279541, -0.0005022957921028137, -0.00048325955867767334, -0.00046422332525253296, -0.0004451870918273926, -0.0004261508584022522, -0.0004071146249771118, -0.00038807839155197144, -0.00036904215812683105, -0.0003500059247016907, -0.0003309696912765503, -0.0003119334578514099, -0.00029289722442626953, -0.00027386099100112915, -0.00025482475757598877, -0.0002357885241508484, -0.000216752290725708, -0.00019771605730056763, -0.00017867982387542725, -0.00015964359045028687, -0.00014060735702514648, -0.0001215711236000061, -0.00010253489017486572, -8.349865674972534e-05, -6.446242332458496e-05, -4.542618989944458e-05, -2.63899564743042e-05, -7.353723049163818e-06, 1.1682510375976562e-05, 3.071874380111694e-05, 4.9754977226257324e-05, 6.87912106513977e-05, 8.782744407653809e-05, 0.00010686367750167847, 0.00012589991092681885, 0.00014493614435195923, 0.0001639723777770996, 0.00018300861120224, 0.00020204484462738037, 0.00022108107805252075, 0.00024011731147766113, 0.0002591535449028015, 0.0002781897783279419, 0.0002972260117530823, 0.00031626224517822266, 0.00033529847860336304, 0.0003543347120285034, 0.0003733709454536438, 0.0003924071788787842, 0.00041144341230392456, 0.00043047964572906494, 0.0004495158791542053, 0.0004685521125793457, 0.0004875883460044861, 0.0005066245794296265, 0.0005256608128547668, 0.0005446970462799072, 0.0005637332797050476, 0.000582769513130188, 0.0006018057465553284, 0.0006208419799804688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 13.0, 17.0, 24.0, 31.0, 44.0, 65.0, 111.0, 158.0, 252.0, 423.0, 732.0, 1226.0, 2093.0, 3628.0, 6381.0, 11637.0, 19699.0, 34005.0, 56310.0, 86398.0, 120801.0, 148074.0, 153431.0, 133179.0, 101518.0, 67611.0, 42225.0, 24844.0, 14331.0, 8210.0, 4678.0, 2620.0, 1487.0, 881.0, 515.0, 351.0, 183.0, 124.0, 91.0, 46.0, 21.0, 29.0, 15.0, 12.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.85546875, -4.7047119140625, -4.553955078125, -4.4031982421875, -4.25244140625, -4.1016845703125, -3.950927734375, -3.8001708984375, -3.6494140625, -3.4986572265625, -3.347900390625, -3.1971435546875, -3.04638671875, -2.8956298828125, -2.744873046875, -2.5941162109375, -2.443359375, -2.2926025390625, -2.141845703125, -1.9910888671875, -1.84033203125, -1.6895751953125, -1.538818359375, -1.3880615234375, -1.2373046875, -1.0865478515625, -0.935791015625, -0.7850341796875, -0.63427734375, -0.4835205078125, -0.332763671875, -0.1820068359375, -0.03125, 0.1195068359375, 0.270263671875, 0.4210205078125, 0.57177734375, 0.7225341796875, 0.873291015625, 1.0240478515625, 1.1748046875, 1.3255615234375, 1.476318359375, 1.6270751953125, 1.77783203125, 1.9285888671875, 2.079345703125, 2.2301025390625, 2.380859375, 2.5316162109375, 2.682373046875, 2.8331298828125, 2.98388671875, 3.1346435546875, 3.285400390625, 3.4361572265625, 3.5869140625, 3.7376708984375, 3.888427734375, 4.0391845703125, 4.18994140625, 4.3406982421875, 4.491455078125, 4.6422119140625, 4.79296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 11.0, 19.0, 25.0, 27.0, 27.0, 29.0, 34.0, 34.0, 41.0, 47.0, 48.0, 40.0, 56.0, 46.0, 58.0, 54.0, 50.0, 43.0, 29.0, 33.0, 26.0, 41.0, 23.0, 19.0, 11.0, 23.0, 12.0, 4.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.439453125, -1.3881683349609375, -1.336883544921875, -1.2855987548828125, -1.23431396484375, -1.1830291748046875, -1.131744384765625, -1.0804595947265625, -1.0291748046875, -0.9778900146484375, -0.926605224609375, -0.8753204345703125, -0.82403564453125, -0.7727508544921875, -0.721466064453125, -0.6701812744140625, -0.618896484375, -0.5676116943359375, -0.516326904296875, -0.4650421142578125, -0.41375732421875, -0.3624725341796875, -0.311187744140625, -0.2599029541015625, -0.2086181640625, -0.1573333740234375, -0.106048583984375, -0.0547637939453125, -0.00347900390625, 0.0478057861328125, 0.099090576171875, 0.1503753662109375, 0.20166015625, 0.2529449462890625, 0.304229736328125, 0.3555145263671875, 0.40679931640625, 0.4580841064453125, 0.509368896484375, 0.5606536865234375, 0.6119384765625, 0.6632232666015625, 0.714508056640625, 0.7657928466796875, 0.81707763671875, 0.8683624267578125, 0.919647216796875, 0.9709320068359375, 1.022216796875, 1.0735015869140625, 1.124786376953125, 1.1760711669921875, 1.22735595703125, 1.2786407470703125, 1.329925537109375, 1.3812103271484375, 1.4324951171875, 1.4837799072265625, 1.535064697265625, 1.5863494873046875, 1.63763427734375, 1.6889190673828125, 1.740203857421875, 1.7914886474609375, 1.8427734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 8.0, 6.0, 13.0, 14.0, 14.0, 21.0, 21.0, 34.0, 35.0, 36.0, 39.0, 47.0, 43.0, 41.0, 53.0, 43.0, 57.0, 57.0, 50.0, 32.0, 36.0, 40.0, 37.0, 32.0, 26.0, 21.0, 23.0, 19.0, 14.0, 11.0, 19.0, 13.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.24126148223877, -10.870044708251953, -10.498828887939453, -10.127612113952637, -9.75639533996582, -9.38517951965332, -9.013962745666504, -8.642745971679688, -8.271530151367188, -7.900313854217529, -7.529097080230713, -7.157880783081055, -6.786664009094238, -6.41544771194458, -6.044231414794922, -5.6730146408081055, -5.301797866821289, -4.930581569671631, -4.5593647956848145, -4.188148498535156, -3.816931962966919, -3.4457154273986816, -3.0744991302490234, -2.703282594680786, -2.332066059112549, -1.9608495235443115, -1.5896331071853638, -1.218416690826416, -0.8472001552581787, -0.4759836196899414, -0.1047673225402832, 0.2664492130279541, 0.6376657485961914, 1.0088822841644287, 1.3800987005233765, 1.7513151168823242, 2.1225316524505615, 2.493748188018799, 2.864964485168457, 3.2361810207366943, 3.6073975563049316, 3.978614091873169, 4.349830627441406, 4.7210469245910645, 5.092263221740723, 5.463479995727539, 5.834696292877197, 6.2059125900268555, 6.577129364013672, 6.94834566116333, 7.3195624351501465, 7.690778732299805, 8.061995506286621, 8.433212280273438, 8.804428100585938, 9.175644874572754, 9.54686164855957, 9.918078422546387, 10.289294242858887, 10.660511016845703, 11.03172779083252, 11.402944564819336, 11.774160385131836, 12.145377159118652, 12.516592979431152]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 10.0, 12.0, 8.0, 9.0, 12.0, 20.0, 14.0, 27.0, 26.0, 30.0, 39.0, 42.0, 33.0, 22.0, 36.0, 32.0, 43.0, 39.0, 47.0, 38.0, 38.0, 43.0, 47.0, 39.0, 31.0, 26.0, 38.0, 28.0, 31.0, 19.0, 23.0, 13.0, 13.0, 12.0, 10.0, 3.0, 11.0, 2.0, 7.0, 5.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.42354679107666, -11.083907127380371, -10.744266510009766, -10.404626846313477, -10.064986228942871, -9.725346565246582, -9.385705947875977, -9.046066284179688, -8.706426620483398, -8.36678695678711, -8.027146339416504, -7.687506675720215, -7.347866058349609, -7.00822639465332, -6.668586254119873, -6.328946113586426, -5.98930549621582, -5.649665355682373, -5.310025215148926, -4.970385551452637, -4.630744934082031, -4.291105270385742, -3.951465129852295, -3.6118249893188477, -3.2721848487854004, -2.932544708251953, -2.592904567718506, -2.2532646656036377, -1.9136245250701904, -1.5739843845367432, -1.234344482421875, -0.8947043418884277, -0.5550642013549805, -0.21542412042617798, 0.12421596050262451, 0.4638559818267822, 0.8034961223602295, 1.1431362628936768, 1.482776165008545, 1.8224163055419922, 2.1620564460754395, 2.5016965866088867, 2.841336727142334, 3.180976629257202, 3.5206167697906494, 3.8602569103240967, 4.199896812438965, 4.539536952972412, 4.879177093505859, 5.218817234039307, 5.558457374572754, 5.898097038269043, 6.237737655639648, 6.5773773193359375, 6.917017459869385, 7.256657600402832, 7.596297740936279, 7.935937881469727, 8.275577545166016, 8.615218162536621, 8.95485782623291, 9.294498443603516, 9.634138107299805, 9.973777770996094, 10.3134183883667]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 13.0, 25.0, 42.0, 51.0, 97.0, 129.0, 230.0, 347.0, 595.0, 866.0, 1443.0, 2376.0, 3671.0, 5884.0, 9457.0, 14870.0, 23456.0, 36857.0, 56913.0, 86738.0, 128732.0, 185494.0, 257788.0, 337411.0, 414545.0, 464928.0, 470876.0, 431344.0, 360255.0, 278020.0, 203408.0, 142787.0, 96658.0, 63999.0, 41802.0, 26756.0, 17041.0, 10714.0, 6634.0, 4237.0, 2559.0, 1572.0, 1009.0, 616.0, 377.0, 253.0, 160.0, 104.0, 60.0, 29.0, 16.0, 13.0, 10.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.671875, -8.41015625, -8.1484375, -7.88671875, -7.625, -7.36328125, -7.1015625, -6.83984375, -6.578125, -6.31640625, -6.0546875, -5.79296875, -5.53125, -5.26953125, -5.0078125, -4.74609375, -4.484375, -4.22265625, -3.9609375, -3.69921875, -3.4375, -3.17578125, -2.9140625, -2.65234375, -2.390625, -2.12890625, -1.8671875, -1.60546875, -1.34375, -1.08203125, -0.8203125, -0.55859375, -0.296875, -0.03515625, 0.2265625, 0.48828125, 0.75, 1.01171875, 1.2734375, 1.53515625, 1.796875, 2.05859375, 2.3203125, 2.58203125, 2.84375, 3.10546875, 3.3671875, 3.62890625, 3.890625, 4.15234375, 4.4140625, 4.67578125, 4.9375, 5.19921875, 5.4609375, 5.72265625, 5.984375, 6.24609375, 6.5078125, 6.76953125, 7.03125, 7.29296875, 7.5546875, 7.81640625, 8.078125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 12.0, 9.0, 12.0, 7.0, 15.0, 12.0, 17.0, 18.0, 27.0, 30.0, 27.0, 34.0, 41.0, 30.0, 35.0, 27.0, 35.0, 42.0, 35.0, 46.0, 35.0, 41.0, 50.0, 40.0, 38.0, 36.0, 28.0, 28.0, 28.0, 32.0, 20.0, 21.0, 15.0, 14.0, 10.0, 6.0, 14.0, 4.0, 4.0, 4.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-9.5546875, -9.2685546875, -8.982421875, -8.6962890625, -8.41015625, -8.1240234375, -7.837890625, -7.5517578125, -7.265625, -6.9794921875, -6.693359375, -6.4072265625, -6.12109375, -5.8349609375, -5.548828125, -5.2626953125, -4.9765625, -4.6904296875, -4.404296875, -4.1181640625, -3.83203125, -3.5458984375, -3.259765625, -2.9736328125, -2.6875, -2.4013671875, -2.115234375, -1.8291015625, -1.54296875, -1.2568359375, -0.970703125, -0.6845703125, -0.3984375, -0.1123046875, 0.173828125, 0.4599609375, 0.74609375, 1.0322265625, 1.318359375, 1.6044921875, 1.890625, 2.1767578125, 2.462890625, 2.7490234375, 3.03515625, 3.3212890625, 3.607421875, 3.8935546875, 4.1796875, 4.4658203125, 4.751953125, 5.0380859375, 5.32421875, 5.6103515625, 5.896484375, 6.1826171875, 6.46875, 6.7548828125, 7.041015625, 7.3271484375, 7.61328125, 7.8994140625, 8.185546875, 8.4716796875, 8.7578125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 23.0, 19.0, 38.0, 64.0, 122.0, 197.0, 359.0, 580.0, 963.0, 1613.0, 2550.0, 4320.0, 7034.0, 11207.0, 18142.0, 28218.0, 43002.0, 64437.0, 94963.0, 135095.0, 184974.0, 244419.0, 306901.0, 363970.0, 403786.0, 416469.0, 399596.0, 356484.0, 298383.0, 235917.0, 177947.0, 129253.0, 90460.0, 60982.0, 41329.0, 26208.0, 16835.0, 10499.0, 6573.0, 4072.0, 2510.0, 1528.0, 918.0, 567.0, 310.0, 197.0, 120.0, 53.0, 26.0, 27.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-8.4296875, -8.17755126953125, -7.9254150390625, -7.67327880859375, -7.421142578125, -7.16900634765625, -6.9168701171875, -6.66473388671875, -6.41259765625, -6.16046142578125, -5.9083251953125, -5.65618896484375, -5.404052734375, -5.15191650390625, -4.8997802734375, -4.64764404296875, -4.3955078125, -4.14337158203125, -3.8912353515625, -3.63909912109375, -3.386962890625, -3.13482666015625, -2.8826904296875, -2.63055419921875, -2.37841796875, -2.12628173828125, -1.8741455078125, -1.62200927734375, -1.369873046875, -1.11773681640625, -0.8656005859375, -0.61346435546875, -0.361328125, -0.10919189453125, 0.1429443359375, 0.39508056640625, 0.647216796875, 0.89935302734375, 1.1514892578125, 1.40362548828125, 1.65576171875, 1.90789794921875, 2.1600341796875, 2.41217041015625, 2.664306640625, 2.91644287109375, 3.1685791015625, 3.42071533203125, 3.6728515625, 3.92498779296875, 4.1771240234375, 4.42926025390625, 4.681396484375, 4.93353271484375, 5.1856689453125, 5.43780517578125, 5.68994140625, 5.94207763671875, 6.1942138671875, 6.44635009765625, 6.698486328125, 6.95062255859375, 7.2027587890625, 7.45489501953125, 7.70703125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 5.0, 8.0, 14.0, 14.0, 16.0, 37.0, 21.0, 34.0, 38.0, 73.0, 57.0, 77.0, 96.0, 100.0, 97.0, 153.0, 175.0, 153.0, 171.0, 157.0, 182.0, 211.0, 204.0, 242.0, 178.0, 194.0, 194.0, 169.0, 142.0, 119.0, 122.0, 99.0, 98.0, 89.0, 55.0, 70.0, 53.0, 35.0, 28.0, 25.0, 24.0, 15.0, 7.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.10546875, -3.9705810546875, -3.835693359375, -3.7008056640625, -3.56591796875, -3.4310302734375, -3.296142578125, -3.1612548828125, -3.0263671875, -2.8914794921875, -2.756591796875, -2.6217041015625, -2.48681640625, -2.3519287109375, -2.217041015625, -2.0821533203125, -1.947265625, -1.8123779296875, -1.677490234375, -1.5426025390625, -1.40771484375, -1.2728271484375, -1.137939453125, -1.0030517578125, -0.8681640625, -0.7332763671875, -0.598388671875, -0.4635009765625, -0.32861328125, -0.1937255859375, -0.058837890625, 0.0760498046875, 0.2109375, 0.3458251953125, 0.480712890625, 0.6156005859375, 0.75048828125, 0.8853759765625, 1.020263671875, 1.1551513671875, 1.2900390625, 1.4249267578125, 1.559814453125, 1.6947021484375, 1.82958984375, 1.9644775390625, 2.099365234375, 2.2342529296875, 2.369140625, 2.5040283203125, 2.638916015625, 2.7738037109375, 2.90869140625, 3.0435791015625, 3.178466796875, 3.3133544921875, 3.4482421875, 3.5831298828125, 3.718017578125, 3.8529052734375, 3.98779296875, 4.1226806640625, 4.257568359375, 4.3924560546875, 4.52734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 6.0, 4.0, 9.0, 17.0, 13.0, 19.0, 20.0, 19.0, 25.0, 37.0, 33.0, 25.0, 47.0, 40.0, 56.0, 39.0, 49.0, 38.0, 42.0, 41.0, 39.0, 41.0, 33.0, 38.0, 38.0, 38.0, 27.0, 36.0, 18.0, 22.0, 11.0, 17.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.316300392150879, -9.949918746948242, -9.583538055419922, -9.217156410217285, -8.850774765014648, -8.484393119812012, -8.118011474609375, -7.751630783081055, -7.385249137878418, -7.018867492675781, -6.652486324310303, -6.286105155944824, -5.9197235107421875, -5.553341865539551, -5.186960697174072, -4.820579528808594, -4.454197883605957, -4.08781623840332, -3.721435070037842, -3.355053663253784, -2.9886722564697266, -2.622290849685669, -2.2559094429016113, -1.8895280361175537, -1.523146629333496, -1.1567652225494385, -0.7903838157653809, -0.42400240898132324, -0.057621002197265625, 0.308760404586792, 0.6751418113708496, 1.0415232181549072, 1.4079046249389648, 1.7742860317230225, 2.14066743850708, 2.5070488452911377, 2.8734302520751953, 3.239811658859253, 3.6061930656433105, 3.972574472427368, 4.338955879211426, 4.7053375244140625, 5.071718692779541, 5.4380998611450195, 5.804481506347656, 6.170863151550293, 6.5372443199157715, 6.90362548828125, 7.270007133483887, 7.636388778686523, 8.002769470214844, 8.36915111541748, 8.735532760620117, 9.101914405822754, 9.46829605102539, 9.834676742553711, 10.201058387756348, 10.567440032958984, 10.933820724487305, 11.300202369689941, 11.666584014892578, 12.032965660095215, 12.399347305297852, 12.765727996826172, 13.132109642028809]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 15.0, 17.0, 13.0, 15.0, 24.0, 18.0, 20.0, 30.0, 29.0, 39.0, 43.0, 39.0, 38.0, 45.0, 43.0, 47.0, 40.0, 39.0, 29.0, 44.0, 32.0, 43.0, 36.0, 27.0, 35.0, 28.0, 14.0, 25.0, 23.0, 14.0, 14.0, 12.0, 13.0, 9.0, 7.0, 9.0, 5.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.262622833251953, -11.906577110290527, -11.550531387329102, -11.19448471069336, -10.838438987731934, -10.482393264770508, -10.126346588134766, -9.77030086517334, -9.414255142211914, -9.058209419250488, -8.702163696289062, -8.34611701965332, -7.9900712966918945, -7.634025573730469, -7.277979373931885, -6.921933174133301, -6.565887451171875, -6.209841728210449, -5.853795528411865, -5.497749328613281, -5.1417036056518555, -4.78565788269043, -4.429611682891846, -4.073565483093262, -3.717519760131836, -3.361473798751831, -3.005427837371826, -2.6493818759918213, -2.2933359146118164, -1.9372899532318115, -1.5812439918518066, -1.2251980304718018, -0.8691530227661133, -0.5131070613861084, -0.15706110000610352, 0.19898486137390137, 0.5550308227539062, 0.9110767841339111, 1.267122745513916, 1.623168706893921, 1.9792146682739258, 2.3352606296539307, 2.6913065910339355, 3.0473525524139404, 3.4033985137939453, 3.75944447517395, 4.115490436553955, 4.471536636352539, 4.827582359313965, 5.183628082275391, 5.539674282073975, 5.895720481872559, 6.251766204833984, 6.60781192779541, 6.963858127593994, 7.319904327392578, 7.675950050354004, 8.03199577331543, 8.388042449951172, 8.744088172912598, 9.100133895874023, 9.45617961883545, 9.812225341796875, 10.168272018432617, 10.524317741394043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 10.0, 14.0, 18.0, 34.0, 38.0, 43.0, 81.0, 116.0, 132.0, 222.0, 321.0, 457.0, 685.0, 1020.0, 1467.0, 2257.0, 3382.0, 5095.0, 7898.0, 12325.0, 20359.0, 33789.0, 57878.0, 97281.0, 154349.0, 198757.0, 170044.0, 111096.0, 66275.0, 39641.0, 23321.0, 14127.0, 9015.0, 5655.0, 3589.0, 2463.0, 1585.0, 1132.0, 803.0, 516.0, 373.0, 268.0, 169.0, 131.0, 111.0, 56.0, 54.0, 34.0, 17.0, 17.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.31640625, -5.15350341796875, -4.9906005859375, -4.82769775390625, -4.664794921875, -4.50189208984375, -4.3389892578125, -4.17608642578125, -4.01318359375, -3.85028076171875, -3.6873779296875, -3.52447509765625, -3.361572265625, -3.19866943359375, -3.0357666015625, -2.87286376953125, -2.7099609375, -2.54705810546875, -2.3841552734375, -2.22125244140625, -2.058349609375, -1.89544677734375, -1.7325439453125, -1.56964111328125, -1.40673828125, -1.24383544921875, -1.0809326171875, -0.91802978515625, -0.755126953125, -0.59222412109375, -0.4293212890625, -0.26641845703125, -0.103515625, 0.05938720703125, 0.2222900390625, 0.38519287109375, 0.548095703125, 0.71099853515625, 0.8739013671875, 1.03680419921875, 1.19970703125, 1.36260986328125, 1.5255126953125, 1.68841552734375, 1.851318359375, 2.01422119140625, 2.1771240234375, 2.34002685546875, 2.5029296875, 2.66583251953125, 2.8287353515625, 2.99163818359375, 3.154541015625, 3.31744384765625, 3.4803466796875, 3.64324951171875, 3.80615234375, 3.96905517578125, 4.1319580078125, 4.29486083984375, 4.457763671875, 4.62066650390625, 4.7835693359375, 4.94647216796875, 5.109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 16.0, 12.0, 12.0, 16.0, 20.0, 23.0, 20.0, 21.0, 30.0, 34.0, 42.0, 41.0, 34.0, 44.0, 41.0, 44.0, 46.0, 36.0, 39.0, 36.0, 37.0, 33.0, 43.0, 30.0, 31.0, 41.0, 19.0, 15.0, 27.0, 18.0, 14.0, 11.0, 12.0, 12.0, 9.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.5865478515625, -11.235595703125, -10.8846435546875, -10.53369140625, -10.1827392578125, -9.831787109375, -9.4808349609375, -9.1298828125, -8.7789306640625, -8.427978515625, -8.0770263671875, -7.72607421875, -7.3751220703125, -7.024169921875, -6.6732177734375, -6.322265625, -5.9713134765625, -5.620361328125, -5.2694091796875, -4.91845703125, -4.5675048828125, -4.216552734375, -3.8656005859375, -3.5146484375, -3.1636962890625, -2.812744140625, -2.4617919921875, -2.11083984375, -1.7598876953125, -1.408935546875, -1.0579833984375, -0.70703125, -0.3560791015625, -0.005126953125, 0.3458251953125, 0.69677734375, 1.0477294921875, 1.398681640625, 1.7496337890625, 2.1005859375, 2.4515380859375, 2.802490234375, 3.1534423828125, 3.50439453125, 3.8553466796875, 4.206298828125, 4.5572509765625, 4.908203125, 5.2591552734375, 5.610107421875, 5.9610595703125, 6.31201171875, 6.6629638671875, 7.013916015625, 7.3648681640625, 7.7158203125, 8.0667724609375, 8.417724609375, 8.7686767578125, 9.11962890625, 9.4705810546875, 9.821533203125, 10.1724853515625, 10.5234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 22.0, 25.0, 36.0, 56.0, 83.0, 144.0, 188.0, 326.0, 462.0, 830.0, 1301.0, 2196.0, 3970.0, 7421.0, 14936.0, 32547.0, 78668.0, 202586.0, 356511.0, 202194.0, 79099.0, 32790.0, 15048.0, 7425.0, 3954.0, 2275.0, 1346.0, 725.0, 500.0, 332.0, 193.0, 113.0, 86.0, 38.0, 37.0, 23.0, 21.0, 10.0, 9.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.72271728515625, -4.5626220703125, -4.40252685546875, -4.242431640625, -4.08233642578125, -3.9222412109375, -3.76214599609375, -3.60205078125, -3.44195556640625, -3.2818603515625, -3.12176513671875, -2.961669921875, -2.80157470703125, -2.6414794921875, -2.48138427734375, -2.3212890625, -2.16119384765625, -2.0010986328125, -1.84100341796875, -1.680908203125, -1.52081298828125, -1.3607177734375, -1.20062255859375, -1.04052734375, -0.88043212890625, -0.7203369140625, -0.56024169921875, -0.400146484375, -0.24005126953125, -0.0799560546875, 0.08013916015625, 0.240234375, 0.40032958984375, 0.5604248046875, 0.72052001953125, 0.880615234375, 1.04071044921875, 1.2008056640625, 1.36090087890625, 1.52099609375, 1.68109130859375, 1.8411865234375, 2.00128173828125, 2.161376953125, 2.32147216796875, 2.4815673828125, 2.64166259765625, 2.8017578125, 2.96185302734375, 3.1219482421875, 3.28204345703125, 3.442138671875, 3.60223388671875, 3.7623291015625, 3.92242431640625, 4.08251953125, 4.24261474609375, 4.4027099609375, 4.56280517578125, 4.722900390625, 4.88299560546875, 5.0430908203125, 5.20318603515625, 5.36328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 5.0, 11.0, 11.0, 11.0, 12.0, 18.0, 27.0, 28.0, 26.0, 27.0, 31.0, 49.0, 27.0, 36.0, 49.0, 48.0, 29.0, 35.0, 39.0, 41.0, 38.0, 45.0, 31.0, 35.0, 35.0, 29.0, 21.0, 36.0, 31.0, 19.0, 20.0, 12.0, 16.0, 3.0, 14.0, 9.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.362548828125, -7.13916015625, -6.915771484375, -6.6923828125, -6.468994140625, -6.24560546875, -6.022216796875, -5.798828125, -5.575439453125, -5.35205078125, -5.128662109375, -4.9052734375, -4.681884765625, -4.45849609375, -4.235107421875, -4.01171875, -3.788330078125, -3.56494140625, -3.341552734375, -3.1181640625, -2.894775390625, -2.67138671875, -2.447998046875, -2.224609375, -2.001220703125, -1.77783203125, -1.554443359375, -1.3310546875, -1.107666015625, -0.88427734375, -0.660888671875, -0.4375, -0.214111328125, 0.00927734375, 0.232666015625, 0.4560546875, 0.679443359375, 0.90283203125, 1.126220703125, 1.349609375, 1.572998046875, 1.79638671875, 2.019775390625, 2.2431640625, 2.466552734375, 2.68994140625, 2.913330078125, 3.13671875, 3.360107421875, 3.58349609375, 3.806884765625, 4.0302734375, 4.253662109375, 4.47705078125, 4.700439453125, 4.923828125, 5.147216796875, 5.37060546875, 5.593994140625, 5.8173828125, 6.040771484375, 6.26416015625, 6.487548828125, 6.7109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 8.0, 10.0, 14.0, 25.0, 30.0, 45.0, 74.0, 96.0, 158.0, 212.0, 316.0, 546.0, 925.0, 1699.0, 3254.0, 7532.0, 24364.0, 190477.0, 726873.0, 66921.0, 14132.0, 5105.0, 2415.0, 1263.0, 705.0, 442.0, 291.0, 183.0, 128.0, 92.0, 65.0, 44.0, 25.0, 23.0, 16.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.5115966796875, -6.296630859375, -6.0816650390625, -5.86669921875, -5.6517333984375, -5.436767578125, -5.2218017578125, -5.0068359375, -4.7918701171875, -4.576904296875, -4.3619384765625, -4.14697265625, -3.9320068359375, -3.717041015625, -3.5020751953125, -3.287109375, -3.0721435546875, -2.857177734375, -2.6422119140625, -2.42724609375, -2.2122802734375, -1.997314453125, -1.7823486328125, -1.5673828125, -1.3524169921875, -1.137451171875, -0.9224853515625, -0.70751953125, -0.4925537109375, -0.277587890625, -0.0626220703125, 0.15234375, 0.3673095703125, 0.582275390625, 0.7972412109375, 1.01220703125, 1.2271728515625, 1.442138671875, 1.6571044921875, 1.8720703125, 2.0870361328125, 2.302001953125, 2.5169677734375, 2.73193359375, 2.9468994140625, 3.161865234375, 3.3768310546875, 3.591796875, 3.8067626953125, 4.021728515625, 4.2366943359375, 4.45166015625, 4.6666259765625, 4.881591796875, 5.0965576171875, 5.3115234375, 5.5264892578125, 5.741455078125, 5.9564208984375, 6.17138671875, 6.3863525390625, 6.601318359375, 6.8162841796875, 7.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 18.0, 12.0, 27.0, 55.0, 61.0, 98.0, 131.0, 129.0, 137.0, 91.0, 46.0, 38.0, 24.0, 20.0, 25.0, 8.0, 8.0, 10.0, 4.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006456375122070312, -0.0006262585520744324, -0.0006068795919418335, -0.0005875006318092346, -0.0005681216716766357, -0.0005487427115440369, -0.000529363751411438, -0.0005099847912788391, -0.0004906058311462402, -0.00047122687101364136, -0.0004518479108810425, -0.0004324689507484436, -0.0004130899906158447, -0.00039371103048324585, -0.00037433207035064697, -0.0003549531102180481, -0.0003355741500854492, -0.00031619518995285034, -0.00029681622982025146, -0.0002774372696876526, -0.0002580583095550537, -0.00023867934942245483, -0.00021930038928985596, -0.00019992142915725708, -0.0001805424690246582, -0.00016116350889205933, -0.00014178454875946045, -0.00012240558862686157, -0.0001030266284942627, -8.364766836166382e-05, -6.426870822906494e-05, -4.4889748096466064e-05, -2.5510787963867188e-05, -6.1318278312683105e-06, 1.3247132301330566e-05, 3.262609243392944e-05, 5.200505256652832e-05, 7.13840126991272e-05, 9.076297283172607e-05, 0.00011014193296432495, 0.00012952089309692383, 0.0001488998532295227, 0.00016827881336212158, 0.00018765777349472046, 0.00020703673362731934, 0.0002264156937599182, 0.0002457946538925171, 0.00026517361402511597, 0.00028455257415771484, 0.0003039315342903137, 0.0003233104944229126, 0.0003426894545555115, 0.00036206841468811035, 0.00038144737482070923, 0.0004008263349533081, 0.000420205295085907, 0.00043958425521850586, 0.00045896321535110474, 0.0004783421754837036, 0.0004977211356163025, 0.0005171000957489014, 0.0005364790558815002, 0.0005558580160140991, 0.000575236976146698, 0.0005946159362792969]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 19.0, 22.0, 28.0, 62.0, 76.0, 94.0, 185.0, 272.0, 398.0, 560.0, 881.0, 1265.0, 2019.0, 2961.0, 4611.0, 7274.0, 12562.0, 23117.0, 48703.0, 122724.0, 313398.0, 295086.0, 112852.0, 45513.0, 21793.0, 11900.0, 7151.0, 4469.0, 2946.0, 1886.0, 1262.0, 820.0, 541.0, 365.0, 265.0, 151.0, 102.0, 52.0, 48.0, 36.0, 17.0, 24.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.44140625, -4.29315185546875, -4.1448974609375, -3.99664306640625, -3.848388671875, -3.70013427734375, -3.5518798828125, -3.40362548828125, -3.25537109375, -3.10711669921875, -2.9588623046875, -2.81060791015625, -2.662353515625, -2.51409912109375, -2.3658447265625, -2.21759033203125, -2.0693359375, -1.92108154296875, -1.7728271484375, -1.62457275390625, -1.476318359375, -1.32806396484375, -1.1798095703125, -1.03155517578125, -0.88330078125, -0.73504638671875, -0.5867919921875, -0.43853759765625, -0.290283203125, -0.14202880859375, 0.0062255859375, 0.15447998046875, 0.302734375, 0.45098876953125, 0.5992431640625, 0.74749755859375, 0.895751953125, 1.04400634765625, 1.1922607421875, 1.34051513671875, 1.48876953125, 1.63702392578125, 1.7852783203125, 1.93353271484375, 2.081787109375, 2.23004150390625, 2.3782958984375, 2.52655029296875, 2.6748046875, 2.82305908203125, 2.9713134765625, 3.11956787109375, 3.267822265625, 3.41607666015625, 3.5643310546875, 3.71258544921875, 3.86083984375, 4.00909423828125, 4.1573486328125, 4.30560302734375, 4.453857421875, 4.60211181640625, 4.7503662109375, 4.89862060546875, 5.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 3.0, 3.0, 7.0, 4.0, 5.0, 12.0, 3.0, 9.0, 20.0, 20.0, 26.0, 38.0, 49.0, 67.0, 105.0, 121.0, 119.0, 95.0, 74.0, 45.0, 32.0, 22.0, 19.0, 12.0, 13.0, 6.0, 6.0, 7.0, 8.0, 4.0, 9.0, 4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.841796875, -1.7859039306640625, -1.730010986328125, -1.6741180419921875, -1.61822509765625, -1.5623321533203125, -1.506439208984375, -1.4505462646484375, -1.3946533203125, -1.3387603759765625, -1.282867431640625, -1.2269744873046875, -1.17108154296875, -1.1151885986328125, -1.059295654296875, -1.0034027099609375, -0.947509765625, -0.8916168212890625, -0.835723876953125, -0.7798309326171875, -0.72393798828125, -0.6680450439453125, -0.612152099609375, -0.5562591552734375, -0.5003662109375, -0.4444732666015625, -0.388580322265625, -0.3326873779296875, -0.27679443359375, -0.2209014892578125, -0.165008544921875, -0.1091156005859375, -0.05322265625, 0.0026702880859375, 0.058563232421875, 0.1144561767578125, 0.17034912109375, 0.2262420654296875, 0.282135009765625, 0.3380279541015625, 0.3939208984375, 0.4498138427734375, 0.505706787109375, 0.5615997314453125, 0.61749267578125, 0.6733856201171875, 0.729278564453125, 0.7851715087890625, 0.841064453125, 0.8969573974609375, 0.952850341796875, 1.0087432861328125, 1.06463623046875, 1.1205291748046875, 1.176422119140625, 1.2323150634765625, 1.2882080078125, 1.3441009521484375, 1.399993896484375, 1.4558868408203125, 1.51177978515625, 1.5676727294921875, 1.623565673828125, 1.6794586181640625, 1.7353515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 3.0, 13.0, 17.0, 9.0, 19.0, 15.0, 25.0, 29.0, 34.0, 29.0, 41.0, 46.0, 55.0, 53.0, 48.0, 46.0, 44.0, 41.0, 35.0, 52.0, 40.0, 38.0, 35.0, 33.0, 36.0, 30.0, 20.0, 14.0, 25.0, 13.0, 12.0, 13.0, 2.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796053886413574, -10.41100788116455, -10.025961875915527, -9.640915870666504, -9.25586986541748, -8.87082290649414, -8.485776901245117, -8.100730895996094, -7.71568489074707, -7.330638885498047, -6.945592880249023, -6.560546875, -6.175500392913818, -5.790454387664795, -5.4054083824157715, -5.02036190032959, -4.635316371917725, -4.250270366668701, -3.8652241230010986, -3.480178117752075, -3.0951318740844727, -2.710085868835449, -2.325039863586426, -1.9399936199188232, -1.5549476146697998, -1.1699014902114868, -0.7848554253578186, -0.3998093605041504, -0.014763236045837402, 0.3702828884124756, 0.755328893661499, 1.1403751373291016, 1.525421142578125, 1.910467267036438, 2.295513391494751, 2.6805593967437744, 3.065605640411377, 3.4506516456604004, 3.835697650909424, 4.2207441329956055, 4.605790138244629, 4.990836143493652, 5.375882148742676, 5.760928153991699, 6.145974636077881, 6.531020641326904, 6.916066646575928, 7.301113128662109, 7.686158657073975, 8.071205139160156, 8.45625114440918, 8.841297149658203, 9.226343154907227, 9.61138916015625, 9.996435165405273, 10.381481170654297, 10.76652717590332, 11.151573181152344, 11.536619186401367, 11.92166519165039, 12.306711196899414, 12.691757202148438, 13.076803207397461, 13.4618501663208, 13.846896171569824]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 12.0, 9.0, 11.0, 14.0, 9.0, 20.0, 26.0, 20.0, 24.0, 33.0, 30.0, 39.0, 48.0, 33.0, 34.0, 46.0, 37.0, 49.0, 49.0, 37.0, 37.0, 35.0, 38.0, 42.0, 37.0, 34.0, 29.0, 23.0, 20.0, 22.0, 16.0, 12.0, 19.0, 11.0, 10.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.813156127929688, -12.449249267578125, -12.085343360900879, -11.721437454223633, -11.35753059387207, -10.993623733520508, -10.629717826843262, -10.265811920166016, -9.901905059814453, -9.53799819946289, -9.174092292785645, -8.810186386108398, -8.446279525756836, -8.082372665405273, -7.718466758728027, -7.354560375213623, -6.990653991699219, -6.6267476081848145, -6.26284122467041, -5.898934841156006, -5.535028457641602, -5.171122074127197, -4.807215690612793, -4.443309307098389, -4.079402923583984, -3.71549654006958, -3.351590156555176, -2.9876837730407715, -2.623777389526367, -2.259871006011963, -1.8959646224975586, -1.5320582389831543, -1.1681509017944336, -0.8042445182800293, -0.440338134765625, -0.0764317512512207, 0.2874746322631836, 0.6513810157775879, 1.0152873992919922, 1.3791937828063965, 1.7431001663208008, 2.107006549835205, 2.4709129333496094, 2.8348193168640137, 3.198725700378418, 3.5626320838928223, 3.9265384674072266, 4.290444850921631, 4.654351234436035, 5.0182576179504395, 5.382164001464844, 5.746070384979248, 6.109976768493652, 6.473883152008057, 6.837789535522461, 7.201695919036865, 7.5656023025512695, 7.929508686065674, 8.293415069580078, 8.65732192993164, 9.021227836608887, 9.385133743286133, 9.749040603637695, 10.112947463989258, 10.476853370666504]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 7.0, 8.0, 11.0, 6.0, 26.0, 36.0, 58.0, 78.0, 147.0, 199.0, 311.0, 570.0, 866.0, 1416.0, 2376.0, 3947.0, 6219.0, 9496.0, 14930.0, 23251.0, 34320.0, 48084.0, 65046.0, 82407.0, 97682.0, 107500.0, 109967.0, 103440.0, 89887.0, 73227.0, 55358.0, 40207.0, 27646.0, 18034.0, 11901.0, 7498.0, 4729.0, 2876.0, 1841.0, 1102.0, 684.0, 448.0, 261.0, 175.0, 100.0, 69.0, 45.0, 28.0, 15.0, 11.0, 3.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.375, -9.0648193359375, -8.754638671875, -8.4444580078125, -8.13427734375, -7.8240966796875, -7.513916015625, -7.2037353515625, -6.8935546875, -6.5833740234375, -6.273193359375, -5.9630126953125, -5.65283203125, -5.3426513671875, -5.032470703125, -4.7222900390625, -4.412109375, -4.1019287109375, -3.791748046875, -3.4815673828125, -3.17138671875, -2.8612060546875, -2.551025390625, -2.2408447265625, -1.9306640625, -1.6204833984375, -1.310302734375, -1.0001220703125, -0.68994140625, -0.3797607421875, -0.069580078125, 0.2406005859375, 0.55078125, 0.8609619140625, 1.171142578125, 1.4813232421875, 1.79150390625, 2.1016845703125, 2.411865234375, 2.7220458984375, 3.0322265625, 3.3424072265625, 3.652587890625, 3.9627685546875, 4.27294921875, 4.5831298828125, 4.893310546875, 5.2034912109375, 5.513671875, 5.8238525390625, 6.134033203125, 6.4442138671875, 6.75439453125, 7.0645751953125, 7.374755859375, 7.6849365234375, 7.9951171875, 8.3052978515625, 8.615478515625, 8.9256591796875, 9.23583984375, 9.5460205078125, 9.856201171875, 10.1663818359375, 10.4765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 9.0, 16.0, 16.0, 19.0, 21.0, 25.0, 24.0, 31.0, 33.0, 37.0, 48.0, 37.0, 33.0, 48.0, 35.0, 50.0, 40.0, 42.0, 34.0, 39.0, 42.0, 36.0, 33.0, 33.0, 27.0, 26.0, 20.0, 18.0, 17.0, 16.0, 15.0, 10.0, 11.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.7554931640625, -11.409423828125, -11.0633544921875, -10.71728515625, -10.3712158203125, -10.025146484375, -9.6790771484375, -9.3330078125, -8.9869384765625, -8.640869140625, -8.2947998046875, -7.94873046875, -7.6026611328125, -7.256591796875, -6.9105224609375, -6.564453125, -6.2183837890625, -5.872314453125, -5.5262451171875, -5.18017578125, -4.8341064453125, -4.488037109375, -4.1419677734375, -3.7958984375, -3.4498291015625, -3.103759765625, -2.7576904296875, -2.41162109375, -2.0655517578125, -1.719482421875, -1.3734130859375, -1.02734375, -0.6812744140625, -0.335205078125, 0.0108642578125, 0.35693359375, 0.7030029296875, 1.049072265625, 1.3951416015625, 1.7412109375, 2.0872802734375, 2.433349609375, 2.7794189453125, 3.12548828125, 3.4715576171875, 3.817626953125, 4.1636962890625, 4.509765625, 4.8558349609375, 5.201904296875, 5.5479736328125, 5.89404296875, 6.2401123046875, 6.586181640625, 6.9322509765625, 7.2783203125, 7.6243896484375, 7.970458984375, 8.3165283203125, 8.66259765625, 9.0086669921875, 9.354736328125, 9.7008056640625, 10.046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 8.0, 16.0, 20.0, 32.0, 56.0, 68.0, 124.0, 202.0, 301.0, 488.0, 789.0, 1278.0, 2123.0, 3349.0, 5397.0, 9014.0, 14292.0, 22458.0, 33978.0, 49539.0, 68166.0, 88267.0, 104977.0, 115340.0, 115666.0, 106627.0, 89329.0, 69445.0, 50503.0, 34883.0, 23044.0, 14934.0, 9170.0, 5577.0, 3427.0, 2057.0, 1371.0, 837.0, 520.0, 304.0, 193.0, 133.0, 76.0, 60.0, 43.0, 25.0, 16.0, 10.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-11.1328125, -10.7957763671875, -10.458740234375, -10.1217041015625, -9.78466796875, -9.4476318359375, -9.110595703125, -8.7735595703125, -8.4365234375, -8.0994873046875, -7.762451171875, -7.4254150390625, -7.08837890625, -6.7513427734375, -6.414306640625, -6.0772705078125, -5.740234375, -5.4031982421875, -5.066162109375, -4.7291259765625, -4.39208984375, -4.0550537109375, -3.718017578125, -3.3809814453125, -3.0439453125, -2.7069091796875, -2.369873046875, -2.0328369140625, -1.69580078125, -1.3587646484375, -1.021728515625, -0.6846923828125, -0.34765625, -0.0106201171875, 0.326416015625, 0.6634521484375, 1.00048828125, 1.3375244140625, 1.674560546875, 2.0115966796875, 2.3486328125, 2.6856689453125, 3.022705078125, 3.3597412109375, 3.69677734375, 4.0338134765625, 4.370849609375, 4.7078857421875, 5.044921875, 5.3819580078125, 5.718994140625, 6.0560302734375, 6.39306640625, 6.7301025390625, 7.067138671875, 7.4041748046875, 7.7412109375, 8.0782470703125, 8.415283203125, 8.7523193359375, 9.08935546875, 9.4263916015625, 9.763427734375, 10.1004638671875, 10.4375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 5.0, 11.0, 12.0, 20.0, 22.0, 25.0, 15.0, 32.0, 30.0, 35.0, 34.0, 39.0, 44.0, 40.0, 36.0, 32.0, 58.0, 43.0, 48.0, 38.0, 33.0, 28.0, 40.0, 44.0, 40.0, 31.0, 19.0, 27.0, 21.0, 15.0, 13.0, 13.0, 12.0, 16.0, 3.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.5697021484375, -7.330810546875, -7.0919189453125, -6.85302734375, -6.6141357421875, -6.375244140625, -6.1363525390625, -5.8974609375, -5.6585693359375, -5.419677734375, -5.1807861328125, -4.94189453125, -4.7030029296875, -4.464111328125, -4.2252197265625, -3.986328125, -3.7474365234375, -3.508544921875, -3.2696533203125, -3.03076171875, -2.7918701171875, -2.552978515625, -2.3140869140625, -2.0751953125, -1.8363037109375, -1.597412109375, -1.3585205078125, -1.11962890625, -0.8807373046875, -0.641845703125, -0.4029541015625, -0.1640625, 0.0748291015625, 0.313720703125, 0.5526123046875, 0.79150390625, 1.0303955078125, 1.269287109375, 1.5081787109375, 1.7470703125, 1.9859619140625, 2.224853515625, 2.4637451171875, 2.70263671875, 2.9415283203125, 3.180419921875, 3.4193115234375, 3.658203125, 3.8970947265625, 4.135986328125, 4.3748779296875, 4.61376953125, 4.8526611328125, 5.091552734375, 5.3304443359375, 5.5693359375, 5.8082275390625, 6.047119140625, 6.2860107421875, 6.52490234375, 6.7637939453125, 7.002685546875, 7.2415771484375, 7.48046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 15.0, 19.0, 22.0, 37.0, 39.0, 64.0, 96.0, 133.0, 201.0, 335.0, 451.0, 717.0, 1156.0, 1912.0, 2985.0, 5123.0, 8514.0, 15091.0, 27037.0, 48088.0, 81693.0, 125855.0, 165203.0, 173426.0, 145353.0, 100606.0, 61519.0, 35479.0, 19758.0, 11035.0, 6494.0, 3713.0, 2306.0, 1415.0, 909.0, 592.0, 385.0, 228.0, 169.0, 112.0, 79.0, 66.0, 27.0, 28.0, 17.0, 8.0, 15.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0], "bins": [-6.3671875, -6.18115234375, -5.9951171875, -5.80908203125, -5.623046875, -5.43701171875, -5.2509765625, -5.06494140625, -4.87890625, -4.69287109375, -4.5068359375, -4.32080078125, -4.134765625, -3.94873046875, -3.7626953125, -3.57666015625, -3.390625, -3.20458984375, -3.0185546875, -2.83251953125, -2.646484375, -2.46044921875, -2.2744140625, -2.08837890625, -1.90234375, -1.71630859375, -1.5302734375, -1.34423828125, -1.158203125, -0.97216796875, -0.7861328125, -0.60009765625, -0.4140625, -0.22802734375, -0.0419921875, 0.14404296875, 0.330078125, 0.51611328125, 0.7021484375, 0.88818359375, 1.07421875, 1.26025390625, 1.4462890625, 1.63232421875, 1.818359375, 2.00439453125, 2.1904296875, 2.37646484375, 2.5625, 2.74853515625, 2.9345703125, 3.12060546875, 3.306640625, 3.49267578125, 3.6787109375, 3.86474609375, 4.05078125, 4.23681640625, 4.4228515625, 4.60888671875, 4.794921875, 4.98095703125, 5.1669921875, 5.35302734375, 5.5390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 10.0, 12.0, 22.0, 22.0, 22.0, 27.0, 36.0, 39.0, 39.0, 46.0, 60.0, 52.0, 59.0, 60.0, 56.0, 50.0, 48.0, 48.0, 26.0, 44.0, 40.0, 30.0, 29.0, 20.0, 14.0, 16.0, 7.0, 5.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006170272827148438, -0.0005972012877464294, -0.0005773752927780151, -0.0005575492978096008, -0.0005377233028411865, -0.0005178973078727722, -0.0004980713129043579, -0.0004782453179359436, -0.0004584193229675293, -0.000438593327999115, -0.0004187673330307007, -0.0003989413380622864, -0.00037911534309387207, -0.00035928934812545776, -0.00033946335315704346, -0.00031963735818862915, -0.00029981136322021484, -0.00027998536825180054, -0.00026015937328338623, -0.00024033337831497192, -0.00022050738334655762, -0.0002006813883781433, -0.000180855393409729, -0.0001610293984413147, -0.0001412034034729004, -0.00012137740850448608, -0.00010155141353607178, -8.172541856765747e-05, -6.189942359924316e-05, -4.207342863082886e-05, -2.224743366241455e-05, -2.421438694000244e-06, 1.7404556274414062e-05, 3.723055124282837e-05, 5.7056546211242676e-05, 7.688254117965698e-05, 9.670853614807129e-05, 0.0001165345311164856, 0.0001363605260848999, 0.0001561865210533142, 0.00017601251602172852, 0.00019583851099014282, 0.00021566450595855713, 0.00023549050092697144, 0.00025531649589538574, 0.00027514249086380005, 0.00029496848583221436, 0.00031479448080062866, 0.00033462047576904297, 0.0003544464707374573, 0.0003742724657058716, 0.0003940984606742859, 0.0004139244556427002, 0.0004337504506111145, 0.0004535764455795288, 0.0004734024405479431, 0.0004932284355163574, 0.0005130544304847717, 0.000532880425453186, 0.0005527064204216003, 0.0005725324153900146, 0.000592358410358429, 0.0006121844053268433, 0.0006320104002952576, 0.0006518363952636719]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 7.0, 13.0, 9.0, 14.0, 16.0, 26.0, 41.0, 55.0, 84.0, 112.0, 171.0, 241.0, 378.0, 541.0, 769.0, 1159.0, 1583.0, 2500.0, 3877.0, 6207.0, 10221.0, 16968.0, 27827.0, 45225.0, 71560.0, 104428.0, 134548.0, 149909.0, 141547.0, 113135.0, 79985.0, 51585.0, 32303.0, 19578.0, 11718.0, 7162.0, 4566.0, 2770.0, 1813.0, 1225.0, 794.0, 574.0, 411.0, 258.0, 171.0, 132.0, 96.0, 73.0, 55.0, 42.0, 26.0, 19.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0], "bins": [-5.4921875, -5.318603515625, -5.14501953125, -4.971435546875, -4.7978515625, -4.624267578125, -4.45068359375, -4.277099609375, -4.103515625, -3.929931640625, -3.75634765625, -3.582763671875, -3.4091796875, -3.235595703125, -3.06201171875, -2.888427734375, -2.71484375, -2.541259765625, -2.36767578125, -2.194091796875, -2.0205078125, -1.846923828125, -1.67333984375, -1.499755859375, -1.326171875, -1.152587890625, -0.97900390625, -0.805419921875, -0.6318359375, -0.458251953125, -0.28466796875, -0.111083984375, 0.0625, 0.236083984375, 0.40966796875, 0.583251953125, 0.7568359375, 0.930419921875, 1.10400390625, 1.277587890625, 1.451171875, 1.624755859375, 1.79833984375, 1.971923828125, 2.1455078125, 2.319091796875, 2.49267578125, 2.666259765625, 2.83984375, 3.013427734375, 3.18701171875, 3.360595703125, 3.5341796875, 3.707763671875, 3.88134765625, 4.054931640625, 4.228515625, 4.402099609375, 4.57568359375, 4.749267578125, 4.9228515625, 5.096435546875, 5.27001953125, 5.443603515625, 5.6171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 10.0, 14.0, 14.0, 16.0, 22.0, 30.0, 28.0, 34.0, 55.0, 57.0, 70.0, 69.0, 73.0, 63.0, 71.0, 50.0, 52.0, 66.0, 39.0, 42.0, 22.0, 21.0, 16.0, 15.0, 8.0, 9.0, 6.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.53125, -2.448883056640625, -2.36651611328125, -2.284149169921875, -2.2017822265625, -2.119415283203125, -2.03704833984375, -1.954681396484375, -1.872314453125, -1.789947509765625, -1.70758056640625, -1.625213623046875, -1.5428466796875, -1.460479736328125, -1.37811279296875, -1.295745849609375, -1.21337890625, -1.131011962890625, -1.04864501953125, -0.966278076171875, -0.8839111328125, -0.801544189453125, -0.71917724609375, -0.636810302734375, -0.554443359375, -0.472076416015625, -0.38970947265625, -0.307342529296875, -0.2249755859375, -0.142608642578125, -0.06024169921875, 0.022125244140625, 0.1044921875, 0.186859130859375, 0.26922607421875, 0.351593017578125, 0.4339599609375, 0.516326904296875, 0.59869384765625, 0.681060791015625, 0.763427734375, 0.845794677734375, 0.92816162109375, 1.010528564453125, 1.0928955078125, 1.175262451171875, 1.25762939453125, 1.339996337890625, 1.42236328125, 1.504730224609375, 1.58709716796875, 1.669464111328125, 1.7518310546875, 1.834197998046875, 1.91656494140625, 1.998931884765625, 2.081298828125, 2.163665771484375, 2.24603271484375, 2.328399658203125, 2.4107666015625, 2.493133544921875, 2.57550048828125, 2.657867431640625, 2.740234375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 8.0, 8.0, 12.0, 5.0, 17.0, 15.0, 29.0, 24.0, 21.0, 26.0, 35.0, 43.0, 47.0, 40.0, 44.0, 49.0, 36.0, 50.0, 47.0, 37.0, 35.0, 44.0, 42.0, 34.0, 34.0, 26.0, 32.0, 25.0, 28.0, 20.0, 24.0, 8.0, 9.0, 9.0, 6.0, 3.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.549898147583008, -10.191729545593262, -9.833560943603516, -9.475393295288086, -9.11722469329834, -8.759056091308594, -8.400887489318848, -8.042718887329102, -7.684550762176514, -7.326382160186768, -6.96821403503418, -6.610045433044434, -6.2518768310546875, -5.8937087059021, -5.5355401039123535, -5.177371978759766, -4.8192033767700195, -4.461034774780273, -4.1028666496276855, -3.7446980476379395, -3.3865296840667725, -3.0283613204956055, -2.6701927185058594, -2.3120243549346924, -1.9538559913635254, -1.5956876277923584, -1.2375191450119019, -0.8793506622314453, -0.5211822986602783, -0.16301393508911133, 0.19515466690063477, 0.5533230304718018, 0.9114904403686523, 1.2696588039398193, 1.6278272867202759, 1.9859957695007324, 2.3441641330718994, 2.7023324966430664, 3.0605010986328125, 3.4186694622039795, 3.7768378257751465, 4.135006427764893, 4.4931745529174805, 4.851343154907227, 5.209511756896973, 5.5676798820495605, 5.925848484039307, 6.2840166091918945, 6.642185211181641, 7.000353813171387, 7.358521938323975, 7.716690540313721, 8.074858665466309, 8.433027267456055, 8.7911958694458, 9.149364471435547, 9.507532119750977, 9.865700721740723, 10.223869323730469, 10.582036972045898, 10.940205574035645, 11.29837417602539, 11.656542778015137, 12.014711380004883, 12.372879981994629]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 7.0, 18.0, 11.0, 20.0, 14.0, 24.0, 35.0, 29.0, 23.0, 36.0, 29.0, 36.0, 43.0, 56.0, 42.0, 32.0, 41.0, 51.0, 48.0, 45.0, 35.0, 34.0, 26.0, 36.0, 32.0, 30.0, 27.0, 19.0, 18.0, 17.0, 12.0, 21.0, 9.0, 6.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.709505081176758, -13.33723258972168, -12.964960098266602, -12.592687606811523, -12.220415115356445, -11.848142623901367, -11.475870132446289, -11.103597640991211, -10.731325149536133, -10.359052658081055, -9.986780166625977, -9.614507675170898, -9.24223518371582, -8.869962692260742, -8.497690200805664, -8.125417709350586, -7.753144264221191, -7.380871772766113, -7.008599281311035, -6.636326789855957, -6.264054298400879, -5.891781806945801, -5.5195088386535645, -5.147236347198486, -4.774963855743408, -4.40269136428833, -4.030418872833252, -3.6581461429595947, -3.2858736515045166, -2.9136011600494385, -2.5413284301757812, -2.169055938720703, -1.7967844009399414, -1.4245119094848633, -1.0522392988204956, -0.6799666881561279, -0.3076941967010498, 0.06457829475402832, 0.43685102462768555, 0.8091235160827637, 1.1813960075378418, 1.55366849899292, 1.9259411096572876, 2.2982137203216553, 2.6704862117767334, 3.0427587032318115, 3.4150314331054688, 3.787303924560547, 4.159576416015625, 4.531848907470703, 4.904121398925781, 5.276393890380859, 5.6486663818359375, 6.020938873291016, 6.393211841583252, 6.76548433303833, 7.137756824493408, 7.510029315948486, 7.8823018074035645, 8.2545747756958, 8.626847267150879, 8.999119758605957, 9.371392250061035, 9.743664741516113, 10.115937232971191]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 10.0, 23.0, 38.0, 62.0, 91.0, 146.0, 238.0, 420.0, 724.0, 1148.0, 2005.0, 3293.0, 5302.0, 9013.0, 14774.0, 23587.0, 37705.0, 58117.0, 90957.0, 135359.0, 195405.0, 271458.0, 352605.0, 428961.0, 472991.0, 472024.0, 426246.0, 352805.0, 268685.0, 194300.0, 133283.0, 89167.0, 57700.0, 36628.0, 23087.0, 14293.0, 8588.0, 5308.0, 3144.0, 1855.0, 1119.0, 661.0, 376.0, 256.0, 131.0, 69.0, 56.0, 29.0, 14.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.3125, -9.0384521484375, -8.764404296875, -8.4903564453125, -8.21630859375, -7.9422607421875, -7.668212890625, -7.3941650390625, -7.1201171875, -6.8460693359375, -6.572021484375, -6.2979736328125, -6.02392578125, -5.7498779296875, -5.475830078125, -5.2017822265625, -4.927734375, -4.6536865234375, -4.379638671875, -4.1055908203125, -3.83154296875, -3.5574951171875, -3.283447265625, -3.0093994140625, -2.7353515625, -2.4613037109375, -2.187255859375, -1.9132080078125, -1.63916015625, -1.3651123046875, -1.091064453125, -0.8170166015625, -0.54296875, -0.2689208984375, 0.005126953125, 0.2791748046875, 0.55322265625, 0.8272705078125, 1.101318359375, 1.3753662109375, 1.6494140625, 1.9234619140625, 2.197509765625, 2.4715576171875, 2.74560546875, 3.0196533203125, 3.293701171875, 3.5677490234375, 3.841796875, 4.1158447265625, 4.389892578125, 4.6639404296875, 4.93798828125, 5.2120361328125, 5.486083984375, 5.7601318359375, 6.0341796875, 6.3082275390625, 6.582275390625, 6.8563232421875, 7.13037109375, 7.4044189453125, 7.678466796875, 7.9525146484375, 8.2265625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 7.0, 8.0, 9.0, 12.0, 18.0, 13.0, 25.0, 25.0, 33.0, 26.0, 24.0, 39.0, 33.0, 38.0, 40.0, 51.0, 44.0, 38.0, 41.0, 40.0, 51.0, 43.0, 40.0, 30.0, 23.0, 37.0, 32.0, 30.0, 18.0, 18.0, 15.0, 15.0, 20.0, 16.0, 11.0, 4.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.4609375, -11.145263671875, -10.82958984375, -10.513916015625, -10.1982421875, -9.882568359375, -9.56689453125, -9.251220703125, -8.935546875, -8.619873046875, -8.30419921875, -7.988525390625, -7.6728515625, -7.357177734375, -7.04150390625, -6.725830078125, -6.41015625, -6.094482421875, -5.77880859375, -5.463134765625, -5.1474609375, -4.831787109375, -4.51611328125, -4.200439453125, -3.884765625, -3.569091796875, -3.25341796875, -2.937744140625, -2.6220703125, -2.306396484375, -1.99072265625, -1.675048828125, -1.359375, -1.043701171875, -0.72802734375, -0.412353515625, -0.0966796875, 0.218994140625, 0.53466796875, 0.850341796875, 1.166015625, 1.481689453125, 1.79736328125, 2.113037109375, 2.4287109375, 2.744384765625, 3.06005859375, 3.375732421875, 3.69140625, 4.007080078125, 4.32275390625, 4.638427734375, 4.9541015625, 5.269775390625, 5.58544921875, 5.901123046875, 6.216796875, 6.532470703125, 6.84814453125, 7.163818359375, 7.4794921875, 7.795166015625, 8.11083984375, 8.426513671875, 8.7421875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 6.0, 14.0, 18.0, 32.0, 46.0, 97.0, 137.0, 231.0, 362.0, 663.0, 1011.0, 1727.0, 2769.0, 4569.0, 7138.0, 11590.0, 18281.0, 28356.0, 42404.0, 63441.0, 92574.0, 130143.0, 176899.0, 232033.0, 290523.0, 343948.0, 383431.0, 400492.0, 391579.0, 358237.0, 308882.0, 249979.0, 195120.0, 144438.0, 103793.0, 71738.0, 49058.0, 32290.0, 20886.0, 13386.0, 8525.0, 5275.0, 3292.0, 1858.0, 1240.0, 724.0, 414.0, 254.0, 163.0, 94.0, 46.0, 42.0, 19.0, 9.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.046875, -7.792724609375, -7.53857421875, -7.284423828125, -7.0302734375, -6.776123046875, -6.52197265625, -6.267822265625, -6.013671875, -5.759521484375, -5.50537109375, -5.251220703125, -4.9970703125, -4.742919921875, -4.48876953125, -4.234619140625, -3.98046875, -3.726318359375, -3.47216796875, -3.218017578125, -2.9638671875, -2.709716796875, -2.45556640625, -2.201416015625, -1.947265625, -1.693115234375, -1.43896484375, -1.184814453125, -0.9306640625, -0.676513671875, -0.42236328125, -0.168212890625, 0.0859375, 0.340087890625, 0.59423828125, 0.848388671875, 1.1025390625, 1.356689453125, 1.61083984375, 1.864990234375, 2.119140625, 2.373291015625, 2.62744140625, 2.881591796875, 3.1357421875, 3.389892578125, 3.64404296875, 3.898193359375, 4.15234375, 4.406494140625, 4.66064453125, 4.914794921875, 5.1689453125, 5.423095703125, 5.67724609375, 5.931396484375, 6.185546875, 6.439697265625, 6.69384765625, 6.947998046875, 7.2021484375, 7.456298828125, 7.71044921875, 7.964599609375, 8.21875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 23.0, 25.0, 35.0, 39.0, 47.0, 49.0, 75.0, 67.0, 79.0, 115.0, 132.0, 153.0, 158.0, 180.0, 203.0, 198.0, 200.0, 213.0, 219.0, 216.0, 167.0, 188.0, 178.0, 169.0, 155.0, 124.0, 107.0, 85.0, 93.0, 57.0, 54.0, 47.0, 43.0, 37.0, 22.0, 18.0, 25.0, 14.0, 12.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.81640625, -4.6710205078125, -4.525634765625, -4.3802490234375, -4.23486328125, -4.0894775390625, -3.944091796875, -3.7987060546875, -3.6533203125, -3.5079345703125, -3.362548828125, -3.2171630859375, -3.07177734375, -2.9263916015625, -2.781005859375, -2.6356201171875, -2.490234375, -2.3448486328125, -2.199462890625, -2.0540771484375, -1.90869140625, -1.7633056640625, -1.617919921875, -1.4725341796875, -1.3271484375, -1.1817626953125, -1.036376953125, -0.8909912109375, -0.74560546875, -0.6002197265625, -0.454833984375, -0.3094482421875, -0.1640625, -0.0186767578125, 0.126708984375, 0.2720947265625, 0.41748046875, 0.5628662109375, 0.708251953125, 0.8536376953125, 0.9990234375, 1.1444091796875, 1.289794921875, 1.4351806640625, 1.58056640625, 1.7259521484375, 1.871337890625, 2.0167236328125, 2.162109375, 2.3074951171875, 2.452880859375, 2.5982666015625, 2.74365234375, 2.8890380859375, 3.034423828125, 3.1798095703125, 3.3251953125, 3.4705810546875, 3.615966796875, 3.7613525390625, 3.90673828125, 4.0521240234375, 4.197509765625, 4.3428955078125, 4.48828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 5.0, 7.0, 7.0, 11.0, 8.0, 17.0, 26.0, 27.0, 21.0, 19.0, 38.0, 27.0, 52.0, 36.0, 70.0, 40.0, 32.0, 39.0, 38.0, 51.0, 42.0, 38.0, 51.0, 32.0, 34.0, 23.0, 31.0, 35.0, 23.0, 19.0, 18.0, 11.0, 8.0, 9.0, 12.0, 10.0, 7.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796188354492188, -9.425966262817383, -9.055744171142578, -8.685522079467773, -8.315299987792969, -7.945078372955322, -7.574856758117676, -7.204634666442871, -6.834412574768066, -6.464190483093262, -6.093968391418457, -5.7237467765808105, -5.353524684906006, -4.983302593231201, -4.613080978393555, -4.24285888671875, -3.8726367950439453, -3.5024147033691406, -3.132192850112915, -2.7619709968566895, -2.3917489051818848, -2.02152681350708, -1.6513049602508545, -1.281083106994629, -0.9108610153198242, -0.5406390428543091, -0.17041707038879395, 0.1998049020767212, 0.5700268745422363, 0.9402488470077515, 1.3104708194732666, 1.6806926727294922, 2.0509138107299805, 2.421135902404785, 2.7913577556610107, 3.1615796089172363, 3.531801700592041, 3.9020237922668457, 4.272245407104492, 4.642467498779297, 5.012689590454102, 5.382911682128906, 5.753133773803711, 6.123355388641357, 6.493577480316162, 6.863799571990967, 7.234021186828613, 7.604243278503418, 7.974465370178223, 8.344687461853027, 8.714909553527832, 9.085131645202637, 9.455352783203125, 9.82557487487793, 10.195796966552734, 10.566019058227539, 10.936241149902344, 11.306463241577148, 11.676685333251953, 12.046907424926758, 12.417129516601562, 12.78735065460205, 13.157572746276855, 13.52779483795166, 13.898016929626465]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 6.0, 3.0, 7.0, 7.0, 9.0, 12.0, 12.0, 14.0, 23.0, 18.0, 20.0, 28.0, 29.0, 31.0, 23.0, 40.0, 35.0, 45.0, 39.0, 31.0, 35.0, 48.0, 40.0, 41.0, 49.0, 43.0, 35.0, 27.0, 38.0, 36.0, 26.0, 20.0, 23.0, 20.0, 13.0, 20.0, 10.0, 9.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.916873931884766, -12.552591323852539, -12.188308715820312, -11.82402515411377, -11.459742546081543, -11.095459938049316, -10.731176376342773, -10.366893768310547, -10.00261116027832, -9.638328552246094, -9.274045944213867, -8.909762382507324, -8.545479774475098, -8.181197166442871, -7.816914081573486, -7.452630996704102, -7.088348388671875, -6.724065780639648, -6.359782695770264, -5.995499610900879, -5.631217002868652, -5.266934394836426, -4.902651309967041, -4.538368225097656, -4.17408561706543, -3.809802770614624, -3.4455199241638184, -3.0812370777130127, -2.716954231262207, -2.3526713848114014, -1.9883885383605957, -1.62410569190979, -1.2598237991333008, -0.8955409526824951, -0.5312581062316895, -0.1669752597808838, 0.19730758666992188, 0.5615904331207275, 0.9258732795715332, 1.2901561260223389, 1.6544389724731445, 2.01872181892395, 2.383004665374756, 2.7472875118255615, 3.111570358276367, 3.475853204727173, 3.8401360511779785, 4.204419136047363, 4.56870174407959, 4.932984352111816, 5.297267436981201, 5.661550521850586, 6.0258331298828125, 6.390115737915039, 6.754398822784424, 7.118681907653809, 7.482964515686035, 7.847247123718262, 8.211530685424805, 8.575813293457031, 8.940095901489258, 9.304378509521484, 9.668661117553711, 10.032944679260254, 10.39722728729248]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 9.0, 8.0, 23.0, 22.0, 33.0, 43.0, 57.0, 79.0, 124.0, 171.0, 258.0, 390.0, 542.0, 839.0, 1230.0, 1906.0, 2953.0, 4522.0, 7345.0, 11421.0, 18451.0, 29690.0, 47336.0, 75033.0, 113991.0, 157178.0, 173175.0, 139698.0, 96155.0, 61618.0, 38727.0, 24055.0, 14999.0, 9490.0, 5973.0, 3754.0, 2405.0, 1560.0, 1079.0, 737.0, 471.0, 326.0, 198.0, 133.0, 101.0, 93.0, 46.0, 42.0, 29.0, 10.0, 9.0, 7.0, 8.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-4.42578125, -4.2886962890625, -4.151611328125, -4.0145263671875, -3.87744140625, -3.7403564453125, -3.603271484375, -3.4661865234375, -3.3291015625, -3.1920166015625, -3.054931640625, -2.9178466796875, -2.78076171875, -2.6436767578125, -2.506591796875, -2.3695068359375, -2.232421875, -2.0953369140625, -1.958251953125, -1.8211669921875, -1.68408203125, -1.5469970703125, -1.409912109375, -1.2728271484375, -1.1357421875, -0.9986572265625, -0.861572265625, -0.7244873046875, -0.58740234375, -0.4503173828125, -0.313232421875, -0.1761474609375, -0.0390625, 0.0980224609375, 0.235107421875, 0.3721923828125, 0.50927734375, 0.6463623046875, 0.783447265625, 0.9205322265625, 1.0576171875, 1.1947021484375, 1.331787109375, 1.4688720703125, 1.60595703125, 1.7430419921875, 1.880126953125, 2.0172119140625, 2.154296875, 2.2913818359375, 2.428466796875, 2.5655517578125, 2.70263671875, 2.8397216796875, 2.976806640625, 3.1138916015625, 3.2509765625, 3.3880615234375, 3.525146484375, 3.6622314453125, 3.79931640625, 3.9364013671875, 4.073486328125, 4.2105712890625, 4.34765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 8.0, 8.0, 11.0, 13.0, 13.0, 23.0, 18.0, 19.0, 27.0, 30.0, 32.0, 23.0, 41.0, 34.0, 39.0, 45.0, 30.0, 37.0, 50.0, 38.0, 43.0, 47.0, 44.0, 34.0, 26.0, 36.0, 41.0, 23.0, 20.0, 23.0, 20.0, 14.0, 21.0, 8.0, 10.0, 9.0, 10.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.78125, -12.419677734375, -12.05810546875, -11.696533203125, -11.3349609375, -10.973388671875, -10.61181640625, -10.250244140625, -9.888671875, -9.527099609375, -9.16552734375, -8.803955078125, -8.4423828125, -8.080810546875, -7.71923828125, -7.357666015625, -6.99609375, -6.634521484375, -6.27294921875, -5.911376953125, -5.5498046875, -5.188232421875, -4.82666015625, -4.465087890625, -4.103515625, -3.741943359375, -3.38037109375, -3.018798828125, -2.6572265625, -2.295654296875, -1.93408203125, -1.572509765625, -1.2109375, -0.849365234375, -0.48779296875, -0.126220703125, 0.2353515625, 0.596923828125, 0.95849609375, 1.320068359375, 1.681640625, 2.043212890625, 2.40478515625, 2.766357421875, 3.1279296875, 3.489501953125, 3.85107421875, 4.212646484375, 4.57421875, 4.935791015625, 5.29736328125, 5.658935546875, 6.0205078125, 6.382080078125, 6.74365234375, 7.105224609375, 7.466796875, 7.828369140625, 8.18994140625, 8.551513671875, 8.9130859375, 9.274658203125, 9.63623046875, 9.997802734375, 10.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 12.0, 15.0, 24.0, 23.0, 43.0, 57.0, 72.0, 117.0, 170.0, 223.0, 327.0, 457.0, 678.0, 1022.0, 1495.0, 2265.0, 3871.0, 6095.0, 10322.0, 18469.0, 33923.0, 65423.0, 128342.0, 227256.0, 241836.0, 144525.0, 73877.0, 37846.0, 20128.0, 11393.0, 6710.0, 4068.0, 2512.0, 1564.0, 1082.0, 687.0, 520.0, 323.0, 245.0, 155.0, 105.0, 72.0, 62.0, 36.0, 37.0, 20.0, 19.0, 5.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.740234375, -3.61993408203125, -3.4996337890625, -3.37933349609375, -3.259033203125, -3.13873291015625, -3.0184326171875, -2.89813232421875, -2.77783203125, -2.65753173828125, -2.5372314453125, -2.41693115234375, -2.296630859375, -2.17633056640625, -2.0560302734375, -1.93572998046875, -1.8154296875, -1.69512939453125, -1.5748291015625, -1.45452880859375, -1.334228515625, -1.21392822265625, -1.0936279296875, -0.97332763671875, -0.85302734375, -0.73272705078125, -0.6124267578125, -0.49212646484375, -0.371826171875, -0.25152587890625, -0.1312255859375, -0.01092529296875, 0.109375, 0.22967529296875, 0.3499755859375, 0.47027587890625, 0.590576171875, 0.71087646484375, 0.8311767578125, 0.95147705078125, 1.07177734375, 1.19207763671875, 1.3123779296875, 1.43267822265625, 1.552978515625, 1.67327880859375, 1.7935791015625, 1.91387939453125, 2.0341796875, 2.15447998046875, 2.2747802734375, 2.39508056640625, 2.515380859375, 2.63568115234375, 2.7559814453125, 2.87628173828125, 2.99658203125, 3.11688232421875, 3.2371826171875, 3.35748291015625, 3.477783203125, 3.59808349609375, 3.7183837890625, 3.83868408203125, 3.958984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 2.0, 8.0, 7.0, 8.0, 11.0, 15.0, 14.0, 16.0, 26.0, 23.0, 29.0, 24.0, 29.0, 22.0, 31.0, 40.0, 32.0, 33.0, 39.0, 38.0, 46.0, 33.0, 34.0, 40.0, 34.0, 45.0, 47.0, 33.0, 25.0, 31.0, 24.0, 28.0, 21.0, 20.0, 14.0, 17.0, 9.0, 18.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.484375, -6.259033203125, -6.03369140625, -5.808349609375, -5.5830078125, -5.357666015625, -5.13232421875, -4.906982421875, -4.681640625, -4.456298828125, -4.23095703125, -4.005615234375, -3.7802734375, -3.554931640625, -3.32958984375, -3.104248046875, -2.87890625, -2.653564453125, -2.42822265625, -2.202880859375, -1.9775390625, -1.752197265625, -1.52685546875, -1.301513671875, -1.076171875, -0.850830078125, -0.62548828125, -0.400146484375, -0.1748046875, 0.050537109375, 0.27587890625, 0.501220703125, 0.7265625, 0.951904296875, 1.17724609375, 1.402587890625, 1.6279296875, 1.853271484375, 2.07861328125, 2.303955078125, 2.529296875, 2.754638671875, 2.97998046875, 3.205322265625, 3.4306640625, 3.656005859375, 3.88134765625, 4.106689453125, 4.33203125, 4.557373046875, 4.78271484375, 5.008056640625, 5.2333984375, 5.458740234375, 5.68408203125, 5.909423828125, 6.134765625, 6.360107421875, 6.58544921875, 6.810791015625, 7.0361328125, 7.261474609375, 7.48681640625, 7.712158203125, 7.9375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 10.0, 7.0, 11.0, 18.0, 16.0, 29.0, 31.0, 58.0, 63.0, 71.0, 108.0, 181.0, 249.0, 400.0, 679.0, 1192.0, 2361.0, 5183.0, 13291.0, 41139.0, 181612.0, 559176.0, 178724.0, 40390.0, 12924.0, 4983.0, 2377.0, 1186.0, 709.0, 462.0, 283.0, 181.0, 143.0, 93.0, 66.0, 42.0, 38.0, 25.0, 13.0, 10.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.81964111328125, -2.7271728515625, -2.63470458984375, -2.542236328125, -2.44976806640625, -2.3572998046875, -2.26483154296875, -2.17236328125, -2.07989501953125, -1.9874267578125, -1.89495849609375, -1.802490234375, -1.71002197265625, -1.6175537109375, -1.52508544921875, -1.4326171875, -1.34014892578125, -1.2476806640625, -1.15521240234375, -1.062744140625, -0.97027587890625, -0.8778076171875, -0.78533935546875, -0.69287109375, -0.60040283203125, -0.5079345703125, -0.41546630859375, -0.322998046875, -0.23052978515625, -0.1380615234375, -0.04559326171875, 0.046875, 0.13934326171875, 0.2318115234375, 0.32427978515625, 0.416748046875, 0.50921630859375, 0.6016845703125, 0.69415283203125, 0.78662109375, 0.87908935546875, 0.9715576171875, 1.06402587890625, 1.156494140625, 1.24896240234375, 1.3414306640625, 1.43389892578125, 1.5263671875, 1.61883544921875, 1.7113037109375, 1.80377197265625, 1.896240234375, 1.98870849609375, 2.0811767578125, 2.17364501953125, 2.26611328125, 2.35858154296875, 2.4510498046875, 2.54351806640625, 2.635986328125, 2.72845458984375, 2.8209228515625, 2.91339111328125, 3.005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 14.0, 17.0, 14.0, 26.0, 25.0, 34.0, 34.0, 49.0, 65.0, 87.0, 74.0, 72.0, 74.0, 71.0, 66.0, 50.0, 48.0, 36.0, 21.0, 26.0, 9.0, 10.0, 9.0, 6.0, 7.0, 10.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003323554992675781, -0.0003235321491956711, -0.00031470879912376404, -0.000305885449051857, -0.00029706209897994995, -0.0002882387489080429, -0.00027941539883613586, -0.0002705920487642288, -0.0002617686986923218, -0.00025294534862041473, -0.0002441219985485077, -0.00023529864847660065, -0.0002264752984046936, -0.00021765194833278656, -0.00020882859826087952, -0.00020000524818897247, -0.00019118189811706543, -0.00018235854804515839, -0.00017353519797325134, -0.0001647118479013443, -0.00015588849782943726, -0.0001470651477575302, -0.00013824179768562317, -0.00012941844761371613, -0.00012059509754180908, -0.00011177174746990204, -0.000102948397397995, -9.412504732608795e-05, -8.530169725418091e-05, -7.647834718227386e-05, -6.765499711036682e-05, -5.883164703845978e-05, -5.0008296966552734e-05, -4.118494689464569e-05, -3.236159682273865e-05, -2.3538246750831604e-05, -1.471489667892456e-05, -5.891546607017517e-06, 2.9318034648895264e-06, 1.175515353679657e-05, 2.0578503608703613e-05, 2.9401853680610657e-05, 3.82252037525177e-05, 4.7048553824424744e-05, 5.587190389633179e-05, 6.469525396823883e-05, 7.351860404014587e-05, 8.234195411205292e-05, 9.116530418395996e-05, 9.9988654255867e-05, 0.00010881200432777405, 0.00011763535439968109, 0.00012645870447158813, 0.00013528205454349518, 0.00014410540461540222, 0.00015292875468730927, 0.0001617521047592163, 0.00017057545483112335, 0.0001793988049030304, 0.00018822215497493744, 0.00019704550504684448, 0.00020586885511875153, 0.00021469220519065857, 0.0002235155552625656, 0.00023233890533447266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 4.0, 3.0, 6.0, 12.0, 16.0, 30.0, 35.0, 48.0, 86.0, 112.0, 214.0, 338.0, 446.0, 728.0, 1120.0, 1852.0, 3200.0, 6076.0, 13608.0, 39459.0, 135158.0, 378952.0, 314440.0, 99691.0, 29801.0, 10818.0, 4993.0, 2766.0, 1622.0, 1036.0, 655.0, 427.0, 267.0, 169.0, 122.0, 81.0, 48.0, 34.0, 30.0, 15.0, 9.0, 13.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.1539306640625, -4.014892578125, -3.8758544921875, -3.73681640625, -3.5977783203125, -3.458740234375, -3.3197021484375, -3.1806640625, -3.0416259765625, -2.902587890625, -2.7635498046875, -2.62451171875, -2.4854736328125, -2.346435546875, -2.2073974609375, -2.068359375, -1.9293212890625, -1.790283203125, -1.6512451171875, -1.51220703125, -1.3731689453125, -1.234130859375, -1.0950927734375, -0.9560546875, -0.8170166015625, -0.677978515625, -0.5389404296875, -0.39990234375, -0.2608642578125, -0.121826171875, 0.0172119140625, 0.15625, 0.2952880859375, 0.434326171875, 0.5733642578125, 0.71240234375, 0.8514404296875, 0.990478515625, 1.1295166015625, 1.2685546875, 1.4075927734375, 1.546630859375, 1.6856689453125, 1.82470703125, 1.9637451171875, 2.102783203125, 2.2418212890625, 2.380859375, 2.5198974609375, 2.658935546875, 2.7979736328125, 2.93701171875, 3.0760498046875, 3.215087890625, 3.3541259765625, 3.4931640625, 3.6322021484375, 3.771240234375, 3.9102783203125, 4.04931640625, 4.1883544921875, 4.327392578125, 4.4664306640625, 4.60546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 12.0, 15.0, 18.0, 28.0, 34.0, 49.0, 75.0, 83.0, 87.0, 91.0, 86.0, 79.0, 75.0, 55.0, 59.0, 38.0, 29.0, 22.0, 10.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.169921875, -1.1318511962890625, -1.093780517578125, -1.0557098388671875, -1.01763916015625, -0.9795684814453125, -0.941497802734375, -0.9034271240234375, -0.8653564453125, -0.8272857666015625, -0.789215087890625, -0.7511444091796875, -0.71307373046875, -0.6750030517578125, -0.636932373046875, -0.5988616943359375, -0.560791015625, -0.5227203369140625, -0.484649658203125, -0.4465789794921875, -0.40850830078125, -0.3704376220703125, -0.332366943359375, -0.2942962646484375, -0.2562255859375, -0.2181549072265625, -0.180084228515625, -0.1420135498046875, -0.10394287109375, -0.0658721923828125, -0.027801513671875, 0.0102691650390625, 0.04833984375, 0.0864105224609375, 0.124481201171875, 0.1625518798828125, 0.20062255859375, 0.2386932373046875, 0.276763916015625, 0.3148345947265625, 0.3529052734375, 0.3909759521484375, 0.429046630859375, 0.4671173095703125, 0.50518798828125, 0.5432586669921875, 0.581329345703125, 0.6194000244140625, 0.657470703125, 0.6955413818359375, 0.733612060546875, 0.7716827392578125, 0.80975341796875, 0.8478240966796875, 0.885894775390625, 0.9239654541015625, 0.9620361328125, 1.0001068115234375, 1.038177490234375, 1.0762481689453125, 1.11431884765625, 1.1523895263671875, 1.190460205078125, 1.2285308837890625, 1.2666015625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 9.0, 10.0, 8.0, 6.0, 21.0, 24.0, 24.0, 27.0, 31.0, 32.0, 42.0, 41.0, 60.0, 52.0, 44.0, 42.0, 45.0, 51.0, 41.0, 47.0, 48.0, 39.0, 34.0, 25.0, 35.0, 27.0, 24.0, 21.0, 9.0, 14.0, 11.0, 13.0, 9.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.889636039733887, -10.494866371154785, -10.10009765625, -9.705327987670898, -9.310558319091797, -8.915788650512695, -8.521018981933594, -8.126250267028809, -7.731480598449707, -7.3367109298706055, -6.941941738128662, -6.547172546386719, -6.152402877807617, -5.757633209228516, -5.362864017486572, -4.968094825744629, -4.573325157165527, -4.178555488586426, -3.7837862968444824, -3.38901686668396, -2.9942474365234375, -2.599478006362915, -2.2047085762023926, -1.8099391460418701, -1.4151697158813477, -1.0204002857208252, -0.6256308555603027, -0.23086142539978027, 0.1639080047607422, 0.5586774349212646, 0.9534468650817871, 1.3482162952423096, 1.742985725402832, 2.1377551555633545, 2.532524585723877, 2.9272940158843994, 3.322063446044922, 3.7168328762054443, 4.111602306365967, 4.50637149810791, 4.901141166687012, 5.295910835266113, 5.690680027008057, 6.08544921875, 6.480218887329102, 6.874988555908203, 7.2697577476501465, 7.66452693939209, 8.059296607971191, 8.454066276550293, 8.848834991455078, 9.24360466003418, 9.638374328613281, 10.033143997192383, 10.427913665771484, 10.82268238067627, 11.217452049255371, 11.612221717834473, 12.006990432739258, 12.40176010131836, 12.796529769897461, 13.191299438476562, 13.586069107055664, 13.98083782196045, 14.37560749053955]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 11.0, 9.0, 9.0, 18.0, 18.0, 21.0, 22.0, 30.0, 17.0, 32.0, 26.0, 28.0, 33.0, 50.0, 38.0, 33.0, 32.0, 44.0, 39.0, 46.0, 47.0, 44.0, 36.0, 33.0, 31.0, 36.0, 27.0, 30.0, 19.0, 16.0, 18.0, 17.0, 14.0, 9.0, 14.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.343374252319336, -11.988327026367188, -11.633280754089355, -11.278233528137207, -10.923187255859375, -10.568140029907227, -10.213092803955078, -9.85804557800293, -9.502999305725098, -9.14795207977295, -8.792905807495117, -8.437858581542969, -8.08281135559082, -7.727765083312988, -7.37271785736084, -7.01767110824585, -6.662624359130859, -6.307577610015869, -5.952530860900879, -5.5974836349487305, -5.24243688583374, -4.88739013671875, -4.532342910766602, -4.177296161651611, -3.822249412536621, -3.467202663421631, -3.1121556758880615, -2.757108688354492, -2.402061939239502, -2.0470151901245117, -1.6919682025909424, -1.336921215057373, -0.9818744659423828, -0.626827597618103, -0.27178072929382324, 0.08326613903045654, 0.43831300735473633, 0.7933598756790161, 1.148406744003296, 1.5034537315368652, 1.8585004806518555, 2.2135472297668457, 2.568594217300415, 2.9236412048339844, 3.2786879539489746, 3.633734703063965, 3.988781690597534, 4.3438286781311035, 4.698875427246094, 5.053922176361084, 5.408968925476074, 5.764016151428223, 6.119062900543213, 6.474109649658203, 6.829156875610352, 7.184203624725342, 7.539250373840332, 7.894297122955322, 8.249343872070312, 8.604391098022461, 8.95943832397461, 9.314484596252441, 9.66953182220459, 10.024578094482422, 10.37962532043457]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 16.0, 27.0, 49.0, 56.0, 85.0, 160.0, 255.0, 417.0, 618.0, 1025.0, 1655.0, 2357.0, 3586.0, 5660.0, 8262.0, 12233.0, 17581.0, 24830.0, 33247.0, 43717.0, 56159.0, 68185.0, 79825.0, 87926.0, 92490.0, 90889.0, 86058.0, 75990.0, 63867.0, 51877.0, 40038.0, 30171.0, 21958.0, 15518.0, 10634.0, 7334.0, 4880.0, 3242.0, 2038.0, 1376.0, 808.0, 523.0, 351.0, 216.0, 149.0, 87.0, 47.0, 36.0, 20.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.59375, -8.32373046875, -8.0537109375, -7.78369140625, -7.513671875, -7.24365234375, -6.9736328125, -6.70361328125, -6.43359375, -6.16357421875, -5.8935546875, -5.62353515625, -5.353515625, -5.08349609375, -4.8134765625, -4.54345703125, -4.2734375, -4.00341796875, -3.7333984375, -3.46337890625, -3.193359375, -2.92333984375, -2.6533203125, -2.38330078125, -2.11328125, -1.84326171875, -1.5732421875, -1.30322265625, -1.033203125, -0.76318359375, -0.4931640625, -0.22314453125, 0.046875, 0.31689453125, 0.5869140625, 0.85693359375, 1.126953125, 1.39697265625, 1.6669921875, 1.93701171875, 2.20703125, 2.47705078125, 2.7470703125, 3.01708984375, 3.287109375, 3.55712890625, 3.8271484375, 4.09716796875, 4.3671875, 4.63720703125, 4.9072265625, 5.17724609375, 5.447265625, 5.71728515625, 5.9873046875, 6.25732421875, 6.52734375, 6.79736328125, 7.0673828125, 7.33740234375, 7.607421875, 7.87744140625, 8.1474609375, 8.41748046875, 8.6875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 13.0, 5.0, 13.0, 15.0, 20.0, 22.0, 24.0, 26.0, 22.0, 30.0, 28.0, 25.0, 39.0, 45.0, 41.0, 32.0, 34.0, 49.0, 34.0, 43.0, 46.0, 47.0, 34.0, 35.0, 30.0, 33.0, 26.0, 29.0, 19.0, 16.0, 19.0, 17.0, 13.0, 7.0, 16.0, 9.0, 11.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.8203125, -11.4791259765625, -11.137939453125, -10.7967529296875, -10.45556640625, -10.1143798828125, -9.773193359375, -9.4320068359375, -9.0908203125, -8.7496337890625, -8.408447265625, -8.0672607421875, -7.72607421875, -7.3848876953125, -7.043701171875, -6.7025146484375, -6.361328125, -6.0201416015625, -5.678955078125, -5.3377685546875, -4.99658203125, -4.6553955078125, -4.314208984375, -3.9730224609375, -3.6318359375, -3.2906494140625, -2.949462890625, -2.6082763671875, -2.26708984375, -1.9259033203125, -1.584716796875, -1.2435302734375, -0.90234375, -0.5611572265625, -0.219970703125, 0.1212158203125, 0.46240234375, 0.8035888671875, 1.144775390625, 1.4859619140625, 1.8271484375, 2.1683349609375, 2.509521484375, 2.8507080078125, 3.19189453125, 3.5330810546875, 3.874267578125, 4.2154541015625, 4.556640625, 4.8978271484375, 5.239013671875, 5.5802001953125, 5.92138671875, 6.2625732421875, 6.603759765625, 6.9449462890625, 7.2861328125, 7.6273193359375, 7.968505859375, 8.3096923828125, 8.65087890625, 8.9920654296875, 9.333251953125, 9.6744384765625, 10.015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 7.0, 12.0, 20.0, 33.0, 45.0, 92.0, 118.0, 172.0, 311.0, 431.0, 732.0, 1184.0, 1857.0, 2950.0, 4570.0, 7258.0, 11258.0, 16628.0, 24728.0, 34658.0, 47970.0, 62463.0, 78716.0, 92359.0, 102262.0, 104211.0, 99125.0, 88046.0, 72977.0, 57240.0, 42779.0, 30514.0, 21556.0, 14642.0, 9527.0, 6307.0, 3908.0, 2562.0, 1686.0, 1003.0, 606.0, 375.0, 228.0, 149.0, 88.0, 70.0, 48.0, 27.0, 13.0, 13.0, 10.0, 3.0, 7.0, 3.0, 1.0, 0.0, 3.0], "bins": [-10.2265625, -9.91015625, -9.59375, -9.27734375, -8.9609375, -8.64453125, -8.328125, -8.01171875, -7.6953125, -7.37890625, -7.0625, -6.74609375, -6.4296875, -6.11328125, -5.796875, -5.48046875, -5.1640625, -4.84765625, -4.53125, -4.21484375, -3.8984375, -3.58203125, -3.265625, -2.94921875, -2.6328125, -2.31640625, -2.0, -1.68359375, -1.3671875, -1.05078125, -0.734375, -0.41796875, -0.1015625, 0.21484375, 0.53125, 0.84765625, 1.1640625, 1.48046875, 1.796875, 2.11328125, 2.4296875, 2.74609375, 3.0625, 3.37890625, 3.6953125, 4.01171875, 4.328125, 4.64453125, 4.9609375, 5.27734375, 5.59375, 5.91015625, 6.2265625, 6.54296875, 6.859375, 7.17578125, 7.4921875, 7.80859375, 8.125, 8.44140625, 8.7578125, 9.07421875, 9.390625, 9.70703125, 10.0234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 4.0, 6.0, 10.0, 16.0, 11.0, 15.0, 17.0, 27.0, 20.0, 26.0, 31.0, 21.0, 25.0, 39.0, 31.0, 34.0, 42.0, 39.0, 46.0, 48.0, 39.0, 42.0, 35.0, 34.0, 34.0, 38.0, 31.0, 29.0, 31.0, 18.0, 19.0, 24.0, 19.0, 18.0, 7.0, 10.0, 10.0, 8.0, 10.0, 4.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 4.0], "bins": [-7.57421875, -7.3570556640625, -7.139892578125, -6.9227294921875, -6.70556640625, -6.4884033203125, -6.271240234375, -6.0540771484375, -5.8369140625, -5.6197509765625, -5.402587890625, -5.1854248046875, -4.96826171875, -4.7510986328125, -4.533935546875, -4.3167724609375, -4.099609375, -3.8824462890625, -3.665283203125, -3.4481201171875, -3.23095703125, -3.0137939453125, -2.796630859375, -2.5794677734375, -2.3623046875, -2.1451416015625, -1.927978515625, -1.7108154296875, -1.49365234375, -1.2764892578125, -1.059326171875, -0.8421630859375, -0.625, -0.4078369140625, -0.190673828125, 0.0264892578125, 0.24365234375, 0.4608154296875, 0.677978515625, 0.8951416015625, 1.1123046875, 1.3294677734375, 1.546630859375, 1.7637939453125, 1.98095703125, 2.1981201171875, 2.415283203125, 2.6324462890625, 2.849609375, 3.0667724609375, 3.283935546875, 3.5010986328125, 3.71826171875, 3.9354248046875, 4.152587890625, 4.3697509765625, 4.5869140625, 4.8040771484375, 5.021240234375, 5.2384033203125, 5.45556640625, 5.6727294921875, 5.889892578125, 6.1070556640625, 6.32421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 8.0, 22.0, 10.0, 25.0, 53.0, 82.0, 132.0, 196.0, 296.0, 538.0, 848.0, 1445.0, 2445.0, 4290.0, 7173.0, 12460.0, 21749.0, 37846.0, 63504.0, 99514.0, 139234.0, 164451.0, 157228.0, 124570.0, 85212.0, 52534.0, 30599.0, 17775.0, 10161.0, 5804.0, 3292.0, 1995.0, 1144.0, 768.0, 418.0, 280.0, 149.0, 113.0, 62.0, 45.0, 26.0, 20.0, 11.0, 11.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.56640625, -6.36627197265625, -6.1661376953125, -5.96600341796875, -5.765869140625, -5.56573486328125, -5.3656005859375, -5.16546630859375, -4.96533203125, -4.76519775390625, -4.5650634765625, -4.36492919921875, -4.164794921875, -3.96466064453125, -3.7645263671875, -3.56439208984375, -3.3642578125, -3.16412353515625, -2.9639892578125, -2.76385498046875, -2.563720703125, -2.36358642578125, -2.1634521484375, -1.96331787109375, -1.76318359375, -1.56304931640625, -1.3629150390625, -1.16278076171875, -0.962646484375, -0.76251220703125, -0.5623779296875, -0.36224365234375, -0.162109375, 0.03802490234375, 0.2381591796875, 0.43829345703125, 0.638427734375, 0.83856201171875, 1.0386962890625, 1.23883056640625, 1.43896484375, 1.63909912109375, 1.8392333984375, 2.03936767578125, 2.239501953125, 2.43963623046875, 2.6397705078125, 2.83990478515625, 3.0400390625, 3.24017333984375, 3.4403076171875, 3.64044189453125, 3.840576171875, 4.04071044921875, 4.2408447265625, 4.44097900390625, 4.64111328125, 4.84124755859375, 5.0413818359375, 5.24151611328125, 5.441650390625, 5.64178466796875, 5.8419189453125, 6.04205322265625, 6.2421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 12.0, 4.0, 14.0, 10.0, 18.0, 14.0, 17.0, 25.0, 36.0, 40.0, 45.0, 62.0, 53.0, 59.0, 54.0, 54.0, 72.0, 49.0, 52.0, 60.0, 46.0, 35.0, 37.0, 33.0, 24.0, 18.0, 12.0, 8.0, 12.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.000657007098197937, -0.0006340444087982178, -0.0006110817193984985, -0.0005881190299987793, -0.0005651563405990601, -0.0005421936511993408, -0.0005192309617996216, -0.0004962682723999023, -0.0004733055830001831, -0.00045034289360046387, -0.00042738020420074463, -0.0004044175148010254, -0.00038145482540130615, -0.0003584921360015869, -0.0003355294466018677, -0.00031256675720214844, -0.0002896040678024292, -0.00026664137840270996, -0.00024367868900299072, -0.00022071599960327148, -0.00019775331020355225, -0.000174790620803833, -0.00015182793140411377, -0.00012886524200439453, -0.00010590255260467529, -8.293986320495605e-05, -5.9977173805236816e-05, -3.701448440551758e-05, -1.405179500579834e-05, 8.910894393920898e-06, 3.187358379364014e-05, 5.4836273193359375e-05, 7.779896259307861e-05, 0.00010076165199279785, 0.0001237243413925171, 0.00014668703079223633, 0.00016964972019195557, 0.0001926124095916748, 0.00021557509899139404, 0.00023853778839111328, 0.0002615004777908325, 0.00028446316719055176, 0.000307425856590271, 0.00033038854598999023, 0.00035335123538970947, 0.0003763139247894287, 0.00039927661418914795, 0.0004222393035888672, 0.0004452019929885864, 0.00046816468238830566, 0.0004911273717880249, 0.0005140900611877441, 0.0005370527505874634, 0.0005600154399871826, 0.0005829781293869019, 0.0006059408187866211, 0.0006289035081863403, 0.0006518661975860596, 0.0006748288869857788, 0.000697791576385498, 0.0007207542657852173, 0.0007437169551849365, 0.0007666796445846558, 0.000789642333984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 9.0, 14.0, 12.0, 19.0, 26.0, 44.0, 80.0, 102.0, 156.0, 224.0, 353.0, 527.0, 773.0, 1101.0, 1704.0, 2712.0, 3864.0, 5752.0, 9017.0, 13286.0, 20235.0, 29314.0, 42088.0, 58878.0, 77802.0, 96614.0, 111110.0, 115647.0, 109753.0, 93687.0, 74805.0, 55949.0, 39776.0, 27371.0, 18900.0, 12435.0, 8169.0, 5330.0, 3615.0, 2423.0, 1527.0, 1107.0, 758.0, 500.0, 309.0, 239.0, 147.0, 100.0, 76.0, 36.0, 28.0, 15.0, 15.0, 10.0, 7.0, 3.0, 1.0, 4.0], "bins": [-5.16796875, -5.0133056640625, -4.858642578125, -4.7039794921875, -4.54931640625, -4.3946533203125, -4.239990234375, -4.0853271484375, -3.9306640625, -3.7760009765625, -3.621337890625, -3.4666748046875, -3.31201171875, -3.1573486328125, -3.002685546875, -2.8480224609375, -2.693359375, -2.5386962890625, -2.384033203125, -2.2293701171875, -2.07470703125, -1.9200439453125, -1.765380859375, -1.6107177734375, -1.4560546875, -1.3013916015625, -1.146728515625, -0.9920654296875, -0.83740234375, -0.6827392578125, -0.528076171875, -0.3734130859375, -0.21875, -0.0640869140625, 0.090576171875, 0.2452392578125, 0.39990234375, 0.5545654296875, 0.709228515625, 0.8638916015625, 1.0185546875, 1.1732177734375, 1.327880859375, 1.4825439453125, 1.63720703125, 1.7918701171875, 1.946533203125, 2.1011962890625, 2.255859375, 2.4105224609375, 2.565185546875, 2.7198486328125, 2.87451171875, 3.0291748046875, 3.183837890625, 3.3385009765625, 3.4931640625, 3.6478271484375, 3.802490234375, 3.9571533203125, 4.11181640625, 4.2664794921875, 4.421142578125, 4.5758056640625, 4.73046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 3.0, 5.0, 9.0, 7.0, 15.0, 15.0, 20.0, 28.0, 25.0, 25.0, 47.0, 67.0, 52.0, 62.0, 58.0, 47.0, 57.0, 62.0, 52.0, 50.0, 59.0, 42.0, 27.0, 35.0, 30.0, 27.0, 11.0, 12.0, 3.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5625, -2.479766845703125, -2.39703369140625, -2.314300537109375, -2.2315673828125, -2.148834228515625, -2.06610107421875, -1.983367919921875, -1.900634765625, -1.817901611328125, -1.73516845703125, -1.652435302734375, -1.5697021484375, -1.486968994140625, -1.40423583984375, -1.321502685546875, -1.23876953125, -1.156036376953125, -1.07330322265625, -0.990570068359375, -0.9078369140625, -0.825103759765625, -0.74237060546875, -0.659637451171875, -0.576904296875, -0.494171142578125, -0.41143798828125, -0.328704833984375, -0.2459716796875, -0.163238525390625, -0.08050537109375, 0.002227783203125, 0.0849609375, 0.167694091796875, 0.25042724609375, 0.333160400390625, 0.4158935546875, 0.498626708984375, 0.58135986328125, 0.664093017578125, 0.746826171875, 0.829559326171875, 0.91229248046875, 0.995025634765625, 1.0777587890625, 1.160491943359375, 1.24322509765625, 1.325958251953125, 1.40869140625, 1.491424560546875, 1.57415771484375, 1.656890869140625, 1.7396240234375, 1.822357177734375, 1.90509033203125, 1.987823486328125, 2.070556640625, 2.153289794921875, 2.23602294921875, 2.318756103515625, 2.4014892578125, 2.484222412109375, 2.56695556640625, 2.649688720703125, 2.732421875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 8.0, 14.0, 16.0, 19.0, 16.0, 25.0, 30.0, 35.0, 47.0, 44.0, 47.0, 43.0, 46.0, 55.0, 47.0, 42.0, 48.0, 41.0, 44.0, 31.0, 40.0, 40.0, 34.0, 35.0, 24.0, 19.0, 19.0, 14.0, 10.0, 10.0, 8.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.368993759155273, -11.959609985351562, -11.550226211547852, -11.14084243774414, -10.731457710266113, -10.322073936462402, -9.912690162658691, -9.50330638885498, -9.093921661376953, -8.684537887573242, -8.275154113769531, -7.865769863128662, -7.456385612487793, -7.047001838684082, -6.637618064880371, -6.22823429107666, -5.818850517272949, -5.409466743469238, -5.000082492828369, -4.590698719024658, -4.181314468383789, -3.771930694580078, -3.362546920776367, -2.953162908554077, -2.543778896331787, -2.134394884109497, -1.7250109910964966, -1.315627098083496, -0.906243085861206, -0.496859073638916, -0.08747529983520508, 0.32190871238708496, 0.731292724609375, 1.140676736831665, 1.5500606298446655, 1.959444522857666, 2.368828535079956, 2.778212547302246, 3.187596321105957, 3.596980333328247, 4.006364345550537, 4.415748119354248, 4.825132369995117, 5.234516143798828, 5.643899917602539, 6.053284168243408, 6.462667942047119, 6.872052192687988, 7.281435966491699, 7.69081974029541, 8.100203514099121, 8.509588241577148, 8.91897201538086, 9.32835578918457, 9.737739562988281, 10.147123336791992, 10.556507110595703, 10.965890884399414, 11.375274658203125, 11.784658432006836, 12.194043159484863, 12.603426933288574, 13.012810707092285, 13.422194480895996, 13.831579208374023]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 11.0, 8.0, 5.0, 14.0, 18.0, 20.0, 23.0, 24.0, 36.0, 35.0, 35.0, 37.0, 42.0, 42.0, 48.0, 44.0, 57.0, 53.0, 56.0, 48.0, 38.0, 35.0, 39.0, 38.0, 22.0, 28.0, 35.0, 23.0, 14.0, 24.0, 13.0, 6.0, 5.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.965024948120117, -13.537736892700195, -13.110448837280273, -12.683160781860352, -12.25587272644043, -11.828584671020508, -11.401296615600586, -10.974007606506348, -10.546719551086426, -10.119431495666504, -9.692143440246582, -9.26485538482666, -8.837567329406738, -8.4102783203125, -7.982990741729736, -7.555702209472656, -7.128414630889893, -6.701126575469971, -6.273838520050049, -5.846549987792969, -5.419261932373047, -4.991973876953125, -4.564685821533203, -4.137397766113281, -3.7101094722747803, -3.2828214168548584, -2.8555331230163574, -2.4282450675964355, -2.0009570121765137, -1.5736687183380127, -1.1463806629180908, -0.7190923690795898, -0.29180431365966797, 0.13548383116722107, 0.5627719759941101, 0.9900600910186768, 1.4173482656478882, 1.8446364402770996, 2.2719244956970215, 2.6992127895355225, 3.1265008449554443, 3.553788900375366, 3.981077194213867, 4.408365249633789, 4.835653305053711, 5.262941360473633, 5.690229415893555, 6.117517948150635, 6.544806003570557, 6.9720940589904785, 7.3993821144104, 7.8266706466674805, 8.253958702087402, 8.681246757507324, 9.108534812927246, 9.535822868347168, 9.96311092376709, 10.390398979187012, 10.817687034606934, 11.244975090026855, 11.672263145446777, 12.099552154541016, 12.526840209960938, 12.95412826538086, 13.381416320800781]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 14.0, 17.0, 22.0, 52.0, 63.0, 105.0, 184.0, 337.0, 575.0, 958.0, 1596.0, 2704.0, 4492.0, 7342.0, 12132.0, 19630.0, 31213.0, 49315.0, 76229.0, 114950.0, 168497.0, 237115.0, 315857.0, 394843.0, 453211.0, 473471.0, 448485.0, 384095.0, 304956.0, 225718.0, 160778.0, 109162.0, 72660.0, 46438.0, 29431.0, 18422.0, 11475.0, 7060.0, 4316.0, 2550.0, 1620.0, 889.0, 514.0, 333.0, 193.0, 115.0, 76.0, 41.0, 15.0, 9.0, 12.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6875, -8.4111328125, -8.134765625, -7.8583984375, -7.58203125, -7.3056640625, -7.029296875, -6.7529296875, -6.4765625, -6.2001953125, -5.923828125, -5.6474609375, -5.37109375, -5.0947265625, -4.818359375, -4.5419921875, -4.265625, -3.9892578125, -3.712890625, -3.4365234375, -3.16015625, -2.8837890625, -2.607421875, -2.3310546875, -2.0546875, -1.7783203125, -1.501953125, -1.2255859375, -0.94921875, -0.6728515625, -0.396484375, -0.1201171875, 0.15625, 0.4326171875, 0.708984375, 0.9853515625, 1.26171875, 1.5380859375, 1.814453125, 2.0908203125, 2.3671875, 2.6435546875, 2.919921875, 3.1962890625, 3.47265625, 3.7490234375, 4.025390625, 4.3017578125, 4.578125, 4.8544921875, 5.130859375, 5.4072265625, 5.68359375, 5.9599609375, 6.236328125, 6.5126953125, 6.7890625, 7.0654296875, 7.341796875, 7.6181640625, 7.89453125, 8.1708984375, 8.447265625, 8.7236328125, 9.0]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 23.0, 20.0, 24.0, 32.0, 35.0, 41.0, 34.0, 44.0, 36.0, 46.0, 48.0, 51.0, 63.0, 49.0, 39.0, 46.0, 40.0, 35.0, 34.0, 30.0, 31.0, 25.0, 21.0, 20.0, 19.0, 13.0, 6.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5421142578125, -11.177978515625, -10.8138427734375, -10.44970703125, -10.0855712890625, -9.721435546875, -9.3572998046875, -8.9931640625, -8.6290283203125, -8.264892578125, -7.9007568359375, -7.53662109375, -7.1724853515625, -6.808349609375, -6.4442138671875, -6.080078125, -5.7159423828125, -5.351806640625, -4.9876708984375, -4.62353515625, -4.2593994140625, -3.895263671875, -3.5311279296875, -3.1669921875, -2.8028564453125, -2.438720703125, -2.0745849609375, -1.71044921875, -1.3463134765625, -0.982177734375, -0.6180419921875, -0.25390625, 0.1102294921875, 0.474365234375, 0.8385009765625, 1.20263671875, 1.5667724609375, 1.930908203125, 2.2950439453125, 2.6591796875, 3.0233154296875, 3.387451171875, 3.7515869140625, 4.11572265625, 4.4798583984375, 4.843994140625, 5.2081298828125, 5.572265625, 5.9364013671875, 6.300537109375, 6.6646728515625, 7.02880859375, 7.3929443359375, 7.757080078125, 8.1212158203125, 8.4853515625, 8.8494873046875, 9.213623046875, 9.5777587890625, 9.94189453125, 10.3060302734375, 10.670166015625, 11.0343017578125, 11.3984375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 18.0, 33.0, 58.0, 102.0, 175.0, 295.0, 540.0, 952.0, 1692.0, 2819.0, 4957.0, 8156.0, 14014.0, 22604.0, 36342.0, 56284.0, 86574.0, 128548.0, 181626.0, 246114.0, 315442.0, 380038.0, 424431.0, 438355.0, 419185.0, 370619.0, 304805.0, 236253.0, 172269.0, 121053.0, 81694.0, 52205.0, 33859.0, 21337.0, 12623.0, 7586.0, 4514.0, 2542.0, 1570.0, 845.0, 512.0, 270.0, 148.0, 98.0, 60.0, 24.0, 21.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0], "bins": [-9.9375, -9.6488037109375, -9.360107421875, -9.0714111328125, -8.78271484375, -8.4940185546875, -8.205322265625, -7.9166259765625, -7.6279296875, -7.3392333984375, -7.050537109375, -6.7618408203125, -6.47314453125, -6.1844482421875, -5.895751953125, -5.6070556640625, -5.318359375, -5.0296630859375, -4.740966796875, -4.4522705078125, -4.16357421875, -3.8748779296875, -3.586181640625, -3.2974853515625, -3.0087890625, -2.7200927734375, -2.431396484375, -2.1427001953125, -1.85400390625, -1.5653076171875, -1.276611328125, -0.9879150390625, -0.69921875, -0.4105224609375, -0.121826171875, 0.1668701171875, 0.45556640625, 0.7442626953125, 1.032958984375, 1.3216552734375, 1.6103515625, 1.8990478515625, 2.187744140625, 2.4764404296875, 2.76513671875, 3.0538330078125, 3.342529296875, 3.6312255859375, 3.919921875, 4.2086181640625, 4.497314453125, 4.7860107421875, 5.07470703125, 5.3634033203125, 5.652099609375, 5.9407958984375, 6.2294921875, 6.5181884765625, 6.806884765625, 7.0955810546875, 7.38427734375, 7.6729736328125, 7.961669921875, 8.2503662109375, 8.5390625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 7.0, 4.0, 15.0, 17.0, 26.0, 32.0, 35.0, 51.0, 45.0, 58.0, 56.0, 103.0, 101.0, 117.0, 156.0, 154.0, 158.0, 161.0, 175.0, 178.0, 189.0, 203.0, 209.0, 196.0, 217.0, 155.0, 196.0, 141.0, 154.0, 104.0, 114.0, 103.0, 78.0, 61.0, 57.0, 43.0, 40.0, 37.0, 27.0, 22.0, 19.0, 15.0, 11.0, 4.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.29296875, -4.153564453125, -4.01416015625, -3.874755859375, -3.7353515625, -3.595947265625, -3.45654296875, -3.317138671875, -3.177734375, -3.038330078125, -2.89892578125, -2.759521484375, -2.6201171875, -2.480712890625, -2.34130859375, -2.201904296875, -2.0625, -1.923095703125, -1.78369140625, -1.644287109375, -1.5048828125, -1.365478515625, -1.22607421875, -1.086669921875, -0.947265625, -0.807861328125, -0.66845703125, -0.529052734375, -0.3896484375, -0.250244140625, -0.11083984375, 0.028564453125, 0.16796875, 0.307373046875, 0.44677734375, 0.586181640625, 0.7255859375, 0.864990234375, 1.00439453125, 1.143798828125, 1.283203125, 1.422607421875, 1.56201171875, 1.701416015625, 1.8408203125, 1.980224609375, 2.11962890625, 2.259033203125, 2.3984375, 2.537841796875, 2.67724609375, 2.816650390625, 2.9560546875, 3.095458984375, 3.23486328125, 3.374267578125, 3.513671875, 3.653076171875, 3.79248046875, 3.931884765625, 4.0712890625, 4.210693359375, 4.35009765625, 4.489501953125, 4.62890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 4.0, 14.0, 22.0, 20.0, 14.0, 20.0, 28.0, 32.0, 32.0, 39.0, 43.0, 46.0, 34.0, 36.0, 44.0, 40.0, 38.0, 48.0, 36.0, 40.0, 45.0, 35.0, 34.0, 30.0, 34.0, 21.0, 20.0, 14.0, 13.0, 22.0, 10.0, 10.0, 12.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.752127647399902, -11.386536598205566, -11.02094554901123, -10.655354499816895, -10.289764404296875, -9.924173355102539, -9.558582305908203, -9.192991256713867, -8.827400207519531, -8.461809158325195, -8.09621810913086, -7.730627536773682, -7.365036487579346, -6.99944543838501, -6.633854866027832, -6.268263816833496, -5.90267276763916, -5.537081718444824, -5.171490669250488, -4.8059000968933105, -4.440309047698975, -4.074717998504639, -3.709127187728882, -3.343536376953125, -2.977945327758789, -2.612354278564453, -2.2467634677886963, -1.88117253780365, -1.5155816078186035, -1.1499906778335571, -0.7843997478485107, -0.4188089370727539, -0.05321693420410156, 0.3123739957809448, 0.6779649257659912, 1.0435558557510376, 1.409146785736084, 1.7747377157211304, 2.1403286457061768, 2.5059194564819336, 2.8715105056762695, 3.2371015548706055, 3.6026923656463623, 3.968283176422119, 4.333874225616455, 4.699465274810791, 5.065055847167969, 5.430646896362305, 5.796237945556641, 6.161828994750977, 6.5274200439453125, 6.89301061630249, 7.258601665496826, 7.624192714691162, 7.98978328704834, 8.355374336242676, 8.720965385437012, 9.086556434631348, 9.452147483825684, 9.81773853302002, 10.183328628540039, 10.548919677734375, 10.914510726928711, 11.280101776123047, 11.645692825317383]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 19.0, 25.0, 19.0, 26.0, 29.0, 29.0, 30.0, 36.0, 59.0, 33.0, 47.0, 38.0, 45.0, 40.0, 38.0, 42.0, 46.0, 40.0, 35.0, 39.0, 19.0, 32.0, 28.0, 19.0, 21.0, 12.0, 19.0, 12.0, 18.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.673048973083496, -10.298126220703125, -9.923202514648438, -9.548279762268066, -9.173356056213379, -8.798433303833008, -8.42350959777832, -8.04858684539795, -7.67366361618042, -7.298740386962891, -6.923817157745361, -6.548893928527832, -6.173971176147461, -5.799047470092773, -5.424124717712402, -5.049201488494873, -4.674278259277344, -4.2993550300598145, -3.924431800842285, -3.549508810043335, -3.1745855808258057, -2.7996623516082764, -2.424739360809326, -2.049816131591797, -1.6748929023742676, -1.2999696731567383, -0.9250465631484985, -0.5501234531402588, -0.1752002239227295, 0.1997230052947998, 0.57464599609375, 0.9495692253112793, 1.324493408203125, 1.6994166374206543, 2.0743398666381836, 2.449262857437134, 2.824186086654663, 3.1991093158721924, 3.5740323066711426, 3.948955535888672, 4.323878765106201, 4.6988019943237305, 5.07372522354126, 5.448648452758789, 5.82357120513916, 6.198494911193848, 6.573417663574219, 6.948340892791748, 7.323264122009277, 7.698187351226807, 8.073110580444336, 8.448033332824707, 8.822957038879395, 9.197879791259766, 9.572803497314453, 9.947726249694824, 10.322649002075195, 10.697571754455566, 11.072495460510254, 11.447418212890625, 11.822341918945312, 12.197264671325684, 12.572187423706055, 12.947111129760742, 13.32203483581543]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 7.0, 1.0, 5.0, 4.0, 12.0, 11.0, 22.0, 20.0, 32.0, 54.0, 65.0, 112.0, 155.0, 208.0, 310.0, 450.0, 636.0, 945.0, 1510.0, 2305.0, 3648.0, 5515.0, 8432.0, 13644.0, 21602.0, 34547.0, 55758.0, 89922.0, 140696.0, 185234.0, 170190.0, 117499.0, 72995.0, 45247.0, 27758.0, 17429.0, 11145.0, 7075.0, 4585.0, 2941.0, 1963.0, 1299.0, 804.0, 545.0, 380.0, 248.0, 173.0, 122.0, 92.0, 62.0, 65.0, 25.0, 21.0, 15.0, 11.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.923828125, -3.796356201171875, -3.66888427734375, -3.541412353515625, -3.4139404296875, -3.286468505859375, -3.15899658203125, -3.031524658203125, -2.904052734375, -2.776580810546875, -2.64910888671875, -2.521636962890625, -2.3941650390625, -2.266693115234375, -2.13922119140625, -2.011749267578125, -1.88427734375, -1.756805419921875, -1.62933349609375, -1.501861572265625, -1.3743896484375, -1.246917724609375, -1.11944580078125, -0.991973876953125, -0.864501953125, -0.737030029296875, -0.60955810546875, -0.482086181640625, -0.3546142578125, -0.227142333984375, -0.09967041015625, 0.027801513671875, 0.1552734375, 0.282745361328125, 0.41021728515625, 0.537689208984375, 0.6651611328125, 0.792633056640625, 0.92010498046875, 1.047576904296875, 1.175048828125, 1.302520751953125, 1.42999267578125, 1.557464599609375, 1.6849365234375, 1.812408447265625, 1.93988037109375, 2.067352294921875, 2.19482421875, 2.322296142578125, 2.44976806640625, 2.577239990234375, 2.7047119140625, 2.832183837890625, 2.95965576171875, 3.087127685546875, 3.214599609375, 3.342071533203125, 3.46954345703125, 3.597015380859375, 3.7244873046875, 3.851959228515625, 3.97943115234375, 4.106903076171875, 4.234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 11.0, 8.0, 10.0, 4.0, 19.0, 24.0, 17.0, 25.0, 18.0, 26.0, 28.0, 30.0, 31.0, 40.0, 53.0, 37.0, 44.0, 38.0, 46.0, 42.0, 36.0, 42.0, 47.0, 37.0, 36.0, 43.0, 17.0, 31.0, 30.0, 16.0, 20.0, 13.0, 20.0, 13.0, 17.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.2357177734375, -9.862060546875, -9.4884033203125, -9.11474609375, -8.7410888671875, -8.367431640625, -7.9937744140625, -7.6201171875, -7.2464599609375, -6.872802734375, -6.4991455078125, -6.12548828125, -5.7518310546875, -5.378173828125, -5.0045166015625, -4.630859375, -4.2572021484375, -3.883544921875, -3.5098876953125, -3.13623046875, -2.7625732421875, -2.388916015625, -2.0152587890625, -1.6416015625, -1.2679443359375, -0.894287109375, -0.5206298828125, -0.14697265625, 0.2266845703125, 0.600341796875, 0.9739990234375, 1.34765625, 1.7213134765625, 2.094970703125, 2.4686279296875, 2.84228515625, 3.2159423828125, 3.589599609375, 3.9632568359375, 4.3369140625, 4.7105712890625, 5.084228515625, 5.4578857421875, 5.83154296875, 6.2052001953125, 6.578857421875, 6.9525146484375, 7.326171875, 7.6998291015625, 8.073486328125, 8.4471435546875, 8.82080078125, 9.1944580078125, 9.568115234375, 9.9417724609375, 10.3154296875, 10.6890869140625, 11.062744140625, 11.4364013671875, 11.81005859375, 12.1837158203125, 12.557373046875, 12.9310302734375, 13.3046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 12.0, 20.0, 23.0, 30.0, 50.0, 64.0, 90.0, 132.0, 211.0, 297.0, 400.0, 653.0, 964.0, 1497.0, 2394.0, 4014.0, 7198.0, 13382.0, 27502.0, 62777.0, 160610.0, 334359.0, 249446.0, 99055.0, 41184.0, 18807.0, 9579.0, 5324.0, 3015.0, 1892.0, 1199.0, 764.0, 521.0, 346.0, 249.0, 164.0, 90.0, 77.0, 46.0, 35.0, 13.0, 20.0, 15.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.31640625, -5.154052734375, -4.99169921875, -4.829345703125, -4.6669921875, -4.504638671875, -4.34228515625, -4.179931640625, -4.017578125, -3.855224609375, -3.69287109375, -3.530517578125, -3.3681640625, -3.205810546875, -3.04345703125, -2.881103515625, -2.71875, -2.556396484375, -2.39404296875, -2.231689453125, -2.0693359375, -1.906982421875, -1.74462890625, -1.582275390625, -1.419921875, -1.257568359375, -1.09521484375, -0.932861328125, -0.7705078125, -0.608154296875, -0.44580078125, -0.283447265625, -0.12109375, 0.041259765625, 0.20361328125, 0.365966796875, 0.5283203125, 0.690673828125, 0.85302734375, 1.015380859375, 1.177734375, 1.340087890625, 1.50244140625, 1.664794921875, 1.8271484375, 1.989501953125, 2.15185546875, 2.314208984375, 2.4765625, 2.638916015625, 2.80126953125, 2.963623046875, 3.1259765625, 3.288330078125, 3.45068359375, 3.613037109375, 3.775390625, 3.937744140625, 4.10009765625, 4.262451171875, 4.4248046875, 4.587158203125, 4.74951171875, 4.911865234375, 5.07421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 6.0, 8.0, 12.0, 13.0, 11.0, 8.0, 9.0, 19.0, 18.0, 26.0, 21.0, 20.0, 33.0, 35.0, 29.0, 27.0, 32.0, 42.0, 39.0, 46.0, 35.0, 35.0, 38.0, 48.0, 41.0, 35.0, 23.0, 35.0, 28.0, 29.0, 23.0, 19.0, 21.0, 19.0, 22.0, 18.0, 13.0, 12.0, 8.0, 9.0, 11.0, 4.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.109375, -6.88604736328125, -6.6627197265625, -6.43939208984375, -6.216064453125, -5.99273681640625, -5.7694091796875, -5.54608154296875, -5.32275390625, -5.09942626953125, -4.8760986328125, -4.65277099609375, -4.429443359375, -4.20611572265625, -3.9827880859375, -3.75946044921875, -3.5361328125, -3.31280517578125, -3.0894775390625, -2.86614990234375, -2.642822265625, -2.41949462890625, -2.1961669921875, -1.97283935546875, -1.74951171875, -1.52618408203125, -1.3028564453125, -1.07952880859375, -0.856201171875, -0.63287353515625, -0.4095458984375, -0.18621826171875, 0.037109375, 0.26043701171875, 0.4837646484375, 0.70709228515625, 0.930419921875, 1.15374755859375, 1.3770751953125, 1.60040283203125, 1.82373046875, 2.04705810546875, 2.2703857421875, 2.49371337890625, 2.717041015625, 2.94036865234375, 3.1636962890625, 3.38702392578125, 3.6103515625, 3.83367919921875, 4.0570068359375, 4.28033447265625, 4.503662109375, 4.72698974609375, 4.9503173828125, 5.17364501953125, 5.39697265625, 5.62030029296875, 5.8436279296875, 6.06695556640625, 6.290283203125, 6.51361083984375, 6.7369384765625, 6.96026611328125, 7.18359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 13.0, 18.0, 29.0, 37.0, 45.0, 67.0, 107.0, 131.0, 213.0, 304.0, 458.0, 678.0, 1105.0, 1905.0, 3205.0, 5922.0, 11680.0, 28949.0, 89626.0, 372991.0, 382214.0, 92436.0, 29762.0, 12243.0, 5861.0, 3339.0, 1924.0, 1125.0, 666.0, 462.0, 330.0, 228.0, 150.0, 98.0, 72.0, 48.0, 28.0, 24.0, 14.0, 10.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.322296142578125, -2.24224853515625, -2.162200927734375, -2.0821533203125, -2.002105712890625, -1.92205810546875, -1.842010498046875, -1.761962890625, -1.681915283203125, -1.60186767578125, -1.521820068359375, -1.4417724609375, -1.361724853515625, -1.28167724609375, -1.201629638671875, -1.12158203125, -1.041534423828125, -0.96148681640625, -0.881439208984375, -0.8013916015625, -0.721343994140625, -0.64129638671875, -0.561248779296875, -0.481201171875, -0.401153564453125, -0.32110595703125, -0.241058349609375, -0.1610107421875, -0.080963134765625, -0.00091552734375, 0.079132080078125, 0.1591796875, 0.239227294921875, 0.31927490234375, 0.399322509765625, 0.4793701171875, 0.559417724609375, 0.63946533203125, 0.719512939453125, 0.799560546875, 0.879608154296875, 0.95965576171875, 1.039703369140625, 1.1197509765625, 1.199798583984375, 1.27984619140625, 1.359893798828125, 1.43994140625, 1.519989013671875, 1.60003662109375, 1.680084228515625, 1.7601318359375, 1.840179443359375, 1.92022705078125, 2.000274658203125, 2.080322265625, 2.160369873046875, 2.24041748046875, 2.320465087890625, 2.4005126953125, 2.480560302734375, 2.56060791015625, 2.640655517578125, 2.720703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 0.0, 5.0, 13.0, 12.0, 27.0, 29.0, 60.0, 68.0, 120.0, 159.0, 178.0, 127.0, 74.0, 44.0, 31.0, 24.0, 5.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007534027099609375, -0.0007335394620895386, -0.0007136762142181396, -0.0006938129663467407, -0.0006739497184753418, -0.0006540864706039429, -0.0006342232227325439, -0.000614359974861145, -0.0005944967269897461, -0.0005746334791183472, -0.0005547702312469482, -0.0005349069833755493, -0.0005150437355041504, -0.0004951804876327515, -0.00047531723976135254, -0.0004554539918899536, -0.0004355907440185547, -0.00041572749614715576, -0.00039586424827575684, -0.0003760010004043579, -0.000356137752532959, -0.00033627450466156006, -0.00031641125679016113, -0.0002965480089187622, -0.0002766847610473633, -0.00025682151317596436, -0.00023695826530456543, -0.0002170950174331665, -0.00019723176956176758, -0.00017736852169036865, -0.00015750527381896973, -0.0001376420259475708, -0.00011777877807617188, -9.791553020477295e-05, -7.805228233337402e-05, -5.81890344619751e-05, -3.832578659057617e-05, -1.8462538719177246e-05, 1.4007091522216797e-06, 2.1263957023620605e-05, 4.112720489501953e-05, 6.099045276641846e-05, 8.085370063781738e-05, 0.00010071694850921631, 0.00012058019638061523, 0.00014044344425201416, 0.00016030669212341309, 0.000180169939994812, 0.00020003318786621094, 0.00021989643573760986, 0.0002397596836090088, 0.0002596229314804077, 0.00027948617935180664, 0.00029934942722320557, 0.0003192126750946045, 0.0003390759229660034, 0.00035893917083740234, 0.00037880241870880127, 0.0003986656665802002, 0.0004185289144515991, 0.00043839216232299805, 0.00045825541019439697, 0.0004781186580657959, 0.0004979819059371948, 0.0005178451538085938]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 20.0, 23.0, 38.0, 48.0, 64.0, 108.0, 161.0, 233.0, 319.0, 423.0, 643.0, 918.0, 1456.0, 2217.0, 3476.0, 5437.0, 8732.0, 14285.0, 23550.0, 39339.0, 66598.0, 112433.0, 177447.0, 207007.0, 151934.0, 92477.0, 54991.0, 32252.0, 19640.0, 11754.0, 7255.0, 4576.0, 2923.0, 1945.0, 1184.0, 826.0, 559.0, 407.0, 274.0, 169.0, 131.0, 91.0, 61.0, 45.0, 33.0, 15.0, 13.0, 8.0, 4.0, 1.0, 1.0, 3.0], "bins": [-2.384765625, -2.317230224609375, -2.24969482421875, -2.182159423828125, -2.1146240234375, -2.047088623046875, -1.97955322265625, -1.912017822265625, -1.844482421875, -1.776947021484375, -1.70941162109375, -1.641876220703125, -1.5743408203125, -1.506805419921875, -1.43927001953125, -1.371734619140625, -1.30419921875, -1.236663818359375, -1.16912841796875, -1.101593017578125, -1.0340576171875, -0.966522216796875, -0.89898681640625, -0.831451416015625, -0.763916015625, -0.696380615234375, -0.62884521484375, -0.561309814453125, -0.4937744140625, -0.426239013671875, -0.35870361328125, -0.291168212890625, -0.2236328125, -0.156097412109375, -0.08856201171875, -0.021026611328125, 0.0465087890625, 0.114044189453125, 0.18157958984375, 0.249114990234375, 0.316650390625, 0.384185791015625, 0.45172119140625, 0.519256591796875, 0.5867919921875, 0.654327392578125, 0.72186279296875, 0.789398193359375, 0.85693359375, 0.924468994140625, 0.99200439453125, 1.059539794921875, 1.1270751953125, 1.194610595703125, 1.26214599609375, 1.329681396484375, 1.397216796875, 1.464752197265625, 1.53228759765625, 1.599822998046875, 1.6673583984375, 1.734893798828125, 1.80242919921875, 1.869964599609375, 1.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 5.0, 9.0, 12.0, 21.0, 14.0, 14.0, 24.0, 37.0, 48.0, 44.0, 50.0, 85.0, 86.0, 83.0, 85.0, 69.0, 58.0, 43.0, 31.0, 26.0, 22.0, 22.0, 15.0, 15.0, 10.0, 11.0, 2.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97265625, -0.9411468505859375, -0.909637451171875, -0.8781280517578125, -0.84661865234375, -0.8151092529296875, -0.783599853515625, -0.7520904541015625, -0.7205810546875, -0.6890716552734375, -0.657562255859375, -0.6260528564453125, -0.59454345703125, -0.5630340576171875, -0.531524658203125, -0.5000152587890625, -0.468505859375, -0.4369964599609375, -0.405487060546875, -0.3739776611328125, -0.34246826171875, -0.3109588623046875, -0.279449462890625, -0.2479400634765625, -0.2164306640625, -0.1849212646484375, -0.153411865234375, -0.1219024658203125, -0.09039306640625, -0.0588836669921875, -0.027374267578125, 0.0041351318359375, 0.03564453125, 0.0671539306640625, 0.098663330078125, 0.1301727294921875, 0.16168212890625, 0.1931915283203125, 0.224700927734375, 0.2562103271484375, 0.2877197265625, 0.3192291259765625, 0.350738525390625, 0.3822479248046875, 0.41375732421875, 0.4452667236328125, 0.476776123046875, 0.5082855224609375, 0.539794921875, 0.5713043212890625, 0.602813720703125, 0.6343231201171875, 0.66583251953125, 0.6973419189453125, 0.728851318359375, 0.7603607177734375, 0.7918701171875, 0.8233795166015625, 0.854888916015625, 0.8863983154296875, 0.91790771484375, 0.9494171142578125, 0.980926513671875, 1.0124359130859375, 1.0439453125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 11.0, 17.0, 25.0, 17.0, 15.0, 23.0, 35.0, 34.0, 40.0, 37.0, 51.0, 39.0, 37.0, 43.0, 31.0, 46.0, 36.0, 42.0, 48.0, 41.0, 42.0, 26.0, 25.0, 28.0, 29.0, 23.0, 17.0, 19.0, 17.0, 9.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-12.539216995239258, -12.17225456237793, -11.805293083190918, -11.43833065032959, -11.071369171142578, -10.70440673828125, -10.337444305419922, -9.970481872558594, -9.603520393371582, -9.236557960510254, -8.869596481323242, -8.502634048461914, -8.135671615600586, -7.768710136413574, -7.401747703552246, -7.034785747528076, -6.667823791503906, -6.300861835479736, -5.933899879455566, -5.566937446594238, -5.199975490570068, -4.833013534545898, -4.46605110168457, -4.0990891456604, -3.7321271896362305, -3.3651652336120605, -2.9982030391693115, -2.6312408447265625, -2.2642788887023926, -1.897316813468933, -1.5303547382354736, -1.1633925437927246, -0.7964305877685547, -0.4294685125350952, -0.06250643730163574, 0.30445563793182373, 0.6714177131652832, 1.0383797883987427, 1.4053418636322021, 1.7723040580749512, 2.139266014099121, 2.506227970123291, 2.87319016456604, 3.240152359008789, 3.607114315032959, 3.974076271057129, 4.341038703918457, 4.708000659942627, 5.074962615966797, 5.441924571990967, 5.808886528015137, 6.175848960876465, 6.542810916900635, 6.909772872924805, 7.276735305786133, 7.643697261810303, 8.010659217834473, 8.3776216506958, 8.744583129882812, 9.11154556274414, 9.478507995605469, 9.84546947479248, 10.212431907653809, 10.57939338684082, 10.946355819702148]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 4.0, 5.0, 11.0, 7.0, 8.0, 13.0, 15.0, 17.0, 23.0, 27.0, 19.0, 24.0, 29.0, 28.0, 36.0, 47.0, 44.0, 44.0, 41.0, 48.0, 39.0, 38.0, 42.0, 41.0, 44.0, 45.0, 25.0, 37.0, 25.0, 38.0, 20.0, 21.0, 21.0, 16.0, 14.0, 14.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.687249183654785, -10.307353019714355, -9.927456855773926, -9.547560691833496, -9.167664527893066, -8.787768363952637, -8.40787124633789, -8.027975082397461, -7.6480793952941895, -7.26818323135376, -6.88828706741333, -6.508390426635742, -6.1284942626953125, -5.748598098754883, -5.368701934814453, -4.988805770874023, -4.608909606933594, -4.229013442993164, -3.8491172790527344, -3.4692208766937256, -3.089324712753296, -2.709428548812866, -2.3295321464538574, -1.9496359825134277, -1.569739818572998, -1.1898436546325684, -0.8099473714828491, -0.4300510883331299, -0.050154924392700195, 0.3297412395477295, 0.7096376419067383, 1.089533805847168, 1.4694290161132812, 1.849325180053711, 2.2292213439941406, 2.6091177463531494, 2.989013910293579, 3.368910074234009, 3.7488064765930176, 4.128702640533447, 4.508598804473877, 4.888494968414307, 5.268391132354736, 5.648287773132324, 6.028183937072754, 6.408080101013184, 6.787976264953613, 7.167872428894043, 7.547768592834473, 7.927664756774902, 8.307560920715332, 8.687457084655762, 9.067353248596191, 9.447249412536621, 9.827146530151367, 10.207042694091797, 10.586938858032227, 10.966835021972656, 11.346731185913086, 11.726627349853516, 12.106523513793945, 12.486419677734375, 12.866315841674805, 13.246212005615234, 13.626108169555664]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 13.0, 19.0, 25.0, 39.0, 53.0, 74.0, 108.0, 186.0, 265.0, 467.0, 811.0, 1214.0, 1977.0, 3418.0, 5458.0, 8712.0, 13782.0, 20896.0, 30913.0, 43796.0, 59539.0, 76691.0, 91955.0, 103898.0, 108897.0, 104075.0, 93807.0, 77975.0, 61346.0, 45324.0, 32315.0, 21757.0, 14217.0, 9284.0, 5886.0, 3668.0, 2145.0, 1353.0, 808.0, 522.0, 305.0, 212.0, 115.0, 71.0, 56.0, 33.0, 26.0, 18.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0], "bins": [-11.203125, -10.87890625, -10.5546875, -10.23046875, -9.90625, -9.58203125, -9.2578125, -8.93359375, -8.609375, -8.28515625, -7.9609375, -7.63671875, -7.3125, -6.98828125, -6.6640625, -6.33984375, -6.015625, -5.69140625, -5.3671875, -5.04296875, -4.71875, -4.39453125, -4.0703125, -3.74609375, -3.421875, -3.09765625, -2.7734375, -2.44921875, -2.125, -1.80078125, -1.4765625, -1.15234375, -0.828125, -0.50390625, -0.1796875, 0.14453125, 0.46875, 0.79296875, 1.1171875, 1.44140625, 1.765625, 2.08984375, 2.4140625, 2.73828125, 3.0625, 3.38671875, 3.7109375, 4.03515625, 4.359375, 4.68359375, 5.0078125, 5.33203125, 5.65625, 5.98046875, 6.3046875, 6.62890625, 6.953125, 7.27734375, 7.6015625, 7.92578125, 8.25, 8.57421875, 8.8984375, 9.22265625, 9.546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 9.0, 13.0, 13.0, 19.0, 26.0, 23.0, 17.0, 30.0, 23.0, 30.0, 37.0, 46.0, 48.0, 39.0, 44.0, 48.0, 38.0, 39.0, 42.0, 35.0, 49.0, 45.0, 25.0, 38.0, 27.0, 34.0, 20.0, 21.0, 24.0, 12.0, 16.0, 15.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.9461669921875, -9.579833984375, -9.2135009765625, -8.84716796875, -8.4808349609375, -8.114501953125, -7.7481689453125, -7.3818359375, -7.0155029296875, -6.649169921875, -6.2828369140625, -5.91650390625, -5.5501708984375, -5.183837890625, -4.8175048828125, -4.451171875, -4.0848388671875, -3.718505859375, -3.3521728515625, -2.98583984375, -2.6195068359375, -2.253173828125, -1.8868408203125, -1.5205078125, -1.1541748046875, -0.787841796875, -0.4215087890625, -0.05517578125, 0.3111572265625, 0.677490234375, 1.0438232421875, 1.41015625, 1.7764892578125, 2.142822265625, 2.5091552734375, 2.87548828125, 3.2418212890625, 3.608154296875, 3.9744873046875, 4.3408203125, 4.7071533203125, 5.073486328125, 5.4398193359375, 5.80615234375, 6.1724853515625, 6.538818359375, 6.9051513671875, 7.271484375, 7.6378173828125, 8.004150390625, 8.3704833984375, 8.73681640625, 9.1031494140625, 9.469482421875, 9.8358154296875, 10.2021484375, 10.5684814453125, 10.934814453125, 11.3011474609375, 11.66748046875, 12.0338134765625, 12.400146484375, 12.7664794921875, 13.1328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 13.0, 23.0, 30.0, 50.0, 51.0, 94.0, 176.0, 245.0, 473.0, 756.0, 1221.0, 2062.0, 3409.0, 5653.0, 9222.0, 14325.0, 21971.0, 33208.0, 47064.0, 64107.0, 82762.0, 99171.0, 110079.0, 112245.0, 104931.0, 91195.0, 73872.0, 55841.0, 39707.0, 26912.0, 18086.0, 11511.0, 6990.0, 4323.0, 2704.0, 1595.0, 940.0, 588.0, 364.0, 202.0, 145.0, 82.0, 58.0, 29.0, 19.0, 15.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.21875, -10.88134765625, -10.5439453125, -10.20654296875, -9.869140625, -9.53173828125, -9.1943359375, -8.85693359375, -8.51953125, -8.18212890625, -7.8447265625, -7.50732421875, -7.169921875, -6.83251953125, -6.4951171875, -6.15771484375, -5.8203125, -5.48291015625, -5.1455078125, -4.80810546875, -4.470703125, -4.13330078125, -3.7958984375, -3.45849609375, -3.12109375, -2.78369140625, -2.4462890625, -2.10888671875, -1.771484375, -1.43408203125, -1.0966796875, -0.75927734375, -0.421875, -0.08447265625, 0.2529296875, 0.59033203125, 0.927734375, 1.26513671875, 1.6025390625, 1.93994140625, 2.27734375, 2.61474609375, 2.9521484375, 3.28955078125, 3.626953125, 3.96435546875, 4.3017578125, 4.63916015625, 4.9765625, 5.31396484375, 5.6513671875, 5.98876953125, 6.326171875, 6.66357421875, 7.0009765625, 7.33837890625, 7.67578125, 8.01318359375, 8.3505859375, 8.68798828125, 9.025390625, 9.36279296875, 9.7001953125, 10.03759765625, 10.375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 9.0, 11.0, 16.0, 15.0, 20.0, 17.0, 20.0, 23.0, 22.0, 25.0, 26.0, 35.0, 38.0, 38.0, 31.0, 53.0, 42.0, 51.0, 49.0, 48.0, 40.0, 40.0, 33.0, 35.0, 33.0, 26.0, 25.0, 29.0, 21.0, 5.0, 20.0, 15.0, 12.0, 19.0, 11.0, 6.0, 7.0, 6.0, 2.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.7364501953125, -5.511962890625, -5.2874755859375, -5.06298828125, -4.8385009765625, -4.614013671875, -4.3895263671875, -4.1650390625, -3.9405517578125, -3.716064453125, -3.4915771484375, -3.26708984375, -3.0426025390625, -2.818115234375, -2.5936279296875, -2.369140625, -2.1446533203125, -1.920166015625, -1.6956787109375, -1.47119140625, -1.2467041015625, -1.022216796875, -0.7977294921875, -0.5732421875, -0.3487548828125, -0.124267578125, 0.1002197265625, 0.32470703125, 0.5491943359375, 0.773681640625, 0.9981689453125, 1.22265625, 1.4471435546875, 1.671630859375, 1.8961181640625, 2.12060546875, 2.3450927734375, 2.569580078125, 2.7940673828125, 3.0185546875, 3.2430419921875, 3.467529296875, 3.6920166015625, 3.91650390625, 4.1409912109375, 4.365478515625, 4.5899658203125, 4.814453125, 5.0389404296875, 5.263427734375, 5.4879150390625, 5.71240234375, 5.9368896484375, 6.161376953125, 6.3858642578125, 6.6103515625, 6.8348388671875, 7.059326171875, 7.2838134765625, 7.50830078125, 7.7327880859375, 7.957275390625, 8.1817626953125, 8.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 8.0, 12.0, 19.0, 29.0, 30.0, 58.0, 67.0, 110.0, 195.0, 292.0, 454.0, 776.0, 1408.0, 2377.0, 4473.0, 8099.0, 14801.0, 26562.0, 46181.0, 76825.0, 115277.0, 151923.0, 166184.0, 149072.0, 110850.0, 72899.0, 43564.0, 24630.0, 13964.0, 7556.0, 4163.0, 2417.0, 1336.0, 779.0, 438.0, 276.0, 143.0, 118.0, 69.0, 42.0, 32.0, 18.0, 11.0, 4.0, 12.0, 4.0, 1.0, 1.0, 5.0], "bins": [-7.72265625, -7.51641845703125, -7.3101806640625, -7.10394287109375, -6.897705078125, -6.69146728515625, -6.4852294921875, -6.27899169921875, -6.07275390625, -5.86651611328125, -5.6602783203125, -5.45404052734375, -5.247802734375, -5.04156494140625, -4.8353271484375, -4.62908935546875, -4.4228515625, -4.21661376953125, -4.0103759765625, -3.80413818359375, -3.597900390625, -3.39166259765625, -3.1854248046875, -2.97918701171875, -2.77294921875, -2.56671142578125, -2.3604736328125, -2.15423583984375, -1.947998046875, -1.74176025390625, -1.5355224609375, -1.32928466796875, -1.123046875, -0.91680908203125, -0.7105712890625, -0.50433349609375, -0.298095703125, -0.09185791015625, 0.1143798828125, 0.32061767578125, 0.52685546875, 0.73309326171875, 0.9393310546875, 1.14556884765625, 1.351806640625, 1.55804443359375, 1.7642822265625, 1.97052001953125, 2.1767578125, 2.38299560546875, 2.5892333984375, 2.79547119140625, 3.001708984375, 3.20794677734375, 3.4141845703125, 3.62042236328125, 3.82666015625, 4.03289794921875, 4.2391357421875, 4.44537353515625, 4.651611328125, 4.85784912109375, 5.0640869140625, 5.27032470703125, 5.4765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 0.0, 8.0, 5.0, 7.0, 6.0, 16.0, 14.0, 21.0, 30.0, 30.0, 36.0, 33.0, 34.0, 41.0, 36.0, 48.0, 51.0, 55.0, 56.0, 68.0, 63.0, 52.0, 54.0, 38.0, 44.0, 30.0, 23.0, 27.0, 25.0, 13.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007047653198242188, -0.0006809532642364502, -0.0006571412086486816, -0.0006333291530609131, -0.0006095170974731445, -0.000585705041885376, -0.0005618929862976074, -0.0005380809307098389, -0.0005142688751220703, -0.0004904568195343018, -0.0004666447639465332, -0.00044283270835876465, -0.0004190206527709961, -0.00039520859718322754, -0.000371396541595459, -0.00034758448600769043, -0.0003237724304199219, -0.0002999603748321533, -0.00027614831924438477, -0.0002523362636566162, -0.00022852420806884766, -0.0002047121524810791, -0.00018090009689331055, -0.000157088041305542, -0.00013327598571777344, -0.00010946393013000488, -8.565187454223633e-05, -6.183981895446777e-05, -3.802776336669922e-05, -1.4215707778930664e-05, 9.59634780883789e-06, 3.3408403396606445e-05, 5.7220458984375e-05, 8.103251457214355e-05, 0.00010484457015991211, 0.00012865662574768066, 0.00015246868133544922, 0.00017628073692321777, 0.00020009279251098633, 0.00022390484809875488, 0.00024771690368652344, 0.000271528959274292, 0.00029534101486206055, 0.0003191530704498291, 0.00034296512603759766, 0.0003667771816253662, 0.00039058923721313477, 0.0004144012928009033, 0.0004382133483886719, 0.00046202540397644043, 0.000485837459564209, 0.0005096495151519775, 0.0005334615707397461, 0.0005572736263275146, 0.0005810856819152832, 0.0006048977375030518, 0.0006287097930908203, 0.0006525218486785889, 0.0006763339042663574, 0.000700145959854126, 0.0007239580154418945, 0.0007477700710296631, 0.0007715821266174316, 0.0007953941822052002, 0.0008192062377929688]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 20.0, 25.0, 28.0, 48.0, 92.0, 106.0, 177.0, 300.0, 375.0, 618.0, 944.0, 1455.0, 2319.0, 3597.0, 5533.0, 8714.0, 13892.0, 22127.0, 34432.0, 52479.0, 75988.0, 103239.0, 126217.0, 135748.0, 126598.0, 104909.0, 77845.0, 53495.0, 35235.0, 22720.0, 14353.0, 8972.0, 5753.0, 3573.0, 2267.0, 1495.0, 998.0, 616.0, 419.0, 264.0, 198.0, 110.0, 73.0, 64.0, 42.0, 20.0, 18.0, 12.0, 5.0, 4.0, 2.0, 3.0, 1.0], "bins": [-6.19140625, -6.0120849609375, -5.832763671875, -5.6534423828125, -5.47412109375, -5.2947998046875, -5.115478515625, -4.9361572265625, -4.7568359375, -4.5775146484375, -4.398193359375, -4.2188720703125, -4.03955078125, -3.8602294921875, -3.680908203125, -3.5015869140625, -3.322265625, -3.1429443359375, -2.963623046875, -2.7843017578125, -2.60498046875, -2.4256591796875, -2.246337890625, -2.0670166015625, -1.8876953125, -1.7083740234375, -1.529052734375, -1.3497314453125, -1.17041015625, -0.9910888671875, -0.811767578125, -0.6324462890625, -0.453125, -0.2738037109375, -0.094482421875, 0.0848388671875, 0.26416015625, 0.4434814453125, 0.622802734375, 0.8021240234375, 0.9814453125, 1.1607666015625, 1.340087890625, 1.5194091796875, 1.69873046875, 1.8780517578125, 2.057373046875, 2.2366943359375, 2.416015625, 2.5953369140625, 2.774658203125, 2.9539794921875, 3.13330078125, 3.3126220703125, 3.491943359375, 3.6712646484375, 3.8505859375, 4.0299072265625, 4.209228515625, 4.3885498046875, 4.56787109375, 4.7471923828125, 4.926513671875, 5.1058349609375, 5.28515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 3.0, 1.0, 9.0, 2.0, 11.0, 15.0, 11.0, 13.0, 15.0, 19.0, 27.0, 23.0, 37.0, 36.0, 53.0, 48.0, 62.0, 59.0, 69.0, 69.0, 62.0, 48.0, 36.0, 43.0, 33.0, 29.0, 30.0, 24.0, 21.0, 19.0, 16.0, 12.0, 8.0, 5.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.6953125, -2.61627197265625, -2.5372314453125, -2.45819091796875, -2.379150390625, -2.30010986328125, -2.2210693359375, -2.14202880859375, -2.06298828125, -1.98394775390625, -1.9049072265625, -1.82586669921875, -1.746826171875, -1.66778564453125, -1.5887451171875, -1.50970458984375, -1.4306640625, -1.35162353515625, -1.2725830078125, -1.19354248046875, -1.114501953125, -1.03546142578125, -0.9564208984375, -0.87738037109375, -0.79833984375, -0.71929931640625, -0.6402587890625, -0.56121826171875, -0.482177734375, -0.40313720703125, -0.3240966796875, -0.24505615234375, -0.166015625, -0.08697509765625, -0.0079345703125, 0.07110595703125, 0.150146484375, 0.22918701171875, 0.3082275390625, 0.38726806640625, 0.46630859375, 0.54534912109375, 0.6243896484375, 0.70343017578125, 0.782470703125, 0.86151123046875, 0.9405517578125, 1.01959228515625, 1.0986328125, 1.17767333984375, 1.2567138671875, 1.33575439453125, 1.414794921875, 1.49383544921875, 1.5728759765625, 1.65191650390625, 1.73095703125, 1.80999755859375, 1.8890380859375, 1.96807861328125, 2.047119140625, 2.12615966796875, 2.2052001953125, 2.28424072265625, 2.36328125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 11.0, 19.0, 17.0, 18.0, 24.0, 23.0, 28.0, 38.0, 42.0, 44.0, 40.0, 47.0, 41.0, 37.0, 39.0, 42.0, 56.0, 42.0, 42.0, 28.0, 37.0, 38.0, 25.0, 26.0, 38.0, 18.0, 11.0, 18.0, 11.0, 12.0, 11.0, 9.0, 12.0, 3.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75565242767334, -11.380942344665527, -11.006231307983398, -10.631521224975586, -10.256810188293457, -9.882100105285645, -9.507389068603516, -9.132678985595703, -8.75796890258789, -8.383258819580078, -8.00854778289795, -7.633837699890137, -7.259126663208008, -6.884416580200195, -6.509706020355225, -6.134995460510254, -5.760284423828125, -5.385573863983154, -5.010863304138184, -4.636153221130371, -4.261442184448242, -3.8867318630218506, -3.512021541595459, -3.1373109817504883, -2.7626004219055176, -2.387889862060547, -2.013179302215576, -1.6384689807891846, -1.2637584209442139, -0.8890478610992432, -0.5143375396728516, -0.13962697982788086, 0.23508453369140625, 0.6097950339317322, 0.9845055341720581, 1.3592159748077393, 1.73392653465271, 2.1086370944976807, 2.4833474159240723, 2.858057975769043, 3.2327685356140137, 3.6074790954589844, 3.982189655303955, 4.356900215148926, 4.731610298156738, 5.106321334838867, 5.48103141784668, 5.85574197769165, 6.230452537536621, 6.605163097381592, 6.9798736572265625, 7.354583740234375, 7.729294776916504, 8.104004859924316, 8.478715896606445, 8.853425979614258, 9.22813606262207, 9.602846145629883, 9.977557182312012, 10.352267265319824, 10.726978302001953, 11.101688385009766, 11.476398468017578, 11.851109504699707, 12.225820541381836]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 10.0, 7.0, 8.0, 8.0, 11.0, 4.0, 19.0, 15.0, 25.0, 15.0, 29.0, 25.0, 37.0, 28.0, 25.0, 43.0, 41.0, 34.0, 35.0, 37.0, 38.0, 41.0, 36.0, 35.0, 29.0, 34.0, 30.0, 36.0, 39.0, 30.0, 22.0, 23.0, 20.0, 19.0, 24.0, 20.0, 10.0, 16.0, 9.0, 8.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.271442413330078, -10.927652359008789, -10.5838623046875, -10.240072250366211, -9.896282196044922, -9.552492141723633, -9.208702087402344, -8.864912033081055, -8.521121978759766, -8.177331924438477, -7.8335418701171875, -7.489751815795898, -7.145961761474609, -6.80217170715332, -6.458381652832031, -6.114591598510742, -5.770801544189453, -5.427011489868164, -5.083221435546875, -4.739431381225586, -4.395641326904297, -4.051851272583008, -3.7080612182617188, -3.3642711639404297, -3.0204811096191406, -2.6766910552978516, -2.3329010009765625, -1.9891109466552734, -1.6453208923339844, -1.3015308380126953, -0.9577407836914062, -0.6139507293701172, -0.27016162872314453, 0.07362842559814453, 0.4174184799194336, 0.7612085342407227, 1.1049985885620117, 1.4487886428833008, 1.7925786972045898, 2.136368751525879, 2.480158805847168, 2.823948860168457, 3.167738914489746, 3.511528968811035, 3.855319023132324, 4.199109077453613, 4.542899131774902, 4.886689186096191, 5.2304792404174805, 5.5742692947387695, 5.918059349060059, 6.261849403381348, 6.605639457702637, 6.949429512023926, 7.293219566345215, 7.637009620666504, 7.980799674987793, 8.324589729309082, 8.668379783630371, 9.01216983795166, 9.35595989227295, 9.699749946594238, 10.043540000915527, 10.387330055236816, 10.731120109558105]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 6.0, 7.0, 16.0, 23.0, 38.0, 57.0, 117.0, 178.0, 341.0, 518.0, 824.0, 1407.0, 2215.0, 3520.0, 5686.0, 8976.0, 14222.0, 21990.0, 34111.0, 50951.0, 77572.0, 112649.0, 159089.0, 216686.0, 283796.0, 349883.0, 402281.0, 429691.0, 423645.0, 385270.0, 325106.0, 259014.0, 194413.0, 141038.0, 97741.0, 66448.0, 44517.0, 29021.0, 18476.0, 12214.0, 7477.0, 4918.0, 3004.0, 1999.0, 1186.0, 738.0, 441.0, 308.0, 191.0, 107.0, 68.0, 40.0, 27.0, 13.0, 5.0, 10.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-8.0390625, -7.7781982421875, -7.517333984375, -7.2564697265625, -6.99560546875, -6.7347412109375, -6.473876953125, -6.2130126953125, -5.9521484375, -5.6912841796875, -5.430419921875, -5.1695556640625, -4.90869140625, -4.6478271484375, -4.386962890625, -4.1260986328125, -3.865234375, -3.6043701171875, -3.343505859375, -3.0826416015625, -2.82177734375, -2.5609130859375, -2.300048828125, -2.0391845703125, -1.7783203125, -1.5174560546875, -1.256591796875, -0.9957275390625, -0.73486328125, -0.4739990234375, -0.213134765625, 0.0477294921875, 0.30859375, 0.5694580078125, 0.830322265625, 1.0911865234375, 1.35205078125, 1.6129150390625, 1.873779296875, 2.1346435546875, 2.3955078125, 2.6563720703125, 2.917236328125, 3.1781005859375, 3.43896484375, 3.6998291015625, 3.960693359375, 4.2215576171875, 4.482421875, 4.7432861328125, 5.004150390625, 5.2650146484375, 5.52587890625, 5.7867431640625, 6.047607421875, 6.3084716796875, 6.5693359375, 6.8302001953125, 7.091064453125, 7.3519287109375, 7.61279296875, 7.8736572265625, 8.134521484375, 8.3953857421875, 8.65625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 8.0, 16.0, 12.0, 17.0, 23.0, 23.0, 33.0, 34.0, 28.0, 28.0, 36.0, 44.0, 37.0, 34.0, 38.0, 41.0, 29.0, 47.0, 34.0, 35.0, 27.0, 35.0, 35.0, 40.0, 26.0, 24.0, 30.0, 15.0, 26.0, 22.0, 15.0, 13.0, 13.0, 9.0, 6.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2940673828125, -8.994384765625, -8.6947021484375, -8.39501953125, -8.0953369140625, -7.795654296875, -7.4959716796875, -7.1962890625, -6.8966064453125, -6.596923828125, -6.2972412109375, -5.99755859375, -5.6978759765625, -5.398193359375, -5.0985107421875, -4.798828125, -4.4991455078125, -4.199462890625, -3.8997802734375, -3.60009765625, -3.3004150390625, -3.000732421875, -2.7010498046875, -2.4013671875, -2.1016845703125, -1.802001953125, -1.5023193359375, -1.20263671875, -0.9029541015625, -0.603271484375, -0.3035888671875, -0.00390625, 0.2957763671875, 0.595458984375, 0.8951416015625, 1.19482421875, 1.4945068359375, 1.794189453125, 2.0938720703125, 2.3935546875, 2.6932373046875, 2.992919921875, 3.2926025390625, 3.59228515625, 3.8919677734375, 4.191650390625, 4.4913330078125, 4.791015625, 5.0906982421875, 5.390380859375, 5.6900634765625, 5.98974609375, 6.2894287109375, 6.589111328125, 6.8887939453125, 7.1884765625, 7.4881591796875, 7.787841796875, 8.0875244140625, 8.38720703125, 8.6868896484375, 8.986572265625, 9.2862548828125, 9.5859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 18.0, 34.0, 50.0, 95.0, 169.0, 302.0, 524.0, 814.0, 1572.0, 2503.0, 4215.0, 6793.0, 11221.0, 17746.0, 28461.0, 43962.0, 65571.0, 96943.0, 137298.0, 187169.0, 245832.0, 305945.0, 359379.0, 396531.0, 408785.0, 393248.0, 355215.0, 298827.0, 239920.0, 182346.0, 132295.0, 93486.0, 63602.0, 42353.0, 27202.0, 17025.0, 10692.0, 6538.0, 3920.0, 2306.0, 1373.0, 844.0, 469.0, 285.0, 151.0, 99.0, 76.0, 32.0, 19.0, 13.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.7265625, -8.4490966796875, -8.171630859375, -7.8941650390625, -7.61669921875, -7.3392333984375, -7.061767578125, -6.7843017578125, -6.5068359375, -6.2293701171875, -5.951904296875, -5.6744384765625, -5.39697265625, -5.1195068359375, -4.842041015625, -4.5645751953125, -4.287109375, -4.0096435546875, -3.732177734375, -3.4547119140625, -3.17724609375, -2.8997802734375, -2.622314453125, -2.3448486328125, -2.0673828125, -1.7899169921875, -1.512451171875, -1.2349853515625, -0.95751953125, -0.6800537109375, -0.402587890625, -0.1251220703125, 0.15234375, 0.4298095703125, 0.707275390625, 0.9847412109375, 1.26220703125, 1.5396728515625, 1.817138671875, 2.0946044921875, 2.3720703125, 2.6495361328125, 2.927001953125, 3.2044677734375, 3.48193359375, 3.7593994140625, 4.036865234375, 4.3143310546875, 4.591796875, 4.8692626953125, 5.146728515625, 5.4241943359375, 5.70166015625, 5.9791259765625, 6.256591796875, 6.5340576171875, 6.8115234375, 7.0889892578125, 7.366455078125, 7.6439208984375, 7.92138671875, 8.1988525390625, 8.476318359375, 8.7537841796875, 9.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 7.0, 9.0, 15.0, 16.0, 12.0, 17.0, 29.0, 33.0, 54.0, 60.0, 64.0, 98.0, 101.0, 117.0, 114.0, 153.0, 149.0, 169.0, 183.0, 189.0, 181.0, 222.0, 220.0, 196.0, 175.0, 187.0, 159.0, 145.0, 158.0, 154.0, 127.0, 81.0, 83.0, 86.0, 69.0, 58.0, 29.0, 23.0, 30.0, 20.0, 20.0, 15.0, 16.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.765625, -4.62213134765625, -4.4786376953125, -4.33514404296875, -4.191650390625, -4.04815673828125, -3.9046630859375, -3.76116943359375, -3.61767578125, -3.47418212890625, -3.3306884765625, -3.18719482421875, -3.043701171875, -2.90020751953125, -2.7567138671875, -2.61322021484375, -2.4697265625, -2.32623291015625, -2.1827392578125, -2.03924560546875, -1.895751953125, -1.75225830078125, -1.6087646484375, -1.46527099609375, -1.32177734375, -1.17828369140625, -1.0347900390625, -0.89129638671875, -0.747802734375, -0.60430908203125, -0.4608154296875, -0.31732177734375, -0.173828125, -0.03033447265625, 0.1131591796875, 0.25665283203125, 0.400146484375, 0.54364013671875, 0.6871337890625, 0.83062744140625, 0.97412109375, 1.11761474609375, 1.2611083984375, 1.40460205078125, 1.548095703125, 1.69158935546875, 1.8350830078125, 1.97857666015625, 2.1220703125, 2.26556396484375, 2.4090576171875, 2.55255126953125, 2.696044921875, 2.83953857421875, 2.9830322265625, 3.12652587890625, 3.27001953125, 3.41351318359375, 3.5570068359375, 3.70050048828125, 3.843994140625, 3.98748779296875, 4.1309814453125, 4.27447509765625, 4.41796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 7.0, 11.0, 15.0, 25.0, 21.0, 21.0, 25.0, 33.0, 33.0, 44.0, 45.0, 46.0, 42.0, 52.0, 50.0, 55.0, 58.0, 46.0, 48.0, 38.0, 35.0, 32.0, 31.0, 30.0, 27.0, 15.0, 19.0, 14.0, 18.0, 14.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.280447006225586, -14.832430839538574, -14.384414672851562, -13.936399459838867, -13.488383293151855, -13.040367126464844, -12.592350959777832, -12.14433479309082, -11.696318626403809, -11.248302459716797, -10.800286293029785, -10.352270126342773, -9.904254913330078, -9.456238746643066, -9.008222579956055, -8.560206413269043, -8.112190246582031, -7.6641740798950195, -7.216158390045166, -6.768142223358154, -6.320126056671143, -5.872110366821289, -5.424094200134277, -4.976078033447266, -4.52806282043457, -4.080046653747559, -3.632030725479126, -3.1840147972106934, -2.7359986305236816, -2.287982702255249, -1.8399667739868164, -1.3919506072998047, -0.943934440612793, -0.4959184229373932, -0.04790240526199341, 0.400113582611084, 0.8481296300888062, 1.2961456775665283, 1.744161605834961, 2.1921777725219727, 2.6401937007904053, 3.088209629058838, 3.5362257957458496, 3.9842417240142822, 4.432257652282715, 4.880273818969727, 5.328289985656738, 5.77630615234375, 6.2243218421936035, 6.672338008880615, 7.120353698730469, 7.5683698654174805, 8.016386032104492, 8.464402198791504, 8.912418365478516, 9.360433578491211, 9.808449745178223, 10.256465911865234, 10.704482078552246, 11.152498245239258, 11.600513458251953, 12.048529624938965, 12.496545791625977, 12.944561958312988, 13.392578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 8.0, 11.0, 5.0, 11.0, 12.0, 11.0, 12.0, 15.0, 16.0, 22.0, 20.0, 28.0, 29.0, 39.0, 25.0, 29.0, 32.0, 33.0, 34.0, 25.0, 34.0, 37.0, 27.0, 43.0, 36.0, 30.0, 34.0, 31.0, 42.0, 29.0, 33.0, 35.0, 20.0, 28.0, 13.0, 10.0, 13.0, 15.0, 12.0, 11.0, 6.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0], "bins": [-11.690108299255371, -11.369203567504883, -11.048298835754395, -10.727394104003906, -10.406488418579102, -10.085583686828613, -9.764678955078125, -9.443774223327637, -9.122869491577148, -8.80196475982666, -8.481060028076172, -8.160155296325684, -7.839250087738037, -7.518345355987549, -7.197440147399902, -6.876535415649414, -6.555630683898926, -6.2347259521484375, -5.913821220397949, -5.592916011810303, -5.2720112800598145, -4.951106548309326, -4.63020133972168, -4.309296607971191, -3.988391876220703, -3.667487144470215, -3.3465821743011475, -3.02567720413208, -2.704772472381592, -2.3838677406311035, -2.062962770462036, -1.7420578002929688, -1.421152114868164, -1.1002472639083862, -0.7793424129486084, -0.45843756198883057, -0.13753271102905273, 0.1833721399307251, 0.5042769908905029, 0.8251819610595703, 1.1460866928100586, 1.4669915437698364, 1.7878963947296143, 2.1088013648986816, 2.42970609664917, 2.750610828399658, 3.0715157985687256, 3.392420768737793, 3.7133255004882812, 4.0342302322387695, 4.355134963989258, 4.676040172576904, 4.996944904327393, 5.317849636077881, 5.638754844665527, 5.959659576416016, 6.280564308166504, 6.601469039916992, 6.9223737716674805, 7.243278980255127, 7.564183712005615, 7.8850884437561035, 8.20599365234375, 8.526898384094238, 8.847803115844727]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 6.0, 9.0, 23.0, 28.0, 50.0, 50.0, 76.0, 105.0, 174.0, 222.0, 372.0, 530.0, 798.0, 1312.0, 2044.0, 3258.0, 5196.0, 8333.0, 13325.0, 22034.0, 35516.0, 58495.0, 94247.0, 143054.0, 178797.0, 165225.0, 119475.0, 75721.0, 45879.0, 28177.0, 17335.0, 10574.0, 6613.0, 4127.0, 2605.0, 1639.0, 1097.0, 656.0, 430.0, 304.0, 199.0, 132.0, 76.0, 53.0, 58.0, 38.0, 23.0, 14.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0], "bins": [-4.0625, -3.942169189453125, -3.82183837890625, -3.701507568359375, -3.5811767578125, -3.460845947265625, -3.34051513671875, -3.220184326171875, -3.099853515625, -2.979522705078125, -2.85919189453125, -2.738861083984375, -2.6185302734375, -2.498199462890625, -2.37786865234375, -2.257537841796875, -2.13720703125, -2.016876220703125, -1.89654541015625, -1.776214599609375, -1.6558837890625, -1.535552978515625, -1.41522216796875, -1.294891357421875, -1.174560546875, -1.054229736328125, -0.93389892578125, -0.813568115234375, -0.6932373046875, -0.572906494140625, -0.45257568359375, -0.332244873046875, -0.2119140625, -0.091583251953125, 0.02874755859375, 0.149078369140625, 0.2694091796875, 0.389739990234375, 0.51007080078125, 0.630401611328125, 0.750732421875, 0.871063232421875, 0.99139404296875, 1.111724853515625, 1.2320556640625, 1.352386474609375, 1.47271728515625, 1.593048095703125, 1.71337890625, 1.833709716796875, 1.95404052734375, 2.074371337890625, 2.1947021484375, 2.315032958984375, 2.43536376953125, 2.555694580078125, 2.676025390625, 2.796356201171875, 2.91668701171875, 3.037017822265625, 3.1573486328125, 3.277679443359375, 3.39801025390625, 3.518341064453125, 3.638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 7.0, 12.0, 3.0, 14.0, 10.0, 11.0, 14.0, 15.0, 14.0, 21.0, 22.0, 29.0, 29.0, 40.0, 26.0, 24.0, 35.0, 33.0, 34.0, 24.0, 34.0, 39.0, 31.0, 40.0, 34.0, 32.0, 37.0, 26.0, 45.0, 26.0, 36.0, 33.0, 25.0, 23.0, 11.0, 11.0, 13.0, 14.0, 14.0, 8.0, 6.0, 9.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0], "bins": [-11.6953125, -11.37451171875, -11.0537109375, -10.73291015625, -10.412109375, -10.09130859375, -9.7705078125, -9.44970703125, -9.12890625, -8.80810546875, -8.4873046875, -8.16650390625, -7.845703125, -7.52490234375, -7.2041015625, -6.88330078125, -6.5625, -6.24169921875, -5.9208984375, -5.60009765625, -5.279296875, -4.95849609375, -4.6376953125, -4.31689453125, -3.99609375, -3.67529296875, -3.3544921875, -3.03369140625, -2.712890625, -2.39208984375, -2.0712890625, -1.75048828125, -1.4296875, -1.10888671875, -0.7880859375, -0.46728515625, -0.146484375, 0.17431640625, 0.4951171875, 0.81591796875, 1.13671875, 1.45751953125, 1.7783203125, 2.09912109375, 2.419921875, 2.74072265625, 3.0615234375, 3.38232421875, 3.703125, 4.02392578125, 4.3447265625, 4.66552734375, 4.986328125, 5.30712890625, 5.6279296875, 5.94873046875, 6.26953125, 6.59033203125, 6.9111328125, 7.23193359375, 7.552734375, 7.87353515625, 8.1943359375, 8.51513671875, 8.8359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 7.0, 18.0, 20.0, 26.0, 43.0, 57.0, 76.0, 92.0, 132.0, 188.0, 248.0, 346.0, 517.0, 739.0, 1016.0, 1612.0, 2494.0, 3705.0, 5958.0, 10004.0, 17169.0, 31081.0, 59297.0, 116529.0, 213080.0, 248031.0, 157518.0, 80559.0, 41597.0, 22604.0, 12604.0, 7533.0, 4612.0, 2995.0, 1950.0, 1245.0, 838.0, 575.0, 404.0, 302.0, 191.0, 129.0, 104.0, 79.0, 52.0, 60.0, 42.0, 29.0, 14.0, 11.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.552734375, -3.4425048828125, -3.332275390625, -3.2220458984375, -3.11181640625, -3.0015869140625, -2.891357421875, -2.7811279296875, -2.6708984375, -2.5606689453125, -2.450439453125, -2.3402099609375, -2.22998046875, -2.1197509765625, -2.009521484375, -1.8992919921875, -1.7890625, -1.6788330078125, -1.568603515625, -1.4583740234375, -1.34814453125, -1.2379150390625, -1.127685546875, -1.0174560546875, -0.9072265625, -0.7969970703125, -0.686767578125, -0.5765380859375, -0.46630859375, -0.3560791015625, -0.245849609375, -0.1356201171875, -0.025390625, 0.0848388671875, 0.195068359375, 0.3052978515625, 0.41552734375, 0.5257568359375, 0.635986328125, 0.7462158203125, 0.8564453125, 0.9666748046875, 1.076904296875, 1.1871337890625, 1.29736328125, 1.4075927734375, 1.517822265625, 1.6280517578125, 1.73828125, 1.8485107421875, 1.958740234375, 2.0689697265625, 2.17919921875, 2.2894287109375, 2.399658203125, 2.5098876953125, 2.6201171875, 2.7303466796875, 2.840576171875, 2.9508056640625, 3.06103515625, 3.1712646484375, 3.281494140625, 3.3917236328125, 3.501953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 4.0, 4.0, 8.0, 12.0, 11.0, 20.0, 21.0, 15.0, 18.0, 31.0, 31.0, 18.0, 46.0, 31.0, 36.0, 39.0, 32.0, 37.0, 45.0, 39.0, 38.0, 53.0, 47.0, 34.0, 41.0, 39.0, 30.0, 37.0, 28.0, 26.0, 23.0, 12.0, 22.0, 10.0, 13.0, 12.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.32177734375, -7.0810546875, -6.84033203125, -6.599609375, -6.35888671875, -6.1181640625, -5.87744140625, -5.63671875, -5.39599609375, -5.1552734375, -4.91455078125, -4.673828125, -4.43310546875, -4.1923828125, -3.95166015625, -3.7109375, -3.47021484375, -3.2294921875, -2.98876953125, -2.748046875, -2.50732421875, -2.2666015625, -2.02587890625, -1.78515625, -1.54443359375, -1.3037109375, -1.06298828125, -0.822265625, -0.58154296875, -0.3408203125, -0.10009765625, 0.140625, 0.38134765625, 0.6220703125, 0.86279296875, 1.103515625, 1.34423828125, 1.5849609375, 1.82568359375, 2.06640625, 2.30712890625, 2.5478515625, 2.78857421875, 3.029296875, 3.27001953125, 3.5107421875, 3.75146484375, 3.9921875, 4.23291015625, 4.4736328125, 4.71435546875, 4.955078125, 5.19580078125, 5.4365234375, 5.67724609375, 5.91796875, 6.15869140625, 6.3994140625, 6.64013671875, 6.880859375, 7.12158203125, 7.3623046875, 7.60302734375, 7.84375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 11.0, 14.0, 20.0, 34.0, 36.0, 49.0, 73.0, 117.0, 180.0, 232.0, 407.0, 555.0, 880.0, 1455.0, 2362.0, 4212.0, 7926.0, 15507.0, 37222.0, 113548.0, 422341.0, 305092.0, 79444.0, 28051.0, 12844.0, 6480.0, 3614.0, 2116.0, 1250.0, 852.0, 566.0, 350.0, 198.0, 149.0, 86.0, 84.0, 51.0, 46.0, 21.0, 17.0, 19.0, 10.0, 12.0, 3.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.3292236328125, -2.256103515625, -2.1829833984375, -2.10986328125, -2.0367431640625, -1.963623046875, -1.8905029296875, -1.8173828125, -1.7442626953125, -1.671142578125, -1.5980224609375, -1.52490234375, -1.4517822265625, -1.378662109375, -1.3055419921875, -1.232421875, -1.1593017578125, -1.086181640625, -1.0130615234375, -0.93994140625, -0.8668212890625, -0.793701171875, -0.7205810546875, -0.6474609375, -0.5743408203125, -0.501220703125, -0.4281005859375, -0.35498046875, -0.2818603515625, -0.208740234375, -0.1356201171875, -0.0625, 0.0106201171875, 0.083740234375, 0.1568603515625, 0.22998046875, 0.3031005859375, 0.376220703125, 0.4493408203125, 0.5224609375, 0.5955810546875, 0.668701171875, 0.7418212890625, 0.81494140625, 0.8880615234375, 0.961181640625, 1.0343017578125, 1.107421875, 1.1805419921875, 1.253662109375, 1.3267822265625, 1.39990234375, 1.4730224609375, 1.546142578125, 1.6192626953125, 1.6923828125, 1.7655029296875, 1.838623046875, 1.9117431640625, 1.98486328125, 2.0579833984375, 2.131103515625, 2.2042236328125, 2.27734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 15.0, 13.0, 23.0, 37.0, 40.0, 30.0, 65.0, 54.0, 71.0, 69.0, 77.0, 87.0, 61.0, 54.0, 55.0, 45.0, 34.0, 31.0, 23.0, 22.0, 13.0, 14.0, 14.0, 8.0, 5.0, 7.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020839646458625793, -0.00020054727792739868, -0.00019269809126853943, -0.00018484890460968018, -0.00017699971795082092, -0.00016915053129196167, -0.00016130134463310242, -0.00015345215797424316, -0.0001456029713153839, -0.00013775378465652466, -0.0001299045979976654, -0.00012205541133880615, -0.0001142062246799469, -0.00010635703802108765, -9.85078513622284e-05, -9.065866470336914e-05, -8.280947804450989e-05, -7.496029138565063e-05, -6.711110472679138e-05, -5.926191806793213e-05, -5.1412731409072876e-05, -4.356354475021362e-05, -3.571435809135437e-05, -2.7865171432495117e-05, -2.0015984773635864e-05, -1.2166798114776611e-05, -4.317611455917358e-06, 3.5315752029418945e-06, 1.1380761861801147e-05, 1.92299485206604e-05, 2.7079135179519653e-05, 3.4928321838378906e-05, 4.277750849723816e-05, 5.062669515609741e-05, 5.8475881814956665e-05, 6.632506847381592e-05, 7.417425513267517e-05, 8.202344179153442e-05, 8.987262845039368e-05, 9.772181510925293e-05, 0.00010557100176811218, 0.00011342018842697144, 0.00012126937508583069, 0.00012911856174468994, 0.0001369677484035492, 0.00014481693506240845, 0.0001526661217212677, 0.00016051530838012695, 0.0001683644950389862, 0.00017621368169784546, 0.0001840628683567047, 0.00019191205501556396, 0.00019976124167442322, 0.00020761042833328247, 0.00021545961499214172, 0.00022330880165100098, 0.00023115798830986023, 0.00023900717496871948, 0.00024685636162757874, 0.000254705548286438, 0.00026255473494529724, 0.0002704039216041565, 0.00027825310826301575, 0.000286102294921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 15.0, 15.0, 30.0, 32.0, 39.0, 65.0, 90.0, 155.0, 204.0, 299.0, 405.0, 635.0, 875.0, 1148.0, 1856.0, 2664.0, 3960.0, 5755.0, 8466.0, 12807.0, 19184.0, 29778.0, 45329.0, 69338.0, 103702.0, 148486.0, 171850.0, 139421.0, 95676.0, 63282.0, 41390.0, 27062.0, 17938.0, 11767.0, 7801.0, 5385.0, 3650.0, 2524.0, 1689.0, 1166.0, 837.0, 544.0, 394.0, 265.0, 178.0, 135.0, 85.0, 58.0, 39.0, 28.0, 14.0, 11.0, 13.0, 5.0, 5.0, 4.0, 3.0, 6.0], "bins": [-1.708984375, -1.6562347412109375, -1.603485107421875, -1.5507354736328125, -1.49798583984375, -1.4452362060546875, -1.392486572265625, -1.3397369384765625, -1.2869873046875, -1.2342376708984375, -1.181488037109375, -1.1287384033203125, -1.07598876953125, -1.0232391357421875, -0.970489501953125, -0.9177398681640625, -0.864990234375, -0.8122406005859375, -0.759490966796875, -0.7067413330078125, -0.65399169921875, -0.6012420654296875, -0.548492431640625, -0.4957427978515625, -0.4429931640625, -0.3902435302734375, -0.337493896484375, -0.2847442626953125, -0.23199462890625, -0.1792449951171875, -0.126495361328125, -0.0737457275390625, -0.02099609375, 0.0317535400390625, 0.084503173828125, 0.1372528076171875, 0.19000244140625, 0.2427520751953125, 0.295501708984375, 0.3482513427734375, 0.4010009765625, 0.4537506103515625, 0.506500244140625, 0.5592498779296875, 0.61199951171875, 0.6647491455078125, 0.717498779296875, 0.7702484130859375, 0.822998046875, 0.8757476806640625, 0.928497314453125, 0.9812469482421875, 1.03399658203125, 1.0867462158203125, 1.139495849609375, 1.1922454833984375, 1.2449951171875, 1.2977447509765625, 1.350494384765625, 1.4032440185546875, 1.45599365234375, 1.5087432861328125, 1.561492919921875, 1.6142425537109375, 1.6669921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 4.0, 12.0, 17.0, 13.0, 12.0, 14.0, 20.0, 17.0, 18.0, 34.0, 26.0, 50.0, 33.0, 31.0, 44.0, 47.0, 54.0, 66.0, 69.0, 53.0, 43.0, 51.0, 37.0, 30.0, 33.0, 28.0, 17.0, 11.0, 13.0, 16.0, 10.0, 9.0, 14.0, 12.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.7548828125, -0.7310409545898438, -0.7071990966796875, -0.6833572387695312, -0.659515380859375, -0.6356735229492188, -0.6118316650390625, -0.5879898071289062, -0.56414794921875, -0.5403060913085938, -0.5164642333984375, -0.49262237548828125, -0.468780517578125, -0.44493865966796875, -0.4210968017578125, -0.39725494384765625, -0.3734130859375, -0.34957122802734375, -0.3257293701171875, -0.30188751220703125, -0.278045654296875, -0.25420379638671875, -0.2303619384765625, -0.20652008056640625, -0.18267822265625, -0.15883636474609375, -0.1349945068359375, -0.11115264892578125, -0.087310791015625, -0.06346893310546875, -0.0396270751953125, -0.01578521728515625, 0.008056640625, 0.03189849853515625, 0.0557403564453125, 0.07958221435546875, 0.103424072265625, 0.12726593017578125, 0.1511077880859375, 0.17494964599609375, 0.19879150390625, 0.22263336181640625, 0.2464752197265625, 0.27031707763671875, 0.294158935546875, 0.31800079345703125, 0.3418426513671875, 0.36568450927734375, 0.3895263671875, 0.41336822509765625, 0.4372100830078125, 0.46105194091796875, 0.484893798828125, 0.5087356567382812, 0.5325775146484375, 0.5564193725585938, 0.58026123046875, 0.6041030883789062, 0.6279449462890625, 0.6517868041992188, 0.675628662109375, 0.6994705200195312, 0.7233123779296875, 0.7471542358398438, 0.77099609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 3.0, 17.0, 25.0, 22.0, 17.0, 22.0, 26.0, 39.0, 31.0, 47.0, 46.0, 49.0, 42.0, 49.0, 52.0, 59.0, 44.0, 49.0, 51.0, 30.0, 40.0, 36.0, 31.0, 28.0, 17.0, 21.0, 16.0, 14.0, 15.0, 11.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.547548294067383, -15.099172592163086, -14.650796890258789, -14.202422142028809, -13.754046440124512, -13.305670738220215, -12.857295989990234, -12.408920288085938, -11.96054458618164, -11.512168884277344, -11.063793182373047, -10.615418434143066, -10.16704273223877, -9.718667030334473, -9.270292282104492, -8.821916580200195, -8.373540878295898, -7.925165176391602, -7.476789951324463, -7.028414726257324, -6.580039024353027, -6.1316633224487305, -5.683288097381592, -5.234912872314453, -4.786537170410156, -4.338161468505859, -3.8897862434387207, -3.441410779953003, -2.993035316467285, -2.5446598529815674, -2.0962843894958496, -1.6479089260101318, -1.199533462524414, -0.7511579990386963, -0.3027825355529785, 0.14559292793273926, 0.593968391418457, 1.0423438549041748, 1.4907193183898926, 1.9390947818756104, 2.387470245361328, 2.835845708847046, 3.2842211723327637, 3.7325966358184814, 4.180972099304199, 4.629347801208496, 5.077723026275635, 5.526098251342773, 5.97447395324707, 6.422849655151367, 6.871224880218506, 7.3196001052856445, 7.767975807189941, 8.216351509094238, 8.664726257324219, 9.113101959228516, 9.561477661132812, 10.00985336303711, 10.458229064941406, 10.906603813171387, 11.354979515075684, 11.80335521697998, 12.251729965209961, 12.700105667114258, 13.148481369018555]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 10.0, 6.0, 9.0, 9.0, 15.0, 8.0, 13.0, 23.0, 17.0, 14.0, 24.0, 30.0, 42.0, 27.0, 28.0, 24.0, 33.0, 40.0, 24.0, 31.0, 37.0, 33.0, 40.0, 42.0, 20.0, 33.0, 36.0, 32.0, 34.0, 33.0, 35.0, 31.0, 27.0, 20.0, 14.0, 10.0, 14.0, 13.0, 6.0, 14.0, 4.0, 9.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0], "bins": [-11.63754940032959, -11.315777778625488, -10.994006156921387, -10.672233581542969, -10.350461959838867, -10.028690338134766, -9.706918716430664, -9.385147094726562, -9.063375473022461, -8.74160385131836, -8.419832229614258, -8.09805965423584, -7.776288032531738, -7.454516410827637, -7.132744789123535, -6.810973167419434, -6.489200592041016, -6.167428970336914, -5.845656871795654, -5.523885250091553, -5.202113151550293, -4.880341529846191, -4.55856990814209, -4.236798286437988, -3.9150261878967285, -3.593254327774048, -3.271482467651367, -2.9497108459472656, -2.627938985824585, -2.3061671257019043, -1.9843953847885132, -1.662623643875122, -1.340850830078125, -1.0190789699554443, -0.6973072290420532, -0.37553542852401733, -0.053763628005981445, 0.2680082321166992, 0.5897799730300903, 0.9115517139434814, 1.233323574066162, 1.5550954341888428, 1.8768671751022339, 2.198638916015625, 2.5204107761383057, 2.8421826362609863, 3.163954257965088, 3.4857261180877686, 3.807497978210449, 4.129269599914551, 4.4510416984558105, 4.772813320159912, 5.094585418701172, 5.416357040405273, 5.738128662109375, 6.059900283813477, 6.381672382354736, 6.703444004058838, 7.025216102600098, 7.346987724304199, 7.668759346008301, 7.9905314445495605, 8.31230354309082, 8.634075164794922, 8.955846786499023]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 12.0, 16.0, 14.0, 34.0, 50.0, 79.0, 109.0, 164.0, 276.0, 474.0, 636.0, 970.0, 1432.0, 2189.0, 3241.0, 4881.0, 7091.0, 10283.0, 14449.0, 20225.0, 27292.0, 36390.0, 46029.0, 57780.0, 67315.0, 77341.0, 84110.0, 87169.0, 85750.0, 80476.0, 71862.0, 61787.0, 50600.0, 39861.0, 30838.0, 22800.0, 16854.0, 11941.0, 8357.0, 5745.0, 3904.0, 2587.0, 1750.0, 1206.0, 766.0, 482.0, 307.0, 217.0, 156.0, 113.0, 68.0, 28.0, 27.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.66796875, -7.40985107421875, -7.1517333984375, -6.89361572265625, -6.635498046875, -6.37738037109375, -6.1192626953125, -5.86114501953125, -5.60302734375, -5.34490966796875, -5.0867919921875, -4.82867431640625, -4.570556640625, -4.31243896484375, -4.0543212890625, -3.79620361328125, -3.5380859375, -3.27996826171875, -3.0218505859375, -2.76373291015625, -2.505615234375, -2.24749755859375, -1.9893798828125, -1.73126220703125, -1.47314453125, -1.21502685546875, -0.9569091796875, -0.69879150390625, -0.440673828125, -0.18255615234375, 0.0755615234375, 0.33367919921875, 0.591796875, 0.84991455078125, 1.1080322265625, 1.36614990234375, 1.624267578125, 1.88238525390625, 2.1405029296875, 2.39862060546875, 2.65673828125, 2.91485595703125, 3.1729736328125, 3.43109130859375, 3.689208984375, 3.94732666015625, 4.2054443359375, 4.46356201171875, 4.7216796875, 4.97979736328125, 5.2379150390625, 5.49603271484375, 5.754150390625, 6.01226806640625, 6.2703857421875, 6.52850341796875, 6.78662109375, 7.04473876953125, 7.3028564453125, 7.56097412109375, 7.819091796875, 8.07720947265625, 8.3353271484375, 8.59344482421875, 8.8515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 6.0, 8.0, 5.0, 9.0, 8.0, 15.0, 11.0, 12.0, 22.0, 15.0, 16.0, 27.0, 26.0, 37.0, 37.0, 23.0, 28.0, 26.0, 40.0, 25.0, 33.0, 41.0, 31.0, 31.0, 42.0, 25.0, 31.0, 40.0, 31.0, 33.0, 32.0, 41.0, 28.0, 24.0, 23.0, 14.0, 12.0, 14.0, 11.0, 9.0, 13.0, 5.0, 7.0, 9.0, 5.0, 7.0, 4.0, 1.0, 2.0, 3.0], "bins": [-11.21875, -10.9093017578125, -10.599853515625, -10.2904052734375, -9.98095703125, -9.6715087890625, -9.362060546875, -9.0526123046875, -8.7431640625, -8.4337158203125, -8.124267578125, -7.8148193359375, -7.50537109375, -7.1959228515625, -6.886474609375, -6.5770263671875, -6.267578125, -5.9581298828125, -5.648681640625, -5.3392333984375, -5.02978515625, -4.7203369140625, -4.410888671875, -4.1014404296875, -3.7919921875, -3.4825439453125, -3.173095703125, -2.8636474609375, -2.55419921875, -2.2447509765625, -1.935302734375, -1.6258544921875, -1.31640625, -1.0069580078125, -0.697509765625, -0.3880615234375, -0.07861328125, 0.2308349609375, 0.540283203125, 0.8497314453125, 1.1591796875, 1.4686279296875, 1.778076171875, 2.0875244140625, 2.39697265625, 2.7064208984375, 3.015869140625, 3.3253173828125, 3.634765625, 3.9442138671875, 4.253662109375, 4.5631103515625, 4.87255859375, 5.1820068359375, 5.491455078125, 5.8009033203125, 6.1103515625, 6.4197998046875, 6.729248046875, 7.0386962890625, 7.34814453125, 7.6575927734375, 7.967041015625, 8.2764892578125, 8.5859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 13.0, 24.0, 32.0, 65.0, 93.0, 143.0, 298.0, 461.0, 850.0, 1426.0, 2416.0, 4321.0, 7309.0, 12113.0, 20103.0, 31601.0, 47641.0, 68043.0, 90507.0, 110100.0, 122295.0, 122337.0, 111567.0, 91858.0, 69161.0, 49258.0, 32783.0, 20855.0, 12680.0, 7653.0, 4394.0, 2552.0, 1463.0, 848.0, 496.0, 304.0, 169.0, 114.0, 53.0, 54.0, 32.0, 14.0, 11.0, 9.0, 5.0, 2.0, 6.0], "bins": [-13.609375, -13.2515869140625, -12.893798828125, -12.5360107421875, -12.17822265625, -11.8204345703125, -11.462646484375, -11.1048583984375, -10.7470703125, -10.3892822265625, -10.031494140625, -9.6737060546875, -9.31591796875, -8.9581298828125, -8.600341796875, -8.2425537109375, -7.884765625, -7.5269775390625, -7.169189453125, -6.8114013671875, -6.45361328125, -6.0958251953125, -5.738037109375, -5.3802490234375, -5.0224609375, -4.6646728515625, -4.306884765625, -3.9490966796875, -3.59130859375, -3.2335205078125, -2.875732421875, -2.5179443359375, -2.16015625, -1.8023681640625, -1.444580078125, -1.0867919921875, -0.72900390625, -0.3712158203125, -0.013427734375, 0.3443603515625, 0.7021484375, 1.0599365234375, 1.417724609375, 1.7755126953125, 2.13330078125, 2.4910888671875, 2.848876953125, 3.2066650390625, 3.564453125, 3.9222412109375, 4.280029296875, 4.6378173828125, 4.99560546875, 5.3533935546875, 5.711181640625, 6.0689697265625, 6.4267578125, 6.7845458984375, 7.142333984375, 7.5001220703125, 7.85791015625, 8.2156982421875, 8.573486328125, 8.9312744140625, 9.2890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 10.0, 15.0, 9.0, 17.0, 20.0, 17.0, 29.0, 25.0, 18.0, 41.0, 42.0, 34.0, 35.0, 29.0, 43.0, 43.0, 51.0, 28.0, 46.0, 41.0, 38.0, 34.0, 42.0, 32.0, 34.0, 31.0, 32.0, 19.0, 29.0, 20.0, 14.0, 12.0, 14.0, 4.0, 8.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.3125, -8.0875244140625, -7.862548828125, -7.6375732421875, -7.41259765625, -7.1876220703125, -6.962646484375, -6.7376708984375, -6.5126953125, -6.2877197265625, -6.062744140625, -5.8377685546875, -5.61279296875, -5.3878173828125, -5.162841796875, -4.9378662109375, -4.712890625, -4.4879150390625, -4.262939453125, -4.0379638671875, -3.81298828125, -3.5880126953125, -3.363037109375, -3.1380615234375, -2.9130859375, -2.6881103515625, -2.463134765625, -2.2381591796875, -2.01318359375, -1.7882080078125, -1.563232421875, -1.3382568359375, -1.11328125, -0.8883056640625, -0.663330078125, -0.4383544921875, -0.21337890625, 0.0115966796875, 0.236572265625, 0.4615478515625, 0.6865234375, 0.9114990234375, 1.136474609375, 1.3614501953125, 1.58642578125, 1.8114013671875, 2.036376953125, 2.2613525390625, 2.486328125, 2.7113037109375, 2.936279296875, 3.1612548828125, 3.38623046875, 3.6112060546875, 3.836181640625, 4.0611572265625, 4.2861328125, 4.5111083984375, 4.736083984375, 4.9610595703125, 5.18603515625, 5.4110107421875, 5.635986328125, 5.8609619140625, 6.0859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 13.0, 21.0, 27.0, 43.0, 54.0, 94.0, 115.0, 176.0, 309.0, 532.0, 864.0, 1565.0, 2766.0, 5309.0, 10258.0, 20421.0, 39023.0, 71453.0, 117972.0, 165025.0, 184389.0, 163132.0, 115609.0, 69645.0, 37982.0, 19562.0, 10376.0, 5253.0, 2778.0, 1437.0, 874.0, 551.0, 326.0, 199.0, 146.0, 93.0, 56.0, 27.0, 16.0, 22.0, 13.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.80859375, -7.59454345703125, -7.3804931640625, -7.16644287109375, -6.952392578125, -6.73834228515625, -6.5242919921875, -6.31024169921875, -6.09619140625, -5.88214111328125, -5.6680908203125, -5.45404052734375, -5.239990234375, -5.02593994140625, -4.8118896484375, -4.59783935546875, -4.3837890625, -4.16973876953125, -3.9556884765625, -3.74163818359375, -3.527587890625, -3.31353759765625, -3.0994873046875, -2.88543701171875, -2.67138671875, -2.45733642578125, -2.2432861328125, -2.02923583984375, -1.815185546875, -1.60113525390625, -1.3870849609375, -1.17303466796875, -0.958984375, -0.74493408203125, -0.5308837890625, -0.31683349609375, -0.102783203125, 0.11126708984375, 0.3253173828125, 0.53936767578125, 0.75341796875, 0.96746826171875, 1.1815185546875, 1.39556884765625, 1.609619140625, 1.82366943359375, 2.0377197265625, 2.25177001953125, 2.4658203125, 2.67987060546875, 2.8939208984375, 3.10797119140625, 3.322021484375, 3.53607177734375, 3.7501220703125, 3.96417236328125, 4.17822265625, 4.39227294921875, 4.6063232421875, 4.82037353515625, 5.034423828125, 5.24847412109375, 5.4625244140625, 5.67657470703125, 5.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 16.0, 24.0, 12.0, 19.0, 27.0, 32.0, 46.0, 45.0, 38.0, 49.0, 62.0, 64.0, 60.0, 59.0, 70.0, 61.0, 60.0, 41.0, 37.0, 35.0, 24.0, 22.0, 17.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006856918334960938, -0.0006635934114456177, -0.0006414949893951416, -0.0006193965673446655, -0.0005972981452941895, -0.0005751997232437134, -0.0005531013011932373, -0.0005310028791427612, -0.0005089044570922852, -0.0004868060350418091, -0.000464707612991333, -0.00044260919094085693, -0.00042051076889038086, -0.0003984123468399048, -0.0003763139247894287, -0.00035421550273895264, -0.00033211708068847656, -0.0003100186586380005, -0.0002879202365875244, -0.00026582181453704834, -0.00024372339248657227, -0.0002216249704360962, -0.00019952654838562012, -0.00017742812633514404, -0.00015532970428466797, -0.0001332312822341919, -0.00011113286018371582, -8.903443813323975e-05, -6.693601608276367e-05, -4.48375940322876e-05, -2.2739171981811523e-05, -6.407499313354492e-07, 2.1457672119140625e-05, 4.35560941696167e-05, 6.565451622009277e-05, 8.775293827056885e-05, 0.00010985136032104492, 0.000131949782371521, 0.00015404820442199707, 0.00017614662647247314, 0.00019824504852294922, 0.0002203434705734253, 0.00024244189262390137, 0.00026454031467437744, 0.0002866387367248535, 0.0003087371587753296, 0.00033083558082580566, 0.00035293400287628174, 0.0003750324249267578, 0.0003971308469772339, 0.00041922926902770996, 0.00044132769107818604, 0.0004634261131286621, 0.0004855245351791382, 0.0005076229572296143, 0.0005297213792800903, 0.0005518198013305664, 0.0005739182233810425, 0.0005960166454315186, 0.0006181150674819946, 0.0006402134895324707, 0.0006623119115829468, 0.0006844103336334229, 0.0007065087556838989, 0.000728607177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 7.0, 10.0, 11.0, 23.0, 28.0, 59.0, 61.0, 98.0, 138.0, 223.0, 363.0, 509.0, 742.0, 1129.0, 1762.0, 2819.0, 4458.0, 6702.0, 10791.0, 16812.0, 26482.0, 40100.0, 59050.0, 83024.0, 106454.0, 124956.0, 129607.0, 118818.0, 97089.0, 72197.0, 49910.0, 33797.0, 21615.0, 13901.0, 8762.0, 5801.0, 3581.0, 2274.0, 1482.0, 1022.0, 629.0, 389.0, 309.0, 176.0, 126.0, 88.0, 47.0, 49.0, 23.0, 20.0, 11.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0], "bins": [-5.53125, -5.35992431640625, -5.1885986328125, -5.01727294921875, -4.845947265625, -4.67462158203125, -4.5032958984375, -4.33197021484375, -4.16064453125, -3.98931884765625, -3.8179931640625, -3.64666748046875, -3.475341796875, -3.30401611328125, -3.1326904296875, -2.96136474609375, -2.7900390625, -2.61871337890625, -2.4473876953125, -2.27606201171875, -2.104736328125, -1.93341064453125, -1.7620849609375, -1.59075927734375, -1.41943359375, -1.24810791015625, -1.0767822265625, -0.90545654296875, -0.734130859375, -0.56280517578125, -0.3914794921875, -0.22015380859375, -0.048828125, 0.12249755859375, 0.2938232421875, 0.46514892578125, 0.636474609375, 0.80780029296875, 0.9791259765625, 1.15045166015625, 1.32177734375, 1.49310302734375, 1.6644287109375, 1.83575439453125, 2.007080078125, 2.17840576171875, 2.3497314453125, 2.52105712890625, 2.6923828125, 2.86370849609375, 3.0350341796875, 3.20635986328125, 3.377685546875, 3.54901123046875, 3.7203369140625, 3.89166259765625, 4.06298828125, 4.23431396484375, 4.4056396484375, 4.57696533203125, 4.748291015625, 4.91961669921875, 5.0909423828125, 5.26226806640625, 5.43359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 10.0, 7.0, 8.0, 10.0, 12.0, 16.0, 15.0, 21.0, 26.0, 20.0, 29.0, 36.0, 34.0, 43.0, 35.0, 39.0, 51.0, 33.0, 61.0, 39.0, 36.0, 47.0, 51.0, 27.0, 31.0, 32.0, 31.0, 21.0, 21.0, 16.0, 20.0, 19.0, 20.0, 17.0, 10.0, 4.0, 7.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.9287109375, -1.8708648681640625, -1.813018798828125, -1.7551727294921875, -1.69732666015625, -1.6394805908203125, -1.581634521484375, -1.5237884521484375, -1.4659423828125, -1.4080963134765625, -1.350250244140625, -1.2924041748046875, -1.23455810546875, -1.1767120361328125, -1.118865966796875, -1.0610198974609375, -1.003173828125, -0.9453277587890625, -0.887481689453125, -0.8296356201171875, -0.77178955078125, -0.7139434814453125, -0.656097412109375, -0.5982513427734375, -0.5404052734375, -0.4825592041015625, -0.424713134765625, -0.3668670654296875, -0.30902099609375, -0.2511749267578125, -0.193328857421875, -0.1354827880859375, -0.07763671875, -0.0197906494140625, 0.038055419921875, 0.0959014892578125, 0.15374755859375, 0.2115936279296875, 0.269439697265625, 0.3272857666015625, 0.3851318359375, 0.4429779052734375, 0.500823974609375, 0.5586700439453125, 0.61651611328125, 0.6743621826171875, 0.732208251953125, 0.7900543212890625, 0.847900390625, 0.9057464599609375, 0.963592529296875, 1.0214385986328125, 1.07928466796875, 1.1371307373046875, 1.194976806640625, 1.2528228759765625, 1.3106689453125, 1.3685150146484375, 1.426361083984375, 1.4842071533203125, 1.54205322265625, 1.5998992919921875, 1.657745361328125, 1.7155914306640625, 1.7734375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 8.0, 9.0, 9.0, 5.0, 10.0, 10.0, 15.0, 9.0, 27.0, 24.0, 22.0, 18.0, 29.0, 32.0, 42.0, 51.0, 45.0, 52.0, 46.0, 43.0, 47.0, 46.0, 34.0, 40.0, 26.0, 48.0, 31.0, 39.0, 26.0, 29.0, 15.0, 27.0, 18.0, 11.0, 13.0, 6.0, 8.0, 7.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.942811965942383, -13.54409122467041, -13.145371437072754, -12.746650695800781, -12.347929954528809, -11.949209213256836, -11.55048942565918, -11.151768684387207, -10.753047943115234, -10.354327201843262, -9.955607414245605, -9.556886672973633, -9.15816593170166, -8.759445190429688, -8.360725402832031, -7.962004661560059, -7.563284873962402, -7.164564609527588, -6.765843868255615, -6.367123603820801, -5.968402862548828, -5.569682598114014, -5.170962333679199, -4.772241592407227, -4.373521327972412, -3.9748008251190186, -3.576080322265625, -3.1773600578308105, -2.778639554977417, -2.3799190521240234, -1.981198787689209, -1.5824782848358154, -1.1837568283081055, -0.7850363850593567, -0.3863159418106079, 0.012404441833496094, 0.41112494468688965, 0.8098454475402832, 1.2085657119750977, 1.6072862148284912, 2.0060067176818848, 2.4047272205352783, 2.803447723388672, 3.2021679878234863, 3.60088849067688, 3.9996089935302734, 4.398329257965088, 4.797049522399902, 5.195770263671875, 5.5944905281066895, 5.993211269378662, 6.391931533813477, 6.790652275085449, 7.189372539520264, 7.588092803955078, 7.986813545227051, 8.385534286499023, 8.784255027770996, 9.182974815368652, 9.581695556640625, 9.980416297912598, 10.37913703918457, 10.777856826782227, 11.1765775680542, 11.575297355651855]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 8.0, 10.0, 3.0, 7.0, 12.0, 11.0, 6.0, 12.0, 17.0, 17.0, 17.0, 17.0, 25.0, 20.0, 24.0, 28.0, 16.0, 28.0, 46.0, 24.0, 29.0, 30.0, 39.0, 40.0, 44.0, 33.0, 31.0, 24.0, 26.0, 25.0, 20.0, 38.0, 31.0, 30.0, 35.0, 20.0, 31.0, 18.0, 22.0, 10.0, 12.0, 8.0, 6.0, 11.0, 11.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.214995384216309, -9.906293869018555, -9.597591400146484, -9.28888988494873, -8.98018741607666, -8.671485900878906, -8.362783432006836, -8.054081916809082, -7.74537992477417, -7.436677932739258, -7.127975940704346, -6.819273948669434, -6.51057243347168, -6.201869964599609, -5.8931684494018555, -5.584466457366943, -5.275764465332031, -4.967062473297119, -4.658360481262207, -4.349658489227295, -4.040956497192383, -3.73225474357605, -3.423552989959717, -3.1148509979248047, -2.8061490058898926, -2.4974470138549805, -2.1887450218200684, -1.8800432682037354, -1.5713412761688232, -1.2626392841339111, -0.9539374113082886, -0.645235538482666, -0.3365345001220703, -0.02783256769180298, 0.28086936473846436, 0.5895712971687317, 0.898273229598999, 1.2069752216339111, 1.5156770944595337, 1.8243789672851562, 2.1330809593200684, 2.4417829513549805, 2.7504849433898926, 3.0591866970062256, 3.3678886890411377, 3.67659068107605, 3.985292434692383, 4.293994426727295, 4.602696418762207, 4.911398410797119, 5.220100402832031, 5.528802394866943, 5.8375043869018555, 6.146205902099609, 6.4549078941345215, 6.763609886169434, 7.072311878204346, 7.381013870239258, 7.68971586227417, 7.998417854309082, 8.307119369506836, 8.615821838378906, 8.92452335357666, 9.233224868774414, 9.541927337646484]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 9.0, 21.0, 28.0, 49.0, 59.0, 154.0, 254.0, 427.0, 778.0, 1246.0, 2187.0, 3845.0, 6276.0, 10738.0, 17717.0, 28195.0, 45138.0, 70142.0, 105760.0, 154829.0, 217493.0, 291598.0, 366549.0, 426273.0, 457295.0, 446686.0, 399882.0, 330822.0, 255842.0, 186985.0, 129987.0, 86884.0, 56944.0, 36095.0, 22446.0, 13849.0, 8414.0, 5093.0, 3006.0, 1731.0, 1082.0, 667.0, 354.0, 203.0, 115.0, 57.0, 31.0, 29.0, 14.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.3984375, -9.111572265625, -8.82470703125, -8.537841796875, -8.2509765625, -7.964111328125, -7.67724609375, -7.390380859375, -7.103515625, -6.816650390625, -6.52978515625, -6.242919921875, -5.9560546875, -5.669189453125, -5.38232421875, -5.095458984375, -4.80859375, -4.521728515625, -4.23486328125, -3.947998046875, -3.6611328125, -3.374267578125, -3.08740234375, -2.800537109375, -2.513671875, -2.226806640625, -1.93994140625, -1.653076171875, -1.3662109375, -1.079345703125, -0.79248046875, -0.505615234375, -0.21875, 0.068115234375, 0.35498046875, 0.641845703125, 0.9287109375, 1.215576171875, 1.50244140625, 1.789306640625, 2.076171875, 2.363037109375, 2.64990234375, 2.936767578125, 3.2236328125, 3.510498046875, 3.79736328125, 4.084228515625, 4.37109375, 4.657958984375, 4.94482421875, 5.231689453125, 5.5185546875, 5.805419921875, 6.09228515625, 6.379150390625, 6.666015625, 6.952880859375, 7.23974609375, 7.526611328125, 7.8134765625, 8.100341796875, 8.38720703125, 8.674072265625, 8.9609375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 10.0, 8.0, 8.0, 10.0, 10.0, 13.0, 18.0, 18.0, 14.0, 23.0, 26.0, 22.0, 21.0, 27.0, 31.0, 33.0, 23.0, 32.0, 38.0, 30.0, 40.0, 33.0, 45.0, 28.0, 34.0, 29.0, 25.0, 16.0, 32.0, 29.0, 36.0, 33.0, 26.0, 29.0, 26.0, 13.0, 15.0, 14.0, 8.0, 7.0, 13.0, 7.0, 8.0, 6.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.53564453125, -8.2666015625, -7.99755859375, -7.728515625, -7.45947265625, -7.1904296875, -6.92138671875, -6.65234375, -6.38330078125, -6.1142578125, -5.84521484375, -5.576171875, -5.30712890625, -5.0380859375, -4.76904296875, -4.5, -4.23095703125, -3.9619140625, -3.69287109375, -3.423828125, -3.15478515625, -2.8857421875, -2.61669921875, -2.34765625, -2.07861328125, -1.8095703125, -1.54052734375, -1.271484375, -1.00244140625, -0.7333984375, -0.46435546875, -0.1953125, 0.07373046875, 0.3427734375, 0.61181640625, 0.880859375, 1.14990234375, 1.4189453125, 1.68798828125, 1.95703125, 2.22607421875, 2.4951171875, 2.76416015625, 3.033203125, 3.30224609375, 3.5712890625, 3.84033203125, 4.109375, 4.37841796875, 4.6474609375, 4.91650390625, 5.185546875, 5.45458984375, 5.7236328125, 5.99267578125, 6.26171875, 6.53076171875, 6.7998046875, 7.06884765625, 7.337890625, 7.60693359375, 7.8759765625, 8.14501953125, 8.4140625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 6.0, 7.0, 16.0, 30.0, 42.0, 74.0, 115.0, 235.0, 374.0, 641.0, 1128.0, 1837.0, 3228.0, 5130.0, 8262.0, 13733.0, 21282.0, 32540.0, 48994.0, 72767.0, 104514.0, 143638.0, 192250.0, 244760.0, 298619.0, 344450.0, 376524.0, 386966.0, 375167.0, 343233.0, 295511.0, 241415.0, 188709.0, 140264.0, 101830.0, 71260.0, 48502.0, 31634.0, 20505.0, 12949.0, 8391.0, 5121.0, 3014.0, 1863.0, 1177.0, 663.0, 395.0, 226.0, 120.0, 77.0, 44.0, 23.0, 15.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.578125, -8.3055419921875, -8.032958984375, -7.7603759765625, -7.48779296875, -7.2152099609375, -6.942626953125, -6.6700439453125, -6.3974609375, -6.1248779296875, -5.852294921875, -5.5797119140625, -5.30712890625, -5.0345458984375, -4.761962890625, -4.4893798828125, -4.216796875, -3.9442138671875, -3.671630859375, -3.3990478515625, -3.12646484375, -2.8538818359375, -2.581298828125, -2.3087158203125, -2.0361328125, -1.7635498046875, -1.490966796875, -1.2183837890625, -0.94580078125, -0.6732177734375, -0.400634765625, -0.1280517578125, 0.14453125, 0.4171142578125, 0.689697265625, 0.9622802734375, 1.23486328125, 1.5074462890625, 1.780029296875, 2.0526123046875, 2.3251953125, 2.5977783203125, 2.870361328125, 3.1429443359375, 3.41552734375, 3.6881103515625, 3.960693359375, 4.2332763671875, 4.505859375, 4.7784423828125, 5.051025390625, 5.3236083984375, 5.59619140625, 5.8687744140625, 6.141357421875, 6.4139404296875, 6.6865234375, 6.9591064453125, 7.231689453125, 7.5042724609375, 7.77685546875, 8.0494384765625, 8.322021484375, 8.5946044921875, 8.8671875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 8.0, 17.0, 20.0, 30.0, 44.0, 53.0, 48.0, 68.0, 71.0, 98.0, 98.0, 125.0, 148.0, 181.0, 180.0, 197.0, 194.0, 230.0, 214.0, 189.0, 215.0, 188.0, 183.0, 196.0, 156.0, 160.0, 141.0, 130.0, 90.0, 73.0, 63.0, 46.0, 45.0, 41.0, 34.0, 24.0, 11.0, 12.0, 11.0, 3.0, 0.0, 2.0, 7.0, 1.0, 3.0, 1.0], "bins": [-5.765625, -5.6092529296875, -5.452880859375, -5.2965087890625, -5.14013671875, -4.9837646484375, -4.827392578125, -4.6710205078125, -4.5146484375, -4.3582763671875, -4.201904296875, -4.0455322265625, -3.88916015625, -3.7327880859375, -3.576416015625, -3.4200439453125, -3.263671875, -3.1072998046875, -2.950927734375, -2.7945556640625, -2.63818359375, -2.4818115234375, -2.325439453125, -2.1690673828125, -2.0126953125, -1.8563232421875, -1.699951171875, -1.5435791015625, -1.38720703125, -1.2308349609375, -1.074462890625, -0.9180908203125, -0.76171875, -0.6053466796875, -0.448974609375, -0.2926025390625, -0.13623046875, 0.0201416015625, 0.176513671875, 0.3328857421875, 0.4892578125, 0.6456298828125, 0.802001953125, 0.9583740234375, 1.11474609375, 1.2711181640625, 1.427490234375, 1.5838623046875, 1.740234375, 1.8966064453125, 2.052978515625, 2.2093505859375, 2.36572265625, 2.5220947265625, 2.678466796875, 2.8348388671875, 2.9912109375, 3.1475830078125, 3.303955078125, 3.4603271484375, 3.61669921875, 3.7730712890625, 3.929443359375, 4.0858154296875, 4.2421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 4.0, 7.0, 3.0, 12.0, 14.0, 19.0, 16.0, 16.0, 22.0, 22.0, 24.0, 26.0, 33.0, 27.0, 34.0, 30.0, 36.0, 40.0, 40.0, 36.0, 49.0, 30.0, 41.0, 38.0, 38.0, 45.0, 31.0, 32.0, 32.0, 34.0, 16.0, 32.0, 24.0, 14.0, 9.0, 11.0, 12.0, 7.0, 9.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.58362865447998, -10.225683212280273, -9.86773681640625, -9.509790420532227, -9.15184497833252, -8.793899536132812, -8.435953140258789, -8.078006744384766, -7.720061302185059, -7.362115383148193, -7.004169464111328, -6.646223545074463, -6.288277626037598, -5.930331707000732, -5.572385787963867, -5.214439868927002, -4.856493949890137, -4.4985480308532715, -4.140602111816406, -3.782656192779541, -3.424710273742676, -3.0667643547058105, -2.7088184356689453, -2.35087251663208, -1.9929265975952148, -1.6349806785583496, -1.2770347595214844, -0.9190888404846191, -0.5611429214477539, -0.20319700241088867, 0.15474891662597656, 0.5126948356628418, 0.8706417083740234, 1.2285876274108887, 1.586533546447754, 1.9444794654846191, 2.3024253845214844, 2.6603713035583496, 3.018317222595215, 3.37626314163208, 3.7342090606689453, 4.0921549797058105, 4.450100898742676, 4.808046817779541, 5.165992736816406, 5.5239386558532715, 5.881884574890137, 6.239830493927002, 6.597776412963867, 6.955722332000732, 7.313668251037598, 7.671614170074463, 8.029560089111328, 8.387506484985352, 8.745451927185059, 9.103397369384766, 9.461343765258789, 9.819290161132812, 10.17723560333252, 10.535181045532227, 10.89312744140625, 11.251073837280273, 11.60901927947998, 11.966964721679688, 12.324911117553711]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 13.0, 17.0, 16.0, 20.0, 19.0, 23.0, 29.0, 34.0, 33.0, 31.0, 29.0, 41.0, 30.0, 37.0, 37.0, 33.0, 41.0, 39.0, 41.0, 45.0, 30.0, 32.0, 36.0, 24.0, 27.0, 34.0, 31.0, 21.0, 18.0, 16.0, 15.0, 14.0, 9.0, 15.0, 5.0, 13.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.981307029724121, -10.63040542602539, -10.279504776000977, -9.928603172302246, -9.577701568603516, -9.226799964904785, -8.875899314880371, -8.52499771118164, -8.17409610748291, -7.823194980621338, -7.472293376922607, -7.121392250061035, -6.770490646362305, -6.419589519500732, -6.06868839263916, -5.71778678894043, -5.366885662078857, -5.015984535217285, -4.665082931518555, -4.314181804656982, -3.963280200958252, -3.6123790740966797, -3.2614777088165283, -2.910576343536377, -2.5596749782562256, -2.208773612976074, -1.8578722476959229, -1.506971001625061, -1.1560696363449097, -0.8051682710647583, -0.4542670249938965, -0.10336565971374512, 0.24753570556640625, 0.5984370708465576, 0.9493383765220642, 1.3002396821975708, 1.6511410474777222, 2.002042293548584, 2.3529436588287354, 2.7038450241088867, 3.054746389389038, 3.4056477546691895, 3.756549119949341, 4.107450485229492, 4.4583516120910645, 4.809253215789795, 5.160154342651367, 5.511055946350098, 5.86195707321167, 6.212858200073242, 6.563759803771973, 6.914660930633545, 7.265562534332275, 7.616463661193848, 7.967365264892578, 8.318265914916992, 8.669167518615723, 9.020069122314453, 9.370969772338867, 9.721871376037598, 10.072772979736328, 10.423674583435059, 10.774575233459473, 11.125476837158203, 11.476378440856934]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 19.0, 21.0, 27.0, 44.0, 53.0, 64.0, 137.0, 171.0, 264.0, 355.0, 557.0, 889.0, 1318.0, 1949.0, 3053.0, 4923.0, 8397.0, 14561.0, 26529.0, 49329.0, 93077.0, 165142.0, 224868.0, 193920.0, 117207.0, 63333.0, 33050.0, 18348.0, 10242.0, 6008.0, 3723.0, 2347.0, 1494.0, 1050.0, 667.0, 445.0, 305.0, 227.0, 139.0, 75.0, 69.0, 44.0, 29.0, 27.0, 17.0, 12.0, 13.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.90625, -3.782989501953125, -3.65972900390625, -3.536468505859375, -3.4132080078125, -3.289947509765625, -3.16668701171875, -3.043426513671875, -2.920166015625, -2.796905517578125, -2.67364501953125, -2.550384521484375, -2.4271240234375, -2.303863525390625, -2.18060302734375, -2.057342529296875, -1.93408203125, -1.810821533203125, -1.68756103515625, -1.564300537109375, -1.4410400390625, -1.317779541015625, -1.19451904296875, -1.071258544921875, -0.947998046875, -0.824737548828125, -0.70147705078125, -0.578216552734375, -0.4549560546875, -0.331695556640625, -0.20843505859375, -0.085174560546875, 0.0380859375, 0.161346435546875, 0.28460693359375, 0.407867431640625, 0.5311279296875, 0.654388427734375, 0.77764892578125, 0.900909423828125, 1.024169921875, 1.147430419921875, 1.27069091796875, 1.393951416015625, 1.5172119140625, 1.640472412109375, 1.76373291015625, 1.886993408203125, 2.01025390625, 2.133514404296875, 2.25677490234375, 2.380035400390625, 2.5032958984375, 2.626556396484375, 2.74981689453125, 2.873077392578125, 2.996337890625, 3.119598388671875, 3.24285888671875, 3.366119384765625, 3.4893798828125, 3.612640380859375, 3.73590087890625, 3.859161376953125, 3.982421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 8.0, 6.0, 9.0, 12.0, 13.0, 19.0, 17.0, 16.0, 21.0, 23.0, 27.0, 36.0, 31.0, 33.0, 28.0, 37.0, 32.0, 36.0, 41.0, 32.0, 40.0, 39.0, 41.0, 45.0, 32.0, 30.0, 35.0, 24.0, 31.0, 31.0, 32.0, 20.0, 19.0, 16.0, 16.0, 11.0, 12.0, 15.0, 5.0, 11.0, 3.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.921875, -10.572265625, -10.22265625, -9.873046875, -9.5234375, -9.173828125, -8.82421875, -8.474609375, -8.125, -7.775390625, -7.42578125, -7.076171875, -6.7265625, -6.376953125, -6.02734375, -5.677734375, -5.328125, -4.978515625, -4.62890625, -4.279296875, -3.9296875, -3.580078125, -3.23046875, -2.880859375, -2.53125, -2.181640625, -1.83203125, -1.482421875, -1.1328125, -0.783203125, -0.43359375, -0.083984375, 0.265625, 0.615234375, 0.96484375, 1.314453125, 1.6640625, 2.013671875, 2.36328125, 2.712890625, 3.0625, 3.412109375, 3.76171875, 4.111328125, 4.4609375, 4.810546875, 5.16015625, 5.509765625, 5.859375, 6.208984375, 6.55859375, 6.908203125, 7.2578125, 7.607421875, 7.95703125, 8.306640625, 8.65625, 9.005859375, 9.35546875, 9.705078125, 10.0546875, 10.404296875, 10.75390625, 11.103515625, 11.453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 10.0, 11.0, 11.0, 11.0, 18.0, 23.0, 37.0, 43.0, 67.0, 79.0, 117.0, 178.0, 220.0, 338.0, 499.0, 677.0, 1050.0, 1558.0, 2502.0, 4113.0, 6883.0, 12469.0, 24580.0, 52048.0, 119780.0, 256585.0, 287728.0, 147877.0, 63917.0, 29592.0, 14790.0, 7997.0, 4501.0, 2812.0, 1692.0, 1203.0, 788.0, 514.0, 360.0, 262.0, 165.0, 129.0, 89.0, 67.0, 55.0, 35.0, 23.0, 14.0, 14.0, 9.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.888671875, -3.771270751953125, -3.65386962890625, -3.536468505859375, -3.4190673828125, -3.301666259765625, -3.18426513671875, -3.066864013671875, -2.949462890625, -2.832061767578125, -2.71466064453125, -2.597259521484375, -2.4798583984375, -2.362457275390625, -2.24505615234375, -2.127655029296875, -2.01025390625, -1.892852783203125, -1.77545166015625, -1.658050537109375, -1.5406494140625, -1.423248291015625, -1.30584716796875, -1.188446044921875, -1.071044921875, -0.953643798828125, -0.83624267578125, -0.718841552734375, -0.6014404296875, -0.484039306640625, -0.36663818359375, -0.249237060546875, -0.1318359375, -0.014434814453125, 0.10296630859375, 0.220367431640625, 0.3377685546875, 0.455169677734375, 0.57257080078125, 0.689971923828125, 0.807373046875, 0.924774169921875, 1.04217529296875, 1.159576416015625, 1.2769775390625, 1.394378662109375, 1.51177978515625, 1.629180908203125, 1.74658203125, 1.863983154296875, 1.98138427734375, 2.098785400390625, 2.2161865234375, 2.333587646484375, 2.45098876953125, 2.568389892578125, 2.685791015625, 2.803192138671875, 2.92059326171875, 3.037994384765625, 3.1553955078125, 3.272796630859375, 3.39019775390625, 3.507598876953125, 3.625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 9.0, 7.0, 8.0, 13.0, 9.0, 14.0, 16.0, 19.0, 10.0, 27.0, 23.0, 32.0, 21.0, 24.0, 35.0, 41.0, 41.0, 40.0, 38.0, 41.0, 47.0, 46.0, 40.0, 47.0, 37.0, 38.0, 43.0, 34.0, 31.0, 28.0, 17.0, 22.0, 12.0, 17.0, 19.0, 11.0, 7.0, 5.0, 8.0, 6.0, 8.0, 2.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.0234375, -7.77685546875, -7.5302734375, -7.28369140625, -7.037109375, -6.79052734375, -6.5439453125, -6.29736328125, -6.05078125, -5.80419921875, -5.5576171875, -5.31103515625, -5.064453125, -4.81787109375, -4.5712890625, -4.32470703125, -4.078125, -3.83154296875, -3.5849609375, -3.33837890625, -3.091796875, -2.84521484375, -2.5986328125, -2.35205078125, -2.10546875, -1.85888671875, -1.6123046875, -1.36572265625, -1.119140625, -0.87255859375, -0.6259765625, -0.37939453125, -0.1328125, 0.11376953125, 0.3603515625, 0.60693359375, 0.853515625, 1.10009765625, 1.3466796875, 1.59326171875, 1.83984375, 2.08642578125, 2.3330078125, 2.57958984375, 2.826171875, 3.07275390625, 3.3193359375, 3.56591796875, 3.8125, 4.05908203125, 4.3056640625, 4.55224609375, 4.798828125, 5.04541015625, 5.2919921875, 5.53857421875, 5.78515625, 6.03173828125, 6.2783203125, 6.52490234375, 6.771484375, 7.01806640625, 7.2646484375, 7.51123046875, 7.7578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 1.0, 10.0, 3.0, 14.0, 24.0, 23.0, 34.0, 50.0, 74.0, 101.0, 143.0, 182.0, 285.0, 385.0, 552.0, 898.0, 1345.0, 2198.0, 3944.0, 7437.0, 15760.0, 40280.0, 139732.0, 485871.0, 244723.0, 61099.0, 21699.0, 9515.0, 4929.0, 2708.0, 1540.0, 951.0, 631.0, 411.0, 302.0, 207.0, 129.0, 103.0, 71.0, 54.0, 40.0, 35.0, 16.0, 15.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8232421875, -1.763824462890625, -1.70440673828125, -1.644989013671875, -1.5855712890625, -1.526153564453125, -1.46673583984375, -1.407318115234375, -1.347900390625, -1.288482666015625, -1.22906494140625, -1.169647216796875, -1.1102294921875, -1.050811767578125, -0.99139404296875, -0.931976318359375, -0.87255859375, -0.813140869140625, -0.75372314453125, -0.694305419921875, -0.6348876953125, -0.575469970703125, -0.51605224609375, -0.456634521484375, -0.397216796875, -0.337799072265625, -0.27838134765625, -0.218963623046875, -0.1595458984375, -0.100128173828125, -0.04071044921875, 0.018707275390625, 0.078125, 0.137542724609375, 0.19696044921875, 0.256378173828125, 0.3157958984375, 0.375213623046875, 0.43463134765625, 0.494049072265625, 0.553466796875, 0.612884521484375, 0.67230224609375, 0.731719970703125, 0.7911376953125, 0.850555419921875, 0.90997314453125, 0.969390869140625, 1.02880859375, 1.088226318359375, 1.14764404296875, 1.207061767578125, 1.2664794921875, 1.325897216796875, 1.38531494140625, 1.444732666015625, 1.504150390625, 1.563568115234375, 1.62298583984375, 1.682403564453125, 1.7418212890625, 1.801239013671875, 1.86065673828125, 1.920074462890625, 1.9794921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 7.0, 11.0, 14.0, 15.0, 19.0, 13.0, 35.0, 35.0, 36.0, 44.0, 61.0, 57.0, 62.0, 69.0, 70.0, 62.0, 59.0, 45.0, 37.0, 36.0, 39.0, 27.0, 24.0, 29.0, 13.0, 21.0, 5.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00014256685972213745, -0.00013779103755950928, -0.0001330152153968811, -0.00012823939323425293, -0.00012346357107162476, -0.00011868774890899658, -0.00011391192674636841, -0.00010913610458374023, -0.00010436028242111206, -9.958446025848389e-05, -9.480863809585571e-05, -9.003281593322754e-05, -8.525699377059937e-05, -8.048117160797119e-05, -7.570534944534302e-05, -7.092952728271484e-05, -6.615370512008667e-05, -6.13778829574585e-05, -5.660206079483032e-05, -5.182623863220215e-05, -4.7050416469573975e-05, -4.22745943069458e-05, -3.749877214431763e-05, -3.272294998168945e-05, -2.794712781906128e-05, -2.3171305656433105e-05, -1.839548349380493e-05, -1.3619661331176758e-05, -8.843839168548584e-06, -4.06801700592041e-06, 7.078051567077637e-07, 5.4836273193359375e-06, 1.0259449481964111e-05, 1.5035271644592285e-05, 1.981109380722046e-05, 2.4586915969848633e-05, 2.9362738132476807e-05, 3.413856029510498e-05, 3.8914382457733154e-05, 4.369020462036133e-05, 4.84660267829895e-05, 5.3241848945617676e-05, 5.801767110824585e-05, 6.279349327087402e-05, 6.75693154335022e-05, 7.234513759613037e-05, 7.712095975875854e-05, 8.189678192138672e-05, 8.667260408401489e-05, 9.144842624664307e-05, 9.622424840927124e-05, 0.00010100007057189941, 0.00010577589273452759, 0.00011055171489715576, 0.00011532753705978394, 0.00012010335922241211, 0.00012487918138504028, 0.00012965500354766846, 0.00013443082571029663, 0.0001392066478729248, 0.00014398247003555298, 0.00014875829219818115, 0.00015353411436080933, 0.0001583099365234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 2.0, 14.0, 14.0, 27.0, 33.0, 64.0, 98.0, 155.0, 240.0, 417.0, 651.0, 1200.0, 2249.0, 4140.0, 7853.0, 15778.0, 35109.0, 83564.0, 205331.0, 329987.0, 207490.0, 85199.0, 35273.0, 16383.0, 7944.0, 4147.0, 2219.0, 1238.0, 712.0, 376.0, 244.0, 147.0, 91.0, 62.0, 27.0, 17.0, 14.0, 12.0, 14.0, 5.0, 11.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.90234375, -2.8182373046875, -2.734130859375, -2.6500244140625, -2.56591796875, -2.4818115234375, -2.397705078125, -2.3135986328125, -2.2294921875, -2.1453857421875, -2.061279296875, -1.9771728515625, -1.89306640625, -1.8089599609375, -1.724853515625, -1.6407470703125, -1.556640625, -1.4725341796875, -1.388427734375, -1.3043212890625, -1.22021484375, -1.1361083984375, -1.052001953125, -0.9678955078125, -0.8837890625, -0.7996826171875, -0.715576171875, -0.6314697265625, -0.54736328125, -0.4632568359375, -0.379150390625, -0.2950439453125, -0.2109375, -0.1268310546875, -0.042724609375, 0.0413818359375, 0.12548828125, 0.2095947265625, 0.293701171875, 0.3778076171875, 0.4619140625, 0.5460205078125, 0.630126953125, 0.7142333984375, 0.79833984375, 0.8824462890625, 0.966552734375, 1.0506591796875, 1.134765625, 1.2188720703125, 1.302978515625, 1.3870849609375, 1.47119140625, 1.5552978515625, 1.639404296875, 1.7235107421875, 1.8076171875, 1.8917236328125, 1.975830078125, 2.0599365234375, 2.14404296875, 2.2281494140625, 2.312255859375, 2.3963623046875, 2.48046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 5.0, 14.0, 17.0, 25.0, 44.0, 41.0, 56.0, 63.0, 90.0, 103.0, 112.0, 109.0, 93.0, 56.0, 33.0, 36.0, 19.0, 20.0, 13.0, 12.0, 14.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1787109375, -1.1479949951171875, -1.117279052734375, -1.0865631103515625, -1.05584716796875, -1.0251312255859375, -0.994415283203125, -0.9636993408203125, -0.9329833984375, -0.9022674560546875, -0.871551513671875, -0.8408355712890625, -0.81011962890625, -0.7794036865234375, -0.748687744140625, -0.7179718017578125, -0.687255859375, -0.6565399169921875, -0.625823974609375, -0.5951080322265625, -0.56439208984375, -0.5336761474609375, -0.502960205078125, -0.4722442626953125, -0.4415283203125, -0.4108123779296875, -0.380096435546875, -0.3493804931640625, -0.31866455078125, -0.2879486083984375, -0.257232666015625, -0.2265167236328125, -0.19580078125, -0.1650848388671875, -0.134368896484375, -0.1036529541015625, -0.07293701171875, -0.0422210693359375, -0.011505126953125, 0.0192108154296875, 0.0499267578125, 0.0806427001953125, 0.111358642578125, 0.1420745849609375, 0.17279052734375, 0.2035064697265625, 0.234222412109375, 0.2649383544921875, 0.295654296875, 0.3263702392578125, 0.357086181640625, 0.3878021240234375, 0.41851806640625, 0.4492340087890625, 0.479949951171875, 0.5106658935546875, 0.5413818359375, 0.5720977783203125, 0.602813720703125, 0.6335296630859375, 0.66424560546875, 0.6949615478515625, 0.725677490234375, 0.7563934326171875, 0.787109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 8.0, 15.0, 12.0, 17.0, 22.0, 19.0, 19.0, 21.0, 27.0, 23.0, 37.0, 31.0, 28.0, 36.0, 50.0, 27.0, 39.0, 41.0, 39.0, 39.0, 34.0, 40.0, 38.0, 37.0, 34.0, 37.0, 27.0, 33.0, 13.0, 27.0, 20.0, 14.0, 12.0, 8.0, 7.0, 13.0, 5.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.514762878417969, -10.161996841430664, -9.80923080444336, -9.456463813781738, -9.103697776794434, -8.750931739807129, -8.398164749145508, -8.045398712158203, -7.692632675170898, -7.339866638183594, -6.987100124359131, -6.634333610534668, -6.281567573547363, -5.928801536560059, -5.576035022735596, -5.223268508911133, -4.870502471923828, -4.517736434936523, -4.1649699211120605, -3.8122036457061768, -3.459437370300293, -3.106671094894409, -2.7539048194885254, -2.4011385440826416, -2.048372268676758, -1.695605993270874, -1.3428397178649902, -0.9900734424591064, -0.6373071670532227, -0.28454089164733887, 0.06822538375854492, 0.4209916591644287, 0.7737579345703125, 1.1265242099761963, 1.47929048538208, 1.8320567607879639, 2.1848230361938477, 2.5375893115997314, 2.8903555870056152, 3.243121862411499, 3.595888137817383, 3.9486544132232666, 4.30142068862915, 4.654187202453613, 5.006953239440918, 5.359719276428223, 5.7124857902526855, 6.065252304077148, 6.418018341064453, 6.770784378051758, 7.123550891876221, 7.476317405700684, 7.829083442687988, 8.181849479675293, 8.534616470336914, 8.887382507324219, 9.240148544311523, 9.592914581298828, 9.945680618286133, 10.298447608947754, 10.651213645935059, 11.003979682922363, 11.356746673583984, 11.709512710571289, 12.062278747558594]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 3.0, 7.0, 13.0, 10.0, 17.0, 18.0, 18.0, 23.0, 14.0, 30.0, 27.0, 35.0, 30.0, 28.0, 33.0, 34.0, 37.0, 41.0, 25.0, 36.0, 45.0, 38.0, 51.0, 36.0, 32.0, 34.0, 26.0, 28.0, 34.0, 31.0, 24.0, 20.0, 18.0, 18.0, 11.0, 15.0, 8.0, 13.0, 10.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.804856300354004, -10.4555082321167, -10.106159210205078, -9.756811141967773, -9.407462120056152, -9.058114051818848, -8.708765029907227, -8.359416961669922, -8.0100679397583, -7.660719394683838, -7.311370849609375, -6.962022304534912, -6.612673759460449, -6.263325214385986, -5.913976669311523, -5.564628601074219, -5.215280055999756, -4.865931510925293, -4.51658296585083, -4.167234420776367, -3.8178858757019043, -3.4685373306274414, -3.1191890239715576, -2.7698404788970947, -2.420491933822632, -2.071143388748169, -1.721794843673706, -1.3724464178085327, -1.0230978727340698, -0.6737493276596069, -0.3244009017944336, 0.024947643280029297, 0.3742961883544922, 0.7236447334289551, 1.072993278503418, 1.4223417043685913, 1.7716902494430542, 2.1210389137268066, 2.4703872203826904, 2.8197357654571533, 3.169084310531616, 3.518432855606079, 3.867781400680542, 4.217129707336426, 4.566478252410889, 4.915826797485352, 5.2651753425598145, 5.614523887634277, 5.96387243270874, 6.313220977783203, 6.662569522857666, 7.011918067932129, 7.361266613006592, 7.710615158081055, 8.05996322631836, 8.40931224822998, 8.758660316467285, 9.10800838470459, 9.457357406616211, 9.806705474853516, 10.156054496765137, 10.505402565002441, 10.854751586914062, 11.204099655151367, 11.553448677062988]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 14.0, 16.0, 26.0, 43.0, 89.0, 150.0, 242.0, 420.0, 694.0, 1147.0, 1877.0, 2964.0, 4906.0, 7567.0, 11830.0, 17842.0, 25957.0, 36653.0, 50227.0, 65330.0, 79486.0, 93150.0, 101037.0, 101978.0, 97260.0, 86087.0, 71956.0, 56433.0, 42567.0, 30443.0, 20930.0, 14411.0, 9243.0, 5979.0, 3783.0, 2236.0, 1376.0, 902.0, 498.0, 336.0, 192.0, 133.0, 52.0, 38.0, 21.0, 14.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7890625, -8.48828125, -8.1875, -7.88671875, -7.5859375, -7.28515625, -6.984375, -6.68359375, -6.3828125, -6.08203125, -5.78125, -5.48046875, -5.1796875, -4.87890625, -4.578125, -4.27734375, -3.9765625, -3.67578125, -3.375, -3.07421875, -2.7734375, -2.47265625, -2.171875, -1.87109375, -1.5703125, -1.26953125, -0.96875, -0.66796875, -0.3671875, -0.06640625, 0.234375, 0.53515625, 0.8359375, 1.13671875, 1.4375, 1.73828125, 2.0390625, 2.33984375, 2.640625, 2.94140625, 3.2421875, 3.54296875, 3.84375, 4.14453125, 4.4453125, 4.74609375, 5.046875, 5.34765625, 5.6484375, 5.94921875, 6.25, 6.55078125, 6.8515625, 7.15234375, 7.453125, 7.75390625, 8.0546875, 8.35546875, 8.65625, 8.95703125, 9.2578125, 9.55859375, 9.859375, 10.16015625, 10.4609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 6.0, 14.0, 9.0, 17.0, 18.0, 16.0, 25.0, 17.0, 23.0, 32.0, 37.0, 25.0, 31.0, 37.0, 28.0, 38.0, 37.0, 31.0, 35.0, 44.0, 39.0, 53.0, 30.0, 34.0, 34.0, 29.0, 20.0, 41.0, 29.0, 26.0, 21.0, 15.0, 19.0, 13.0, 13.0, 9.0, 13.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.1156005859375, -9.778076171875, -9.4405517578125, -9.10302734375, -8.7655029296875, -8.427978515625, -8.0904541015625, -7.7529296875, -7.4154052734375, -7.077880859375, -6.7403564453125, -6.40283203125, -6.0653076171875, -5.727783203125, -5.3902587890625, -5.052734375, -4.7152099609375, -4.377685546875, -4.0401611328125, -3.70263671875, -3.3651123046875, -3.027587890625, -2.6900634765625, -2.3525390625, -2.0150146484375, -1.677490234375, -1.3399658203125, -1.00244140625, -0.6649169921875, -0.327392578125, 0.0101318359375, 0.34765625, 0.6851806640625, 1.022705078125, 1.3602294921875, 1.69775390625, 2.0352783203125, 2.372802734375, 2.7103271484375, 3.0478515625, 3.3853759765625, 3.722900390625, 4.0604248046875, 4.39794921875, 4.7354736328125, 5.072998046875, 5.4105224609375, 5.748046875, 6.0855712890625, 6.423095703125, 6.7606201171875, 7.09814453125, 7.4356689453125, 7.773193359375, 8.1107177734375, 8.4482421875, 8.7857666015625, 9.123291015625, 9.4608154296875, 9.79833984375, 10.1358642578125, 10.473388671875, 10.8109130859375, 11.1484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 14.0, 25.0, 36.0, 62.0, 77.0, 133.0, 218.0, 352.0, 492.0, 771.0, 1253.0, 1820.0, 3014.0, 4718.0, 7217.0, 10831.0, 16167.0, 23579.0, 33465.0, 45805.0, 59657.0, 74116.0, 87787.0, 97082.0, 101062.0, 97658.0, 88495.0, 75738.0, 61387.0, 47044.0, 34628.0, 24526.0, 16942.0, 11452.0, 7439.0, 4934.0, 3044.0, 1955.0, 1274.0, 816.0, 538.0, 330.0, 221.0, 150.0, 82.0, 45.0, 39.0, 19.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.9765625, -8.6827392578125, -8.388916015625, -8.0950927734375, -7.80126953125, -7.5074462890625, -7.213623046875, -6.9197998046875, -6.6259765625, -6.3321533203125, -6.038330078125, -5.7445068359375, -5.45068359375, -5.1568603515625, -4.863037109375, -4.5692138671875, -4.275390625, -3.9815673828125, -3.687744140625, -3.3939208984375, -3.10009765625, -2.8062744140625, -2.512451171875, -2.2186279296875, -1.9248046875, -1.6309814453125, -1.337158203125, -1.0433349609375, -0.74951171875, -0.4556884765625, -0.161865234375, 0.1319580078125, 0.42578125, 0.7196044921875, 1.013427734375, 1.3072509765625, 1.60107421875, 1.8948974609375, 2.188720703125, 2.4825439453125, 2.7763671875, 3.0701904296875, 3.364013671875, 3.6578369140625, 3.95166015625, 4.2454833984375, 4.539306640625, 4.8331298828125, 5.126953125, 5.4207763671875, 5.714599609375, 6.0084228515625, 6.30224609375, 6.5960693359375, 6.889892578125, 7.1837158203125, 7.4775390625, 7.7713623046875, 8.065185546875, 8.3590087890625, 8.65283203125, 8.9466552734375, 9.240478515625, 9.5343017578125, 9.828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 10.0, 8.0, 13.0, 17.0, 24.0, 11.0, 11.0, 24.0, 19.0, 30.0, 29.0, 26.0, 37.0, 39.0, 36.0, 52.0, 49.0, 28.0, 31.0, 37.0, 45.0, 48.0, 40.0, 36.0, 39.0, 38.0, 27.0, 23.0, 25.0, 22.0, 20.0, 24.0, 15.0, 12.0, 10.0, 4.0, 6.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.2578125, -7.0216064453125, -6.785400390625, -6.5491943359375, -6.31298828125, -6.0767822265625, -5.840576171875, -5.6043701171875, -5.3681640625, -5.1319580078125, -4.895751953125, -4.6595458984375, -4.42333984375, -4.1871337890625, -3.950927734375, -3.7147216796875, -3.478515625, -3.2423095703125, -3.006103515625, -2.7698974609375, -2.53369140625, -2.2974853515625, -2.061279296875, -1.8250732421875, -1.5888671875, -1.3526611328125, -1.116455078125, -0.8802490234375, -0.64404296875, -0.4078369140625, -0.171630859375, 0.0645751953125, 0.30078125, 0.5369873046875, 0.773193359375, 1.0093994140625, 1.24560546875, 1.4818115234375, 1.718017578125, 1.9542236328125, 2.1904296875, 2.4266357421875, 2.662841796875, 2.8990478515625, 3.13525390625, 3.3714599609375, 3.607666015625, 3.8438720703125, 4.080078125, 4.3162841796875, 4.552490234375, 4.7886962890625, 5.02490234375, 5.2611083984375, 5.497314453125, 5.7335205078125, 5.9697265625, 6.2059326171875, 6.442138671875, 6.6783447265625, 6.91455078125, 7.1507568359375, 7.386962890625, 7.6231689453125, 7.859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 14.0, 6.0, 20.0, 23.0, 31.0, 52.0, 61.0, 110.0, 149.0, 230.0, 306.0, 513.0, 722.0, 1241.0, 2108.0, 3525.0, 6263.0, 10745.0, 18454.0, 30984.0, 49766.0, 75907.0, 106376.0, 132618.0, 143685.0, 135653.0, 111648.0, 80526.0, 53859.0, 33868.0, 20480.0, 11721.0, 6868.0, 3983.0, 2344.0, 1380.0, 804.0, 504.0, 327.0, 222.0, 147.0, 100.0, 67.0, 42.0, 38.0, 23.0, 15.0, 14.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.53515625, -5.35418701171875, -5.1732177734375, -4.99224853515625, -4.811279296875, -4.63031005859375, -4.4493408203125, -4.26837158203125, -4.08740234375, -3.90643310546875, -3.7254638671875, -3.54449462890625, -3.363525390625, -3.18255615234375, -3.0015869140625, -2.82061767578125, -2.6396484375, -2.45867919921875, -2.2777099609375, -2.09674072265625, -1.915771484375, -1.73480224609375, -1.5538330078125, -1.37286376953125, -1.19189453125, -1.01092529296875, -0.8299560546875, -0.64898681640625, -0.468017578125, -0.28704833984375, -0.1060791015625, 0.07489013671875, 0.255859375, 0.43682861328125, 0.6177978515625, 0.79876708984375, 0.979736328125, 1.16070556640625, 1.3416748046875, 1.52264404296875, 1.70361328125, 1.88458251953125, 2.0655517578125, 2.24652099609375, 2.427490234375, 2.60845947265625, 2.7894287109375, 2.97039794921875, 3.1513671875, 3.33233642578125, 3.5133056640625, 3.69427490234375, 3.875244140625, 4.05621337890625, 4.2371826171875, 4.41815185546875, 4.59912109375, 4.78009033203125, 4.9610595703125, 5.14202880859375, 5.322998046875, 5.50396728515625, 5.6849365234375, 5.86590576171875, 6.046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 6.0, 9.0, 8.0, 12.0, 19.0, 13.0, 20.0, 26.0, 28.0, 34.0, 23.0, 34.0, 44.0, 27.0, 46.0, 60.0, 56.0, 47.0, 55.0, 54.0, 43.0, 59.0, 42.0, 46.0, 33.0, 22.0, 31.0, 16.0, 17.0, 13.0, 13.0, 9.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0007762908935546875, -0.0007555261254310608, -0.0007347613573074341, -0.0007139965891838074, -0.0006932318210601807, -0.000672467052936554, -0.0006517022848129272, -0.0006309375166893005, -0.0006101727485656738, -0.0005894079804420471, -0.0005686432123184204, -0.0005478784441947937, -0.000527113676071167, -0.0005063489079475403, -0.0004855841398239136, -0.00046481937170028687, -0.00044405460357666016, -0.00042328983545303345, -0.00040252506732940674, -0.00038176029920578003, -0.0003609955310821533, -0.0003402307629585266, -0.0003194659948348999, -0.0002987012267112732, -0.0002779364585876465, -0.0002571716904640198, -0.00023640692234039307, -0.00021564215421676636, -0.00019487738609313965, -0.00017411261796951294, -0.00015334784984588623, -0.00013258308172225952, -0.00011181831359863281, -9.10535454750061e-05, -7.02887773513794e-05, -4.9524009227752686e-05, -2.8759241104125977e-05, -7.994472980499268e-06, 1.2770295143127441e-05, 3.353506326675415e-05, 5.429983139038086e-05, 7.506459951400757e-05, 9.582936763763428e-05, 0.00011659413576126099, 0.0001373589038848877, 0.0001581236720085144, 0.0001788884401321411, 0.00019965320825576782, 0.00022041797637939453, 0.00024118274450302124, 0.00026194751262664795, 0.00028271228075027466, 0.00030347704887390137, 0.0003242418169975281, 0.0003450065851211548, 0.0003657713532447815, 0.0003865361213684082, 0.0004073008894920349, 0.0004280656576156616, 0.00044883042573928833, 0.00046959519386291504, 0.0004903599619865417, 0.0005111247301101685, 0.0005318894982337952, 0.0005526542663574219]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 9.0, 9.0, 7.0, 12.0, 26.0, 33.0, 70.0, 140.0, 223.0, 313.0, 559.0, 982.0, 1682.0, 3060.0, 5492.0, 10246.0, 18484.0, 33366.0, 57483.0, 92055.0, 131103.0, 160577.0, 162238.0, 135478.0, 95763.0, 60516.0, 35026.0, 19546.0, 10700.0, 5756.0, 3138.0, 1898.0, 1022.0, 619.0, 384.0, 226.0, 133.0, 71.0, 58.0, 18.0, 15.0, 10.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2735595703125, -7.031494140625, -6.7894287109375, -6.54736328125, -6.3052978515625, -6.063232421875, -5.8211669921875, -5.5791015625, -5.3370361328125, -5.094970703125, -4.8529052734375, -4.61083984375, -4.3687744140625, -4.126708984375, -3.8846435546875, -3.642578125, -3.4005126953125, -3.158447265625, -2.9163818359375, -2.67431640625, -2.4322509765625, -2.190185546875, -1.9481201171875, -1.7060546875, -1.4639892578125, -1.221923828125, -0.9798583984375, -0.73779296875, -0.4957275390625, -0.253662109375, -0.0115966796875, 0.23046875, 0.4725341796875, 0.714599609375, 0.9566650390625, 1.19873046875, 1.4407958984375, 1.682861328125, 1.9249267578125, 2.1669921875, 2.4090576171875, 2.651123046875, 2.8931884765625, 3.13525390625, 3.3773193359375, 3.619384765625, 3.8614501953125, 4.103515625, 4.3455810546875, 4.587646484375, 4.8297119140625, 5.07177734375, 5.3138427734375, 5.555908203125, 5.7979736328125, 6.0400390625, 6.2821044921875, 6.524169921875, 6.7662353515625, 7.00830078125, 7.2503662109375, 7.492431640625, 7.7344970703125, 7.9765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 12.0, 14.0, 10.0, 29.0, 30.0, 30.0, 39.0, 51.0, 51.0, 55.0, 76.0, 70.0, 82.0, 67.0, 68.0, 47.0, 37.0, 45.0, 40.0, 31.0, 27.0, 19.0, 11.0, 10.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.97259521484375, -2.8690185546875, -2.76544189453125, -2.661865234375, -2.55828857421875, -2.4547119140625, -2.35113525390625, -2.24755859375, -2.14398193359375, -2.0404052734375, -1.93682861328125, -1.833251953125, -1.72967529296875, -1.6260986328125, -1.52252197265625, -1.4189453125, -1.31536865234375, -1.2117919921875, -1.10821533203125, -1.004638671875, -0.90106201171875, -0.7974853515625, -0.69390869140625, -0.59033203125, -0.48675537109375, -0.3831787109375, -0.27960205078125, -0.176025390625, -0.07244873046875, 0.0311279296875, 0.13470458984375, 0.23828125, 0.34185791015625, 0.4454345703125, 0.54901123046875, 0.652587890625, 0.75616455078125, 0.8597412109375, 0.96331787109375, 1.06689453125, 1.17047119140625, 1.2740478515625, 1.37762451171875, 1.481201171875, 1.58477783203125, 1.6883544921875, 1.79193115234375, 1.8955078125, 1.99908447265625, 2.1026611328125, 2.20623779296875, 2.309814453125, 2.41339111328125, 2.5169677734375, 2.62054443359375, 2.72412109375, 2.82769775390625, 2.9312744140625, 3.03485107421875, 3.138427734375, 3.24200439453125, 3.3455810546875, 3.44915771484375, 3.552734375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 9.0, 5.0, 8.0, 13.0, 13.0, 13.0, 25.0, 19.0, 15.0, 22.0, 30.0, 33.0, 26.0, 39.0, 23.0, 35.0, 36.0, 40.0, 47.0, 33.0, 44.0, 43.0, 41.0, 45.0, 53.0, 41.0, 44.0, 29.0, 31.0, 24.0, 20.0, 17.0, 19.0, 14.0, 10.0, 7.0, 5.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.578670501708984, -11.192037582397461, -10.805404663085938, -10.418771743774414, -10.032139778137207, -9.645506858825684, -9.25887393951416, -8.872241020202637, -8.48560905456543, -8.098976135253906, -7.712343692779541, -7.325710773468018, -6.939078330993652, -6.552445411682129, -6.1658124923706055, -5.779179573059082, -5.392546653747559, -5.005913734436035, -4.61928129196167, -4.2326483726501465, -3.846015691757202, -3.459383010864258, -3.0727500915527344, -2.68611741065979, -2.2994847297668457, -1.9128520488739014, -1.5262192487716675, -1.1395864486694336, -0.7529537677764893, -0.3663210868835449, 0.020311832427978516, 0.40694451332092285, 0.7935762405395508, 1.1802089214324951, 1.566841721534729, 1.953474521636963, 2.3401072025299072, 2.7267398834228516, 3.113372802734375, 3.5000054836273193, 3.8866381645202637, 4.273271083831787, 4.659903526306152, 5.046536445617676, 5.433169364929199, 5.8198018074035645, 6.206434726715088, 6.593067169189453, 6.979700088500977, 7.3663330078125, 7.752965450286865, 8.139598846435547, 8.526230812072754, 8.912863731384277, 9.2994966506958, 9.686129570007324, 10.072761535644531, 10.459394454956055, 10.846027374267578, 11.232660293579102, 11.619292259216309, 12.005925178527832, 12.392558097839355, 12.779191017150879, 13.165823936462402]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 9.0, 10.0, 23.0, 20.0, 15.0, 19.0, 26.0, 22.0, 26.0, 25.0, 32.0, 28.0, 41.0, 50.0, 31.0, 52.0, 31.0, 37.0, 34.0, 33.0, 41.0, 35.0, 45.0, 37.0, 37.0, 26.0, 28.0, 28.0, 17.0, 22.0, 20.0, 18.0, 17.0, 12.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.380697250366211, -11.008035659790039, -10.635375022888184, -10.262714385986328, -9.890052795410156, -9.517391204833984, -9.144730567932129, -8.772069931030273, -8.399408340454102, -8.02674674987793, -7.654086112976074, -7.2814249992370605, -6.908763885498047, -6.536102771759033, -6.1634416580200195, -5.790780544281006, -5.418119430541992, -5.0454583168029785, -4.672797203063965, -4.300136089324951, -3.9274749755859375, -3.554813861846924, -3.18215274810791, -2.8094916343688965, -2.436830520629883, -2.064169406890869, -1.6915082931518555, -1.3188471794128418, -0.9461860656738281, -0.5735249519348145, -0.20086383819580078, 0.1717972755432129, 0.544459342956543, 0.9171204566955566, 1.2897815704345703, 1.662442684173584, 2.0351037979125977, 2.4077649116516113, 2.780426025390625, 3.1530871391296387, 3.5257482528686523, 3.898409366607666, 4.27107048034668, 4.643731594085693, 5.016392707824707, 5.389053821563721, 5.761714935302734, 6.134376049041748, 6.507037162780762, 6.879698276519775, 7.252359390258789, 7.625020503997803, 7.997681617736816, 8.370342254638672, 8.743003845214844, 9.115665435791016, 9.488326072692871, 9.860986709594727, 10.233648300170898, 10.60630989074707, 10.978970527648926, 11.351631164550781, 11.724292755126953, 12.096954345703125, 12.46961498260498]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 22.0, 20.0, 49.0, 53.0, 111.0, 216.0, 416.0, 615.0, 1101.0, 1733.0, 3060.0, 4900.0, 7845.0, 12793.0, 20259.0, 32113.0, 48900.0, 74258.0, 108393.0, 153381.0, 208827.0, 275501.0, 338902.0, 392371.0, 423160.0, 422425.0, 390641.0, 336118.0, 270581.0, 206546.0, 149774.0, 105660.0, 71551.0, 48018.0, 31387.0, 19782.0, 12573.0, 7723.0, 4872.0, 2988.0, 1725.0, 1154.0, 666.0, 442.0, 248.0, 176.0, 95.0, 51.0, 41.0, 21.0, 12.0, 10.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.8515625, -8.57470703125, -8.2978515625, -8.02099609375, -7.744140625, -7.46728515625, -7.1904296875, -6.91357421875, -6.63671875, -6.35986328125, -6.0830078125, -5.80615234375, -5.529296875, -5.25244140625, -4.9755859375, -4.69873046875, -4.421875, -4.14501953125, -3.8681640625, -3.59130859375, -3.314453125, -3.03759765625, -2.7607421875, -2.48388671875, -2.20703125, -1.93017578125, -1.6533203125, -1.37646484375, -1.099609375, -0.82275390625, -0.5458984375, -0.26904296875, 0.0078125, 0.28466796875, 0.5615234375, 0.83837890625, 1.115234375, 1.39208984375, 1.6689453125, 1.94580078125, 2.22265625, 2.49951171875, 2.7763671875, 3.05322265625, 3.330078125, 3.60693359375, 3.8837890625, 4.16064453125, 4.4375, 4.71435546875, 4.9912109375, 5.26806640625, 5.544921875, 5.82177734375, 6.0986328125, 6.37548828125, 6.65234375, 6.92919921875, 7.2060546875, 7.48291015625, 7.759765625, 8.03662109375, 8.3134765625, 8.59033203125, 8.8671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 3.0, 8.0, 19.0, 19.0, 22.0, 22.0, 17.0, 24.0, 23.0, 29.0, 27.0, 29.0, 38.0, 39.0, 39.0, 38.0, 49.0, 43.0, 25.0, 30.0, 37.0, 35.0, 42.0, 41.0, 35.0, 29.0, 33.0, 26.0, 23.0, 23.0, 11.0, 27.0, 16.0, 17.0, 9.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.609375, -9.2900390625, -8.970703125, -8.6513671875, -8.33203125, -8.0126953125, -7.693359375, -7.3740234375, -7.0546875, -6.7353515625, -6.416015625, -6.0966796875, -5.77734375, -5.4580078125, -5.138671875, -4.8193359375, -4.5, -4.1806640625, -3.861328125, -3.5419921875, -3.22265625, -2.9033203125, -2.583984375, -2.2646484375, -1.9453125, -1.6259765625, -1.306640625, -0.9873046875, -0.66796875, -0.3486328125, -0.029296875, 0.2900390625, 0.609375, 0.9287109375, 1.248046875, 1.5673828125, 1.88671875, 2.2060546875, 2.525390625, 2.8447265625, 3.1640625, 3.4833984375, 3.802734375, 4.1220703125, 4.44140625, 4.7607421875, 5.080078125, 5.3994140625, 5.71875, 6.0380859375, 6.357421875, 6.6767578125, 6.99609375, 7.3154296875, 7.634765625, 7.9541015625, 8.2734375, 8.5927734375, 8.912109375, 9.2314453125, 9.55078125, 9.8701171875, 10.189453125, 10.5087890625, 10.828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 21.0, 13.0, 47.0, 86.0, 121.0, 310.0, 527.0, 929.0, 1740.0, 3124.0, 5521.0, 9433.0, 16046.0, 26932.0, 43783.0, 68772.0, 105239.0, 152669.0, 213773.0, 283335.0, 349839.0, 405741.0, 436985.0, 434927.0, 400247.0, 341703.0, 272725.0, 206600.0, 146296.0, 99543.0, 64936.0, 41310.0, 25371.0, 15152.0, 8963.0, 5138.0, 2829.0, 1566.0, 923.0, 480.0, 289.0, 157.0, 66.0, 34.0, 31.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.4453125, -11.1268310546875, -10.808349609375, -10.4898681640625, -10.17138671875, -9.8529052734375, -9.534423828125, -9.2159423828125, -8.8974609375, -8.5789794921875, -8.260498046875, -7.9420166015625, -7.62353515625, -7.3050537109375, -6.986572265625, -6.6680908203125, -6.349609375, -6.0311279296875, -5.712646484375, -5.3941650390625, -5.07568359375, -4.7572021484375, -4.438720703125, -4.1202392578125, -3.8017578125, -3.4832763671875, -3.164794921875, -2.8463134765625, -2.52783203125, -2.2093505859375, -1.890869140625, -1.5723876953125, -1.25390625, -0.9354248046875, -0.616943359375, -0.2984619140625, 0.02001953125, 0.3385009765625, 0.656982421875, 0.9754638671875, 1.2939453125, 1.6124267578125, 1.930908203125, 2.2493896484375, 2.56787109375, 2.8863525390625, 3.204833984375, 3.5233154296875, 3.841796875, 4.1602783203125, 4.478759765625, 4.7972412109375, 5.11572265625, 5.4342041015625, 5.752685546875, 6.0711669921875, 6.3896484375, 6.7081298828125, 7.026611328125, 7.3450927734375, 7.66357421875, 7.9820556640625, 8.300537109375, 8.6190185546875, 8.9375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 5.0, 4.0, 11.0, 14.0, 23.0, 16.0, 23.0, 34.0, 36.0, 39.0, 52.0, 58.0, 85.0, 92.0, 127.0, 111.0, 135.0, 147.0, 165.0, 190.0, 167.0, 170.0, 196.0, 193.0, 219.0, 182.0, 184.0, 184.0, 175.0, 144.0, 147.0, 105.0, 107.0, 86.0, 62.0, 65.0, 52.0, 66.0, 43.0, 28.0, 31.0, 21.0, 18.0, 12.0, 13.0, 5.0, 5.0, 11.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.6171875, -4.47027587890625, -4.3233642578125, -4.17645263671875, -4.029541015625, -3.88262939453125, -3.7357177734375, -3.58880615234375, -3.44189453125, -3.29498291015625, -3.1480712890625, -3.00115966796875, -2.854248046875, -2.70733642578125, -2.5604248046875, -2.41351318359375, -2.2666015625, -2.11968994140625, -1.9727783203125, -1.82586669921875, -1.678955078125, -1.53204345703125, -1.3851318359375, -1.23822021484375, -1.09130859375, -0.94439697265625, -0.7974853515625, -0.65057373046875, -0.503662109375, -0.35675048828125, -0.2098388671875, -0.06292724609375, 0.083984375, 0.23089599609375, 0.3778076171875, 0.52471923828125, 0.671630859375, 0.81854248046875, 0.9654541015625, 1.11236572265625, 1.25927734375, 1.40618896484375, 1.5531005859375, 1.70001220703125, 1.846923828125, 1.99383544921875, 2.1407470703125, 2.28765869140625, 2.4345703125, 2.58148193359375, 2.7283935546875, 2.87530517578125, 3.022216796875, 3.16912841796875, 3.3160400390625, 3.46295166015625, 3.60986328125, 3.75677490234375, 3.9036865234375, 4.05059814453125, 4.197509765625, 4.34442138671875, 4.4913330078125, 4.63824462890625, 4.78515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 9.0, 10.0, 9.0, 23.0, 13.0, 25.0, 26.0, 29.0, 33.0, 52.0, 36.0, 49.0, 48.0, 58.0, 50.0, 39.0, 54.0, 44.0, 54.0, 54.0, 44.0, 33.0, 33.0, 35.0, 27.0, 21.0, 19.0, 10.0, 12.0, 9.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.173664093017578, -15.68911361694336, -15.204562187194824, -14.720011711120605, -14.235461235046387, -13.750909805297852, -13.266359329223633, -12.781808853149414, -12.297258377075195, -11.812707901000977, -11.328156471252441, -10.843605995178223, -10.359055519104004, -9.874504089355469, -9.38995361328125, -8.905403137207031, -8.420851707458496, -7.936300754547119, -7.4517502784729, -6.967199325561523, -6.482648849487305, -5.998097896575928, -5.513546943664551, -5.028996467590332, -4.544445514678955, -4.059894561767578, -3.5753440856933594, -3.0907931327819824, -2.6062424182891846, -2.1216917037963867, -1.6371407508850098, -1.152590036392212, -0.6680393218994141, -0.18348854780197144, 0.3010622262954712, 0.7856130599975586, 1.2701637744903564, 1.7547144889831543, 2.2392654418945312, 2.723816156387329, 3.208366870880127, 3.692917585372925, 4.177468299865723, 4.6620192527771, 5.146570205688477, 5.631120681762695, 6.115671634674072, 6.600222587585449, 7.084773063659668, 7.569324016571045, 8.053874969482422, 8.53842544555664, 9.02297592163086, 9.507526397705078, 9.992077827453613, 10.476628303527832, 10.961179733276367, 11.445730209350586, 11.930281639099121, 12.41483211517334, 12.899382591247559, 13.383934020996094, 13.868484497070312, 14.353034973144531, 14.83758544921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 9.0, 6.0, 10.0, 7.0, 7.0, 11.0, 15.0, 16.0, 22.0, 28.0, 18.0, 36.0, 36.0, 28.0, 50.0, 42.0, 37.0, 44.0, 37.0, 37.0, 36.0, 34.0, 42.0, 42.0, 37.0, 31.0, 32.0, 37.0, 32.0, 27.0, 22.0, 25.0, 20.0, 15.0, 20.0, 15.0, 10.0, 5.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.958240509033203, -10.571837425231934, -10.185434341430664, -9.799031257629395, -9.412628173828125, -9.026226043701172, -8.639822959899902, -8.253419876098633, -7.867016792297363, -7.480613708496094, -7.094210624694824, -6.707808017730713, -6.321404933929443, -5.935001850128174, -5.5485992431640625, -5.162196159362793, -4.775793075561523, -4.389389991760254, -4.002986907958984, -3.616584300994873, -3.2301812171936035, -2.843778133392334, -2.4573752880096436, -2.070972442626953, -1.6845693588256836, -1.2981663942337036, -0.9117634296417236, -0.5253604650497437, -0.13895750045776367, 0.2474454641342163, 0.6338484287261963, 1.0202512741088867, 1.4066543579101562, 1.7930573225021362, 2.179460287094116, 2.5658631324768066, 2.952266216278076, 3.3386693000793457, 3.725072145462036, 4.111474990844727, 4.497878074645996, 4.884281158447266, 5.270684242248535, 5.6570868492126465, 6.043489933013916, 6.4298930168151855, 6.816295623779297, 7.202698707580566, 7.589101791381836, 7.9755048751831055, 8.361907958984375, 8.748311042785645, 9.134714126586914, 9.521116256713867, 9.907519340515137, 10.293922424316406, 10.680325508117676, 11.066728591918945, 11.453131675720215, 11.839534759521484, 12.225936889648438, 12.612339973449707, 12.998743057250977, 13.385146141052246, 13.771549224853516]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 30.0, 37.0, 60.0, 86.0, 122.0, 179.0, 267.0, 400.0, 578.0, 905.0, 1221.0, 2050.0, 3296.0, 5267.0, 8770.0, 14803.0, 25072.0, 43849.0, 76516.0, 126358.0, 179913.0, 190683.0, 147476.0, 91192.0, 53346.0, 30664.0, 17731.0, 10498.0, 6307.0, 3874.0, 2372.0, 1519.0, 989.0, 647.0, 448.0, 319.0, 209.0, 150.0, 109.0, 70.0, 44.0, 28.0, 26.0, 18.0, 7.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.060546875, -2.968292236328125, -2.87603759765625, -2.783782958984375, -2.6915283203125, -2.599273681640625, -2.50701904296875, -2.414764404296875, -2.322509765625, -2.230255126953125, -2.13800048828125, -2.045745849609375, -1.9534912109375, -1.861236572265625, -1.76898193359375, -1.676727294921875, -1.58447265625, -1.492218017578125, -1.39996337890625, -1.307708740234375, -1.2154541015625, -1.123199462890625, -1.03094482421875, -0.938690185546875, -0.846435546875, -0.754180908203125, -0.66192626953125, -0.569671630859375, -0.4774169921875, -0.385162353515625, -0.29290771484375, -0.200653076171875, -0.1083984375, -0.016143798828125, 0.07611083984375, 0.168365478515625, 0.2606201171875, 0.352874755859375, 0.44512939453125, 0.537384033203125, 0.629638671875, 0.721893310546875, 0.81414794921875, 0.906402587890625, 0.9986572265625, 1.090911865234375, 1.18316650390625, 1.275421142578125, 1.36767578125, 1.459930419921875, 1.55218505859375, 1.644439697265625, 1.7366943359375, 1.828948974609375, 1.92120361328125, 2.013458251953125, 2.105712890625, 2.197967529296875, 2.29022216796875, 2.382476806640625, 2.4747314453125, 2.566986083984375, 2.65924072265625, 2.751495361328125, 2.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 8.0, 9.0, 8.0, 8.0, 8.0, 15.0, 18.0, 21.0, 29.0, 17.0, 35.0, 36.0, 29.0, 49.0, 42.0, 37.0, 43.0, 40.0, 34.0, 38.0, 32.0, 42.0, 41.0, 39.0, 30.0, 31.0, 36.0, 37.0, 26.0, 20.0, 25.0, 23.0, 13.0, 20.0, 17.0, 9.0, 6.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5906982421875, -10.204833984375, -9.8189697265625, -9.43310546875, -9.0472412109375, -8.661376953125, -8.2755126953125, -7.8896484375, -7.5037841796875, -7.117919921875, -6.7320556640625, -6.34619140625, -5.9603271484375, -5.574462890625, -5.1885986328125, -4.802734375, -4.4168701171875, -4.031005859375, -3.6451416015625, -3.25927734375, -2.8734130859375, -2.487548828125, -2.1016845703125, -1.7158203125, -1.3299560546875, -0.944091796875, -0.5582275390625, -0.17236328125, 0.2135009765625, 0.599365234375, 0.9852294921875, 1.37109375, 1.7569580078125, 2.142822265625, 2.5286865234375, 2.91455078125, 3.3004150390625, 3.686279296875, 4.0721435546875, 4.4580078125, 4.8438720703125, 5.229736328125, 5.6156005859375, 6.00146484375, 6.3873291015625, 6.773193359375, 7.1590576171875, 7.544921875, 7.9307861328125, 8.316650390625, 8.7025146484375, 9.08837890625, 9.4742431640625, 9.860107421875, 10.2459716796875, 10.6318359375, 11.0177001953125, 11.403564453125, 11.7894287109375, 12.17529296875, 12.5611572265625, 12.947021484375, 13.3328857421875, 13.71875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 13.0, 6.0, 16.0, 23.0, 34.0, 43.0, 63.0, 99.0, 133.0, 214.0, 300.0, 407.0, 654.0, 1032.0, 1726.0, 2850.0, 4814.0, 8537.0, 15712.0, 29385.0, 57411.0, 118969.0, 227277.0, 263381.0, 156014.0, 75839.0, 37890.0, 19384.0, 10592.0, 6239.0, 3495.0, 2138.0, 1275.0, 859.0, 534.0, 393.0, 253.0, 153.0, 106.0, 89.0, 59.0, 45.0, 25.0, 26.0, 17.0, 11.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.31640625, -3.21337890625, -3.1103515625, -3.00732421875, -2.904296875, -2.80126953125, -2.6982421875, -2.59521484375, -2.4921875, -2.38916015625, -2.2861328125, -2.18310546875, -2.080078125, -1.97705078125, -1.8740234375, -1.77099609375, -1.66796875, -1.56494140625, -1.4619140625, -1.35888671875, -1.255859375, -1.15283203125, -1.0498046875, -0.94677734375, -0.84375, -0.74072265625, -0.6376953125, -0.53466796875, -0.431640625, -0.32861328125, -0.2255859375, -0.12255859375, -0.01953125, 0.08349609375, 0.1865234375, 0.28955078125, 0.392578125, 0.49560546875, 0.5986328125, 0.70166015625, 0.8046875, 0.90771484375, 1.0107421875, 1.11376953125, 1.216796875, 1.31982421875, 1.4228515625, 1.52587890625, 1.62890625, 1.73193359375, 1.8349609375, 1.93798828125, 2.041015625, 2.14404296875, 2.2470703125, 2.35009765625, 2.453125, 2.55615234375, 2.6591796875, 2.76220703125, 2.865234375, 2.96826171875, 3.0712890625, 3.17431640625, 3.27734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 11.0, 11.0, 13.0, 13.0, 14.0, 17.0, 28.0, 23.0, 23.0, 28.0, 28.0, 27.0, 33.0, 29.0, 51.0, 31.0, 25.0, 42.0, 28.0, 42.0, 43.0, 50.0, 37.0, 40.0, 39.0, 41.0, 34.0, 21.0, 19.0, 24.0, 19.0, 16.0, 17.0, 11.0, 7.0, 12.0, 9.0, 8.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.734375, -7.4979248046875, -7.261474609375, -7.0250244140625, -6.78857421875, -6.5521240234375, -6.315673828125, -6.0792236328125, -5.8427734375, -5.6063232421875, -5.369873046875, -5.1334228515625, -4.89697265625, -4.6605224609375, -4.424072265625, -4.1876220703125, -3.951171875, -3.7147216796875, -3.478271484375, -3.2418212890625, -3.00537109375, -2.7689208984375, -2.532470703125, -2.2960205078125, -2.0595703125, -1.8231201171875, -1.586669921875, -1.3502197265625, -1.11376953125, -0.8773193359375, -0.640869140625, -0.4044189453125, -0.16796875, 0.0684814453125, 0.304931640625, 0.5413818359375, 0.77783203125, 1.0142822265625, 1.250732421875, 1.4871826171875, 1.7236328125, 1.9600830078125, 2.196533203125, 2.4329833984375, 2.66943359375, 2.9058837890625, 3.142333984375, 3.3787841796875, 3.615234375, 3.8516845703125, 4.088134765625, 4.3245849609375, 4.56103515625, 4.7974853515625, 5.033935546875, 5.2703857421875, 5.5068359375, 5.7432861328125, 5.979736328125, 6.2161865234375, 6.45263671875, 6.6890869140625, 6.925537109375, 7.1619873046875, 7.3984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 13.0, 8.0, 23.0, 33.0, 30.0, 46.0, 82.0, 108.0, 170.0, 187.0, 293.0, 390.0, 610.0, 873.0, 1274.0, 1805.0, 3038.0, 4956.0, 8120.0, 14484.0, 26956.0, 54380.0, 123813.0, 265163.0, 279482.0, 135597.0, 59144.0, 28562.0, 15208.0, 8728.0, 5355.0, 3104.0, 2112.0, 1390.0, 875.0, 614.0, 425.0, 279.0, 230.0, 156.0, 134.0, 87.0, 51.0, 46.0, 33.0, 23.0, 17.0, 16.0, 6.0, 6.0, 6.0, 1.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8775100708007812, -0.8473052978515625, -0.8171005249023438, -0.786895751953125, -0.7566909790039062, -0.7264862060546875, -0.6962814331054688, -0.66607666015625, -0.6358718872070312, -0.6056671142578125, -0.5754623413085938, -0.545257568359375, -0.5150527954101562, -0.4848480224609375, -0.45464324951171875, -0.4244384765625, -0.39423370361328125, -0.3640289306640625, -0.33382415771484375, -0.303619384765625, -0.27341461181640625, -0.2432098388671875, -0.21300506591796875, -0.18280029296875, -0.15259552001953125, -0.1223907470703125, -0.09218597412109375, -0.061981201171875, -0.03177642822265625, -0.0015716552734375, 0.02863311767578125, 0.058837890625, 0.08904266357421875, 0.1192474365234375, 0.14945220947265625, 0.179656982421875, 0.20986175537109375, 0.2400665283203125, 0.27027130126953125, 0.30047607421875, 0.33068084716796875, 0.3608856201171875, 0.39109039306640625, 0.421295166015625, 0.45149993896484375, 0.4817047119140625, 0.5119094848632812, 0.5421142578125, 0.5723190307617188, 0.6025238037109375, 0.6327285766601562, 0.662933349609375, 0.6931381225585938, 0.7233428955078125, 0.7535476684570312, 0.78375244140625, 0.8139572143554688, 0.8441619873046875, 0.8743667602539062, 0.904571533203125, 0.9347763061523438, 0.9649810791015625, 0.9951858520507812, 1.025390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 20.0, 19.0, 29.0, 29.0, 38.0, 58.0, 54.0, 64.0, 68.0, 71.0, 61.0, 94.0, 61.0, 49.0, 48.0, 43.0, 37.0, 31.0, 29.0, 10.0, 13.0, 14.0, 11.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.959936141967773e-05, -9.492877870798111e-05, -9.025819599628448e-05, -8.558761328458786e-05, -8.091703057289124e-05, -7.624644786119461e-05, -7.157586514949799e-05, -6.690528243780136e-05, -6.223469972610474e-05, -5.756411701440811e-05, -5.289353430271149e-05, -4.822295159101486e-05, -4.355236887931824e-05, -3.888178616762161e-05, -3.421120345592499e-05, -2.9540620744228363e-05, -2.4870038032531738e-05, -2.0199455320835114e-05, -1.552887260913849e-05, -1.0858289897441864e-05, -6.187707185745239e-06, -1.5171244740486145e-06, 3.1534582376480103e-06, 7.824040949344635e-06, 1.249462366104126e-05, 1.7165206372737885e-05, 2.183578908443451e-05, 2.6506371796131134e-05, 3.117695450782776e-05, 3.5847537219524384e-05, 4.051811993122101e-05, 4.518870264291763e-05, 4.985928535461426e-05, 5.452986806631088e-05, 5.920045077800751e-05, 6.387103348970413e-05, 6.854161620140076e-05, 7.321219891309738e-05, 7.7882781624794e-05, 8.255336433649063e-05, 8.722394704818726e-05, 9.189452975988388e-05, 9.65651124715805e-05, 0.00010123569518327713, 0.00010590627789497375, 0.00011057686060667038, 0.000115247443318367, 0.00011991802603006363, 0.00012458860874176025, 0.00012925919145345688, 0.0001339297741651535, 0.00013860035687685013, 0.00014327093958854675, 0.00014794152230024338, 0.00015261210501194, 0.00015728268772363663, 0.00016195327043533325, 0.00016662385314702988, 0.0001712944358587265, 0.00017596501857042313, 0.00018063560128211975, 0.00018530618399381638, 0.000189976766705513, 0.00019464734941720963, 0.00019931793212890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 10.0, 12.0, 13.0, 27.0, 41.0, 60.0, 88.0, 129.0, 217.0, 287.0, 422.0, 667.0, 1075.0, 1652.0, 2470.0, 3977.0, 6149.0, 9712.0, 15748.0, 25573.0, 42546.0, 69971.0, 113460.0, 165525.0, 183976.0, 149682.0, 98763.0, 60665.0, 36499.0, 22133.0, 13477.0, 8644.0, 5268.0, 3379.0, 2171.0, 1376.0, 876.0, 627.0, 416.0, 260.0, 164.0, 133.0, 81.0, 49.0, 27.0, 31.0, 13.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2747650146484375, -1.234100341796875, -1.1934356689453125, -1.15277099609375, -1.1121063232421875, -1.071441650390625, -1.0307769775390625, -0.9901123046875, -0.9494476318359375, -0.908782958984375, -0.8681182861328125, -0.82745361328125, -0.7867889404296875, -0.746124267578125, -0.7054595947265625, -0.664794921875, -0.6241302490234375, -0.583465576171875, -0.5428009033203125, -0.50213623046875, -0.4614715576171875, -0.420806884765625, -0.3801422119140625, -0.3394775390625, -0.2988128662109375, -0.258148193359375, -0.2174835205078125, -0.17681884765625, -0.1361541748046875, -0.095489501953125, -0.0548248291015625, -0.01416015625, 0.0265045166015625, 0.067169189453125, 0.1078338623046875, 0.14849853515625, 0.1891632080078125, 0.229827880859375, 0.2704925537109375, 0.3111572265625, 0.3518218994140625, 0.392486572265625, 0.4331512451171875, 0.47381591796875, 0.5144805908203125, 0.555145263671875, 0.5958099365234375, 0.636474609375, 0.6771392822265625, 0.717803955078125, 0.7584686279296875, 0.79913330078125, 0.8397979736328125, 0.880462646484375, 0.9211273193359375, 0.9617919921875, 1.0024566650390625, 1.043121337890625, 1.0837860107421875, 1.12445068359375, 1.1651153564453125, 1.205780029296875, 1.2464447021484375, 1.287109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 7.0, 2.0, 5.0, 7.0, 8.0, 9.0, 16.0, 14.0, 15.0, 31.0, 33.0, 43.0, 46.0, 43.0, 42.0, 46.0, 57.0, 74.0, 58.0, 59.0, 66.0, 58.0, 50.0, 37.0, 30.0, 23.0, 14.0, 12.0, 17.0, 12.0, 11.0, 6.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.5029296875, -0.4884834289550781, -0.47403717041015625, -0.4595909118652344, -0.4451446533203125, -0.4306983947753906, -0.41625213623046875, -0.4018058776855469, -0.387359619140625, -0.3729133605957031, -0.35846710205078125, -0.3440208435058594, -0.3295745849609375, -0.3151283264160156, -0.30068206787109375, -0.2862358093261719, -0.27178955078125, -0.2573432922363281, -0.24289703369140625, -0.22845077514648438, -0.2140045166015625, -0.19955825805664062, -0.18511199951171875, -0.17066574096679688, -0.156219482421875, -0.14177322387695312, -0.12732696533203125, -0.11288070678710938, -0.0984344482421875, -0.08398818969726562, -0.06954193115234375, -0.055095672607421875, -0.0406494140625, -0.026203155517578125, -0.01175689697265625, 0.002689361572265625, 0.0171356201171875, 0.031581878662109375, 0.04602813720703125, 0.060474395751953125, 0.074920654296875, 0.08936691284179688, 0.10381317138671875, 0.11825942993164062, 0.1327056884765625, 0.14715194702148438, 0.16159820556640625, 0.17604446411132812, 0.19049072265625, 0.20493698120117188, 0.21938323974609375, 0.23382949829101562, 0.2482757568359375, 0.2627220153808594, 0.27716827392578125, 0.2916145324707031, 0.306060791015625, 0.3205070495605469, 0.33495330810546875, 0.3493995666503906, 0.3638458251953125, 0.3782920837402344, 0.39273834228515625, 0.4071846008300781, 0.421630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 7.0, 9.0, 14.0, 6.0, 16.0, 17.0, 17.0, 25.0, 28.0, 27.0, 43.0, 38.0, 41.0, 46.0, 48.0, 56.0, 39.0, 54.0, 47.0, 44.0, 46.0, 45.0, 41.0, 33.0, 33.0, 41.0, 29.0, 19.0, 16.0, 13.0, 16.0, 7.0, 9.0, 4.0, 3.0, 7.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.841849327087402, -14.381918907165527, -13.921988487243652, -13.462057113647461, -13.002126693725586, -12.542196273803711, -12.082265853881836, -11.622335433959961, -11.16240406036377, -10.702473640441895, -10.24254322052002, -9.782611846923828, -9.322681427001953, -8.862751007080078, -8.402820587158203, -7.94288969039917, -7.482959270477295, -7.02302885055542, -6.563097953796387, -6.103167533874512, -5.6432366371154785, -5.1833062171936035, -4.72337532043457, -4.263444900512695, -3.803514242172241, -3.343583583831787, -2.883652925491333, -2.423722267150879, -1.9637917280197144, -1.5038611888885498, -1.0439305305480957, -0.5839998722076416, -0.1240692138671875, 0.3358614146709442, 0.7957920432090759, 1.2557226419448853, 1.7156533002853394, 2.175583839416504, 2.635514497756958, 3.095445156097412, 3.555375814437866, 4.01530647277832, 4.475236892700195, 4.9351677894592285, 5.3950982093811035, 5.855029106140137, 6.314959526062012, 6.774889945983887, 7.23482084274292, 7.694751262664795, 8.154682159423828, 8.614612579345703, 9.074542999267578, 9.534473419189453, 9.994404792785645, 10.45433521270752, 10.914265632629395, 11.37419605255127, 11.834126472473145, 12.294057846069336, 12.753988265991211, 13.213918685913086, 13.673849105834961, 14.133779525756836, 14.593710899353027]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 11.0, 5.0, 10.0, 7.0, 8.0, 13.0, 14.0, 24.0, 27.0, 19.0, 22.0, 46.0, 28.0, 40.0, 39.0, 48.0, 39.0, 36.0, 41.0, 44.0, 29.0, 40.0, 47.0, 35.0, 33.0, 34.0, 39.0, 30.0, 31.0, 22.0, 24.0, 24.0, 14.0, 18.0, 18.0, 10.0, 5.0, 8.0, 8.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.263108253479004, -10.871716499328613, -10.480323791503906, -10.088932037353516, -9.697539329528809, -9.306147575378418, -8.914754867553711, -8.52336311340332, -8.13197135925293, -7.740579128265381, -7.349186897277832, -6.957795143127441, -6.566402435302734, -6.175010681152344, -5.783618450164795, -5.392226219177246, -5.000833511352539, -4.60944128036499, -4.218049049377441, -3.8266570568084717, -3.435264825820923, -3.043872594833374, -2.6524806022644043, -2.2610883712768555, -1.8696961402893066, -1.4783039093017578, -1.0869117975234985, -0.6955196857452393, -0.30412745475769043, 0.0872647762298584, 0.4786567687988281, 0.870048999786377, 1.2614412307739258, 1.6528334617614746, 2.0442256927490234, 2.435617685317993, 2.827009916305542, 3.218402147293091, 3.6097941398620605, 4.001186370849609, 4.392578601837158, 4.783970832824707, 5.175363063812256, 5.566755294799805, 5.958147048950195, 6.349539756774902, 6.740931510925293, 7.132323741912842, 7.523715972900391, 7.9151082038879395, 8.306500434875488, 8.697892189025879, 9.089284896850586, 9.480676651000977, 9.872068405151367, 10.263461112976074, 10.654853820800781, 11.046245574951172, 11.437638282775879, 11.82903003692627, 12.220422744750977, 12.611814498901367, 13.003206253051758, 13.394598960876465, 13.785990715026855]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 12.0, 12.0, 25.0, 52.0, 81.0, 145.0, 272.0, 451.0, 831.0, 1380.0, 2506.0, 4278.0, 7119.0, 11879.0, 18761.0, 28800.0, 42124.0, 58587.0, 77341.0, 94282.0, 107946.0, 112810.0, 109416.0, 97582.0, 80341.0, 62238.0, 45097.0, 31602.0, 20509.0, 12793.0, 7924.0, 4775.0, 2716.0, 1624.0, 961.0, 555.0, 327.0, 171.0, 92.0, 59.0, 38.0, 13.0, 9.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.748779296875, -9.41943359375, -9.090087890625, -8.7607421875, -8.431396484375, -8.10205078125, -7.772705078125, -7.443359375, -7.114013671875, -6.78466796875, -6.455322265625, -6.1259765625, -5.796630859375, -5.46728515625, -5.137939453125, -4.80859375, -4.479248046875, -4.14990234375, -3.820556640625, -3.4912109375, -3.161865234375, -2.83251953125, -2.503173828125, -2.173828125, -1.844482421875, -1.51513671875, -1.185791015625, -0.8564453125, -0.527099609375, -0.19775390625, 0.131591796875, 0.4609375, 0.790283203125, 1.11962890625, 1.448974609375, 1.7783203125, 2.107666015625, 2.43701171875, 2.766357421875, 3.095703125, 3.425048828125, 3.75439453125, 4.083740234375, 4.4130859375, 4.742431640625, 5.07177734375, 5.401123046875, 5.73046875, 6.059814453125, 6.38916015625, 6.718505859375, 7.0478515625, 7.377197265625, 7.70654296875, 8.035888671875, 8.365234375, 8.694580078125, 9.02392578125, 9.353271484375, 9.6826171875, 10.011962890625, 10.34130859375, 10.670654296875, 11.0]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 7.0, 9.0, 11.0, 8.0, 7.0, 9.0, 16.0, 21.0, 19.0, 31.0, 16.0, 49.0, 23.0, 40.0, 42.0, 49.0, 34.0, 44.0, 35.0, 45.0, 32.0, 37.0, 48.0, 40.0, 36.0, 28.0, 42.0, 30.0, 30.0, 21.0, 24.0, 25.0, 19.0, 11.0, 23.0, 8.0, 8.0, 9.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.63525390625, -10.2548828125, -9.87451171875, -9.494140625, -9.11376953125, -8.7333984375, -8.35302734375, -7.97265625, -7.59228515625, -7.2119140625, -6.83154296875, -6.451171875, -6.07080078125, -5.6904296875, -5.31005859375, -4.9296875, -4.54931640625, -4.1689453125, -3.78857421875, -3.408203125, -3.02783203125, -2.6474609375, -2.26708984375, -1.88671875, -1.50634765625, -1.1259765625, -0.74560546875, -0.365234375, 0.01513671875, 0.3955078125, 0.77587890625, 1.15625, 1.53662109375, 1.9169921875, 2.29736328125, 2.677734375, 3.05810546875, 3.4384765625, 3.81884765625, 4.19921875, 4.57958984375, 4.9599609375, 5.34033203125, 5.720703125, 6.10107421875, 6.4814453125, 6.86181640625, 7.2421875, 7.62255859375, 8.0029296875, 8.38330078125, 8.763671875, 9.14404296875, 9.5244140625, 9.90478515625, 10.28515625, 10.66552734375, 11.0458984375, 11.42626953125, 11.806640625, 12.18701171875, 12.5673828125, 12.94775390625, 13.328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 6.0, 7.0, 18.0, 27.0, 29.0, 44.0, 83.0, 96.0, 149.0, 305.0, 407.0, 645.0, 1053.0, 1612.0, 2404.0, 3716.0, 5683.0, 8655.0, 12672.0, 18233.0, 26036.0, 35331.0, 46824.0, 59270.0, 72213.0, 83358.0, 91090.0, 94543.0, 92528.0, 84804.0, 73751.0, 61094.0, 48748.0, 36954.0, 26961.0, 19092.0, 13592.0, 9118.0, 6101.0, 4043.0, 2617.0, 1665.0, 1091.0, 644.0, 450.0, 318.0, 153.0, 119.0, 84.0, 46.0, 30.0, 26.0, 9.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.640625, -8.366943359375, -8.09326171875, -7.819580078125, -7.5458984375, -7.272216796875, -6.99853515625, -6.724853515625, -6.451171875, -6.177490234375, -5.90380859375, -5.630126953125, -5.3564453125, -5.082763671875, -4.80908203125, -4.535400390625, -4.26171875, -3.988037109375, -3.71435546875, -3.440673828125, -3.1669921875, -2.893310546875, -2.61962890625, -2.345947265625, -2.072265625, -1.798583984375, -1.52490234375, -1.251220703125, -0.9775390625, -0.703857421875, -0.43017578125, -0.156494140625, 0.1171875, 0.390869140625, 0.66455078125, 0.938232421875, 1.2119140625, 1.485595703125, 1.75927734375, 2.032958984375, 2.306640625, 2.580322265625, 2.85400390625, 3.127685546875, 3.4013671875, 3.675048828125, 3.94873046875, 4.222412109375, 4.49609375, 4.769775390625, 5.04345703125, 5.317138671875, 5.5908203125, 5.864501953125, 6.13818359375, 6.411865234375, 6.685546875, 6.959228515625, 7.23291015625, 7.506591796875, 7.7802734375, 8.053955078125, 8.32763671875, 8.601318359375, 8.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 4.0, 11.0, 9.0, 10.0, 12.0, 13.0, 15.0, 15.0, 22.0, 23.0, 22.0, 30.0, 27.0, 28.0, 39.0, 29.0, 23.0, 29.0, 44.0, 35.0, 38.0, 25.0, 26.0, 43.0, 39.0, 33.0, 37.0, 28.0, 31.0, 24.0, 28.0, 23.0, 22.0, 23.0, 25.0, 11.0, 16.0, 10.0, 12.0, 15.0, 7.0, 6.0, 1.0, 4.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 3.0], "bins": [-7.20703125, -6.9986572265625, -6.790283203125, -6.5819091796875, -6.37353515625, -6.1651611328125, -5.956787109375, -5.7484130859375, -5.5400390625, -5.3316650390625, -5.123291015625, -4.9149169921875, -4.70654296875, -4.4981689453125, -4.289794921875, -4.0814208984375, -3.873046875, -3.6646728515625, -3.456298828125, -3.2479248046875, -3.03955078125, -2.8311767578125, -2.622802734375, -2.4144287109375, -2.2060546875, -1.9976806640625, -1.789306640625, -1.5809326171875, -1.37255859375, -1.1641845703125, -0.955810546875, -0.7474365234375, -0.5390625, -0.3306884765625, -0.122314453125, 0.0860595703125, 0.29443359375, 0.5028076171875, 0.711181640625, 0.9195556640625, 1.1279296875, 1.3363037109375, 1.544677734375, 1.7530517578125, 1.96142578125, 2.1697998046875, 2.378173828125, 2.5865478515625, 2.794921875, 3.0032958984375, 3.211669921875, 3.4200439453125, 3.62841796875, 3.8367919921875, 4.045166015625, 4.2535400390625, 4.4619140625, 4.6702880859375, 4.878662109375, 5.0870361328125, 5.29541015625, 5.5037841796875, 5.712158203125, 5.9205322265625, 6.12890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 22.0, 30.0, 55.0, 77.0, 106.0, 181.0, 279.0, 439.0, 642.0, 1066.0, 1691.0, 2790.0, 4339.0, 6916.0, 11103.0, 17903.0, 28122.0, 42957.0, 62653.0, 85729.0, 107381.0, 121930.0, 126182.0, 114944.0, 95152.0, 72082.0, 51278.0, 33974.0, 21996.0, 13790.0, 8593.0, 5399.0, 3202.0, 1942.0, 1259.0, 875.0, 524.0, 314.0, 205.0, 145.0, 95.0, 64.0, 39.0, 26.0, 14.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.12109375, -4.9669189453125, -4.812744140625, -4.6585693359375, -4.50439453125, -4.3502197265625, -4.196044921875, -4.0418701171875, -3.8876953125, -3.7335205078125, -3.579345703125, -3.4251708984375, -3.27099609375, -3.1168212890625, -2.962646484375, -2.8084716796875, -2.654296875, -2.5001220703125, -2.345947265625, -2.1917724609375, -2.03759765625, -1.8834228515625, -1.729248046875, -1.5750732421875, -1.4208984375, -1.2667236328125, -1.112548828125, -0.9583740234375, -0.80419921875, -0.6500244140625, -0.495849609375, -0.3416748046875, -0.1875, -0.0333251953125, 0.120849609375, 0.2750244140625, 0.42919921875, 0.5833740234375, 0.737548828125, 0.8917236328125, 1.0458984375, 1.2000732421875, 1.354248046875, 1.5084228515625, 1.66259765625, 1.8167724609375, 1.970947265625, 2.1251220703125, 2.279296875, 2.4334716796875, 2.587646484375, 2.7418212890625, 2.89599609375, 3.0501708984375, 3.204345703125, 3.3585205078125, 3.5126953125, 3.6668701171875, 3.821044921875, 3.9752197265625, 4.12939453125, 4.2835693359375, 4.437744140625, 4.5919189453125, 4.74609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 14.0, 19.0, 13.0, 28.0, 23.0, 37.0, 20.0, 42.0, 29.0, 34.0, 55.0, 42.0, 40.0, 54.0, 52.0, 56.0, 46.0, 49.0, 40.0, 51.0, 32.0, 31.0, 28.0, 22.0, 29.0, 23.0, 16.0, 14.0, 4.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007028579711914062, -0.0006838962435722351, -0.000664934515953064, -0.0006459727883338928, -0.0006270110607147217, -0.0006080493330955505, -0.0005890876054763794, -0.0005701258778572083, -0.0005511641502380371, -0.000532202422618866, -0.0005132406949996948, -0.0004942789673805237, -0.00047531723976135254, -0.0004563555121421814, -0.00043739378452301025, -0.0004184320569038391, -0.00039947032928466797, -0.0003805086016654968, -0.0003615468740463257, -0.00034258514642715454, -0.0003236234188079834, -0.00030466169118881226, -0.0002856999635696411, -0.00026673823595046997, -0.00024777650833129883, -0.00022881478071212769, -0.00020985305309295654, -0.0001908913254737854, -0.00017192959785461426, -0.00015296787023544312, -0.00013400614261627197, -0.00011504441499710083, -9.608268737792969e-05, -7.712095975875854e-05, -5.81592321395874e-05, -3.919750452041626e-05, -2.0235776901245117e-05, -1.2740492820739746e-06, 1.7687678337097168e-05, 3.664940595626831e-05, 5.561113357543945e-05, 7.45728611946106e-05, 9.353458881378174e-05, 0.00011249631643295288, 0.00013145804405212402, 0.00015041977167129517, 0.0001693814992904663, 0.00018834322690963745, 0.0002073049545288086, 0.00022626668214797974, 0.0002452284097671509, 0.000264190137386322, 0.00028315186500549316, 0.0003021135926246643, 0.00032107532024383545, 0.0003400370478630066, 0.00035899877548217773, 0.0003779605031013489, 0.00039692223072052, 0.00041588395833969116, 0.0004348456859588623, 0.00045380741357803345, 0.0004727691411972046, 0.0004917308688163757, 0.0005106925964355469]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 8.0, 9.0, 12.0, 25.0, 27.0, 71.0, 86.0, 136.0, 250.0, 395.0, 710.0, 1101.0, 1989.0, 3292.0, 5903.0, 10365.0, 18562.0, 32547.0, 54926.0, 86720.0, 123533.0, 152690.0, 158119.0, 136638.0, 100564.0, 66495.0, 40056.0, 23115.0, 13056.0, 7382.0, 4109.0, 2255.0, 1320.0, 782.0, 491.0, 317.0, 189.0, 120.0, 67.0, 38.0, 36.0, 21.0, 14.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3203125, -7.08563232421875, -6.8509521484375, -6.61627197265625, -6.381591796875, -6.14691162109375, -5.9122314453125, -5.67755126953125, -5.44287109375, -5.20819091796875, -4.9735107421875, -4.73883056640625, -4.504150390625, -4.26947021484375, -4.0347900390625, -3.80010986328125, -3.5654296875, -3.33074951171875, -3.0960693359375, -2.86138916015625, -2.626708984375, -2.39202880859375, -2.1573486328125, -1.92266845703125, -1.68798828125, -1.45330810546875, -1.2186279296875, -0.98394775390625, -0.749267578125, -0.51458740234375, -0.2799072265625, -0.04522705078125, 0.189453125, 0.42413330078125, 0.6588134765625, 0.89349365234375, 1.128173828125, 1.36285400390625, 1.5975341796875, 1.83221435546875, 2.06689453125, 2.30157470703125, 2.5362548828125, 2.77093505859375, 3.005615234375, 3.24029541015625, 3.4749755859375, 3.70965576171875, 3.9443359375, 4.17901611328125, 4.4136962890625, 4.64837646484375, 4.883056640625, 5.11773681640625, 5.3524169921875, 5.58709716796875, 5.82177734375, 6.05645751953125, 6.2911376953125, 6.52581787109375, 6.760498046875, 6.99517822265625, 7.2298583984375, 7.46453857421875, 7.69921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 11.0, 21.0, 18.0, 24.0, 28.0, 35.0, 50.0, 47.0, 81.0, 85.0, 68.0, 78.0, 66.0, 65.0, 67.0, 55.0, 48.0, 48.0, 20.0, 25.0, 15.0, 17.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.6092529296875, -3.497802734375, -3.3863525390625, -3.27490234375, -3.1634521484375, -3.052001953125, -2.9405517578125, -2.8291015625, -2.7176513671875, -2.606201171875, -2.4947509765625, -2.38330078125, -2.2718505859375, -2.160400390625, -2.0489501953125, -1.9375, -1.8260498046875, -1.714599609375, -1.6031494140625, -1.49169921875, -1.3802490234375, -1.268798828125, -1.1573486328125, -1.0458984375, -0.9344482421875, -0.822998046875, -0.7115478515625, -0.60009765625, -0.4886474609375, -0.377197265625, -0.2657470703125, -0.154296875, -0.0428466796875, 0.068603515625, 0.1800537109375, 0.29150390625, 0.4029541015625, 0.514404296875, 0.6258544921875, 0.7373046875, 0.8487548828125, 0.960205078125, 1.0716552734375, 1.18310546875, 1.2945556640625, 1.406005859375, 1.5174560546875, 1.62890625, 1.7403564453125, 1.851806640625, 1.9632568359375, 2.07470703125, 2.1861572265625, 2.297607421875, 2.4090576171875, 2.5205078125, 2.6319580078125, 2.743408203125, 2.8548583984375, 2.96630859375, 3.0777587890625, 3.189208984375, 3.3006591796875, 3.412109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 8.0, 9.0, 9.0, 15.0, 26.0, 11.0, 22.0, 22.0, 22.0, 37.0, 26.0, 31.0, 35.0, 38.0, 43.0, 37.0, 54.0, 40.0, 48.0, 40.0, 54.0, 35.0, 43.0, 32.0, 30.0, 22.0, 31.0, 22.0, 19.0, 25.0, 16.0, 6.0, 7.0, 8.0, 7.0, 12.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.578065872192383, -11.183698654174805, -10.789332389831543, -10.394965171813965, -10.000597953796387, -9.606231689453125, -9.211864471435547, -8.817497253417969, -8.42313003540039, -8.028762817382812, -7.634396076202393, -7.240029335021973, -6.8456621170043945, -6.451295375823975, -6.056928634643555, -5.662561416625977, -5.268195152282715, -4.873828411102295, -4.479461193084717, -4.085094451904297, -3.690727472305298, -3.296360492706299, -2.901993751525879, -2.50762677192688, -2.113259792327881, -1.7188928127288818, -1.3245259523391724, -0.9301590919494629, -0.5357921123504639, -0.14142513275146484, 0.2529416084289551, 0.6473085880279541, 1.0416755676269531, 1.4360425472259521, 1.8304094076156616, 2.224776268005371, 2.61914324760437, 3.013510227203369, 3.407876968383789, 3.802243947982788, 4.196610927581787, 4.590977668762207, 4.985344886779785, 5.379711627960205, 5.774078369140625, 6.168445587158203, 6.562812328338623, 6.957179069519043, 7.351546287536621, 7.745913028717041, 8.140279769897461, 8.534646987915039, 8.929014205932617, 9.323381423950195, 9.717747688293457, 10.112114906311035, 10.506481170654297, 10.900848388671875, 11.295214653015137, 11.689581871032715, 12.083949089050293, 12.478315353393555, 12.872682571411133, 13.267049789428711, 13.661417007446289]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 9.0, 8.0, 8.0, 11.0, 15.0, 22.0, 16.0, 23.0, 21.0, 28.0, 22.0, 35.0, 37.0, 41.0, 38.0, 37.0, 29.0, 52.0, 42.0, 31.0, 33.0, 29.0, 34.0, 25.0, 32.0, 40.0, 31.0, 41.0, 33.0, 25.0, 15.0, 18.0, 12.0, 13.0, 17.0, 15.0, 9.0, 4.0, 7.0, 9.0, 7.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.059592247009277, -10.678985595703125, -10.298379898071289, -9.917774200439453, -9.5371675491333, -9.156560897827148, -8.775955200195312, -8.395349502563477, -8.014742851257324, -7.63413667678833, -7.253530502319336, -6.872924327850342, -6.492318153381348, -6.1117119789123535, -5.731105804443359, -5.350499629974365, -4.969893455505371, -4.589287281036377, -4.208681106567383, -3.8280749320983887, -3.4474687576293945, -3.0668625831604004, -2.6862564086914062, -2.305650234222412, -1.925044059753418, -1.5444378852844238, -1.1638317108154297, -0.7832255363464355, -0.4026193618774414, -0.022013187408447266, 0.3585929870605469, 0.739199161529541, 1.1198053359985352, 1.5004115104675293, 1.8810176849365234, 2.2616238594055176, 2.6422300338745117, 3.022836208343506, 3.4034423828125, 3.784048557281494, 4.164654731750488, 4.545260906219482, 4.925867080688477, 5.306473255157471, 5.687079429626465, 6.067685604095459, 6.448291778564453, 6.828897953033447, 7.209504127502441, 7.5901103019714355, 7.97071647644043, 8.351322174072266, 8.731928825378418, 9.11253547668457, 9.493141174316406, 9.873746871948242, 10.254353523254395, 10.634960174560547, 11.015565872192383, 11.396171569824219, 11.776778221130371, 12.157384872436523, 12.53799057006836, 12.918596267700195, 13.299202919006348]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 14.0, 31.0, 33.0, 58.0, 119.0, 176.0, 325.0, 548.0, 924.0, 1543.0, 2538.0, 4142.0, 6849.0, 11088.0, 17722.0, 27710.0, 42817.0, 65007.0, 96655.0, 137396.0, 190933.0, 252039.0, 316092.0, 373063.0, 410780.0, 421996.0, 402189.0, 355578.0, 293255.0, 229475.0, 171099.0, 122116.0, 83953.0, 56058.0, 37009.0, 23959.0, 15037.0, 9382.0, 5916.0, 3438.0, 2092.0, 1241.0, 761.0, 459.0, 279.0, 172.0, 82.0, 50.0, 38.0, 21.0, 11.0, 16.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.4375, -9.154296875, -8.87109375, -8.587890625, -8.3046875, -8.021484375, -7.73828125, -7.455078125, -7.171875, -6.888671875, -6.60546875, -6.322265625, -6.0390625, -5.755859375, -5.47265625, -5.189453125, -4.90625, -4.623046875, -4.33984375, -4.056640625, -3.7734375, -3.490234375, -3.20703125, -2.923828125, -2.640625, -2.357421875, -2.07421875, -1.791015625, -1.5078125, -1.224609375, -0.94140625, -0.658203125, -0.375, -0.091796875, 0.19140625, 0.474609375, 0.7578125, 1.041015625, 1.32421875, 1.607421875, 1.890625, 2.173828125, 2.45703125, 2.740234375, 3.0234375, 3.306640625, 3.58984375, 3.873046875, 4.15625, 4.439453125, 4.72265625, 5.005859375, 5.2890625, 5.572265625, 5.85546875, 6.138671875, 6.421875, 6.705078125, 6.98828125, 7.271484375, 7.5546875, 7.837890625, 8.12109375, 8.404296875, 8.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 11.0, 12.0, 7.0, 9.0, 18.0, 14.0, 18.0, 21.0, 19.0, 31.0, 25.0, 23.0, 39.0, 41.0, 44.0, 33.0, 25.0, 54.0, 40.0, 39.0, 29.0, 21.0, 42.0, 23.0, 32.0, 37.0, 39.0, 34.0, 35.0, 24.0, 25.0, 15.0, 11.0, 20.0, 15.0, 14.0, 6.0, 10.0, 5.0, 9.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.02978515625, -8.7001953125, -8.37060546875, -8.041015625, -7.71142578125, -7.3818359375, -7.05224609375, -6.72265625, -6.39306640625, -6.0634765625, -5.73388671875, -5.404296875, -5.07470703125, -4.7451171875, -4.41552734375, -4.0859375, -3.75634765625, -3.4267578125, -3.09716796875, -2.767578125, -2.43798828125, -2.1083984375, -1.77880859375, -1.44921875, -1.11962890625, -0.7900390625, -0.46044921875, -0.130859375, 0.19873046875, 0.5283203125, 0.85791015625, 1.1875, 1.51708984375, 1.8466796875, 2.17626953125, 2.505859375, 2.83544921875, 3.1650390625, 3.49462890625, 3.82421875, 4.15380859375, 4.4833984375, 4.81298828125, 5.142578125, 5.47216796875, 5.8017578125, 6.13134765625, 6.4609375, 6.79052734375, 7.1201171875, 7.44970703125, 7.779296875, 8.10888671875, 8.4384765625, 8.76806640625, 9.09765625, 9.42724609375, 9.7568359375, 10.08642578125, 10.416015625, 10.74560546875, 11.0751953125, 11.40478515625, 11.734375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 5.0, 5.0, 13.0, 13.0, 30.0, 50.0, 107.0, 181.0, 314.0, 552.0, 925.0, 1542.0, 2677.0, 4332.0, 7220.0, 11993.0, 19265.0, 30219.0, 45747.0, 69248.0, 100234.0, 141294.0, 190550.0, 245153.0, 301054.0, 350777.0, 384525.0, 395377.0, 382747.0, 349688.0, 299251.0, 242908.0, 187448.0, 139779.0, 99026.0, 67641.0, 45262.0, 29426.0, 18274.0, 11726.0, 7211.0, 4345.0, 2527.0, 1512.0, 895.0, 498.0, 301.0, 183.0, 101.0, 55.0, 33.0, 29.0, 14.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.6971435546875, -8.402099609375, -8.1070556640625, -7.81201171875, -7.5169677734375, -7.221923828125, -6.9268798828125, -6.6318359375, -6.3367919921875, -6.041748046875, -5.7467041015625, -5.45166015625, -5.1566162109375, -4.861572265625, -4.5665283203125, -4.271484375, -3.9764404296875, -3.681396484375, -3.3863525390625, -3.09130859375, -2.7962646484375, -2.501220703125, -2.2061767578125, -1.9111328125, -1.6160888671875, -1.321044921875, -1.0260009765625, -0.73095703125, -0.4359130859375, -0.140869140625, 0.1541748046875, 0.44921875, 0.7442626953125, 1.039306640625, 1.3343505859375, 1.62939453125, 1.9244384765625, 2.219482421875, 2.5145263671875, 2.8095703125, 3.1046142578125, 3.399658203125, 3.6947021484375, 3.98974609375, 4.2847900390625, 4.579833984375, 4.8748779296875, 5.169921875, 5.4649658203125, 5.760009765625, 6.0550537109375, 6.35009765625, 6.6451416015625, 6.940185546875, 7.2352294921875, 7.5302734375, 7.8253173828125, 8.120361328125, 8.4154052734375, 8.71044921875, 9.0054931640625, 9.300537109375, 9.5955810546875, 9.890625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 9.0, 14.0, 17.0, 18.0, 30.0, 40.0, 48.0, 56.0, 72.0, 80.0, 91.0, 105.0, 127.0, 119.0, 110.0, 149.0, 160.0, 200.0, 168.0, 184.0, 211.0, 177.0, 200.0, 185.0, 177.0, 168.0, 155.0, 145.0, 140.0, 114.0, 95.0, 93.0, 72.0, 71.0, 56.0, 53.0, 35.0, 28.0, 27.0, 21.0, 12.0, 18.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0234375, -4.86700439453125, -4.7105712890625, -4.55413818359375, -4.397705078125, -4.24127197265625, -4.0848388671875, -3.92840576171875, -3.77197265625, -3.61553955078125, -3.4591064453125, -3.30267333984375, -3.146240234375, -2.98980712890625, -2.8333740234375, -2.67694091796875, -2.5205078125, -2.36407470703125, -2.2076416015625, -2.05120849609375, -1.894775390625, -1.73834228515625, -1.5819091796875, -1.42547607421875, -1.26904296875, -1.11260986328125, -0.9561767578125, -0.79974365234375, -0.643310546875, -0.48687744140625, -0.3304443359375, -0.17401123046875, -0.017578125, 0.13885498046875, 0.2952880859375, 0.45172119140625, 0.608154296875, 0.76458740234375, 0.9210205078125, 1.07745361328125, 1.23388671875, 1.39031982421875, 1.5467529296875, 1.70318603515625, 1.859619140625, 2.01605224609375, 2.1724853515625, 2.32891845703125, 2.4853515625, 2.64178466796875, 2.7982177734375, 2.95465087890625, 3.111083984375, 3.26751708984375, 3.4239501953125, 3.58038330078125, 3.73681640625, 3.89324951171875, 4.0496826171875, 4.20611572265625, 4.362548828125, 4.51898193359375, 4.6754150390625, 4.83184814453125, 4.98828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 5.0, 4.0, 3.0, 11.0, 9.0, 13.0, 10.0, 24.0, 25.0, 18.0, 26.0, 20.0, 26.0, 38.0, 29.0, 47.0, 47.0, 39.0, 51.0, 45.0, 39.0, 46.0, 37.0, 45.0, 36.0, 32.0, 35.0, 31.0, 24.0, 29.0, 35.0, 17.0, 21.0, 11.0, 10.0, 11.0, 8.0, 13.0, 8.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.261646270751953, -14.843293190002441, -14.42494010925293, -14.006586074829102, -13.58823299407959, -13.169879913330078, -12.751526832580566, -12.333173751831055, -11.914820671081543, -11.496467590332031, -11.07811450958252, -10.659761428833008, -10.24140739440918, -9.823054313659668, -9.404701232910156, -8.986348152160645, -8.567995071411133, -8.149641990661621, -7.731288433074951, -7.3129353523254395, -6.894582271575928, -6.476228713989258, -6.057875633239746, -5.639522552490234, -5.221168518066406, -4.8028154373168945, -4.384461879730225, -3.966108798980713, -3.547755718231201, -3.1294023990631104, -2.7110490798950195, -2.292695999145508, -1.874342918395996, -1.4559897184371948, -1.0376365184783936, -0.6192831993103027, -0.20092999935150146, 0.2174232006072998, 0.6357765197753906, 1.0541296005249023, 1.4724829196929932, 1.8908361196517944, 2.3091893196105957, 2.7275426387786865, 3.1458959579467773, 3.564249038696289, 3.98260235786438, 4.4009552001953125, 4.819308757781982, 5.237661838531494, 5.656015396118164, 6.074368476867676, 6.4927215576171875, 6.911074638366699, 7.329428195953369, 7.747781276702881, 8.16613483428955, 8.584487915039062, 9.002840995788574, 9.421194076538086, 9.839548110961914, 10.257901191711426, 10.676254272460938, 11.09460735321045, 11.512960433959961]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 4.0, 12.0, 10.0, 5.0, 12.0, 8.0, 10.0, 20.0, 24.0, 26.0, 23.0, 26.0, 37.0, 35.0, 36.0, 19.0, 32.0, 56.0, 40.0, 27.0, 46.0, 26.0, 29.0, 36.0, 25.0, 44.0, 29.0, 27.0, 33.0, 32.0, 29.0, 28.0, 18.0, 16.0, 14.0, 18.0, 11.0, 21.0, 8.0, 7.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.496857643127441, -11.12658405303955, -10.75631046295166, -10.38603687286377, -10.015763282775879, -9.645489692687988, -9.275216102600098, -8.904942512512207, -8.534668922424316, -8.164395332336426, -7.794121742248535, -7.4238481521606445, -7.053574562072754, -6.683300971984863, -6.313027381896973, -5.942753791809082, -5.572480201721191, -5.202206611633301, -4.83193302154541, -4.4616594314575195, -4.091385841369629, -3.7211122512817383, -3.3508386611938477, -2.980565071105957, -2.6102914810180664, -2.240017890930176, -1.8697443008422852, -1.4994707107543945, -1.129197120666504, -0.7589235305786133, -0.38864994049072266, -0.01837635040283203, 0.3518962860107422, 0.7221698760986328, 1.0924434661865234, 1.462717056274414, 1.8329906463623047, 2.2032642364501953, 2.573537826538086, 2.9438114166259766, 3.314085006713867, 3.684358596801758, 4.054632186889648, 4.424905776977539, 4.79517936706543, 5.16545295715332, 5.535726547241211, 5.906000137329102, 6.276273727416992, 6.646547317504883, 7.016820907592773, 7.387094497680664, 7.757368087768555, 8.127641677856445, 8.497915267944336, 8.868188858032227, 9.238462448120117, 9.608736038208008, 9.979009628295898, 10.349283218383789, 10.71955680847168, 11.08983039855957, 11.460103988647461, 11.830377578735352, 12.200651168823242]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 17.0, 22.0, 28.0, 35.0, 50.0, 79.0, 97.0, 180.0, 216.0, 347.0, 463.0, 708.0, 1122.0, 1575.0, 2484.0, 3980.0, 6312.0, 10062.0, 16443.0, 27984.0, 47033.0, 79884.0, 128989.0, 177279.0, 182685.0, 139492.0, 88198.0, 52704.0, 31261.0, 18491.0, 10985.0, 6847.0, 4276.0, 2858.0, 1753.0, 1136.0, 801.0, 540.0, 361.0, 256.0, 159.0, 105.0, 83.0, 49.0, 31.0, 33.0, 17.0, 20.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.818359375, -2.73321533203125, -2.6480712890625, -2.56292724609375, -2.477783203125, -2.39263916015625, -2.3074951171875, -2.22235107421875, -2.13720703125, -2.05206298828125, -1.9669189453125, -1.88177490234375, -1.796630859375, -1.71148681640625, -1.6263427734375, -1.54119873046875, -1.4560546875, -1.37091064453125, -1.2857666015625, -1.20062255859375, -1.115478515625, -1.03033447265625, -0.9451904296875, -0.86004638671875, -0.77490234375, -0.68975830078125, -0.6046142578125, -0.51947021484375, -0.434326171875, -0.34918212890625, -0.2640380859375, -0.17889404296875, -0.09375, -0.00860595703125, 0.0765380859375, 0.16168212890625, 0.246826171875, 0.33197021484375, 0.4171142578125, 0.50225830078125, 0.58740234375, 0.67254638671875, 0.7576904296875, 0.84283447265625, 0.927978515625, 1.01312255859375, 1.0982666015625, 1.18341064453125, 1.2685546875, 1.35369873046875, 1.4388427734375, 1.52398681640625, 1.609130859375, 1.69427490234375, 1.7794189453125, 1.86456298828125, 1.94970703125, 2.03485107421875, 2.1199951171875, 2.20513916015625, 2.290283203125, 2.37542724609375, 2.4605712890625, 2.54571533203125, 2.630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 4.0, 12.0, 9.0, 6.0, 11.0, 9.0, 10.0, 20.0, 24.0, 28.0, 19.0, 29.0, 34.0, 36.0, 37.0, 18.0, 30.0, 58.0, 39.0, 29.0, 42.0, 30.0, 30.0, 32.0, 28.0, 42.0, 30.0, 26.0, 30.0, 37.0, 27.0, 29.0, 19.0, 15.0, 14.0, 18.0, 12.0, 18.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.091064453125, -10.72119140625, -10.351318359375, -9.9814453125, -9.611572265625, -9.24169921875, -8.871826171875, -8.501953125, -8.132080078125, -7.76220703125, -7.392333984375, -7.0224609375, -6.652587890625, -6.28271484375, -5.912841796875, -5.54296875, -5.173095703125, -4.80322265625, -4.433349609375, -4.0634765625, -3.693603515625, -3.32373046875, -2.953857421875, -2.583984375, -2.214111328125, -1.84423828125, -1.474365234375, -1.1044921875, -0.734619140625, -0.36474609375, 0.005126953125, 0.375, 0.744873046875, 1.11474609375, 1.484619140625, 1.8544921875, 2.224365234375, 2.59423828125, 2.964111328125, 3.333984375, 3.703857421875, 4.07373046875, 4.443603515625, 4.8134765625, 5.183349609375, 5.55322265625, 5.923095703125, 6.29296875, 6.662841796875, 7.03271484375, 7.402587890625, 7.7724609375, 8.142333984375, 8.51220703125, 8.882080078125, 9.251953125, 9.621826171875, 9.99169921875, 10.361572265625, 10.7314453125, 11.101318359375, 11.47119140625, 11.841064453125, 12.2109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 8.0, 8.0, 13.0, 16.0, 25.0, 34.0, 59.0, 75.0, 92.0, 148.0, 234.0, 341.0, 497.0, 737.0, 1112.0, 1883.0, 2939.0, 4805.0, 8528.0, 15334.0, 28822.0, 55584.0, 112475.0, 215458.0, 263207.0, 163633.0, 81807.0, 40888.0, 21320.0, 11459.0, 6610.0, 3860.0, 2378.0, 1430.0, 926.0, 600.0, 399.0, 252.0, 187.0, 113.0, 72.0, 53.0, 43.0, 26.0, 19.0, 8.0, 7.0, 10.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.23046875, -3.13037109375, -3.0302734375, -2.93017578125, -2.830078125, -2.72998046875, -2.6298828125, -2.52978515625, -2.4296875, -2.32958984375, -2.2294921875, -2.12939453125, -2.029296875, -1.92919921875, -1.8291015625, -1.72900390625, -1.62890625, -1.52880859375, -1.4287109375, -1.32861328125, -1.228515625, -1.12841796875, -1.0283203125, -0.92822265625, -0.828125, -0.72802734375, -0.6279296875, -0.52783203125, -0.427734375, -0.32763671875, -0.2275390625, -0.12744140625, -0.02734375, 0.07275390625, 0.1728515625, 0.27294921875, 0.373046875, 0.47314453125, 0.5732421875, 0.67333984375, 0.7734375, 0.87353515625, 0.9736328125, 1.07373046875, 1.173828125, 1.27392578125, 1.3740234375, 1.47412109375, 1.57421875, 1.67431640625, 1.7744140625, 1.87451171875, 1.974609375, 2.07470703125, 2.1748046875, 2.27490234375, 2.375, 2.47509765625, 2.5751953125, 2.67529296875, 2.775390625, 2.87548828125, 2.9755859375, 3.07568359375, 3.17578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 6.0, 6.0, 13.0, 8.0, 9.0, 16.0, 13.0, 21.0, 30.0, 23.0, 30.0, 31.0, 46.0, 34.0, 36.0, 35.0, 27.0, 42.0, 44.0, 36.0, 38.0, 36.0, 43.0, 42.0, 45.0, 31.0, 26.0, 27.0, 26.0, 25.0, 22.0, 24.0, 21.0, 12.0, 11.0, 12.0, 4.0, 7.0, 1.0, 2.0, 7.0, 7.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3515625, -8.094970703125, -7.83837890625, -7.581787109375, -7.3251953125, -7.068603515625, -6.81201171875, -6.555419921875, -6.298828125, -6.042236328125, -5.78564453125, -5.529052734375, -5.2724609375, -5.015869140625, -4.75927734375, -4.502685546875, -4.24609375, -3.989501953125, -3.73291015625, -3.476318359375, -3.2197265625, -2.963134765625, -2.70654296875, -2.449951171875, -2.193359375, -1.936767578125, -1.68017578125, -1.423583984375, -1.1669921875, -0.910400390625, -0.65380859375, -0.397216796875, -0.140625, 0.115966796875, 0.37255859375, 0.629150390625, 0.8857421875, 1.142333984375, 1.39892578125, 1.655517578125, 1.912109375, 2.168701171875, 2.42529296875, 2.681884765625, 2.9384765625, 3.195068359375, 3.45166015625, 3.708251953125, 3.96484375, 4.221435546875, 4.47802734375, 4.734619140625, 4.9912109375, 5.247802734375, 5.50439453125, 5.760986328125, 6.017578125, 6.274169921875, 6.53076171875, 6.787353515625, 7.0439453125, 7.300537109375, 7.55712890625, 7.813720703125, 8.0703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 6.0, 4.0, 11.0, 13.0, 14.0, 28.0, 29.0, 44.0, 61.0, 81.0, 110.0, 179.0, 219.0, 341.0, 462.0, 623.0, 1039.0, 1723.0, 2552.0, 4434.0, 8251.0, 17004.0, 41182.0, 128947.0, 427006.0, 281739.0, 75953.0, 27790.0, 12353.0, 6414.0, 3589.0, 2147.0, 1347.0, 896.0, 571.0, 394.0, 296.0, 192.0, 144.0, 96.0, 79.0, 59.0, 31.0, 32.0, 25.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4619140625, -1.417327880859375, -1.37274169921875, -1.328155517578125, -1.2835693359375, -1.238983154296875, -1.19439697265625, -1.149810791015625, -1.105224609375, -1.060638427734375, -1.01605224609375, -0.971466064453125, -0.9268798828125, -0.882293701171875, -0.83770751953125, -0.793121337890625, -0.74853515625, -0.703948974609375, -0.65936279296875, -0.614776611328125, -0.5701904296875, -0.525604248046875, -0.48101806640625, -0.436431884765625, -0.391845703125, -0.347259521484375, -0.30267333984375, -0.258087158203125, -0.2135009765625, -0.168914794921875, -0.12432861328125, -0.079742431640625, -0.03515625, 0.009429931640625, 0.05401611328125, 0.098602294921875, 0.1431884765625, 0.187774658203125, 0.23236083984375, 0.276947021484375, 0.321533203125, 0.366119384765625, 0.41070556640625, 0.455291748046875, 0.4998779296875, 0.544464111328125, 0.58905029296875, 0.633636474609375, 0.67822265625, 0.722808837890625, 0.76739501953125, 0.811981201171875, 0.8565673828125, 0.901153564453125, 0.94573974609375, 0.990325927734375, 1.034912109375, 1.079498291015625, 1.12408447265625, 1.168670654296875, 1.2132568359375, 1.257843017578125, 1.30242919921875, 1.347015380859375, 1.3916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 7.0, 16.0, 15.0, 23.0, 26.0, 29.0, 33.0, 47.0, 56.0, 46.0, 57.0, 66.0, 59.0, 61.0, 54.0, 44.0, 58.0, 52.0, 31.0, 39.0, 34.0, 20.0, 17.0, 29.0, 8.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000125885009765625, -0.00012216903269290924, -0.00011845305562019348, -0.00011473707854747772, -0.00011102110147476196, -0.0001073051244020462, -0.00010358914732933044, -9.987317025661469e-05, -9.615719318389893e-05, -9.244121611118317e-05, -8.872523903846741e-05, -8.500926196575165e-05, -8.129328489303589e-05, -7.757730782032013e-05, -7.386133074760437e-05, -7.014535367488861e-05, -6.642937660217285e-05, -6.271339952945709e-05, -5.899742245674133e-05, -5.5281445384025574e-05, -5.1565468311309814e-05, -4.7849491238594055e-05, -4.4133514165878296e-05, -4.041753709316254e-05, -3.670156002044678e-05, -3.298558294773102e-05, -2.926960587501526e-05, -2.55536288022995e-05, -2.183765172958374e-05, -1.812167465686798e-05, -1.4405697584152222e-05, -1.0689720511436462e-05, -6.973743438720703e-06, -3.257766366004944e-06, 4.5821070671081543e-07, 4.174187779426575e-06, 7.890164852142334e-06, 1.1606141924858093e-05, 1.5322118997573853e-05, 1.9038096070289612e-05, 2.275407314300537e-05, 2.647005021572113e-05, 3.018602728843689e-05, 3.390200436115265e-05, 3.761798143386841e-05, 4.133395850658417e-05, 4.504993557929993e-05, 4.8765912652015686e-05, 5.2481889724731445e-05, 5.6197866797447205e-05, 5.9913843870162964e-05, 6.362982094287872e-05, 6.734579801559448e-05, 7.106177508831024e-05, 7.4777752161026e-05, 7.849372923374176e-05, 8.220970630645752e-05, 8.592568337917328e-05, 8.964166045188904e-05, 9.33576375246048e-05, 9.707361459732056e-05, 0.00010078959167003632, 0.00010450556874275208, 0.00010822154581546783, 0.0001119375228881836]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 15.0, 9.0, 18.0, 15.0, 25.0, 40.0, 62.0, 83.0, 108.0, 161.0, 231.0, 343.0, 528.0, 814.0, 1208.0, 1945.0, 3054.0, 4997.0, 8792.0, 15719.0, 29900.0, 62294.0, 137752.0, 262309.0, 257545.0, 133690.0, 60901.0, 29154.0, 14901.0, 8460.0, 4920.0, 2979.0, 1908.0, 1230.0, 775.0, 542.0, 370.0, 249.0, 162.0, 112.0, 75.0, 48.0, 36.0, 29.0, 14.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.92578125, -1.863616943359375, -1.80145263671875, -1.739288330078125, -1.6771240234375, -1.614959716796875, -1.55279541015625, -1.490631103515625, -1.428466796875, -1.366302490234375, -1.30413818359375, -1.241973876953125, -1.1798095703125, -1.117645263671875, -1.05548095703125, -0.993316650390625, -0.93115234375, -0.868988037109375, -0.80682373046875, -0.744659423828125, -0.6824951171875, -0.620330810546875, -0.55816650390625, -0.496002197265625, -0.433837890625, -0.371673583984375, -0.30950927734375, -0.247344970703125, -0.1851806640625, -0.123016357421875, -0.06085205078125, 0.001312255859375, 0.0634765625, 0.125640869140625, 0.18780517578125, 0.249969482421875, 0.3121337890625, 0.374298095703125, 0.43646240234375, 0.498626708984375, 0.560791015625, 0.622955322265625, 0.68511962890625, 0.747283935546875, 0.8094482421875, 0.871612548828125, 0.93377685546875, 0.995941162109375, 1.05810546875, 1.120269775390625, 1.18243408203125, 1.244598388671875, 1.3067626953125, 1.368927001953125, 1.43109130859375, 1.493255615234375, 1.555419921875, 1.617584228515625, 1.67974853515625, 1.741912841796875, 1.8040771484375, 1.866241455078125, 1.92840576171875, 1.990570068359375, 2.052734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 6.0, 8.0, 7.0, 12.0, 19.0, 50.0, 31.0, 67.0, 74.0, 87.0, 93.0, 80.0, 98.0, 83.0, 74.0, 54.0, 41.0, 25.0, 23.0, 15.0, 16.0, 13.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.669952392578125, -0.64361572265625, -0.617279052734375, -0.5909423828125, -0.564605712890625, -0.53826904296875, -0.511932373046875, -0.485595703125, -0.459259033203125, -0.43292236328125, -0.406585693359375, -0.3802490234375, -0.353912353515625, -0.32757568359375, -0.301239013671875, -0.27490234375, -0.248565673828125, -0.22222900390625, -0.195892333984375, -0.1695556640625, -0.143218994140625, -0.11688232421875, -0.090545654296875, -0.064208984375, -0.037872314453125, -0.01153564453125, 0.014801025390625, 0.0411376953125, 0.067474365234375, 0.09381103515625, 0.120147705078125, 0.146484375, 0.172821044921875, 0.19915771484375, 0.225494384765625, 0.2518310546875, 0.278167724609375, 0.30450439453125, 0.330841064453125, 0.357177734375, 0.383514404296875, 0.40985107421875, 0.436187744140625, 0.4625244140625, 0.488861083984375, 0.51519775390625, 0.541534423828125, 0.56787109375, 0.594207763671875, 0.62054443359375, 0.646881103515625, 0.6732177734375, 0.699554443359375, 0.72589111328125, 0.752227783203125, 0.778564453125, 0.804901123046875, 0.83123779296875, 0.857574462890625, 0.8839111328125, 0.910247802734375, 0.93658447265625, 0.962921142578125, 0.9892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 2.0, 7.0, 2.0, 4.0, 10.0, 11.0, 8.0, 14.0, 28.0, 22.0, 15.0, 26.0, 31.0, 26.0, 35.0, 25.0, 41.0, 48.0, 45.0, 40.0, 55.0, 42.0, 38.0, 52.0, 34.0, 38.0, 34.0, 31.0, 27.0, 26.0, 35.0, 27.0, 19.0, 22.0, 13.0, 11.0, 8.0, 11.0, 11.0, 8.0, 2.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-15.242074012756348, -14.822809219360352, -14.403544425964355, -13.98427963256836, -13.565014839172363, -13.145750045776367, -12.726485252380371, -12.307220458984375, -11.887955665588379, -11.468690872192383, -11.049426078796387, -10.63016128540039, -10.210896492004395, -9.791631698608398, -9.372366905212402, -8.953102111816406, -8.53383731842041, -8.114572525024414, -7.695307731628418, -7.276042938232422, -6.856778144836426, -6.43751335144043, -6.018248558044434, -5.5989837646484375, -5.179718971252441, -4.760454177856445, -4.341189384460449, -3.921924591064453, -3.502659797668457, -3.083395004272461, -2.664130210876465, -2.2448654174804688, -1.8255996704101562, -1.4063348770141602, -0.9870700836181641, -0.567805290222168, -0.14854049682617188, 0.2707242965698242, 0.6899890899658203, 1.1092538833618164, 1.5285186767578125, 1.9477834701538086, 2.3670482635498047, 2.786313056945801, 3.205577850341797, 3.624842643737793, 4.044107437133789, 4.463372230529785, 4.882637023925781, 5.301901817321777, 5.721166610717773, 6.1404314041137695, 6.559696197509766, 6.978960990905762, 7.398225784301758, 7.817490577697754, 8.23675537109375, 8.656020164489746, 9.075284957885742, 9.494549751281738, 9.913814544677734, 10.33307933807373, 10.752344131469727, 11.171608924865723, 11.590873718261719]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 6.0, 7.0, 10.0, 6.0, 14.0, 16.0, 22.0, 23.0, 30.0, 29.0, 27.0, 35.0, 36.0, 24.0, 26.0, 42.0, 48.0, 39.0, 28.0, 43.0, 26.0, 34.0, 29.0, 28.0, 45.0, 28.0, 26.0, 33.0, 31.0, 27.0, 20.0, 18.0, 16.0, 18.0, 14.0, 11.0, 16.0, 7.0, 7.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.507094383239746, -11.1393404006958, -10.771587371826172, -10.403833389282227, -10.036079406738281, -9.668325424194336, -9.30057144165039, -8.932818412780762, -8.565064430236816, -8.197310447692871, -7.829556941986084, -7.461803436279297, -7.094049453735352, -6.726295471191406, -6.358541965484619, -5.990788459777832, -5.623034477233887, -5.255280494689941, -4.887526988983154, -4.519773483276367, -4.152019500732422, -3.7842657566070557, -3.4165120124816895, -3.0487582683563232, -2.681004524230957, -2.313250780105591, -1.9454970359802246, -1.5777432918548584, -1.2099895477294922, -0.842235803604126, -0.47448205947875977, -0.10672831535339355, 0.26102638244628906, 0.6287801265716553, 0.9965338706970215, 1.3642876148223877, 1.732041358947754, 2.09979510307312, 2.4675488471984863, 2.8353025913238525, 3.2030563354492188, 3.570810079574585, 3.938563823699951, 4.306317329406738, 4.674071311950684, 5.041825294494629, 5.409578800201416, 5.777332305908203, 6.145086288452148, 6.512840270996094, 6.880593776702881, 7.248347282409668, 7.616101264953613, 7.983855247497559, 8.351608276367188, 8.719362258911133, 9.087116241455078, 9.454870223999023, 9.822624206542969, 10.190377235412598, 10.558131217956543, 10.925885200500488, 11.293638229370117, 11.661392211914062, 12.029146194458008]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 9.0, 13.0, 28.0, 27.0, 58.0, 100.0, 156.0, 268.0, 406.0, 631.0, 945.0, 1571.0, 2275.0, 3581.0, 5324.0, 7779.0, 11507.0, 16048.0, 22226.0, 29894.0, 39013.0, 49918.0, 59967.0, 70940.0, 78748.0, 84703.0, 86244.0, 84071.0, 78211.0, 69371.0, 59378.0, 48181.0, 37713.0, 28865.0, 21294.0, 15657.0, 11033.0, 7572.0, 5116.0, 3449.0, 2263.0, 1440.0, 931.0, 621.0, 387.0, 255.0, 134.0, 93.0, 58.0, 45.0, 20.0, 12.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3359375, -7.0867919921875, -6.837646484375, -6.5885009765625, -6.33935546875, -6.0902099609375, -5.841064453125, -5.5919189453125, -5.3427734375, -5.0936279296875, -4.844482421875, -4.5953369140625, -4.34619140625, -4.0970458984375, -3.847900390625, -3.5987548828125, -3.349609375, -3.1004638671875, -2.851318359375, -2.6021728515625, -2.35302734375, -2.1038818359375, -1.854736328125, -1.6055908203125, -1.3564453125, -1.1072998046875, -0.858154296875, -0.6090087890625, -0.35986328125, -0.1107177734375, 0.138427734375, 0.3875732421875, 0.63671875, 0.8858642578125, 1.135009765625, 1.3841552734375, 1.63330078125, 1.8824462890625, 2.131591796875, 2.3807373046875, 2.6298828125, 2.8790283203125, 3.128173828125, 3.3773193359375, 3.62646484375, 3.8756103515625, 4.124755859375, 4.3739013671875, 4.623046875, 4.8721923828125, 5.121337890625, 5.3704833984375, 5.61962890625, 5.8687744140625, 6.117919921875, 6.3670654296875, 6.6162109375, 6.8653564453125, 7.114501953125, 7.3636474609375, 7.61279296875, 7.8619384765625, 8.111083984375, 8.3602294921875, 8.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 9.0, 6.0, 10.0, 11.0, 5.0, 15.0, 12.0, 21.0, 24.0, 28.0, 28.0, 29.0, 39.0, 31.0, 27.0, 25.0, 41.0, 48.0, 42.0, 28.0, 40.0, 28.0, 34.0, 29.0, 29.0, 44.0, 28.0, 26.0, 34.0, 35.0, 28.0, 15.0, 21.0, 15.0, 18.0, 15.0, 11.0, 16.0, 9.0, 4.0, 9.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.8917236328125, -10.533447265625, -10.1751708984375, -9.81689453125, -9.4586181640625, -9.100341796875, -8.7420654296875, -8.3837890625, -8.0255126953125, -7.667236328125, -7.3089599609375, -6.95068359375, -6.5924072265625, -6.234130859375, -5.8758544921875, -5.517578125, -5.1593017578125, -4.801025390625, -4.4427490234375, -4.08447265625, -3.7261962890625, -3.367919921875, -3.0096435546875, -2.6513671875, -2.2930908203125, -1.934814453125, -1.5765380859375, -1.21826171875, -0.8599853515625, -0.501708984375, -0.1434326171875, 0.21484375, 0.5731201171875, 0.931396484375, 1.2896728515625, 1.64794921875, 2.0062255859375, 2.364501953125, 2.7227783203125, 3.0810546875, 3.4393310546875, 3.797607421875, 4.1558837890625, 4.51416015625, 4.8724365234375, 5.230712890625, 5.5889892578125, 5.947265625, 6.3055419921875, 6.663818359375, 7.0220947265625, 7.38037109375, 7.7386474609375, 8.096923828125, 8.4552001953125, 8.8134765625, 9.1717529296875, 9.530029296875, 9.8883056640625, 10.24658203125, 10.6048583984375, 10.963134765625, 11.3214111328125, 11.6796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 15.0, 16.0, 26.0, 64.0, 97.0, 163.0, 290.0, 508.0, 948.0, 1652.0, 2719.0, 4480.0, 7779.0, 12509.0, 19758.0, 29983.0, 43417.0, 59825.0, 77869.0, 94813.0, 107560.0, 112182.0, 107883.0, 96229.0, 79089.0, 60940.0, 44552.0, 30545.0, 20243.0, 12996.0, 7991.0, 4747.0, 2749.0, 1682.0, 970.0, 576.0, 280.0, 173.0, 93.0, 61.0, 29.0, 25.0, 14.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.184814453125, -9.86181640625, -9.538818359375, -9.2158203125, -8.892822265625, -8.56982421875, -8.246826171875, -7.923828125, -7.600830078125, -7.27783203125, -6.954833984375, -6.6318359375, -6.308837890625, -5.98583984375, -5.662841796875, -5.33984375, -5.016845703125, -4.69384765625, -4.370849609375, -4.0478515625, -3.724853515625, -3.40185546875, -3.078857421875, -2.755859375, -2.432861328125, -2.10986328125, -1.786865234375, -1.4638671875, -1.140869140625, -0.81787109375, -0.494873046875, -0.171875, 0.151123046875, 0.47412109375, 0.797119140625, 1.1201171875, 1.443115234375, 1.76611328125, 2.089111328125, 2.412109375, 2.735107421875, 3.05810546875, 3.381103515625, 3.7041015625, 4.027099609375, 4.35009765625, 4.673095703125, 4.99609375, 5.319091796875, 5.64208984375, 5.965087890625, 6.2880859375, 6.611083984375, 6.93408203125, 7.257080078125, 7.580078125, 7.903076171875, 8.22607421875, 8.549072265625, 8.8720703125, 9.195068359375, 9.51806640625, 9.841064453125, 10.1640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 2.0, 4.0, 6.0, 3.0, 5.0, 15.0, 12.0, 15.0, 21.0, 17.0, 23.0, 20.0, 24.0, 27.0, 34.0, 34.0, 35.0, 37.0, 38.0, 43.0, 44.0, 43.0, 37.0, 34.0, 38.0, 39.0, 33.0, 36.0, 46.0, 40.0, 27.0, 23.0, 27.0, 28.0, 17.0, 11.0, 10.0, 9.0, 13.0, 9.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7734375, -8.5064697265625, -8.239501953125, -7.9725341796875, -7.70556640625, -7.4385986328125, -7.171630859375, -6.9046630859375, -6.6376953125, -6.3707275390625, -6.103759765625, -5.8367919921875, -5.56982421875, -5.3028564453125, -5.035888671875, -4.7689208984375, -4.501953125, -4.2349853515625, -3.968017578125, -3.7010498046875, -3.43408203125, -3.1671142578125, -2.900146484375, -2.6331787109375, -2.3662109375, -2.0992431640625, -1.832275390625, -1.5653076171875, -1.29833984375, -1.0313720703125, -0.764404296875, -0.4974365234375, -0.23046875, 0.0364990234375, 0.303466796875, 0.5704345703125, 0.83740234375, 1.1043701171875, 1.371337890625, 1.6383056640625, 1.9052734375, 2.1722412109375, 2.439208984375, 2.7061767578125, 2.97314453125, 3.2401123046875, 3.507080078125, 3.7740478515625, 4.041015625, 4.3079833984375, 4.574951171875, 4.8419189453125, 5.10888671875, 5.3758544921875, 5.642822265625, 5.9097900390625, 6.1767578125, 6.4437255859375, 6.710693359375, 6.9776611328125, 7.24462890625, 7.5115966796875, 7.778564453125, 8.0455322265625, 8.3125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 31.0, 55.0, 68.0, 100.0, 195.0, 300.0, 568.0, 943.0, 1552.0, 2775.0, 4965.0, 8565.0, 15193.0, 25897.0, 43124.0, 66733.0, 95877.0, 124777.0, 142162.0, 139836.0, 121377.0, 92934.0, 63035.0, 40417.0, 24182.0, 14078.0, 8026.0, 4633.0, 2544.0, 1505.0, 812.0, 492.0, 275.0, 169.0, 101.0, 73.0, 37.0, 29.0, 13.0, 17.0, 6.0, 3.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.6796875, -5.5018310546875, -5.323974609375, -5.1461181640625, -4.96826171875, -4.7904052734375, -4.612548828125, -4.4346923828125, -4.2568359375, -4.0789794921875, -3.901123046875, -3.7232666015625, -3.54541015625, -3.3675537109375, -3.189697265625, -3.0118408203125, -2.833984375, -2.6561279296875, -2.478271484375, -2.3004150390625, -2.12255859375, -1.9447021484375, -1.766845703125, -1.5889892578125, -1.4111328125, -1.2332763671875, -1.055419921875, -0.8775634765625, -0.69970703125, -0.5218505859375, -0.343994140625, -0.1661376953125, 0.01171875, 0.1895751953125, 0.367431640625, 0.5452880859375, 0.72314453125, 0.9010009765625, 1.078857421875, 1.2567138671875, 1.4345703125, 1.6124267578125, 1.790283203125, 1.9681396484375, 2.14599609375, 2.3238525390625, 2.501708984375, 2.6795654296875, 2.857421875, 3.0352783203125, 3.213134765625, 3.3909912109375, 3.56884765625, 3.7467041015625, 3.924560546875, 4.1024169921875, 4.2802734375, 4.4581298828125, 4.635986328125, 4.8138427734375, 4.99169921875, 5.1695556640625, 5.347412109375, 5.5252685546875, 5.703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 16.0, 21.0, 16.0, 19.0, 16.0, 12.0, 21.0, 33.0, 28.0, 48.0, 34.0, 47.0, 39.0, 44.0, 48.0, 52.0, 44.0, 46.0, 41.0, 29.0, 42.0, 27.0, 34.0, 35.0, 30.0, 29.0, 20.0, 17.0, 15.0, 8.0, 13.0, 14.0, 9.0, 12.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.000606536865234375, -0.0005899891257286072, -0.0005734413862228394, -0.0005568936467170715, -0.0005403459072113037, -0.0005237981677055359, -0.0005072504281997681, -0.0004907026886940002, -0.0004741549491882324, -0.0004576072096824646, -0.0004410594701766968, -0.00042451173067092896, -0.00040796399116516113, -0.0003914162516593933, -0.0003748685121536255, -0.00035832077264785767, -0.00034177303314208984, -0.000325225293636322, -0.0003086775541305542, -0.0002921298146247864, -0.00027558207511901855, -0.00025903433561325073, -0.0002424865961074829, -0.0002259388566017151, -0.00020939111709594727, -0.00019284337759017944, -0.00017629563808441162, -0.0001597478985786438, -0.00014320015907287598, -0.00012665241956710815, -0.00011010468006134033, -9.355694055557251e-05, -7.700920104980469e-05, -6.0461461544036865e-05, -4.391372203826904e-05, -2.736598253250122e-05, -1.0818243026733398e-05, 5.729496479034424e-06, 2.2277235984802246e-05, 3.882497549057007e-05, 5.537271499633789e-05, 7.192045450210571e-05, 8.846819400787354e-05, 0.00010501593351364136, 0.00012156367301940918, 0.000138111412525177, 0.00015465915203094482, 0.00017120689153671265, 0.00018775463104248047, 0.0002043023705482483, 0.0002208501100540161, 0.00023739784955978394, 0.00025394558906555176, 0.0002704933285713196, 0.0002870410680770874, 0.0003035888075828552, 0.00032013654708862305, 0.00033668428659439087, 0.0003532320261001587, 0.0003697797656059265, 0.00038632750511169434, 0.00040287524461746216, 0.00041942298412323, 0.0004359707236289978, 0.0004525184631347656]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 10.0, 10.0, 21.0, 30.0, 63.0, 74.0, 118.0, 173.0, 288.0, 467.0, 775.0, 1245.0, 2103.0, 3413.0, 5686.0, 9694.0, 16325.0, 27727.0, 44665.0, 69633.0, 98776.0, 127312.0, 142706.0, 139227.0, 117153.0, 87486.0, 59265.0, 37616.0, 22883.0, 13579.0, 8012.0, 4842.0, 2750.0, 1682.0, 1040.0, 611.0, 406.0, 237.0, 141.0, 100.0, 59.0, 49.0, 33.0, 23.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.7955322265625, -5.587158203125, -5.3787841796875, -5.17041015625, -4.9620361328125, -4.753662109375, -4.5452880859375, -4.3369140625, -4.1285400390625, -3.920166015625, -3.7117919921875, -3.50341796875, -3.2950439453125, -3.086669921875, -2.8782958984375, -2.669921875, -2.4615478515625, -2.253173828125, -2.0447998046875, -1.83642578125, -1.6280517578125, -1.419677734375, -1.2113037109375, -1.0029296875, -0.7945556640625, -0.586181640625, -0.3778076171875, -0.16943359375, 0.0389404296875, 0.247314453125, 0.4556884765625, 0.6640625, 0.8724365234375, 1.080810546875, 1.2891845703125, 1.49755859375, 1.7059326171875, 1.914306640625, 2.1226806640625, 2.3310546875, 2.5394287109375, 2.747802734375, 2.9561767578125, 3.16455078125, 3.3729248046875, 3.581298828125, 3.7896728515625, 3.998046875, 4.2064208984375, 4.414794921875, 4.6231689453125, 4.83154296875, 5.0399169921875, 5.248291015625, 5.4566650390625, 5.6650390625, 5.8734130859375, 6.081787109375, 6.2901611328125, 6.49853515625, 6.7069091796875, 6.915283203125, 7.1236572265625, 7.33203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 16.0, 21.0, 36.0, 38.0, 51.0, 72.0, 90.0, 96.0, 81.0, 93.0, 89.0, 84.0, 62.0, 42.0, 34.0, 15.0, 14.0, 10.0, 8.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.08099365234375, -3.9276123046875, -3.77423095703125, -3.620849609375, -3.46746826171875, -3.3140869140625, -3.16070556640625, -3.00732421875, -2.85394287109375, -2.7005615234375, -2.54718017578125, -2.393798828125, -2.24041748046875, -2.0870361328125, -1.93365478515625, -1.7802734375, -1.62689208984375, -1.4735107421875, -1.32012939453125, -1.166748046875, -1.01336669921875, -0.8599853515625, -0.70660400390625, -0.55322265625, -0.39984130859375, -0.2464599609375, -0.09307861328125, 0.060302734375, 0.21368408203125, 0.3670654296875, 0.52044677734375, 0.673828125, 0.82720947265625, 0.9805908203125, 1.13397216796875, 1.287353515625, 1.44073486328125, 1.5941162109375, 1.74749755859375, 1.90087890625, 2.05426025390625, 2.2076416015625, 2.36102294921875, 2.514404296875, 2.66778564453125, 2.8211669921875, 2.97454833984375, 3.1279296875, 3.28131103515625, 3.4346923828125, 3.58807373046875, 3.741455078125, 3.89483642578125, 4.0482177734375, 4.20159912109375, 4.35498046875, 4.50836181640625, 4.6617431640625, 4.81512451171875, 4.968505859375, 5.12188720703125, 5.2752685546875, 5.42864990234375, 5.58203125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 5.0, 8.0, 5.0, 7.0, 12.0, 19.0, 17.0, 28.0, 21.0, 23.0, 23.0, 33.0, 27.0, 33.0, 39.0, 53.0, 39.0, 43.0, 39.0, 39.0, 55.0, 43.0, 42.0, 36.0, 30.0, 26.0, 38.0, 27.0, 25.0, 33.0, 20.0, 21.0, 13.0, 13.0, 13.0, 5.0, 16.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.781293869018555, -12.363321304321289, -11.945348739624023, -11.527376174926758, -11.109403610229492, -10.691431045532227, -10.273458480834961, -9.855485916137695, -9.43751335144043, -9.019540786743164, -8.601568222045898, -8.183595657348633, -7.765623092651367, -7.347650527954102, -6.929677963256836, -6.51170539855957, -6.093733310699463, -5.675760746002197, -5.257788181304932, -4.839815616607666, -4.4218430519104, -4.003870964050293, -3.5858981609344482, -3.1679255962371826, -2.749953031539917, -2.3319804668426514, -1.9140079021453857, -1.4960354566574097, -1.078062891960144, -0.660090446472168, -0.24211788177490234, 0.17585468292236328, 0.5938272476196289, 1.0117998123168945, 1.4297723770141602, 1.8477448225021362, 2.2657175064086914, 2.683689832687378, 3.1016623973846436, 3.519634962081909, 3.937607526779175, 4.355579853057861, 4.773552417755127, 5.191524982452393, 5.609497547149658, 6.027470111846924, 6.4454426765441895, 6.863415241241455, 7.281387805938721, 7.699360370635986, 8.117332458496094, 8.53530502319336, 8.953277587890625, 9.37125015258789, 9.789222717285156, 10.207195281982422, 10.625167846679688, 11.043140411376953, 11.461112976074219, 11.879085540771484, 12.29705810546875, 12.715030670166016, 13.133003234863281, 13.550975799560547, 13.968948364257812]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 2.0, 6.0, 14.0, 4.0, 14.0, 16.0, 19.0, 14.0, 25.0, 30.0, 28.0, 30.0, 22.0, 35.0, 43.0, 38.0, 41.0, 42.0, 46.0, 40.0, 37.0, 41.0, 28.0, 38.0, 29.0, 27.0, 32.0, 28.0, 29.0, 40.0, 21.0, 25.0, 16.0, 18.0, 11.0, 11.0, 12.0, 11.0, 2.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.830852508544922, -14.405828475952148, -13.980804443359375, -13.555780410766602, -13.130756378173828, -12.705732345581055, -12.280708312988281, -11.855684280395508, -11.430660247802734, -11.005636215209961, -10.580612182617188, -10.155588150024414, -9.73056411743164, -9.305540084838867, -8.880516052246094, -8.45549201965332, -8.03046703338623, -7.605443000793457, -7.180418968200684, -6.75539493560791, -6.330370903015137, -5.905346870422363, -5.480322360992432, -5.055298328399658, -4.630274295806885, -4.205250263214111, -3.780226230621338, -3.3552019596099854, -2.930177927017212, -2.5051538944244385, -2.080129623413086, -1.6551055908203125, -1.2300825119018555, -0.8050584197044373, -0.38003432750701904, 0.044989824295043945, 0.4700138568878174, 0.8950378894805908, 1.3200621604919434, 1.7450861930847168, 2.1701102256774902, 2.5951342582702637, 3.020158290863037, 3.4451825618743896, 3.870206594467163, 4.295230865478516, 4.720254898071289, 5.1452789306640625, 5.570302963256836, 5.995326995849609, 6.420351028442383, 6.845375061035156, 7.27039909362793, 7.695423126220703, 8.120447158813477, 8.54547119140625, 8.970495223999023, 9.395519256591797, 9.82054328918457, 10.245567321777344, 10.670591354370117, 11.09561538696289, 11.520639419555664, 11.945663452148438, 12.370688438415527]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 8.0, 4.0, 18.0, 23.0, 33.0, 61.0, 97.0, 168.0, 238.0, 445.0, 706.0, 1123.0, 1869.0, 3000.0, 4892.0, 7628.0, 12094.0, 19039.0, 28843.0, 43753.0, 65179.0, 92833.0, 131839.0, 177493.0, 231719.0, 287783.0, 340084.0, 379328.0, 395537.0, 387341.0, 356157.0, 307703.0, 252288.0, 195875.0, 145952.0, 105075.0, 73836.0, 49960.0, 33886.0, 22237.0, 14190.0, 9086.0, 5666.0, 3623.0, 2193.0, 1417.0, 772.0, 466.0, 308.0, 185.0, 114.0, 41.0, 42.0, 25.0, 11.0, 8.0, 4.0, 1.0, 0.0, 2.0], "bins": [-9.0859375, -8.807861328125, -8.52978515625, -8.251708984375, -7.9736328125, -7.695556640625, -7.41748046875, -7.139404296875, -6.861328125, -6.583251953125, -6.30517578125, -6.027099609375, -5.7490234375, -5.470947265625, -5.19287109375, -4.914794921875, -4.63671875, -4.358642578125, -4.08056640625, -3.802490234375, -3.5244140625, -3.246337890625, -2.96826171875, -2.690185546875, -2.412109375, -2.134033203125, -1.85595703125, -1.577880859375, -1.2998046875, -1.021728515625, -0.74365234375, -0.465576171875, -0.1875, 0.090576171875, 0.36865234375, 0.646728515625, 0.9248046875, 1.202880859375, 1.48095703125, 1.759033203125, 2.037109375, 2.315185546875, 2.59326171875, 2.871337890625, 3.1494140625, 3.427490234375, 3.70556640625, 3.983642578125, 4.26171875, 4.539794921875, 4.81787109375, 5.095947265625, 5.3740234375, 5.652099609375, 5.93017578125, 6.208251953125, 6.486328125, 6.764404296875, 7.04248046875, 7.320556640625, 7.5986328125, 7.876708984375, 8.15478515625, 8.432861328125, 8.7109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 5.0, 7.0, 9.0, 10.0, 7.0, 16.0, 17.0, 15.0, 22.0, 24.0, 39.0, 25.0, 31.0, 26.0, 38.0, 39.0, 43.0, 34.0, 44.0, 53.0, 36.0, 40.0, 31.0, 34.0, 25.0, 34.0, 34.0, 31.0, 21.0, 44.0, 24.0, 24.0, 15.0, 16.0, 16.0, 11.0, 11.0, 9.0, 6.0, 7.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.8203125, -12.4451904296875, -12.070068359375, -11.6949462890625, -11.31982421875, -10.9447021484375, -10.569580078125, -10.1944580078125, -9.8193359375, -9.4442138671875, -9.069091796875, -8.6939697265625, -8.31884765625, -7.9437255859375, -7.568603515625, -7.1934814453125, -6.818359375, -6.4432373046875, -6.068115234375, -5.6929931640625, -5.31787109375, -4.9427490234375, -4.567626953125, -4.1925048828125, -3.8173828125, -3.4422607421875, -3.067138671875, -2.6920166015625, -2.31689453125, -1.9417724609375, -1.566650390625, -1.1915283203125, -0.81640625, -0.4412841796875, -0.066162109375, 0.3089599609375, 0.68408203125, 1.0592041015625, 1.434326171875, 1.8094482421875, 2.1845703125, 2.5596923828125, 2.934814453125, 3.3099365234375, 3.68505859375, 4.0601806640625, 4.435302734375, 4.8104248046875, 5.185546875, 5.5606689453125, 5.935791015625, 6.3109130859375, 6.68603515625, 7.0611572265625, 7.436279296875, 7.8114013671875, 8.1865234375, 8.5616455078125, 8.936767578125, 9.3118896484375, 9.68701171875, 10.0621337890625, 10.437255859375, 10.8123779296875, 11.1875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 8.0, 13.0, 24.0, 58.0, 85.0, 120.0, 259.0, 462.0, 773.0, 1326.0, 2248.0, 3978.0, 6403.0, 10794.0, 17424.0, 27852.0, 43248.0, 66161.0, 95829.0, 136080.0, 184670.0, 239919.0, 295793.0, 345790.0, 380985.0, 395161.0, 384950.0, 354823.0, 305503.0, 250648.0, 195396.0, 145423.0, 103545.0, 71462.0, 47592.0, 30703.0, 19192.0, 12077.0, 7202.0, 4233.0, 2604.0, 1464.0, 870.0, 513.0, 285.0, 120.0, 100.0, 56.0, 25.0, 23.0, 8.0, 6.0, 4.0, 1.0, 2.0], "bins": [-10.546875, -10.2420654296875, -9.937255859375, -9.6324462890625, -9.32763671875, -9.0228271484375, -8.718017578125, -8.4132080078125, -8.1083984375, -7.8035888671875, -7.498779296875, -7.1939697265625, -6.88916015625, -6.5843505859375, -6.279541015625, -5.9747314453125, -5.669921875, -5.3651123046875, -5.060302734375, -4.7554931640625, -4.45068359375, -4.1458740234375, -3.841064453125, -3.5362548828125, -3.2314453125, -2.9266357421875, -2.621826171875, -2.3170166015625, -2.01220703125, -1.7073974609375, -1.402587890625, -1.0977783203125, -0.79296875, -0.4881591796875, -0.183349609375, 0.1214599609375, 0.42626953125, 0.7310791015625, 1.035888671875, 1.3406982421875, 1.6455078125, 1.9503173828125, 2.255126953125, 2.5599365234375, 2.86474609375, 3.1695556640625, 3.474365234375, 3.7791748046875, 4.083984375, 4.3887939453125, 4.693603515625, 4.9984130859375, 5.30322265625, 5.6080322265625, 5.912841796875, 6.2176513671875, 6.5224609375, 6.8272705078125, 7.132080078125, 7.4368896484375, 7.74169921875, 8.0465087890625, 8.351318359375, 8.6561279296875, 8.9609375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 5.0, 8.0, 6.0, 9.0, 12.0, 14.0, 29.0, 31.0, 28.0, 38.0, 45.0, 60.0, 60.0, 87.0, 93.0, 118.0, 118.0, 156.0, 146.0, 153.0, 153.0, 178.0, 189.0, 189.0, 167.0, 191.0, 175.0, 190.0, 182.0, 170.0, 153.0, 151.0, 130.0, 112.0, 89.0, 96.0, 63.0, 56.0, 43.0, 40.0, 29.0, 29.0, 26.0, 14.0, 9.0, 13.0, 10.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.84765625, -5.683349609375, -5.51904296875, -5.354736328125, -5.1904296875, -5.026123046875, -4.86181640625, -4.697509765625, -4.533203125, -4.368896484375, -4.20458984375, -4.040283203125, -3.8759765625, -3.711669921875, -3.54736328125, -3.383056640625, -3.21875, -3.054443359375, -2.89013671875, -2.725830078125, -2.5615234375, -2.397216796875, -2.23291015625, -2.068603515625, -1.904296875, -1.739990234375, -1.57568359375, -1.411376953125, -1.2470703125, -1.082763671875, -0.91845703125, -0.754150390625, -0.58984375, -0.425537109375, -0.26123046875, -0.096923828125, 0.0673828125, 0.231689453125, 0.39599609375, 0.560302734375, 0.724609375, 0.888916015625, 1.05322265625, 1.217529296875, 1.3818359375, 1.546142578125, 1.71044921875, 1.874755859375, 2.0390625, 2.203369140625, 2.36767578125, 2.531982421875, 2.6962890625, 2.860595703125, 3.02490234375, 3.189208984375, 3.353515625, 3.517822265625, 3.68212890625, 3.846435546875, 4.0107421875, 4.175048828125, 4.33935546875, 4.503662109375, 4.66796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 6.0, 8.0, 11.0, 15.0, 14.0, 12.0, 7.0, 19.0, 24.0, 23.0, 38.0, 37.0, 33.0, 29.0, 41.0, 43.0, 31.0, 34.0, 42.0, 39.0, 47.0, 48.0, 38.0, 45.0, 33.0, 30.0, 29.0, 25.0, 31.0, 26.0, 20.0, 18.0, 11.0, 14.0, 11.0, 14.0, 14.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-13.379307746887207, -12.9785737991333, -12.577839851379395, -12.177105903625488, -11.776371955871582, -11.375638008117676, -10.974905014038086, -10.57417106628418, -10.173437118530273, -9.772703170776367, -9.371969223022461, -8.971235275268555, -8.570501327514648, -8.169767379760742, -7.769033908843994, -7.368299961090088, -6.967565536499023, -6.566831588745117, -6.166097640991211, -5.765363693237305, -5.364629745483398, -4.963895797729492, -4.563162326812744, -4.162428379058838, -3.7616944313049316, -3.3609604835510254, -2.960226535797119, -2.559492826461792, -2.1587588787078857, -1.7580249309539795, -1.3572912216186523, -0.9565572738647461, -0.5558242797851562, -0.15509039163589478, 0.2456434965133667, 0.6463773250579834, 1.0471112728118896, 1.447845220565796, 1.848578929901123, 2.2493128776550293, 2.6500468254089355, 3.050780773162842, 3.451514720916748, 3.852248430252075, 4.252982139587402, 4.653716087341309, 5.054450035095215, 5.455183982849121, 5.855917930603027, 6.256651878356934, 6.65738582611084, 7.058119773864746, 7.458853721618652, 7.859587669372559, 8.260320663452148, 8.661054611206055, 9.061788558959961, 9.462522506713867, 9.863256454467773, 10.26399040222168, 10.664724349975586, 11.065458297729492, 11.466192245483398, 11.866926193237305, 12.267660140991211]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 8.0, 3.0, 11.0, 16.0, 10.0, 21.0, 15.0, 19.0, 21.0, 25.0, 28.0, 23.0, 27.0, 31.0, 39.0, 39.0, 39.0, 31.0, 38.0, 37.0, 31.0, 33.0, 36.0, 41.0, 27.0, 35.0, 32.0, 32.0, 28.0, 22.0, 18.0, 33.0, 17.0, 13.0, 16.0, 17.0, 14.0, 15.0, 10.0, 10.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.455949783325195, -12.056567192077637, -11.657184600830078, -11.257801055908203, -10.858418464660645, -10.459035873413086, -10.059653282165527, -9.660270690917969, -9.260887145996094, -8.861504554748535, -8.462121963500977, -8.062738418579102, -7.663355827331543, -7.263973236083984, -6.864590644836426, -6.465208053588867, -6.065825462341309, -5.66644287109375, -5.267059803009033, -4.867677211761475, -4.468294143676758, -4.068911552429199, -3.6695289611816406, -3.270146131515503, -2.8707633018493652, -2.4713804721832275, -2.07199764251709, -1.6726150512695312, -1.2732322216033936, -0.8738493919372559, -0.47446680068969727, -0.07508397102355957, 0.3242979049682617, 0.7236806750297546, 1.1230634450912476, 1.5224461555480957, 1.9218289852142334, 2.321211814880371, 2.7205944061279297, 3.1199772357940674, 3.519360065460205, 3.9187428951263428, 4.3181257247924805, 4.717508316040039, 5.116890907287598, 5.5162739753723145, 5.915656566619873, 6.31503963470459, 6.714422225952148, 7.113804817199707, 7.513187885284424, 7.912570476531982, 8.3119535446167, 8.711336135864258, 9.110718727111816, 9.510101318359375, 9.90948486328125, 10.308867454528809, 10.708250045776367, 11.107633590698242, 11.5070161819458, 11.90639877319336, 12.305781364440918, 12.705163955688477, 13.104546546936035]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 7.0, 10.0, 29.0, 37.0, 46.0, 61.0, 118.0, 151.0, 256.0, 412.0, 681.0, 1169.0, 2097.0, 3524.0, 6372.0, 11724.0, 21869.0, 40659.0, 74010.0, 126408.0, 186727.0, 202765.0, 155428.0, 95695.0, 53725.0, 29228.0, 15674.0, 8461.0, 4782.0, 2610.0, 1533.0, 876.0, 508.0, 319.0, 203.0, 129.0, 72.0, 61.0, 41.0, 25.0, 18.0, 7.0, 9.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.4295654296875, -2.343505859375, -2.2574462890625, -2.17138671875, -2.0853271484375, -1.999267578125, -1.9132080078125, -1.8271484375, -1.7410888671875, -1.655029296875, -1.5689697265625, -1.48291015625, -1.3968505859375, -1.310791015625, -1.2247314453125, -1.138671875, -1.0526123046875, -0.966552734375, -0.8804931640625, -0.79443359375, -0.7083740234375, -0.622314453125, -0.5362548828125, -0.4501953125, -0.3641357421875, -0.278076171875, -0.1920166015625, -0.10595703125, -0.0198974609375, 0.066162109375, 0.1522216796875, 0.23828125, 0.3243408203125, 0.410400390625, 0.4964599609375, 0.58251953125, 0.6685791015625, 0.754638671875, 0.8406982421875, 0.9267578125, 1.0128173828125, 1.098876953125, 1.1849365234375, 1.27099609375, 1.3570556640625, 1.443115234375, 1.5291748046875, 1.615234375, 1.7012939453125, 1.787353515625, 1.8734130859375, 1.95947265625, 2.0455322265625, 2.131591796875, 2.2176513671875, 2.3037109375, 2.3897705078125, 2.475830078125, 2.5618896484375, 2.64794921875, 2.7340087890625, 2.820068359375, 2.9061279296875, 2.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 4.0, 8.0, 4.0, 10.0, 16.0, 12.0, 19.0, 14.0, 23.0, 18.0, 27.0, 25.0, 27.0, 24.0, 30.0, 40.0, 40.0, 39.0, 30.0, 38.0, 39.0, 30.0, 31.0, 37.0, 42.0, 27.0, 36.0, 30.0, 32.0, 31.0, 20.0, 19.0, 31.0, 17.0, 14.0, 15.0, 17.0, 14.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.4921875, -12.092529296875, -11.69287109375, -11.293212890625, -10.8935546875, -10.493896484375, -10.09423828125, -9.694580078125, -9.294921875, -8.895263671875, -8.49560546875, -8.095947265625, -7.6962890625, -7.296630859375, -6.89697265625, -6.497314453125, -6.09765625, -5.697998046875, -5.29833984375, -4.898681640625, -4.4990234375, -4.099365234375, -3.69970703125, -3.300048828125, -2.900390625, -2.500732421875, -2.10107421875, -1.701416015625, -1.3017578125, -0.902099609375, -0.50244140625, -0.102783203125, 0.296875, 0.696533203125, 1.09619140625, 1.495849609375, 1.8955078125, 2.295166015625, 2.69482421875, 3.094482421875, 3.494140625, 3.893798828125, 4.29345703125, 4.693115234375, 5.0927734375, 5.492431640625, 5.89208984375, 6.291748046875, 6.69140625, 7.091064453125, 7.49072265625, 7.890380859375, 8.2900390625, 8.689697265625, 9.08935546875, 9.489013671875, 9.888671875, 10.288330078125, 10.68798828125, 11.087646484375, 11.4873046875, 11.886962890625, 12.28662109375, 12.686279296875, 13.0859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 6.0, 11.0, 11.0, 14.0, 22.0, 28.0, 48.0, 62.0, 73.0, 130.0, 155.0, 211.0, 315.0, 454.0, 624.0, 923.0, 1381.0, 2184.0, 3399.0, 5455.0, 8926.0, 15236.0, 26015.0, 47743.0, 90749.0, 169281.0, 244131.0, 191861.0, 106638.0, 56224.0, 30693.0, 17570.0, 10475.0, 6258.0, 3825.0, 2419.0, 1626.0, 1020.0, 682.0, 494.0, 357.0, 229.0, 191.0, 109.0, 86.0, 63.0, 45.0, 27.0, 33.0, 22.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.701171875, -2.6099853515625, -2.518798828125, -2.4276123046875, -2.33642578125, -2.2452392578125, -2.154052734375, -2.0628662109375, -1.9716796875, -1.8804931640625, -1.789306640625, -1.6981201171875, -1.60693359375, -1.5157470703125, -1.424560546875, -1.3333740234375, -1.2421875, -1.1510009765625, -1.059814453125, -0.9686279296875, -0.87744140625, -0.7862548828125, -0.695068359375, -0.6038818359375, -0.5126953125, -0.4215087890625, -0.330322265625, -0.2391357421875, -0.14794921875, -0.0567626953125, 0.034423828125, 0.1256103515625, 0.216796875, 0.3079833984375, 0.399169921875, 0.4903564453125, 0.58154296875, 0.6727294921875, 0.763916015625, 0.8551025390625, 0.9462890625, 1.0374755859375, 1.128662109375, 1.2198486328125, 1.31103515625, 1.4022216796875, 1.493408203125, 1.5845947265625, 1.67578125, 1.7669677734375, 1.858154296875, 1.9493408203125, 2.04052734375, 2.1317138671875, 2.222900390625, 2.3140869140625, 2.4052734375, 2.4964599609375, 2.587646484375, 2.6788330078125, 2.77001953125, 2.8612060546875, 2.952392578125, 3.0435791015625, 3.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 4.0, 7.0, 10.0, 11.0, 15.0, 11.0, 15.0, 26.0, 16.0, 17.0, 31.0, 35.0, 25.0, 29.0, 51.0, 29.0, 45.0, 33.0, 38.0, 41.0, 38.0, 45.0, 40.0, 40.0, 36.0, 35.0, 36.0, 30.0, 37.0, 26.0, 24.0, 15.0, 22.0, 12.0, 12.0, 6.0, 12.0, 12.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.479248046875, -8.20849609375, -7.937744140625, -7.6669921875, -7.396240234375, -7.12548828125, -6.854736328125, -6.583984375, -6.313232421875, -6.04248046875, -5.771728515625, -5.5009765625, -5.230224609375, -4.95947265625, -4.688720703125, -4.41796875, -4.147216796875, -3.87646484375, -3.605712890625, -3.3349609375, -3.064208984375, -2.79345703125, -2.522705078125, -2.251953125, -1.981201171875, -1.71044921875, -1.439697265625, -1.1689453125, -0.898193359375, -0.62744140625, -0.356689453125, -0.0859375, 0.184814453125, 0.45556640625, 0.726318359375, 0.9970703125, 1.267822265625, 1.53857421875, 1.809326171875, 2.080078125, 2.350830078125, 2.62158203125, 2.892333984375, 3.1630859375, 3.433837890625, 3.70458984375, 3.975341796875, 4.24609375, 4.516845703125, 4.78759765625, 5.058349609375, 5.3291015625, 5.599853515625, 5.87060546875, 6.141357421875, 6.412109375, 6.682861328125, 6.95361328125, 7.224365234375, 7.4951171875, 7.765869140625, 8.03662109375, 8.307373046875, 8.578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 13.0, 18.0, 20.0, 27.0, 38.0, 51.0, 76.0, 120.0, 152.0, 229.0, 358.0, 555.0, 886.0, 1406.0, 2480.0, 4668.0, 9283.0, 21455.0, 62338.0, 271543.0, 483627.0, 125075.0, 35301.0, 14134.0, 6437.0, 3328.0, 1901.0, 1086.0, 680.0, 388.0, 259.0, 213.0, 118.0, 92.0, 49.0, 33.0, 23.0, 27.0, 12.0, 25.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5131072998046875, -1.464691162109375, -1.4162750244140625, -1.36785888671875, -1.3194427490234375, -1.271026611328125, -1.2226104736328125, -1.1741943359375, -1.1257781982421875, -1.077362060546875, -1.0289459228515625, -0.98052978515625, -0.9321136474609375, -0.883697509765625, -0.8352813720703125, -0.786865234375, -0.7384490966796875, -0.690032958984375, -0.6416168212890625, -0.59320068359375, -0.5447845458984375, -0.496368408203125, -0.4479522705078125, -0.3995361328125, -0.3511199951171875, -0.302703857421875, -0.2542877197265625, -0.20587158203125, -0.1574554443359375, -0.109039306640625, -0.0606231689453125, -0.01220703125, 0.0362091064453125, 0.084625244140625, 0.1330413818359375, 0.18145751953125, 0.2298736572265625, 0.278289794921875, 0.3267059326171875, 0.3751220703125, 0.4235382080078125, 0.471954345703125, 0.5203704833984375, 0.56878662109375, 0.6172027587890625, 0.665618896484375, 0.7140350341796875, 0.762451171875, 0.8108673095703125, 0.859283447265625, 0.9076995849609375, 0.95611572265625, 1.0045318603515625, 1.052947998046875, 1.1013641357421875, 1.1497802734375, 1.1981964111328125, 1.246612548828125, 1.2950286865234375, 1.34344482421875, 1.3918609619140625, 1.440277099609375, 1.4886932373046875, 1.537109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 4.0, 13.0, 15.0, 10.0, 8.0, 15.0, 22.0, 22.0, 34.0, 36.0, 29.0, 46.0, 38.0, 51.0, 53.0, 59.0, 55.0, 51.0, 60.0, 48.0, 44.0, 44.0, 39.0, 33.0, 27.0, 24.0, 28.0, 18.0, 17.0, 9.0, 9.0, 5.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.930133819580078e-05, -9.651482105255127e-05, -9.372830390930176e-05, -9.094178676605225e-05, -8.815526962280273e-05, -8.536875247955322e-05, -8.258223533630371e-05, -7.97957181930542e-05, -7.700920104980469e-05, -7.422268390655518e-05, -7.143616676330566e-05, -6.864964962005615e-05, -6.586313247680664e-05, -6.307661533355713e-05, -6.029009819030762e-05, -5.7503581047058105e-05, -5.4717063903808594e-05, -5.193054676055908e-05, -4.914402961730957e-05, -4.635751247406006e-05, -4.357099533081055e-05, -4.0784478187561035e-05, -3.7997961044311523e-05, -3.521144390106201e-05, -3.24249267578125e-05, -2.9638409614562988e-05, -2.6851892471313477e-05, -2.4065375328063965e-05, -2.1278858184814453e-05, -1.849234104156494e-05, -1.570582389831543e-05, -1.2919306755065918e-05, -1.0132789611816406e-05, -7.3462724685668945e-06, -4.559755325317383e-06, -1.773238182067871e-06, 1.0132789611816406e-06, 3.7997961044311523e-06, 6.586313247680664e-06, 9.372830390930176e-06, 1.2159347534179688e-05, 1.49458646774292e-05, 1.773238182067871e-05, 2.0518898963928223e-05, 2.3305416107177734e-05, 2.6091933250427246e-05, 2.8878450393676758e-05, 3.166496753692627e-05, 3.445148468017578e-05, 3.723800182342529e-05, 4.0024518966674805e-05, 4.2811036109924316e-05, 4.559755325317383e-05, 4.838407039642334e-05, 5.117058753967285e-05, 5.395710468292236e-05, 5.6743621826171875e-05, 5.953013896942139e-05, 6.23166561126709e-05, 6.510317325592041e-05, 6.788969039916992e-05, 7.067620754241943e-05, 7.346272468566895e-05, 7.624924182891846e-05, 7.903575897216797e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 13.0, 20.0, 22.0, 34.0, 42.0, 75.0, 107.0, 145.0, 183.0, 275.0, 343.0, 541.0, 862.0, 1168.0, 1784.0, 2796.0, 4240.0, 7085.0, 11900.0, 21198.0, 40182.0, 80397.0, 159179.0, 247106.0, 216694.0, 120299.0, 59472.0, 30394.0, 16211.0, 9313.0, 5621.0, 3675.0, 2327.0, 1490.0, 998.0, 666.0, 484.0, 404.0, 231.0, 167.0, 111.0, 85.0, 50.0, 48.0, 30.0, 25.0, 19.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.6533203125, -1.6043853759765625, -1.555450439453125, -1.5065155029296875, -1.45758056640625, -1.4086456298828125, -1.359710693359375, -1.3107757568359375, -1.2618408203125, -1.2129058837890625, -1.163970947265625, -1.1150360107421875, -1.06610107421875, -1.0171661376953125, -0.968231201171875, -0.9192962646484375, -0.870361328125, -0.8214263916015625, -0.772491455078125, -0.7235565185546875, -0.67462158203125, -0.6256866455078125, -0.576751708984375, -0.5278167724609375, -0.4788818359375, -0.4299468994140625, -0.381011962890625, -0.3320770263671875, -0.28314208984375, -0.2342071533203125, -0.185272216796875, -0.1363372802734375, -0.08740234375, -0.0384674072265625, 0.010467529296875, 0.0594024658203125, 0.10833740234375, 0.1572723388671875, 0.206207275390625, 0.2551422119140625, 0.3040771484375, 0.3530120849609375, 0.401947021484375, 0.4508819580078125, 0.49981689453125, 0.5487518310546875, 0.597686767578125, 0.6466217041015625, 0.695556640625, 0.7444915771484375, 0.793426513671875, 0.8423614501953125, 0.89129638671875, 0.9402313232421875, 0.989166259765625, 1.0381011962890625, 1.0870361328125, 1.1359710693359375, 1.184906005859375, 1.2338409423828125, 1.28277587890625, 1.3317108154296875, 1.380645751953125, 1.4295806884765625, 1.478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 10.0, 3.0, 8.0, 6.0, 13.0, 15.0, 12.0, 7.0, 12.0, 18.0, 30.0, 38.0, 51.0, 73.0, 86.0, 102.0, 95.0, 80.0, 64.0, 49.0, 52.0, 27.0, 22.0, 18.0, 12.0, 16.0, 9.0, 11.0, 7.0, 9.0, 2.0, 9.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.607879638671875, -0.58636474609375, -0.564849853515625, -0.5433349609375, -0.521820068359375, -0.50030517578125, -0.478790283203125, -0.457275390625, -0.435760498046875, -0.41424560546875, -0.392730712890625, -0.3712158203125, -0.349700927734375, -0.32818603515625, -0.306671142578125, -0.28515625, -0.263641357421875, -0.24212646484375, -0.220611572265625, -0.1990966796875, -0.177581787109375, -0.15606689453125, -0.134552001953125, -0.113037109375, -0.091522216796875, -0.07000732421875, -0.048492431640625, -0.0269775390625, -0.005462646484375, 0.01605224609375, 0.037567138671875, 0.05908203125, 0.080596923828125, 0.10211181640625, 0.123626708984375, 0.1451416015625, 0.166656494140625, 0.18817138671875, 0.209686279296875, 0.231201171875, 0.252716064453125, 0.27423095703125, 0.295745849609375, 0.3172607421875, 0.338775634765625, 0.36029052734375, 0.381805419921875, 0.4033203125, 0.424835205078125, 0.44635009765625, 0.467864990234375, 0.4893798828125, 0.510894775390625, 0.53240966796875, 0.553924560546875, 0.575439453125, 0.596954345703125, 0.61846923828125, 0.639984130859375, 0.6614990234375, 0.683013916015625, 0.70452880859375, 0.726043701171875, 0.74755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 18.0, 15.0, 11.0, 14.0, 12.0, 19.0, 27.0, 33.0, 27.0, 42.0, 32.0, 37.0, 39.0, 38.0, 37.0, 35.0, 46.0, 43.0, 50.0, 43.0, 35.0, 39.0, 31.0, 35.0, 18.0, 27.0, 28.0, 30.0, 17.0, 8.0, 16.0, 14.0, 15.0, 9.0, 7.0, 8.0, 8.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.17137336730957, -12.766740798950195, -12.36210823059082, -11.957475662231445, -11.55284309387207, -11.148210525512695, -10.74357795715332, -10.338946342468262, -9.934313774108887, -9.529681205749512, -9.125048637390137, -8.720416069030762, -8.315783500671387, -7.91115140914917, -7.506518840789795, -7.101886749267578, -6.697253704071045, -6.29262113571167, -5.887988567352295, -5.483356475830078, -5.078723907470703, -4.674091339111328, -4.269458770751953, -3.8648264408111572, -3.4601938724517822, -3.0555613040924072, -2.6509289741516113, -2.2462964057922363, -1.8416639566421509, -1.4370315074920654, -1.0323989391326904, -0.6277666091918945, -0.22313404083251953, 0.1814984381198883, 0.5861309170722961, 0.9907634258270264, 1.3953958749771118, 1.8000283241271973, 2.2046608924865723, 2.609293222427368, 3.013925790786743, 3.418558359146118, 3.823190689086914, 4.227823257446289, 4.632455825805664, 5.037088394165039, 5.441720962524414, 5.846353054046631, 6.250985622406006, 6.655618190765381, 7.060250759124756, 7.464882850646973, 7.869515419006348, 8.274147987365723, 8.678780555725098, 9.083413124084473, 9.488045692443848, 9.892678260803223, 10.297310829162598, 10.701943397521973, 11.106575965881348, 11.511207580566406, 11.915840148925781, 12.320472717285156, 12.725105285644531]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 5.0, 9.0, 13.0, 15.0, 18.0, 17.0, 19.0, 25.0, 24.0, 23.0, 26.0, 27.0, 31.0, 49.0, 35.0, 33.0, 36.0, 37.0, 36.0, 32.0, 35.0, 46.0, 31.0, 27.0, 35.0, 33.0, 33.0, 26.0, 24.0, 23.0, 26.0, 11.0, 19.0, 19.0, 14.0, 14.0, 15.0, 10.0, 5.0, 11.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.595891952514648, -12.190874099731445, -11.785857200622559, -11.380839347839355, -10.975821495056152, -10.570804595947266, -10.165786743164062, -9.76076889038086, -9.355751037597656, -8.950733184814453, -8.545716285705566, -8.140698432922363, -7.73568058013916, -7.330663204193115, -6.92564582824707, -6.520627975463867, -6.1156110763549805, -5.7105937004089355, -5.305575847625732, -4.9005584716796875, -4.495540618896484, -4.0905232429504395, -3.6855058670043945, -3.2804882526397705, -2.8754706382751465, -2.4704530239105225, -2.0654354095458984, -1.6604180335998535, -1.2554004192352295, -0.8503828048706055, -0.44536542892456055, -0.04034781455993652, 0.3646688461303711, 0.7696864008903503, 1.1747039556503296, 1.579721450805664, 1.984739065170288, 2.389756679534912, 2.794774055480957, 3.199791669845581, 3.604809284210205, 4.00982666015625, 4.414844512939453, 4.819861888885498, 5.224879264831543, 5.629897117614746, 6.034914493560791, 6.439931869506836, 6.844949722290039, 7.249967098236084, 7.654984951019287, 8.060002326965332, 8.465020179748535, 8.870037078857422, 9.275054931640625, 9.680072784423828, 10.085090637207031, 10.490108489990234, 10.895125389099121, 11.300143241882324, 11.705161094665527, 12.110177993774414, 12.515195846557617, 12.92021369934082, 13.325230598449707]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 15.0, 24.0, 41.0, 92.0, 151.0, 229.0, 397.0, 655.0, 888.0, 1549.0, 2266.0, 3573.0, 5487.0, 8058.0, 11825.0, 16806.0, 23099.0, 31165.0, 40658.0, 51360.0, 62040.0, 72326.0, 80875.0, 85377.0, 86894.0, 84367.0, 77451.0, 68331.0, 57449.0, 46822.0, 36353.0, 27701.0, 20141.0, 14579.0, 9997.0, 6772.0, 4575.0, 2985.0, 1924.0, 1269.0, 744.0, 494.0, 299.0, 186.0, 96.0, 61.0, 47.0, 25.0, 6.0, 12.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2109375, -7.948486328125, -7.68603515625, -7.423583984375, -7.1611328125, -6.898681640625, -6.63623046875, -6.373779296875, -6.111328125, -5.848876953125, -5.58642578125, -5.323974609375, -5.0615234375, -4.799072265625, -4.53662109375, -4.274169921875, -4.01171875, -3.749267578125, -3.48681640625, -3.224365234375, -2.9619140625, -2.699462890625, -2.43701171875, -2.174560546875, -1.912109375, -1.649658203125, -1.38720703125, -1.124755859375, -0.8623046875, -0.599853515625, -0.33740234375, -0.074951171875, 0.1875, 0.449951171875, 0.71240234375, 0.974853515625, 1.2373046875, 1.499755859375, 1.76220703125, 2.024658203125, 2.287109375, 2.549560546875, 2.81201171875, 3.074462890625, 3.3369140625, 3.599365234375, 3.86181640625, 4.124267578125, 4.38671875, 4.649169921875, 4.91162109375, 5.174072265625, 5.4365234375, 5.698974609375, 5.96142578125, 6.223876953125, 6.486328125, 6.748779296875, 7.01123046875, 7.273681640625, 7.5361328125, 7.798583984375, 8.06103515625, 8.323486328125, 8.5859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 3.0, 7.0, 7.0, 5.0, 18.0, 14.0, 17.0, 16.0, 16.0, 25.0, 25.0, 25.0, 25.0, 27.0, 30.0, 40.0, 44.0, 36.0, 26.0, 44.0, 39.0, 27.0, 38.0, 38.0, 40.0, 24.0, 34.0, 31.0, 39.0, 25.0, 24.0, 20.0, 30.0, 14.0, 14.0, 21.0, 12.0, 18.0, 12.0, 12.0, 6.0, 8.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.265625, -11.8736572265625, -11.481689453125, -11.0897216796875, -10.69775390625, -10.3057861328125, -9.913818359375, -9.5218505859375, -9.1298828125, -8.7379150390625, -8.345947265625, -7.9539794921875, -7.56201171875, -7.1700439453125, -6.778076171875, -6.3861083984375, -5.994140625, -5.6021728515625, -5.210205078125, -4.8182373046875, -4.42626953125, -4.0343017578125, -3.642333984375, -3.2503662109375, -2.8583984375, -2.4664306640625, -2.074462890625, -1.6824951171875, -1.29052734375, -0.8985595703125, -0.506591796875, -0.1146240234375, 0.27734375, 0.6693115234375, 1.061279296875, 1.4532470703125, 1.84521484375, 2.2371826171875, 2.629150390625, 3.0211181640625, 3.4130859375, 3.8050537109375, 4.197021484375, 4.5889892578125, 4.98095703125, 5.3729248046875, 5.764892578125, 6.1568603515625, 6.548828125, 6.9407958984375, 7.332763671875, 7.7247314453125, 8.11669921875, 8.5086669921875, 8.900634765625, 9.2926025390625, 9.6845703125, 10.0765380859375, 10.468505859375, 10.8604736328125, 11.25244140625, 11.6444091796875, 12.036376953125, 12.4283447265625, 12.8203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 0.0, 4.0, 23.0, 19.0, 29.0, 42.0, 91.0, 118.0, 207.0, 355.0, 562.0, 905.0, 1443.0, 2262.0, 3312.0, 5159.0, 7841.0, 11457.0, 16282.0, 23081.0, 31517.0, 41594.0, 53295.0, 65025.0, 76127.0, 85084.0, 90213.0, 90553.0, 86065.0, 78305.0, 66813.0, 55558.0, 43882.0, 33112.0, 24478.0, 17549.0, 12175.0, 8326.0, 5567.0, 3617.0, 2406.0, 1525.0, 976.0, 636.0, 391.0, 218.0, 136.0, 73.0, 56.0, 39.0, 26.0, 19.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1875, -7.9154052734375, -7.643310546875, -7.3712158203125, -7.09912109375, -6.8270263671875, -6.554931640625, -6.2828369140625, -6.0107421875, -5.7386474609375, -5.466552734375, -5.1944580078125, -4.92236328125, -4.6502685546875, -4.378173828125, -4.1060791015625, -3.833984375, -3.5618896484375, -3.289794921875, -3.0177001953125, -2.74560546875, -2.4735107421875, -2.201416015625, -1.9293212890625, -1.6572265625, -1.3851318359375, -1.113037109375, -0.8409423828125, -0.56884765625, -0.2967529296875, -0.024658203125, 0.2474365234375, 0.51953125, 0.7916259765625, 1.063720703125, 1.3358154296875, 1.60791015625, 1.8800048828125, 2.152099609375, 2.4241943359375, 2.6962890625, 2.9683837890625, 3.240478515625, 3.5125732421875, 3.78466796875, 4.0567626953125, 4.328857421875, 4.6009521484375, 4.873046875, 5.1451416015625, 5.417236328125, 5.6893310546875, 5.96142578125, 6.2335205078125, 6.505615234375, 6.7777099609375, 7.0498046875, 7.3218994140625, 7.593994140625, 7.8660888671875, 8.13818359375, 8.4102783203125, 8.682373046875, 8.9544677734375, 9.2265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 3.0, 7.0, 12.0, 13.0, 14.0, 15.0, 29.0, 16.0, 20.0, 28.0, 31.0, 14.0, 36.0, 34.0, 38.0, 37.0, 43.0, 35.0, 28.0, 36.0, 23.0, 37.0, 48.0, 40.0, 35.0, 27.0, 38.0, 39.0, 32.0, 25.0, 22.0, 26.0, 15.0, 16.0, 11.0, 10.0, 7.0, 9.0, 13.0, 9.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.2890625, -8.0181884765625, -7.747314453125, -7.4764404296875, -7.20556640625, -6.9346923828125, -6.663818359375, -6.3929443359375, -6.1220703125, -5.8511962890625, -5.580322265625, -5.3094482421875, -5.03857421875, -4.7677001953125, -4.496826171875, -4.2259521484375, -3.955078125, -3.6842041015625, -3.413330078125, -3.1424560546875, -2.87158203125, -2.6007080078125, -2.329833984375, -2.0589599609375, -1.7880859375, -1.5172119140625, -1.246337890625, -0.9754638671875, -0.70458984375, -0.4337158203125, -0.162841796875, 0.1080322265625, 0.37890625, 0.6497802734375, 0.920654296875, 1.1915283203125, 1.46240234375, 1.7332763671875, 2.004150390625, 2.2750244140625, 2.5458984375, 2.8167724609375, 3.087646484375, 3.3585205078125, 3.62939453125, 3.9002685546875, 4.171142578125, 4.4420166015625, 4.712890625, 4.9837646484375, 5.254638671875, 5.5255126953125, 5.79638671875, 6.0672607421875, 6.338134765625, 6.6090087890625, 6.8798828125, 7.1507568359375, 7.421630859375, 7.6925048828125, 7.96337890625, 8.2342529296875, 8.505126953125, 8.7760009765625, 9.046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 6.0, 9.0, 12.0, 9.0, 21.0, 38.0, 50.0, 73.0, 111.0, 202.0, 304.0, 434.0, 666.0, 1063.0, 1544.0, 2458.0, 3735.0, 5754.0, 8673.0, 13370.0, 19719.0, 28707.0, 40113.0, 54434.0, 69987.0, 85386.0, 98179.0, 104143.0, 103062.0, 94886.0, 81527.0, 65492.0, 50294.0, 36769.0, 25571.0, 17544.0, 11709.0, 7841.0, 5172.0, 3315.0, 2099.0, 1379.0, 971.0, 567.0, 410.0, 246.0, 153.0, 110.0, 89.0, 52.0, 46.0, 26.0, 11.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.03289794921875, -3.8978271484375, -3.76275634765625, -3.627685546875, -3.49261474609375, -3.3575439453125, -3.22247314453125, -3.08740234375, -2.95233154296875, -2.8172607421875, -2.68218994140625, -2.547119140625, -2.41204833984375, -2.2769775390625, -2.14190673828125, -2.0068359375, -1.87176513671875, -1.7366943359375, -1.60162353515625, -1.466552734375, -1.33148193359375, -1.1964111328125, -1.06134033203125, -0.92626953125, -0.79119873046875, -0.6561279296875, -0.52105712890625, -0.385986328125, -0.25091552734375, -0.1158447265625, 0.01922607421875, 0.154296875, 0.28936767578125, 0.4244384765625, 0.55950927734375, 0.694580078125, 0.82965087890625, 0.9647216796875, 1.09979248046875, 1.23486328125, 1.36993408203125, 1.5050048828125, 1.64007568359375, 1.775146484375, 1.91021728515625, 2.0452880859375, 2.18035888671875, 2.3154296875, 2.45050048828125, 2.5855712890625, 2.72064208984375, 2.855712890625, 2.99078369140625, 3.1258544921875, 3.26092529296875, 3.39599609375, 3.53106689453125, 3.6661376953125, 3.80120849609375, 3.936279296875, 4.07135009765625, 4.2064208984375, 4.34149169921875, 4.4765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 7.0, 11.0, 10.0, 18.0, 17.0, 17.0, 18.0, 33.0, 24.0, 23.0, 40.0, 48.0, 32.0, 30.0, 46.0, 43.0, 49.0, 48.0, 43.0, 53.0, 38.0, 41.0, 34.0, 31.0, 37.0, 26.0, 26.0, 24.0, 23.0, 24.0, 18.0, 12.0, 6.0, 7.0, 4.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005769729614257812, -0.0005591660737991333, -0.0005413591861724854, -0.0005235522985458374, -0.0005057454109191895, -0.0004879385232925415, -0.00047013163566589355, -0.0004523247480392456, -0.00043451786041259766, -0.0004167109727859497, -0.00039890408515930176, -0.0003810971975326538, -0.00036329030990600586, -0.0003454834222793579, -0.00032767653465270996, -0.000309869647026062, -0.00029206275939941406, -0.0002742558717727661, -0.00025644898414611816, -0.00023864209651947021, -0.00022083520889282227, -0.00020302832126617432, -0.00018522143363952637, -0.00016741454601287842, -0.00014960765838623047, -0.00013180077075958252, -0.00011399388313293457, -9.618699550628662e-05, -7.838010787963867e-05, -6.057322025299072e-05, -4.2766332626342773e-05, -2.4959444999694824e-05, -7.152557373046875e-06, 1.0654330253601074e-05, 2.8461217880249023e-05, 4.626810550689697e-05, 6.407499313354492e-05, 8.188188076019287e-05, 9.968876838684082e-05, 0.00011749565601348877, 0.00013530254364013672, 0.00015310943126678467, 0.00017091631889343262, 0.00018872320652008057, 0.00020653009414672852, 0.00022433698177337646, 0.00024214386940002441, 0.00025995075702667236, 0.0002777576446533203, 0.00029556453227996826, 0.0003133714199066162, 0.00033117830753326416, 0.0003489851951599121, 0.00036679208278656006, 0.000384598970413208, 0.00040240585803985596, 0.0004202127456665039, 0.00043801963329315186, 0.0004558265209197998, 0.00047363340854644775, 0.0004914402961730957, 0.0005092471837997437, 0.0005270540714263916, 0.0005448609590530396, 0.0005626678466796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 16.0, 21.0, 36.0, 65.0, 103.0, 149.0, 245.0, 373.0, 603.0, 963.0, 1581.0, 2614.0, 4212.0, 7069.0, 11242.0, 18101.0, 27959.0, 42861.0, 61657.0, 83941.0, 104521.0, 119798.0, 123334.0, 114953.0, 96448.0, 74097.0, 53311.0, 36085.0, 23522.0, 14811.0, 9171.0, 5649.0, 3426.0, 2186.0, 1287.0, 799.0, 509.0, 289.0, 197.0, 131.0, 75.0, 42.0, 37.0, 14.0, 15.0, 16.0, 9.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.1484375, -5.9637451171875, -5.779052734375, -5.5943603515625, -5.40966796875, -5.2249755859375, -5.040283203125, -4.8555908203125, -4.6708984375, -4.4862060546875, -4.301513671875, -4.1168212890625, -3.93212890625, -3.7474365234375, -3.562744140625, -3.3780517578125, -3.193359375, -3.0086669921875, -2.823974609375, -2.6392822265625, -2.45458984375, -2.2698974609375, -2.085205078125, -1.9005126953125, -1.7158203125, -1.5311279296875, -1.346435546875, -1.1617431640625, -0.97705078125, -0.7923583984375, -0.607666015625, -0.4229736328125, -0.23828125, -0.0535888671875, 0.131103515625, 0.3157958984375, 0.50048828125, 0.6851806640625, 0.869873046875, 1.0545654296875, 1.2392578125, 1.4239501953125, 1.608642578125, 1.7933349609375, 1.97802734375, 2.1627197265625, 2.347412109375, 2.5321044921875, 2.716796875, 2.9014892578125, 3.086181640625, 3.2708740234375, 3.45556640625, 3.6402587890625, 3.824951171875, 4.0096435546875, 4.1943359375, 4.3790283203125, 4.563720703125, 4.7484130859375, 4.93310546875, 5.1177978515625, 5.302490234375, 5.4871826171875, 5.671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 16.0, 9.0, 12.0, 25.0, 12.0, 18.0, 25.0, 44.0, 40.0, 35.0, 48.0, 44.0, 39.0, 52.0, 44.0, 52.0, 45.0, 47.0, 43.0, 54.0, 43.0, 42.0, 31.0, 35.0, 20.0, 21.0, 23.0, 8.0, 12.0, 10.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.2862548828125, -2.207275390625, -2.1282958984375, -2.04931640625, -1.9703369140625, -1.891357421875, -1.8123779296875, -1.7333984375, -1.6544189453125, -1.575439453125, -1.4964599609375, -1.41748046875, -1.3385009765625, -1.259521484375, -1.1805419921875, -1.1015625, -1.0225830078125, -0.943603515625, -0.8646240234375, -0.78564453125, -0.7066650390625, -0.627685546875, -0.5487060546875, -0.4697265625, -0.3907470703125, -0.311767578125, -0.2327880859375, -0.15380859375, -0.0748291015625, 0.004150390625, 0.0831298828125, 0.162109375, 0.2410888671875, 0.320068359375, 0.3990478515625, 0.47802734375, 0.5570068359375, 0.635986328125, 0.7149658203125, 0.7939453125, 0.8729248046875, 0.951904296875, 1.0308837890625, 1.10986328125, 1.1888427734375, 1.267822265625, 1.3468017578125, 1.42578125, 1.5047607421875, 1.583740234375, 1.6627197265625, 1.74169921875, 1.8206787109375, 1.899658203125, 1.9786376953125, 2.0576171875, 2.1365966796875, 2.215576171875, 2.2945556640625, 2.37353515625, 2.4525146484375, 2.531494140625, 2.6104736328125, 2.689453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 12.0, 5.0, 12.0, 6.0, 24.0, 27.0, 23.0, 25.0, 23.0, 31.0, 34.0, 40.0, 33.0, 47.0, 42.0, 53.0, 45.0, 33.0, 41.0, 37.0, 44.0, 34.0, 39.0, 35.0, 37.0, 26.0, 25.0, 30.0, 21.0, 13.0, 8.0, 13.0, 20.0, 13.0, 5.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.258975982666016, -11.840922355651855, -11.422869682312012, -11.004816055297852, -10.586762428283691, -10.168708801269531, -9.750656127929688, -9.332602500915527, -8.914548873901367, -8.496495246887207, -8.078442573547363, -7.660388946533203, -7.242335319519043, -6.824282169342041, -6.406229019165039, -5.988175392150879, -5.570122718811035, -5.152069568634033, -4.734015941619873, -4.315962791442871, -3.89790940284729, -3.479856014251709, -3.061802864074707, -2.643749475479126, -2.225696086883545, -1.8076426982879639, -1.3895894289016724, -0.9715361595153809, -0.5534827709197998, -0.13542938232421875, 0.2826237678527832, 0.7006771564483643, 1.1187314987182617, 1.5367848873138428, 1.9548381567001343, 2.372891426086426, 2.790944814682007, 3.208998203277588, 3.62705135345459, 4.04510498046875, 4.463158130645752, 4.881211280822754, 5.299264907836914, 5.717318058013916, 6.135371208190918, 6.553424835205078, 6.97147798538208, 7.389531135559082, 7.807584762573242, 8.225638389587402, 8.643691062927246, 9.061744689941406, 9.479798316955566, 9.897851943969727, 10.31590461730957, 10.73395824432373, 11.15201187133789, 11.57006549835205, 11.988118171691895, 12.406171798706055, 12.824225425720215, 13.242279052734375, 13.660331726074219, 14.078385353088379, 14.496438026428223]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 7.0, 2.0, 4.0, 8.0, 9.0, 16.0, 13.0, 24.0, 23.0, 20.0, 26.0, 35.0, 27.0, 34.0, 30.0, 40.0, 28.0, 35.0, 23.0, 36.0, 27.0, 43.0, 30.0, 43.0, 45.0, 32.0, 33.0, 31.0, 18.0, 33.0, 30.0, 27.0, 23.0, 10.0, 20.0, 20.0, 23.0, 16.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-14.283504486083984, -13.853324890136719, -13.423145294189453, -12.992965698242188, -12.562786102294922, -12.132606506347656, -11.702427864074707, -11.272248268127441, -10.842068672180176, -10.41188907623291, -9.981709480285645, -9.551529884338379, -9.12135124206543, -8.691171646118164, -8.260992050170898, -7.830812454223633, -7.400632858276367, -6.970453262329102, -6.540273666381836, -6.1100945472717285, -5.679914951324463, -5.249735355377197, -4.81955623626709, -4.389376640319824, -3.9591970443725586, -3.529017448425293, -3.0988380908966064, -2.66865873336792, -2.2384791374206543, -1.8082995414733887, -1.3781201839447021, -0.9479408264160156, -0.5177621841430664, -0.08758270740509033, 0.34259676933288574, 0.7727762460708618, 1.202955722808838, 1.6331353187561035, 2.06331467628479, 2.4934940338134766, 2.923673629760742, 3.353853225708008, 3.7840325832366943, 4.214211940765381, 4.6443915367126465, 5.074571132659912, 5.5047502517700195, 5.934929847717285, 6.365109443664551, 6.795289039611816, 7.225468635559082, 7.6556477546691895, 8.085826873779297, 8.516006469726562, 8.946186065673828, 9.376365661621094, 9.80654525756836, 10.236724853515625, 10.66690444946289, 11.097084045410156, 11.527263641357422, 11.957443237304688, 12.387621879577637, 12.817801475524902, 13.247981071472168]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 13.0, 26.0, 32.0, 53.0, 95.0, 120.0, 252.0, 385.0, 601.0, 908.0, 1484.0, 2386.0, 3948.0, 6133.0, 9481.0, 14867.0, 22909.0, 34173.0, 50825.0, 74028.0, 105503.0, 144804.0, 193267.0, 246506.0, 300130.0, 346664.0, 378673.0, 386931.0, 374350.0, 338674.0, 290730.0, 237321.0, 183953.0, 137274.0, 99229.0, 69708.0, 48035.0, 31809.0, 21016.0, 13665.0, 8782.0, 5577.0, 3495.0, 2125.0, 1322.0, 791.0, 506.0, 298.0, 184.0, 96.0, 70.0, 33.0, 26.0, 7.0, 7.0, 2.0, 3.0, 3.0], "bins": [-9.7265625, -9.4354248046875, -9.144287109375, -8.8531494140625, -8.56201171875, -8.2708740234375, -7.979736328125, -7.6885986328125, -7.3974609375, -7.1063232421875, -6.815185546875, -6.5240478515625, -6.23291015625, -5.9417724609375, -5.650634765625, -5.3594970703125, -5.068359375, -4.7772216796875, -4.486083984375, -4.1949462890625, -3.90380859375, -3.6126708984375, -3.321533203125, -3.0303955078125, -2.7392578125, -2.4481201171875, -2.156982421875, -1.8658447265625, -1.57470703125, -1.2835693359375, -0.992431640625, -0.7012939453125, -0.41015625, -0.1190185546875, 0.172119140625, 0.4632568359375, 0.75439453125, 1.0455322265625, 1.336669921875, 1.6278076171875, 1.9189453125, 2.2100830078125, 2.501220703125, 2.7923583984375, 3.08349609375, 3.3746337890625, 3.665771484375, 3.9569091796875, 4.248046875, 4.5391845703125, 4.830322265625, 5.1214599609375, 5.41259765625, 5.7037353515625, 5.994873046875, 6.2860107421875, 6.5771484375, 6.8682861328125, 7.159423828125, 7.4505615234375, 7.74169921875, 8.0328369140625, 8.323974609375, 8.6151123046875, 8.90625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 10.0, 4.0, 5.0, 3.0, 9.0, 9.0, 11.0, 14.0, 27.0, 20.0, 18.0, 30.0, 35.0, 25.0, 32.0, 27.0, 37.0, 35.0, 39.0, 21.0, 30.0, 25.0, 44.0, 37.0, 32.0, 49.0, 31.0, 38.0, 26.0, 23.0, 25.0, 26.0, 35.0, 24.0, 13.0, 17.0, 19.0, 25.0, 18.0, 9.0, 10.0, 7.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-12.6875, -12.3055419921875, -11.923583984375, -11.5416259765625, -11.15966796875, -10.7777099609375, -10.395751953125, -10.0137939453125, -9.6318359375, -9.2498779296875, -8.867919921875, -8.4859619140625, -8.10400390625, -7.7220458984375, -7.340087890625, -6.9581298828125, -6.576171875, -6.1942138671875, -5.812255859375, -5.4302978515625, -5.04833984375, -4.6663818359375, -4.284423828125, -3.9024658203125, -3.5205078125, -3.1385498046875, -2.756591796875, -2.3746337890625, -1.99267578125, -1.6107177734375, -1.228759765625, -0.8468017578125, -0.46484375, -0.0828857421875, 0.299072265625, 0.6810302734375, 1.06298828125, 1.4449462890625, 1.826904296875, 2.2088623046875, 2.5908203125, 2.9727783203125, 3.354736328125, 3.7366943359375, 4.11865234375, 4.5006103515625, 4.882568359375, 5.2645263671875, 5.646484375, 6.0284423828125, 6.410400390625, 6.7923583984375, 7.17431640625, 7.5562744140625, 7.938232421875, 8.3201904296875, 8.7021484375, 9.0841064453125, 9.466064453125, 9.8480224609375, 10.22998046875, 10.6119384765625, 10.993896484375, 11.3758544921875, 11.7578125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 17.0, 24.0, 48.0, 70.0, 142.0, 207.0, 356.0, 571.0, 962.0, 1731.0, 2516.0, 4228.0, 6857.0, 10594.0, 16272.0, 25056.0, 37239.0, 54156.0, 77201.0, 106267.0, 142176.0, 183903.0, 228781.0, 273577.0, 312054.0, 339258.0, 352237.0, 349502.0, 329485.0, 293829.0, 252922.0, 209530.0, 165111.0, 124887.0, 92048.0, 66349.0, 45716.0, 31092.0, 20828.0, 13616.0, 8652.0, 5477.0, 3462.0, 2051.0, 1289.0, 766.0, 495.0, 281.0, 160.0, 113.0, 44.0, 27.0, 22.0, 13.0, 7.0, 4.0, 2.0, 3.0], "bins": [-9.421875, -9.1343994140625, -8.846923828125, -8.5594482421875, -8.27197265625, -7.9844970703125, -7.697021484375, -7.4095458984375, -7.1220703125, -6.8345947265625, -6.547119140625, -6.2596435546875, -5.97216796875, -5.6846923828125, -5.397216796875, -5.1097412109375, -4.822265625, -4.5347900390625, -4.247314453125, -3.9598388671875, -3.67236328125, -3.3848876953125, -3.097412109375, -2.8099365234375, -2.5224609375, -2.2349853515625, -1.947509765625, -1.6600341796875, -1.37255859375, -1.0850830078125, -0.797607421875, -0.5101318359375, -0.22265625, 0.0648193359375, 0.352294921875, 0.6397705078125, 0.92724609375, 1.2147216796875, 1.502197265625, 1.7896728515625, 2.0771484375, 2.3646240234375, 2.652099609375, 2.9395751953125, 3.22705078125, 3.5145263671875, 3.802001953125, 4.0894775390625, 4.376953125, 4.6644287109375, 4.951904296875, 5.2393798828125, 5.52685546875, 5.8143310546875, 6.101806640625, 6.3892822265625, 6.6767578125, 6.9642333984375, 7.251708984375, 7.5391845703125, 7.82666015625, 8.1141357421875, 8.401611328125, 8.6890869140625, 8.9765625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 9.0, 8.0, 7.0, 8.0, 24.0, 20.0, 25.0, 25.0, 34.0, 59.0, 74.0, 79.0, 90.0, 110.0, 109.0, 148.0, 144.0, 149.0, 171.0, 171.0, 198.0, 193.0, 183.0, 170.0, 196.0, 195.0, 184.0, 169.0, 162.0, 151.0, 108.0, 102.0, 111.0, 99.0, 69.0, 76.0, 45.0, 42.0, 35.0, 38.0, 25.0, 15.0, 10.0, 12.0, 4.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.582275390625, -5.39501953125, -5.207763671875, -5.0205078125, -4.833251953125, -4.64599609375, -4.458740234375, -4.271484375, -4.084228515625, -3.89697265625, -3.709716796875, -3.5224609375, -3.335205078125, -3.14794921875, -2.960693359375, -2.7734375, -2.586181640625, -2.39892578125, -2.211669921875, -2.0244140625, -1.837158203125, -1.64990234375, -1.462646484375, -1.275390625, -1.088134765625, -0.90087890625, -0.713623046875, -0.5263671875, -0.339111328125, -0.15185546875, 0.035400390625, 0.22265625, 0.409912109375, 0.59716796875, 0.784423828125, 0.9716796875, 1.158935546875, 1.34619140625, 1.533447265625, 1.720703125, 1.907958984375, 2.09521484375, 2.282470703125, 2.4697265625, 2.656982421875, 2.84423828125, 3.031494140625, 3.21875, 3.406005859375, 3.59326171875, 3.780517578125, 3.9677734375, 4.155029296875, 4.34228515625, 4.529541015625, 4.716796875, 4.904052734375, 5.09130859375, 5.278564453125, 5.4658203125, 5.653076171875, 5.84033203125, 6.027587890625, 6.21484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 10.0, 9.0, 13.0, 21.0, 28.0, 25.0, 19.0, 36.0, 19.0, 33.0, 22.0, 36.0, 46.0, 34.0, 53.0, 36.0, 46.0, 47.0, 44.0, 43.0, 48.0, 45.0, 27.0, 35.0, 25.0, 31.0, 28.0, 26.0, 18.0, 13.0, 15.0, 8.0, 10.0, 8.0, 11.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.842455863952637, -14.399292945861816, -13.95612907409668, -13.51296615600586, -13.069803237915039, -12.626640319824219, -12.183477401733398, -11.740313529968262, -11.297150611877441, -10.853987693786621, -10.410823822021484, -9.967660903930664, -9.524497985839844, -9.081335067749023, -8.638172149658203, -8.195008277893066, -7.751845359802246, -7.308682441711426, -6.865519046783447, -6.422355651855469, -5.979192733764648, -5.536029815673828, -5.09286642074585, -4.649703025817871, -4.206540107727051, -3.7633769512176514, -3.320213794708252, -2.8770506381988525, -2.433887481689453, -1.9907243251800537, -1.5475611686706543, -1.1043980121612549, -0.6612358093261719, -0.21807265281677246, 0.22509050369262695, 0.6682536602020264, 1.1114168167114258, 1.5545799732208252, 1.9977431297302246, 2.440906286239624, 2.8840694427490234, 3.327232599258423, 3.7703957557678223, 4.213559150695801, 4.656722068786621, 5.099884986877441, 5.54304838180542, 5.986211776733398, 6.429374694824219, 6.872537612915039, 7.315701007843018, 7.758864402770996, 8.202027320861816, 8.645190238952637, 9.088354110717773, 9.531517028808594, 9.974679946899414, 10.417842864990234, 10.861005783081055, 11.304169654846191, 11.747332572937012, 12.190495491027832, 12.633659362792969, 13.076822280883789, 13.51998519897461]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 15.0, 15.0, 15.0, 10.0, 26.0, 21.0, 24.0, 28.0, 28.0, 37.0, 34.0, 45.0, 28.0, 38.0, 46.0, 34.0, 37.0, 33.0, 41.0, 27.0, 38.0, 33.0, 42.0, 28.0, 29.0, 26.0, 33.0, 15.0, 15.0, 23.0, 16.0, 13.0, 7.0, 13.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-15.027436256408691, -14.58669662475586, -14.145956993103027, -13.705217361450195, -13.264477729797363, -12.823738098144531, -12.3829984664917, -11.942258834838867, -11.501519203186035, -11.060779571533203, -10.620039939880371, -10.179300308227539, -9.738560676574707, -9.297821044921875, -8.857081413269043, -8.416341781616211, -7.975601673126221, -7.534862041473389, -7.094122409820557, -6.653382778167725, -6.212643146514893, -5.771903038024902, -5.33116340637207, -4.890423774719238, -4.449684143066406, -4.008944511413574, -3.568204879760742, -3.12746524810791, -2.686725616455078, -2.245985746383667, -1.805246114730835, -1.364506483078003, -0.92376708984375, -0.4830274283885956, -0.04228776693344116, 0.39845192432403564, 0.8391915559768677, 1.2799313068389893, 1.7206709384918213, 2.1614105701446533, 2.6021502017974854, 3.0428898334503174, 3.4836294651031494, 3.9243693351745605, 4.365108966827393, 4.805848598480225, 5.246588230133057, 5.687327861785889, 6.128067493438721, 6.568807125091553, 7.009546756744385, 7.450286388397217, 7.891026020050049, 8.331766128540039, 8.772505760192871, 9.213245391845703, 9.653985023498535, 10.094724655151367, 10.5354642868042, 10.976203918457031, 11.416943550109863, 11.857683181762695, 12.298422813415527, 12.73916244506836, 13.179902076721191]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 11.0, 5.0, 10.0, 10.0, 17.0, 27.0, 38.0, 43.0, 95.0, 98.0, 137.0, 218.0, 366.0, 528.0, 737.0, 1191.0, 1856.0, 2993.0, 4917.0, 7931.0, 13384.0, 22555.0, 37947.0, 63435.0, 98655.0, 141623.0, 169179.0, 159199.0, 120014.0, 78917.0, 48678.0, 29293.0, 17628.0, 10205.0, 6206.0, 3776.0, 2303.0, 1488.0, 984.0, 560.0, 406.0, 292.0, 180.0, 121.0, 87.0, 71.0, 44.0, 30.0, 21.0, 15.0, 14.0, 8.0, 10.0, 2.0, 5.0, 3.0], "bins": [-2.62109375, -2.545654296875, -2.47021484375, -2.394775390625, -2.3193359375, -2.243896484375, -2.16845703125, -2.093017578125, -2.017578125, -1.942138671875, -1.86669921875, -1.791259765625, -1.7158203125, -1.640380859375, -1.56494140625, -1.489501953125, -1.4140625, -1.338623046875, -1.26318359375, -1.187744140625, -1.1123046875, -1.036865234375, -0.96142578125, -0.885986328125, -0.810546875, -0.735107421875, -0.65966796875, -0.584228515625, -0.5087890625, -0.433349609375, -0.35791015625, -0.282470703125, -0.20703125, -0.131591796875, -0.05615234375, 0.019287109375, 0.0947265625, 0.170166015625, 0.24560546875, 0.321044921875, 0.396484375, 0.471923828125, 0.54736328125, 0.622802734375, 0.6982421875, 0.773681640625, 0.84912109375, 0.924560546875, 1.0, 1.075439453125, 1.15087890625, 1.226318359375, 1.3017578125, 1.377197265625, 1.45263671875, 1.528076171875, 1.603515625, 1.678955078125, 1.75439453125, 1.829833984375, 1.9052734375, 1.980712890625, 2.05615234375, 2.131591796875, 2.20703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 16.0, 14.0, 14.0, 11.0, 28.0, 18.0, 25.0, 29.0, 27.0, 37.0, 35.0, 44.0, 28.0, 39.0, 44.0, 35.0, 38.0, 33.0, 41.0, 26.0, 38.0, 33.0, 40.0, 29.0, 30.0, 26.0, 33.0, 13.0, 17.0, 23.0, 16.0, 13.0, 6.0, 14.0, 4.0, 7.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-14.96875, -14.5284423828125, -14.088134765625, -13.6478271484375, -13.20751953125, -12.7672119140625, -12.326904296875, -11.8865966796875, -11.4462890625, -11.0059814453125, -10.565673828125, -10.1253662109375, -9.68505859375, -9.2447509765625, -8.804443359375, -8.3641357421875, -7.923828125, -7.4835205078125, -7.043212890625, -6.6029052734375, -6.16259765625, -5.7222900390625, -5.281982421875, -4.8416748046875, -4.4013671875, -3.9610595703125, -3.520751953125, -3.0804443359375, -2.64013671875, -2.1998291015625, -1.759521484375, -1.3192138671875, -0.87890625, -0.4385986328125, 0.001708984375, 0.4420166015625, 0.88232421875, 1.3226318359375, 1.762939453125, 2.2032470703125, 2.6435546875, 3.0838623046875, 3.524169921875, 3.9644775390625, 4.40478515625, 4.8450927734375, 5.285400390625, 5.7257080078125, 6.166015625, 6.6063232421875, 7.046630859375, 7.4869384765625, 7.92724609375, 8.3675537109375, 8.807861328125, 9.2481689453125, 9.6884765625, 10.1287841796875, 10.569091796875, 11.0093994140625, 11.44970703125, 11.8900146484375, 12.330322265625, 12.7706298828125, 13.2109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 11.0, 14.0, 25.0, 31.0, 48.0, 60.0, 97.0, 147.0, 195.0, 266.0, 444.0, 626.0, 980.0, 1645.0, 2580.0, 4127.0, 7111.0, 12328.0, 22252.0, 42919.0, 84027.0, 165514.0, 254747.0, 211072.0, 113449.0, 56713.0, 29325.0, 15905.0, 8613.0, 5041.0, 2981.0, 1819.0, 1143.0, 761.0, 499.0, 307.0, 196.0, 146.0, 116.0, 73.0, 47.0, 35.0, 40.0, 16.0, 17.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.3515625, -3.245880126953125, -3.14019775390625, -3.034515380859375, -2.9288330078125, -2.823150634765625, -2.71746826171875, -2.611785888671875, -2.506103515625, -2.400421142578125, -2.29473876953125, -2.189056396484375, -2.0833740234375, -1.977691650390625, -1.87200927734375, -1.766326904296875, -1.66064453125, -1.554962158203125, -1.44927978515625, -1.343597412109375, -1.2379150390625, -1.132232666015625, -1.02655029296875, -0.920867919921875, -0.815185546875, -0.709503173828125, -0.60382080078125, -0.498138427734375, -0.3924560546875, -0.286773681640625, -0.18109130859375, -0.075408935546875, 0.0302734375, 0.135955810546875, 0.24163818359375, 0.347320556640625, 0.4530029296875, 0.558685302734375, 0.66436767578125, 0.770050048828125, 0.875732421875, 0.981414794921875, 1.08709716796875, 1.192779541015625, 1.2984619140625, 1.404144287109375, 1.50982666015625, 1.615509033203125, 1.72119140625, 1.826873779296875, 1.93255615234375, 2.038238525390625, 2.1439208984375, 2.249603271484375, 2.35528564453125, 2.460968017578125, 2.566650390625, 2.672332763671875, 2.77801513671875, 2.883697509765625, 2.9893798828125, 3.095062255859375, 3.20074462890625, 3.306427001953125, 3.412109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 15.0, 15.0, 14.0, 28.0, 26.0, 25.0, 29.0, 32.0, 30.0, 31.0, 33.0, 37.0, 37.0, 36.0, 45.0, 50.0, 43.0, 37.0, 40.0, 38.0, 36.0, 34.0, 35.0, 35.0, 30.0, 26.0, 18.0, 10.0, 24.0, 12.0, 16.0, 2.0, 8.0, 17.0, 2.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.234375, -9.93505859375, -9.6357421875, -9.33642578125, -9.037109375, -8.73779296875, -8.4384765625, -8.13916015625, -7.83984375, -7.54052734375, -7.2412109375, -6.94189453125, -6.642578125, -6.34326171875, -6.0439453125, -5.74462890625, -5.4453125, -5.14599609375, -4.8466796875, -4.54736328125, -4.248046875, -3.94873046875, -3.6494140625, -3.35009765625, -3.05078125, -2.75146484375, -2.4521484375, -2.15283203125, -1.853515625, -1.55419921875, -1.2548828125, -0.95556640625, -0.65625, -0.35693359375, -0.0576171875, 0.24169921875, 0.541015625, 0.84033203125, 1.1396484375, 1.43896484375, 1.73828125, 2.03759765625, 2.3369140625, 2.63623046875, 2.935546875, 3.23486328125, 3.5341796875, 3.83349609375, 4.1328125, 4.43212890625, 4.7314453125, 5.03076171875, 5.330078125, 5.62939453125, 5.9287109375, 6.22802734375, 6.52734375, 6.82666015625, 7.1259765625, 7.42529296875, 7.724609375, 8.02392578125, 8.3232421875, 8.62255859375, 8.921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 8.0, 20.0, 13.0, 35.0, 46.0, 60.0, 65.0, 120.0, 129.0, 217.0, 315.0, 451.0, 619.0, 1023.0, 1494.0, 2313.0, 3596.0, 5945.0, 10615.0, 19656.0, 41520.0, 103582.0, 284524.0, 335601.0, 132458.0, 50523.0, 23210.0, 12108.0, 6884.0, 4010.0, 2491.0, 1584.0, 1062.0, 699.0, 459.0, 312.0, 236.0, 166.0, 102.0, 85.0, 52.0, 43.0, 26.0, 30.0, 16.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.05078125, -1.0170135498046875, -0.983245849609375, -0.9494781494140625, -0.91571044921875, -0.8819427490234375, -0.848175048828125, -0.8144073486328125, -0.7806396484375, -0.7468719482421875, -0.713104248046875, -0.6793365478515625, -0.64556884765625, -0.6118011474609375, -0.578033447265625, -0.5442657470703125, -0.510498046875, -0.4767303466796875, -0.442962646484375, -0.4091949462890625, -0.37542724609375, -0.3416595458984375, -0.307891845703125, -0.2741241455078125, -0.2403564453125, -0.2065887451171875, -0.172821044921875, -0.1390533447265625, -0.10528564453125, -0.0715179443359375, -0.037750244140625, -0.0039825439453125, 0.02978515625, 0.0635528564453125, 0.097320556640625, 0.1310882568359375, 0.16485595703125, 0.1986236572265625, 0.232391357421875, 0.2661590576171875, 0.2999267578125, 0.3336944580078125, 0.367462158203125, 0.4012298583984375, 0.43499755859375, 0.4687652587890625, 0.502532958984375, 0.5363006591796875, 0.570068359375, 0.6038360595703125, 0.637603759765625, 0.6713714599609375, 0.70513916015625, 0.7389068603515625, 0.772674560546875, 0.8064422607421875, 0.8402099609375, 0.8739776611328125, 0.907745361328125, 0.9415130615234375, 0.97528076171875, 1.0090484619140625, 1.042816162109375, 1.0765838623046875, 1.1103515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 3.0, 6.0, 11.0, 15.0, 16.0, 12.0, 19.0, 21.0, 28.0, 33.0, 30.0, 33.0, 38.0, 29.0, 43.0, 38.0, 37.0, 39.0, 47.0, 55.0, 53.0, 50.0, 50.0, 39.0, 45.0, 32.0, 28.0, 22.0, 20.0, 18.0, 17.0, 16.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.17993825674057e-05, -6.92121684551239e-05, -6.66249543428421e-05, -6.40377402305603e-05, -6.14505261182785e-05, -5.8863312005996704e-05, -5.6276097893714905e-05, -5.3688883781433105e-05, -5.1101669669151306e-05, -4.851445555686951e-05, -4.592724144458771e-05, -4.334002733230591e-05, -4.075281322002411e-05, -3.816559910774231e-05, -3.557838499546051e-05, -3.299117088317871e-05, -3.040395677089691e-05, -2.7816742658615112e-05, -2.5229528546333313e-05, -2.2642314434051514e-05, -2.0055100321769714e-05, -1.7467886209487915e-05, -1.4880672097206116e-05, -1.2293457984924316e-05, -9.706243872642517e-06, -7.119029760360718e-06, -4.5318156480789185e-06, -1.944601535797119e-06, 6.426125764846802e-07, 3.2298266887664795e-06, 5.817040801048279e-06, 8.404254913330078e-06, 1.0991469025611877e-05, 1.3578683137893677e-05, 1.6165897250175476e-05, 1.8753111362457275e-05, 2.1340325474739075e-05, 2.3927539587020874e-05, 2.6514753699302673e-05, 2.9101967811584473e-05, 3.168918192386627e-05, 3.427639603614807e-05, 3.686361014842987e-05, 3.945082426071167e-05, 4.203803837299347e-05, 4.462525248527527e-05, 4.721246659755707e-05, 4.979968070983887e-05, 5.2386894822120667e-05, 5.4974108934402466e-05, 5.7561323046684265e-05, 6.0148537158966064e-05, 6.273575127124786e-05, 6.532296538352966e-05, 6.791017949581146e-05, 7.049739360809326e-05, 7.308460772037506e-05, 7.567182183265686e-05, 7.825903594493866e-05, 8.084625005722046e-05, 8.343346416950226e-05, 8.602067828178406e-05, 8.860789239406586e-05, 9.119510650634766e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 9.0, 18.0, 17.0, 29.0, 37.0, 56.0, 81.0, 100.0, 181.0, 273.0, 402.0, 655.0, 982.0, 1503.0, 2274.0, 3771.0, 5974.0, 9914.0, 16708.0, 29238.0, 51951.0, 93278.0, 159641.0, 217307.0, 186318.0, 115471.0, 64415.0, 35859.0, 20406.0, 12121.0, 7350.0, 4518.0, 2726.0, 1702.0, 1130.0, 711.0, 470.0, 303.0, 213.0, 128.0, 82.0, 65.0, 49.0, 42.0, 14.0, 11.0, 14.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3212890625, -1.278228759765625, -1.23516845703125, -1.192108154296875, -1.1490478515625, -1.105987548828125, -1.06292724609375, -1.019866943359375, -0.976806640625, -0.933746337890625, -0.89068603515625, -0.847625732421875, -0.8045654296875, -0.761505126953125, -0.71844482421875, -0.675384521484375, -0.63232421875, -0.589263916015625, -0.54620361328125, -0.503143310546875, -0.4600830078125, -0.417022705078125, -0.37396240234375, -0.330902099609375, -0.287841796875, -0.244781494140625, -0.20172119140625, -0.158660888671875, -0.1156005859375, -0.072540283203125, -0.02947998046875, 0.013580322265625, 0.056640625, 0.099700927734375, 0.14276123046875, 0.185821533203125, 0.2288818359375, 0.271942138671875, 0.31500244140625, 0.358062744140625, 0.401123046875, 0.444183349609375, 0.48724365234375, 0.530303955078125, 0.5733642578125, 0.616424560546875, 0.65948486328125, 0.702545166015625, 0.74560546875, 0.788665771484375, 0.83172607421875, 0.874786376953125, 0.9178466796875, 0.960906982421875, 1.00396728515625, 1.047027587890625, 1.090087890625, 1.133148193359375, 1.17620849609375, 1.219268798828125, 1.2623291015625, 1.305389404296875, 1.34844970703125, 1.391510009765625, 1.4345703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 15.0, 10.0, 10.0, 23.0, 23.0, 29.0, 31.0, 31.0, 39.0, 46.0, 52.0, 44.0, 66.0, 49.0, 53.0, 41.0, 44.0, 59.0, 35.0, 42.0, 28.0, 27.0, 27.0, 17.0, 20.0, 14.0, 25.0, 12.0, 6.0, 11.0, 9.0, 5.0, 9.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4609375, -0.4478912353515625, -0.434844970703125, -0.4217987060546875, -0.40875244140625, -0.3957061767578125, -0.382659912109375, -0.3696136474609375, -0.3565673828125, -0.3435211181640625, -0.330474853515625, -0.3174285888671875, -0.30438232421875, -0.2913360595703125, -0.278289794921875, -0.2652435302734375, -0.252197265625, -0.2391510009765625, -0.226104736328125, -0.2130584716796875, -0.20001220703125, -0.1869659423828125, -0.173919677734375, -0.1608734130859375, -0.1478271484375, -0.1347808837890625, -0.121734619140625, -0.1086883544921875, -0.09564208984375, -0.0825958251953125, -0.069549560546875, -0.0565032958984375, -0.04345703125, -0.0304107666015625, -0.017364501953125, -0.0043182373046875, 0.00872802734375, 0.0217742919921875, 0.034820556640625, 0.0478668212890625, 0.0609130859375, 0.0739593505859375, 0.087005615234375, 0.1000518798828125, 0.11309814453125, 0.1261444091796875, 0.139190673828125, 0.1522369384765625, 0.165283203125, 0.1783294677734375, 0.191375732421875, 0.2044219970703125, 0.21746826171875, 0.2305145263671875, 0.243560791015625, 0.2566070556640625, 0.2696533203125, 0.2826995849609375, 0.295745849609375, 0.3087921142578125, 0.32183837890625, 0.3348846435546875, 0.347930908203125, 0.3609771728515625, 0.3740234375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 10.0, 6.0, 5.0, 10.0, 14.0, 13.0, 32.0, 24.0, 13.0, 35.0, 32.0, 22.0, 26.0, 27.0, 45.0, 41.0, 53.0, 32.0, 43.0, 55.0, 43.0, 40.0, 49.0, 43.0, 34.0, 29.0, 36.0, 27.0, 23.0, 25.0, 25.0, 16.0, 17.0, 9.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.107321739196777, -14.661651611328125, -14.215982437133789, -13.770312309265137, -13.324642181396484, -12.878972053527832, -12.43330192565918, -11.987632751464844, -11.541962623596191, -11.096292495727539, -10.650623321533203, -10.20495319366455, -9.759283065795898, -9.313612937927246, -8.867942810058594, -8.422273635864258, -7.9766035079956055, -7.530933380126953, -7.085263729095459, -6.639594078063965, -6.1939239501953125, -5.74825382232666, -5.302584171295166, -4.856914520263672, -4.4112443923950195, -3.9655745029449463, -3.519904613494873, -3.0742347240448, -2.6285648345947266, -2.1828949451446533, -1.73722505569458, -1.2915551662445068, -0.8458852767944336, -0.40021538734436035, 0.04545450210571289, 0.49112439155578613, 0.9367942810058594, 1.3824641704559326, 1.8281340599060059, 2.273803949356079, 2.7194738388061523, 3.1651437282562256, 3.610813617706299, 4.056483268737793, 4.502153396606445, 4.947823524475098, 5.393493175506592, 5.839162826538086, 6.284832954406738, 6.730503082275391, 7.176172733306885, 7.621842384338379, 8.067512512207031, 8.513182640075684, 8.958852767944336, 9.404521942138672, 9.850192070007324, 10.295862197875977, 10.741531372070312, 11.187201499938965, 11.632871627807617, 12.07854175567627, 12.524211883544922, 12.969881057739258, 13.41555118560791]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 7.0, 6.0, 11.0, 18.0, 15.0, 15.0, 10.0, 16.0, 27.0, 20.0, 21.0, 32.0, 23.0, 41.0, 36.0, 42.0, 28.0, 39.0, 48.0, 32.0, 36.0, 37.0, 39.0, 24.0, 37.0, 34.0, 41.0, 28.0, 31.0, 21.0, 32.0, 17.0, 16.0, 18.0, 19.0, 12.0, 8.0, 10.0, 6.0, 5.0, 9.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0], "bins": [-14.735434532165527, -14.299111366271973, -13.862788200378418, -13.426465034484863, -12.990141868591309, -12.553818702697754, -12.1174955368042, -11.681172370910645, -11.24484920501709, -10.808526039123535, -10.37220287322998, -9.935879707336426, -9.499556541442871, -9.063233375549316, -8.626910209655762, -8.190587043762207, -7.754263877868652, -7.317940711975098, -6.881617546081543, -6.445294380187988, -6.008971214294434, -5.572648048400879, -5.136324882507324, -4.7000017166137695, -4.263678550720215, -3.82735538482666, -3.3910322189331055, -2.954709053039551, -2.518385887145996, -2.0820627212524414, -1.6457395553588867, -1.209416389465332, -0.7730932235717773, -0.33677005767822266, 0.09955310821533203, 0.5358762741088867, 0.9721994400024414, 1.408522605895996, 1.8448457717895508, 2.2811689376831055, 2.71749210357666, 3.153815269470215, 3.5901384353637695, 4.026461601257324, 4.462784767150879, 4.899107933044434, 5.335431098937988, 5.771754264831543, 6.208077430725098, 6.644400596618652, 7.080723762512207, 7.517046928405762, 7.953370094299316, 8.389693260192871, 8.826016426086426, 9.26233959197998, 9.698662757873535, 10.13498592376709, 10.571309089660645, 11.0076322555542, 11.443955421447754, 11.880278587341309, 12.316601753234863, 12.752924919128418, 13.189248085021973]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 8.0, 19.0, 29.0, 37.0, 61.0, 117.0, 167.0, 258.0, 407.0, 617.0, 1092.0, 1642.0, 2493.0, 3833.0, 5758.0, 8343.0, 11899.0, 16830.0, 22943.0, 30347.0, 39371.0, 49002.0, 58827.0, 68143.0, 75995.0, 80996.0, 82823.0, 81408.0, 76320.0, 69221.0, 59819.0, 49689.0, 40177.0, 31087.0, 23533.0, 16906.0, 12465.0, 8593.0, 5859.0, 4034.0, 2647.0, 1677.0, 1103.0, 769.0, 440.0, 276.0, 200.0, 112.0, 65.0, 44.0, 24.0, 18.0, 13.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.0234375, -7.7607421875, -7.498046875, -7.2353515625, -6.97265625, -6.7099609375, -6.447265625, -6.1845703125, -5.921875, -5.6591796875, -5.396484375, -5.1337890625, -4.87109375, -4.6083984375, -4.345703125, -4.0830078125, -3.8203125, -3.5576171875, -3.294921875, -3.0322265625, -2.76953125, -2.5068359375, -2.244140625, -1.9814453125, -1.71875, -1.4560546875, -1.193359375, -0.9306640625, -0.66796875, -0.4052734375, -0.142578125, 0.1201171875, 0.3828125, 0.6455078125, 0.908203125, 1.1708984375, 1.43359375, 1.6962890625, 1.958984375, 2.2216796875, 2.484375, 2.7470703125, 3.009765625, 3.2724609375, 3.53515625, 3.7978515625, 4.060546875, 4.3232421875, 4.5859375, 4.8486328125, 5.111328125, 5.3740234375, 5.63671875, 5.8994140625, 6.162109375, 6.4248046875, 6.6875, 6.9501953125, 7.212890625, 7.4755859375, 7.73828125, 8.0009765625, 8.263671875, 8.5263671875, 8.7890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 5.0, 13.0, 15.0, 16.0, 16.0, 8.0, 19.0, 26.0, 23.0, 19.0, 31.0, 24.0, 40.0, 41.0, 39.0, 27.0, 44.0, 41.0, 35.0, 31.0, 40.0, 36.0, 28.0, 39.0, 34.0, 36.0, 28.0, 31.0, 24.0, 30.0, 17.0, 17.0, 21.0, 13.0, 14.0, 8.0, 9.0, 4.0, 6.0, 10.0, 1.0, 6.0, 2.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-14.2265625, -13.8043212890625, -13.382080078125, -12.9598388671875, -12.53759765625, -12.1153564453125, -11.693115234375, -11.2708740234375, -10.8486328125, -10.4263916015625, -10.004150390625, -9.5819091796875, -9.15966796875, -8.7374267578125, -8.315185546875, -7.8929443359375, -7.470703125, -7.0484619140625, -6.626220703125, -6.2039794921875, -5.78173828125, -5.3594970703125, -4.937255859375, -4.5150146484375, -4.0927734375, -3.6705322265625, -3.248291015625, -2.8260498046875, -2.40380859375, -1.9815673828125, -1.559326171875, -1.1370849609375, -0.71484375, -0.2926025390625, 0.129638671875, 0.5518798828125, 0.97412109375, 1.3963623046875, 1.818603515625, 2.2408447265625, 2.6630859375, 3.0853271484375, 3.507568359375, 3.9298095703125, 4.35205078125, 4.7742919921875, 5.196533203125, 5.6187744140625, 6.041015625, 6.4632568359375, 6.885498046875, 7.3077392578125, 7.72998046875, 8.1522216796875, 8.574462890625, 8.9967041015625, 9.4189453125, 9.8411865234375, 10.263427734375, 10.6856689453125, 11.10791015625, 11.5301513671875, 11.952392578125, 12.3746337890625, 12.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 14.0, 16.0, 19.0, 53.0, 74.0, 107.0, 173.0, 276.0, 447.0, 685.0, 1120.0, 1717.0, 2591.0, 4050.0, 5881.0, 8862.0, 12879.0, 17502.0, 24331.0, 32832.0, 42320.0, 52565.0, 63238.0, 73118.0, 80722.0, 85583.0, 85495.0, 82584.0, 75799.0, 66525.0, 56174.0, 45300.0, 35871.0, 26397.0, 19757.0, 14161.0, 9851.0, 6666.0, 4552.0, 2850.0, 1940.0, 1259.0, 840.0, 506.0, 300.0, 229.0, 139.0, 73.0, 38.0, 30.0, 18.0, 15.0, 10.0, 4.0, 2.0, 2.0], "bins": [-9.421875, -9.14599609375, -8.8701171875, -8.59423828125, -8.318359375, -8.04248046875, -7.7666015625, -7.49072265625, -7.21484375, -6.93896484375, -6.6630859375, -6.38720703125, -6.111328125, -5.83544921875, -5.5595703125, -5.28369140625, -5.0078125, -4.73193359375, -4.4560546875, -4.18017578125, -3.904296875, -3.62841796875, -3.3525390625, -3.07666015625, -2.80078125, -2.52490234375, -2.2490234375, -1.97314453125, -1.697265625, -1.42138671875, -1.1455078125, -0.86962890625, -0.59375, -0.31787109375, -0.0419921875, 0.23388671875, 0.509765625, 0.78564453125, 1.0615234375, 1.33740234375, 1.61328125, 1.88916015625, 2.1650390625, 2.44091796875, 2.716796875, 2.99267578125, 3.2685546875, 3.54443359375, 3.8203125, 4.09619140625, 4.3720703125, 4.64794921875, 4.923828125, 5.19970703125, 5.4755859375, 5.75146484375, 6.02734375, 6.30322265625, 6.5791015625, 6.85498046875, 7.130859375, 7.40673828125, 7.6826171875, 7.95849609375, 8.234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 3.0, 5.0, 8.0, 10.0, 12.0, 13.0, 22.0, 18.0, 13.0, 19.0, 16.0, 19.0, 26.0, 30.0, 37.0, 32.0, 40.0, 37.0, 40.0, 32.0, 45.0, 41.0, 38.0, 30.0, 27.0, 38.0, 41.0, 28.0, 21.0, 28.0, 26.0, 31.0, 29.0, 18.0, 16.0, 13.0, 8.0, 15.0, 10.0, 10.0, 10.0, 4.0, 5.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0], "bins": [-8.78125, -8.5059814453125, -8.230712890625, -7.9554443359375, -7.68017578125, -7.4049072265625, -7.129638671875, -6.8543701171875, -6.5791015625, -6.3038330078125, -6.028564453125, -5.7532958984375, -5.47802734375, -5.2027587890625, -4.927490234375, -4.6522216796875, -4.376953125, -4.1016845703125, -3.826416015625, -3.5511474609375, -3.27587890625, -3.0006103515625, -2.725341796875, -2.4500732421875, -2.1748046875, -1.8995361328125, -1.624267578125, -1.3489990234375, -1.07373046875, -0.7984619140625, -0.523193359375, -0.2479248046875, 0.02734375, 0.3026123046875, 0.577880859375, 0.8531494140625, 1.12841796875, 1.4036865234375, 1.678955078125, 1.9542236328125, 2.2294921875, 2.5047607421875, 2.780029296875, 3.0552978515625, 3.33056640625, 3.6058349609375, 3.881103515625, 4.1563720703125, 4.431640625, 4.7069091796875, 4.982177734375, 5.2574462890625, 5.53271484375, 5.8079833984375, 6.083251953125, 6.3585205078125, 6.6337890625, 6.9090576171875, 7.184326171875, 7.4595947265625, 7.73486328125, 8.0101318359375, 8.285400390625, 8.5606689453125, 8.8359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 7.0, 4.0, 8.0, 15.0, 22.0, 26.0, 36.0, 78.0, 118.0, 194.0, 357.0, 590.0, 947.0, 1530.0, 2666.0, 4620.0, 7813.0, 13266.0, 21062.0, 33146.0, 50152.0, 71311.0, 94147.0, 113610.0, 124790.0, 122699.0, 109077.0, 88364.0, 65476.0, 45633.0, 29822.0, 18851.0, 11402.0, 6815.0, 4098.0, 2435.0, 1373.0, 817.0, 438.0, 292.0, 165.0, 102.0, 80.0, 33.0, 22.0, 17.0, 7.0, 7.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.86328125, -5.6793212890625, -5.495361328125, -5.3114013671875, -5.12744140625, -4.9434814453125, -4.759521484375, -4.5755615234375, -4.3916015625, -4.2076416015625, -4.023681640625, -3.8397216796875, -3.65576171875, -3.4718017578125, -3.287841796875, -3.1038818359375, -2.919921875, -2.7359619140625, -2.552001953125, -2.3680419921875, -2.18408203125, -2.0001220703125, -1.816162109375, -1.6322021484375, -1.4482421875, -1.2642822265625, -1.080322265625, -0.8963623046875, -0.71240234375, -0.5284423828125, -0.344482421875, -0.1605224609375, 0.0234375, 0.2073974609375, 0.391357421875, 0.5753173828125, 0.75927734375, 0.9432373046875, 1.127197265625, 1.3111572265625, 1.4951171875, 1.6790771484375, 1.863037109375, 2.0469970703125, 2.23095703125, 2.4149169921875, 2.598876953125, 2.7828369140625, 2.966796875, 3.1507568359375, 3.334716796875, 3.5186767578125, 3.70263671875, 3.8865966796875, 4.070556640625, 4.2545166015625, 4.4384765625, 4.6224365234375, 4.806396484375, 4.9903564453125, 5.17431640625, 5.3582763671875, 5.542236328125, 5.7261962890625, 5.91015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 6.0, 7.0, 12.0, 16.0, 34.0, 24.0, 23.0, 30.0, 35.0, 29.0, 25.0, 36.0, 47.0, 42.0, 35.0, 52.0, 49.0, 44.0, 46.0, 43.0, 51.0, 50.0, 35.0, 28.0, 24.0, 29.0, 18.0, 16.0, 17.0, 12.0, 12.0, 7.0, 6.0, 5.0, 4.0, 12.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0007319450378417969, -0.0007120594382286072, -0.0006921738386154175, -0.0006722882390022278, -0.0006524026393890381, -0.0006325170397758484, -0.0006126314401626587, -0.000592745840549469, -0.0005728602409362793, -0.0005529746413230896, -0.0005330890417098999, -0.0005132034420967102, -0.0004933178424835205, -0.0004734322428703308, -0.0004535466432571411, -0.0004336610436439514, -0.0004137754440307617, -0.000393889844417572, -0.0003740042448043823, -0.0003541186451911926, -0.00033423304557800293, -0.00031434744596481323, -0.00029446184635162354, -0.00027457624673843384, -0.00025469064712524414, -0.00023480504751205444, -0.00021491944789886475, -0.00019503384828567505, -0.00017514824867248535, -0.00015526264905929565, -0.00013537704944610596, -0.00011549144983291626, -9.560585021972656e-05, -7.572025060653687e-05, -5.583465099334717e-05, -3.594905138015747e-05, -1.6063451766967773e-05, 3.822147846221924e-06, 2.370774745941162e-05, 4.359334707260132e-05, 6.347894668579102e-05, 8.336454629898071e-05, 0.00010325014591217041, 0.0001231357455253601, 0.0001430213451385498, 0.0001629069447517395, 0.0001827925443649292, 0.0002026781439781189, 0.0002225637435913086, 0.0002424493432044983, 0.000262334942817688, 0.0002822205424308777, 0.0003021061420440674, 0.0003219917416572571, 0.0003418773412704468, 0.0003617629408836365, 0.00038164854049682617, 0.00040153414011001587, 0.00042141973972320557, 0.00044130533933639526, 0.00046119093894958496, 0.00048107653856277466, 0.0005009621381759644, 0.000520847737789154, 0.0005407333374023438]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 10.0, 9.0, 15.0, 36.0, 46.0, 67.0, 139.0, 190.0, 279.0, 462.0, 774.0, 1268.0, 2224.0, 3698.0, 6224.0, 10457.0, 17360.0, 28400.0, 44084.0, 66103.0, 92241.0, 116281.0, 132643.0, 132311.0, 117156.0, 92764.0, 66346.0, 45050.0, 28429.0, 17421.0, 10578.0, 6177.0, 3780.0, 2196.0, 1301.0, 788.0, 433.0, 292.0, 182.0, 114.0, 84.0, 47.0, 34.0, 24.0, 13.0, 12.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.03106689453125, -6.8043212890625, -6.57757568359375, -6.350830078125, -6.12408447265625, -5.8973388671875, -5.67059326171875, -5.44384765625, -5.21710205078125, -4.9903564453125, -4.76361083984375, -4.536865234375, -4.31011962890625, -4.0833740234375, -3.85662841796875, -3.6298828125, -3.40313720703125, -3.1763916015625, -2.94964599609375, -2.722900390625, -2.49615478515625, -2.2694091796875, -2.04266357421875, -1.81591796875, -1.58917236328125, -1.3624267578125, -1.13568115234375, -0.908935546875, -0.68218994140625, -0.4554443359375, -0.22869873046875, -0.001953125, 0.22479248046875, 0.4515380859375, 0.67828369140625, 0.905029296875, 1.13177490234375, 1.3585205078125, 1.58526611328125, 1.81201171875, 2.03875732421875, 2.2655029296875, 2.49224853515625, 2.718994140625, 2.94573974609375, 3.1724853515625, 3.39923095703125, 3.6259765625, 3.85272216796875, 4.0794677734375, 4.30621337890625, 4.532958984375, 4.75970458984375, 4.9864501953125, 5.21319580078125, 5.43994140625, 5.66668701171875, 5.8934326171875, 6.12017822265625, 6.346923828125, 6.57366943359375, 6.8004150390625, 7.02716064453125, 7.25390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 2.0, 7.0, 9.0, 6.0, 7.0, 14.0, 16.0, 13.0, 26.0, 31.0, 26.0, 33.0, 36.0, 22.0, 46.0, 39.0, 59.0, 39.0, 64.0, 46.0, 56.0, 48.0, 32.0, 37.0, 41.0, 33.0, 24.0, 20.0, 20.0, 30.0, 21.0, 18.0, 11.0, 15.0, 5.0, 6.0, 7.0, 7.0, 1.0, 8.0, 8.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.249359130859375, -2.16278076171875, -2.076202392578125, -1.9896240234375, -1.903045654296875, -1.81646728515625, -1.729888916015625, -1.643310546875, -1.556732177734375, -1.47015380859375, -1.383575439453125, -1.2969970703125, -1.210418701171875, -1.12384033203125, -1.037261962890625, -0.95068359375, -0.864105224609375, -0.77752685546875, -0.690948486328125, -0.6043701171875, -0.517791748046875, -0.43121337890625, -0.344635009765625, -0.258056640625, -0.171478271484375, -0.08489990234375, 0.001678466796875, 0.0882568359375, 0.174835205078125, 0.26141357421875, 0.347991943359375, 0.4345703125, 0.521148681640625, 0.60772705078125, 0.694305419921875, 0.7808837890625, 0.867462158203125, 0.95404052734375, 1.040618896484375, 1.127197265625, 1.213775634765625, 1.30035400390625, 1.386932373046875, 1.4735107421875, 1.560089111328125, 1.64666748046875, 1.733245849609375, 1.81982421875, 1.906402587890625, 1.99298095703125, 2.079559326171875, 2.1661376953125, 2.252716064453125, 2.33929443359375, 2.425872802734375, 2.512451171875, 2.599029541015625, 2.68560791015625, 2.772186279296875, 2.8587646484375, 2.945343017578125, 3.03192138671875, 3.118499755859375, 3.205078125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 19.0, 14.0, 26.0, 19.0, 18.0, 21.0, 34.0, 27.0, 36.0, 38.0, 52.0, 28.0, 48.0, 38.0, 37.0, 42.0, 59.0, 41.0, 22.0, 30.0, 23.0, 42.0, 33.0, 33.0, 23.0, 26.0, 21.0, 17.0, 17.0, 8.0, 10.0, 4.0, 14.0, 4.0, 9.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.258090019226074, -12.842058181762695, -12.426026344299316, -12.009994506835938, -11.593961715698242, -11.17793083190918, -10.761898040771484, -10.345866203308105, -9.929834365844727, -9.513802528381348, -9.097770690917969, -8.68173885345459, -8.265707015991211, -7.849674701690674, -7.433642387390137, -7.017610549926758, -6.601578712463379, -6.185546875, -5.769515037536621, -5.353482723236084, -4.937450885772705, -4.521419048309326, -4.105386734008789, -3.68935489654541, -3.2733230590820312, -2.8572912216186523, -2.4412591457366943, -2.0252270698547363, -1.6091952323913574, -1.1931633949279785, -0.7771313190460205, -0.3610992431640625, 0.05493354797363281, 0.47096550464630127, 0.8869974613189697, 1.3030294179916382, 1.7190613746643066, 2.1350932121276855, 2.5511252880096436, 2.9671573638916016, 3.3831892013549805, 3.7992210388183594, 4.215252876281738, 4.631285190582275, 5.047317028045654, 5.463348865509033, 5.87938117980957, 6.295413017272949, 6.711444854736328, 7.127476692199707, 7.543508529663086, 7.959540843963623, 8.375572204589844, 8.791604995727539, 9.207636833190918, 9.623668670654297, 10.039700508117676, 10.455732345581055, 10.871764183044434, 11.287796020507812, 11.703828811645508, 12.11985969543457, 12.535892486572266, 12.951924324035645, 13.367956161499023]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 7.0, 16.0, 19.0, 20.0, 23.0, 32.0, 29.0, 34.0, 39.0, 34.0, 35.0, 41.0, 40.0, 48.0, 36.0, 40.0, 41.0, 42.0, 44.0, 30.0, 33.0, 32.0, 32.0, 20.0, 28.0, 34.0, 19.0, 14.0, 18.0, 14.0, 9.0, 11.0, 8.0, 12.0, 8.0, 5.0, 3.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.291322708129883, -16.76630401611328, -16.24128532409668, -15.716267585754395, -15.19124984741211, -14.666231155395508, -14.141212463378906, -13.616193771362305, -13.09117603302002, -12.566157341003418, -12.041139602661133, -11.516120910644531, -10.99110221862793, -10.466084480285645, -9.941065788269043, -9.416048049926758, -8.891029357910156, -8.366010665893555, -7.8409929275512695, -7.315974235534668, -6.790956020355225, -6.265937805175781, -5.74091911315918, -5.215900897979736, -4.690882682800293, -4.16586446762085, -3.640846014022827, -3.1158275604248047, -2.5908093452453613, -2.065791130065918, -1.5407726764678955, -1.015754222869873, -0.4907341003417969, 0.034284234046936035, 0.559302568435669, 1.0843209028244019, 1.6093392372131348, 2.134357452392578, 2.6593759059906006, 3.184394359588623, 3.7094125747680664, 4.23443078994751, 4.759449005126953, 5.284467697143555, 5.809485912322998, 6.334504127502441, 6.859522819519043, 7.384541034698486, 7.90955924987793, 8.434577941894531, 8.959595680236816, 9.484614372253418, 10.009632110595703, 10.534650802612305, 11.059669494628906, 11.584688186645508, 12.109705924987793, 12.634724617004395, 13.15974235534668, 13.684761047363281, 14.209779739379883, 14.734797477722168, 15.25981616973877, 15.784833908081055, 16.309852600097656]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 13.0, 16.0, 31.0, 51.0, 80.0, 152.0, 276.0, 433.0, 752.0, 1155.0, 2019.0, 3200.0, 5238.0, 8559.0, 13725.0, 21975.0, 34273.0, 52779.0, 79661.0, 115385.0, 163294.0, 221825.0, 286427.0, 346657.0, 396866.0, 420381.0, 414759.0, 380040.0, 324291.0, 261537.0, 199834.0, 144823.0, 101632.0, 69022.0, 45499.0, 29265.0, 18749.0, 11620.0, 6982.0, 4385.0, 2683.0, 1605.0, 939.0, 609.0, 349.0, 193.0, 107.0, 77.0, 27.0, 13.0, 7.0, 9.0, 3.0, 2.0, 0.0, 3.0], "bins": [-11.703125, -11.3570556640625, -11.010986328125, -10.6649169921875, -10.31884765625, -9.9727783203125, -9.626708984375, -9.2806396484375, -8.9345703125, -8.5885009765625, -8.242431640625, -7.8963623046875, -7.55029296875, -7.2042236328125, -6.858154296875, -6.5120849609375, -6.166015625, -5.8199462890625, -5.473876953125, -5.1278076171875, -4.78173828125, -4.4356689453125, -4.089599609375, -3.7435302734375, -3.3974609375, -3.0513916015625, -2.705322265625, -2.3592529296875, -2.01318359375, -1.6671142578125, -1.321044921875, -0.9749755859375, -0.62890625, -0.2828369140625, 0.063232421875, 0.4093017578125, 0.75537109375, 1.1014404296875, 1.447509765625, 1.7935791015625, 2.1396484375, 2.4857177734375, 2.831787109375, 3.1778564453125, 3.52392578125, 3.8699951171875, 4.216064453125, 4.5621337890625, 4.908203125, 5.2542724609375, 5.600341796875, 5.9464111328125, 6.29248046875, 6.6385498046875, 6.984619140625, 7.3306884765625, 7.6767578125, 8.0228271484375, 8.368896484375, 8.7149658203125, 9.06103515625, 9.4071044921875, 9.753173828125, 10.0992431640625, 10.4453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 4.0, 5.0, 13.0, 10.0, 12.0, 9.0, 14.0, 17.0, 18.0, 26.0, 20.0, 33.0, 37.0, 36.0, 35.0, 41.0, 40.0, 36.0, 44.0, 37.0, 40.0, 40.0, 44.0, 43.0, 34.0, 29.0, 36.0, 28.0, 25.0, 29.0, 28.0, 25.0, 13.0, 21.0, 14.0, 9.0, 14.0, 9.0, 8.0, 11.0, 2.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.1405029296875, -15.640380859375, -15.1402587890625, -14.64013671875, -14.1400146484375, -13.639892578125, -13.1397705078125, -12.6396484375, -12.1395263671875, -11.639404296875, -11.1392822265625, -10.63916015625, -10.1390380859375, -9.638916015625, -9.1387939453125, -8.638671875, -8.1385498046875, -7.638427734375, -7.1383056640625, -6.63818359375, -6.1380615234375, -5.637939453125, -5.1378173828125, -4.6376953125, -4.1375732421875, -3.637451171875, -3.1373291015625, -2.63720703125, -2.1370849609375, -1.636962890625, -1.1368408203125, -0.63671875, -0.1365966796875, 0.363525390625, 0.8636474609375, 1.36376953125, 1.8638916015625, 2.364013671875, 2.8641357421875, 3.3642578125, 3.8643798828125, 4.364501953125, 4.8646240234375, 5.36474609375, 5.8648681640625, 6.364990234375, 6.8651123046875, 7.365234375, 7.8653564453125, 8.365478515625, 8.8656005859375, 9.36572265625, 9.8658447265625, 10.365966796875, 10.8660888671875, 11.3662109375, 11.8663330078125, 12.366455078125, 12.8665771484375, 13.36669921875, 13.8668212890625, 14.366943359375, 14.8670654296875, 15.3671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 7.0, 7.0, 14.0, 25.0, 34.0, 53.0, 121.0, 191.0, 353.0, 655.0, 1203.0, 2167.0, 3832.0, 6636.0, 11559.0, 19142.0, 31728.0, 49772.0, 78039.0, 114268.0, 164527.0, 224435.0, 288965.0, 350191.0, 397964.0, 423063.0, 418344.0, 383523.0, 329341.0, 268393.0, 202582.0, 146636.0, 101859.0, 66578.0, 43006.0, 26696.0, 16006.0, 9711.0, 5518.0, 3104.0, 1828.0, 976.0, 576.0, 303.0, 162.0, 93.0, 48.0, 33.0, 16.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0616455078125, -10.677978515625, -10.2943115234375, -9.91064453125, -9.5269775390625, -9.143310546875, -8.7596435546875, -8.3759765625, -7.9923095703125, -7.608642578125, -7.2249755859375, -6.84130859375, -6.4576416015625, -6.073974609375, -5.6903076171875, -5.306640625, -4.9229736328125, -4.539306640625, -4.1556396484375, -3.77197265625, -3.3883056640625, -3.004638671875, -2.6209716796875, -2.2373046875, -1.8536376953125, -1.469970703125, -1.0863037109375, -0.70263671875, -0.3189697265625, 0.064697265625, 0.4483642578125, 0.83203125, 1.2156982421875, 1.599365234375, 1.9830322265625, 2.36669921875, 2.7503662109375, 3.134033203125, 3.5177001953125, 3.9013671875, 4.2850341796875, 4.668701171875, 5.0523681640625, 5.43603515625, 5.8197021484375, 6.203369140625, 6.5870361328125, 6.970703125, 7.3543701171875, 7.738037109375, 8.1217041015625, 8.50537109375, 8.8890380859375, 9.272705078125, 9.6563720703125, 10.0400390625, 10.4237060546875, 10.807373046875, 11.1910400390625, 11.57470703125, 11.9583740234375, 12.342041015625, 12.7257080078125, 13.109375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 16.0, 15.0, 22.0, 27.0, 35.0, 34.0, 43.0, 61.0, 80.0, 76.0, 90.0, 100.0, 110.0, 162.0, 156.0, 133.0, 184.0, 193.0, 195.0, 190.0, 190.0, 213.0, 191.0, 201.0, 147.0, 175.0, 152.0, 126.0, 131.0, 124.0, 89.0, 72.0, 68.0, 52.0, 53.0, 29.0, 35.0, 29.0, 20.0, 16.0, 9.0, 7.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.625, -6.41522216796875, -6.2054443359375, -5.99566650390625, -5.785888671875, -5.57611083984375, -5.3663330078125, -5.15655517578125, -4.94677734375, -4.73699951171875, -4.5272216796875, -4.31744384765625, -4.107666015625, -3.89788818359375, -3.6881103515625, -3.47833251953125, -3.2685546875, -3.05877685546875, -2.8489990234375, -2.63922119140625, -2.429443359375, -2.21966552734375, -2.0098876953125, -1.80010986328125, -1.59033203125, -1.38055419921875, -1.1707763671875, -0.96099853515625, -0.751220703125, -0.54144287109375, -0.3316650390625, -0.12188720703125, 0.087890625, 0.29766845703125, 0.5074462890625, 0.71722412109375, 0.927001953125, 1.13677978515625, 1.3465576171875, 1.55633544921875, 1.76611328125, 1.97589111328125, 2.1856689453125, 2.39544677734375, 2.605224609375, 2.81500244140625, 3.0247802734375, 3.23455810546875, 3.4443359375, 3.65411376953125, 3.8638916015625, 4.07366943359375, 4.283447265625, 4.49322509765625, 4.7030029296875, 4.91278076171875, 5.12255859375, 5.33233642578125, 5.5421142578125, 5.75189208984375, 5.961669921875, 6.17144775390625, 6.3812255859375, 6.59100341796875, 6.80078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 10.0, 12.0, 10.0, 13.0, 10.0, 18.0, 24.0, 35.0, 29.0, 31.0, 30.0, 32.0, 35.0, 32.0, 42.0, 47.0, 33.0, 39.0, 42.0, 49.0, 42.0, 33.0, 37.0, 36.0, 27.0, 40.0, 22.0, 21.0, 25.0, 15.0, 19.0, 15.0, 13.0, 15.0, 9.0, 7.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.516847610473633, -13.0610933303833, -12.605339050292969, -12.149584770202637, -11.693830490112305, -11.238077163696289, -10.782322883605957, -10.326568603515625, -9.870814323425293, -9.415060043334961, -8.959305763244629, -8.503551483154297, -8.047798156738281, -7.592043399810791, -7.136289596557617, -6.680535316467285, -6.224781036376953, -5.769026756286621, -5.313272476196289, -4.857518672943115, -4.401764392852783, -3.946010112762451, -3.4902560710906982, -3.0345020294189453, -2.5787477493286133, -2.1229934692382812, -1.6672394275665283, -1.2114852666854858, -0.7557311058044434, -0.29997682571411133, 0.1557772159576416, 0.6115312576293945, 1.0672845840454102, 1.5230387449264526, 1.9787929058074951, 2.434546947479248, 2.89030122756958, 3.346055507659912, 3.801809549331665, 4.257563591003418, 4.71331787109375, 5.169072151184082, 5.624826431274414, 6.080580234527588, 6.53633451461792, 6.992088794708252, 7.447842597961426, 7.903596878051758, 8.35935115814209, 8.815105438232422, 9.270859718322754, 9.726613998413086, 10.182367324829102, 10.63812255859375, 11.093875885009766, 11.549630165100098, 12.00538444519043, 12.461138725280762, 12.916893005371094, 13.372647285461426, 13.828401565551758, 14.284154891967773, 14.739909172058105, 15.195663452148438, 15.65141773223877]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 8.0, 13.0, 7.0, 13.0, 11.0, 15.0, 9.0, 17.0, 18.0, 23.0, 23.0, 32.0, 24.0, 36.0, 33.0, 28.0, 27.0, 36.0, 33.0, 45.0, 32.0, 37.0, 36.0, 33.0, 41.0, 33.0, 34.0, 39.0, 33.0, 18.0, 29.0, 25.0, 26.0, 19.0, 14.0, 17.0, 9.0, 14.0, 12.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.059412002563477, -15.555341720581055, -15.051271438598633, -14.547201156616211, -14.043130874633789, -13.539060592651367, -13.034990310668945, -12.530920028686523, -12.026849746704102, -11.52277946472168, -11.018709182739258, -10.514638900756836, -10.010568618774414, -9.506498336791992, -9.00242805480957, -8.498357772827148, -7.99428653717041, -7.490216255187988, -6.986145973205566, -6.4820756912231445, -5.978005409240723, -5.473935127258301, -4.969864368438721, -4.465794086456299, -3.961723804473877, -3.457653522491455, -2.953583240509033, -2.4495127201080322, -1.9454424381256104, -1.4413721561431885, -0.9373016357421875, -0.4332313537597656, 0.07083892822265625, 0.5749092698097229, 1.0789796113967896, 1.583050012588501, 2.087120294570923, 2.5911905765533447, 3.0952610969543457, 3.5993313789367676, 4.1034016609191895, 4.607471942901611, 5.111542224884033, 5.615612983703613, 6.119683265686035, 6.623753547668457, 7.127823829650879, 7.631894111633301, 8.135964393615723, 8.640034675598145, 9.144104957580566, 9.648175239562988, 10.15224552154541, 10.656315803527832, 11.16038703918457, 11.664457321166992, 12.168527603149414, 12.672597885131836, 13.176668167114258, 13.68073844909668, 14.184808731079102, 14.688879013061523, 15.192949295043945, 15.697019577026367, 16.20108985900879]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 9.0, 8.0, 15.0, 15.0, 33.0, 37.0, 58.0, 80.0, 100.0, 154.0, 224.0, 282.0, 488.0, 748.0, 1088.0, 1733.0, 2764.0, 4532.0, 7364.0, 12160.0, 21267.0, 37250.0, 66425.0, 113794.0, 176085.0, 203993.0, 160643.0, 100624.0, 57446.0, 32476.0, 18446.0, 10736.0, 6435.0, 3870.0, 2524.0, 1560.0, 990.0, 655.0, 480.0, 294.0, 205.0, 131.0, 109.0, 72.0, 46.0, 44.0, 29.0, 13.0, 12.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-3.669921875, -3.559967041015625, -3.45001220703125, -3.340057373046875, -3.2301025390625, -3.120147705078125, -3.01019287109375, -2.900238037109375, -2.790283203125, -2.680328369140625, -2.57037353515625, -2.460418701171875, -2.3504638671875, -2.240509033203125, -2.13055419921875, -2.020599365234375, -1.91064453125, -1.800689697265625, -1.69073486328125, -1.580780029296875, -1.4708251953125, -1.360870361328125, -1.25091552734375, -1.140960693359375, -1.031005859375, -0.921051025390625, -0.81109619140625, -0.701141357421875, -0.5911865234375, -0.481231689453125, -0.37127685546875, -0.261322021484375, -0.1513671875, -0.041412353515625, 0.06854248046875, 0.178497314453125, 0.2884521484375, 0.398406982421875, 0.50836181640625, 0.618316650390625, 0.728271484375, 0.838226318359375, 0.94818115234375, 1.058135986328125, 1.1680908203125, 1.278045654296875, 1.38800048828125, 1.497955322265625, 1.60791015625, 1.717864990234375, 1.82781982421875, 1.937774658203125, 2.0477294921875, 2.157684326171875, 2.26763916015625, 2.377593994140625, 2.487548828125, 2.597503662109375, 2.70745849609375, 2.817413330078125, 2.9273681640625, 3.037322998046875, 3.14727783203125, 3.257232666015625, 3.3671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 3.0, 8.0, 13.0, 7.0, 13.0, 10.0, 16.0, 9.0, 18.0, 17.0, 22.0, 24.0, 32.0, 25.0, 38.0, 31.0, 30.0, 24.0, 36.0, 35.0, 43.0, 31.0, 37.0, 39.0, 31.0, 40.0, 38.0, 31.0, 41.0, 31.0, 18.0, 29.0, 24.0, 26.0, 19.0, 15.0, 16.0, 10.0, 13.0, 12.0, 7.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.078125, -15.572509765625, -15.06689453125, -14.561279296875, -14.0556640625, -13.550048828125, -13.04443359375, -12.538818359375, -12.033203125, -11.527587890625, -11.02197265625, -10.516357421875, -10.0107421875, -9.505126953125, -8.99951171875, -8.493896484375, -7.98828125, -7.482666015625, -6.97705078125, -6.471435546875, -5.9658203125, -5.460205078125, -4.95458984375, -4.448974609375, -3.943359375, -3.437744140625, -2.93212890625, -2.426513671875, -1.9208984375, -1.415283203125, -0.90966796875, -0.404052734375, 0.1015625, 0.607177734375, 1.11279296875, 1.618408203125, 2.1240234375, 2.629638671875, 3.13525390625, 3.640869140625, 4.146484375, 4.652099609375, 5.15771484375, 5.663330078125, 6.1689453125, 6.674560546875, 7.18017578125, 7.685791015625, 8.19140625, 8.697021484375, 9.20263671875, 9.708251953125, 10.2138671875, 10.719482421875, 11.22509765625, 11.730712890625, 12.236328125, 12.741943359375, 13.24755859375, 13.753173828125, 14.2587890625, 14.764404296875, 15.27001953125, 15.775634765625, 16.28125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 6.0, 14.0, 15.0, 23.0, 25.0, 45.0, 53.0, 75.0, 124.0, 161.0, 247.0, 381.0, 687.0, 901.0, 1527.0, 2620.0, 4680.0, 8401.0, 15799.0, 33677.0, 74048.0, 169845.0, 303917.0, 232557.0, 105170.0, 46619.0, 21855.0, 10915.0, 5788.0, 3292.0, 1906.0, 1108.0, 696.0, 458.0, 260.0, 178.0, 161.0, 102.0, 66.0, 47.0, 34.0, 23.0, 15.0, 16.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.535888671875, -4.38818359375, -4.240478515625, -4.0927734375, -3.945068359375, -3.79736328125, -3.649658203125, -3.501953125, -3.354248046875, -3.20654296875, -3.058837890625, -2.9111328125, -2.763427734375, -2.61572265625, -2.468017578125, -2.3203125, -2.172607421875, -2.02490234375, -1.877197265625, -1.7294921875, -1.581787109375, -1.43408203125, -1.286376953125, -1.138671875, -0.990966796875, -0.84326171875, -0.695556640625, -0.5478515625, -0.400146484375, -0.25244140625, -0.104736328125, 0.04296875, 0.190673828125, 0.33837890625, 0.486083984375, 0.6337890625, 0.781494140625, 0.92919921875, 1.076904296875, 1.224609375, 1.372314453125, 1.52001953125, 1.667724609375, 1.8154296875, 1.963134765625, 2.11083984375, 2.258544921875, 2.40625, 2.553955078125, 2.70166015625, 2.849365234375, 2.9970703125, 3.144775390625, 3.29248046875, 3.440185546875, 3.587890625, 3.735595703125, 3.88330078125, 4.031005859375, 4.1787109375, 4.326416015625, 4.47412109375, 4.621826171875, 4.76953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 6.0, 1.0, 5.0, 6.0, 14.0, 9.0, 14.0, 19.0, 23.0, 20.0, 25.0, 25.0, 15.0, 36.0, 32.0, 38.0, 33.0, 42.0, 43.0, 37.0, 31.0, 50.0, 46.0, 38.0, 59.0, 37.0, 38.0, 28.0, 28.0, 28.0, 19.0, 18.0, 19.0, 23.0, 21.0, 8.0, 11.0, 15.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5333251953125, -10.183837890625, -9.8343505859375, -9.48486328125, -9.1353759765625, -8.785888671875, -8.4364013671875, -8.0869140625, -7.7374267578125, -7.387939453125, -7.0384521484375, -6.68896484375, -6.3394775390625, -5.989990234375, -5.6405029296875, -5.291015625, -4.9415283203125, -4.592041015625, -4.2425537109375, -3.89306640625, -3.5435791015625, -3.194091796875, -2.8446044921875, -2.4951171875, -2.1456298828125, -1.796142578125, -1.4466552734375, -1.09716796875, -0.7476806640625, -0.398193359375, -0.0487060546875, 0.30078125, 0.6502685546875, 0.999755859375, 1.3492431640625, 1.69873046875, 2.0482177734375, 2.397705078125, 2.7471923828125, 3.0966796875, 3.4461669921875, 3.795654296875, 4.1451416015625, 4.49462890625, 4.8441162109375, 5.193603515625, 5.5430908203125, 5.892578125, 6.2420654296875, 6.591552734375, 6.9410400390625, 7.29052734375, 7.6400146484375, 7.989501953125, 8.3389892578125, 8.6884765625, 9.0379638671875, 9.387451171875, 9.7369384765625, 10.08642578125, 10.4359130859375, 10.785400390625, 11.1348876953125, 11.484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 3.0, 5.0, 15.0, 17.0, 17.0, 31.0, 41.0, 86.0, 96.0, 154.0, 202.0, 289.0, 494.0, 665.0, 1122.0, 1645.0, 2625.0, 4492.0, 8051.0, 14747.0, 30062.0, 68083.0, 173504.0, 333660.0, 234452.0, 92744.0, 38989.0, 18578.0, 9717.0, 5375.0, 3116.0, 1929.0, 1198.0, 767.0, 497.0, 347.0, 242.0, 171.0, 109.0, 60.0, 45.0, 29.0, 32.0, 19.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0887451171875, -1.055419921875, -1.0220947265625, -0.98876953125, -0.9554443359375, -0.922119140625, -0.8887939453125, -0.85546875, -0.8221435546875, -0.788818359375, -0.7554931640625, -0.72216796875, -0.6888427734375, -0.655517578125, -0.6221923828125, -0.5888671875, -0.5555419921875, -0.522216796875, -0.4888916015625, -0.45556640625, -0.4222412109375, -0.388916015625, -0.3555908203125, -0.322265625, -0.2889404296875, -0.255615234375, -0.2222900390625, -0.18896484375, -0.1556396484375, -0.122314453125, -0.0889892578125, -0.0556640625, -0.0223388671875, 0.010986328125, 0.0443115234375, 0.07763671875, 0.1109619140625, 0.144287109375, 0.1776123046875, 0.2109375, 0.2442626953125, 0.277587890625, 0.3109130859375, 0.34423828125, 0.3775634765625, 0.410888671875, 0.4442138671875, 0.4775390625, 0.5108642578125, 0.544189453125, 0.5775146484375, 0.61083984375, 0.6441650390625, 0.677490234375, 0.7108154296875, 0.744140625, 0.7774658203125, 0.810791015625, 0.8441162109375, 0.87744140625, 0.9107666015625, 0.944091796875, 0.9774169921875, 1.0107421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 6.0, 1.0, 8.0, 4.0, 10.0, 10.0, 12.0, 14.0, 15.0, 29.0, 20.0, 24.0, 28.0, 24.0, 34.0, 48.0, 47.0, 42.0, 46.0, 59.0, 61.0, 62.0, 54.0, 51.0, 39.0, 34.0, 40.0, 26.0, 24.0, 30.0, 24.0, 15.0, 7.0, 11.0, 11.0, 7.0, 3.0, 7.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1552734375e-05, -8.82614403963089e-05, -8.49701464176178e-05, -8.16788524389267e-05, -7.83875584602356e-05, -7.50962644815445e-05, -7.18049705028534e-05, -6.851367652416229e-05, -6.522238254547119e-05, -6.193108856678009e-05, -5.863979458808899e-05, -5.534850060939789e-05, -5.205720663070679e-05, -4.8765912652015686e-05, -4.5474618673324585e-05, -4.2183324694633484e-05, -3.889203071594238e-05, -3.560073673725128e-05, -3.230944275856018e-05, -2.901814877986908e-05, -2.572685480117798e-05, -2.2435560822486877e-05, -1.9144266843795776e-05, -1.5852972865104675e-05, -1.2561678886413574e-05, -9.270384907722473e-06, -5.979090929031372e-06, -2.687796950340271e-06, 6.034970283508301e-07, 3.894791007041931e-06, 7.186084985733032e-06, 1.0477378964424133e-05, 1.3768672943115234e-05, 1.7059966921806335e-05, 2.0351260900497437e-05, 2.3642554879188538e-05, 2.693384885787964e-05, 3.022514283657074e-05, 3.351643681526184e-05, 3.680773079395294e-05, 4.009902477264404e-05, 4.3390318751335144e-05, 4.6681612730026245e-05, 4.9972906708717346e-05, 5.326420068740845e-05, 5.655549466609955e-05, 5.984678864479065e-05, 6.313808262348175e-05, 6.642937660217285e-05, 6.972067058086395e-05, 7.301196455955505e-05, 7.630325853824615e-05, 7.959455251693726e-05, 8.288584649562836e-05, 8.617714047431946e-05, 8.946843445301056e-05, 9.275972843170166e-05, 9.605102241039276e-05, 9.934231638908386e-05, 0.00010263361036777496, 0.00010592490434646606, 0.00010921619832515717, 0.00011250749230384827, 0.00011579878628253937, 0.00011909008026123047]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 9.0, 9.0, 23.0, 28.0, 42.0, 56.0, 77.0, 101.0, 188.0, 294.0, 407.0, 609.0, 951.0, 1442.0, 2268.0, 3806.0, 6017.0, 10064.0, 16835.0, 28640.0, 49983.0, 84118.0, 133158.0, 179578.0, 181333.0, 136376.0, 86528.0, 51275.0, 29832.0, 17479.0, 10358.0, 6057.0, 3864.0, 2360.0, 1572.0, 916.0, 629.0, 400.0, 276.0, 197.0, 152.0, 80.0, 49.0, 42.0, 31.0, 15.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1044921875, -1.07000732421875, -1.0355224609375, -1.00103759765625, -0.966552734375, -0.93206787109375, -0.8975830078125, -0.86309814453125, -0.82861328125, -0.79412841796875, -0.7596435546875, -0.72515869140625, -0.690673828125, -0.65618896484375, -0.6217041015625, -0.58721923828125, -0.552734375, -0.51824951171875, -0.4837646484375, -0.44927978515625, -0.414794921875, -0.38031005859375, -0.3458251953125, -0.31134033203125, -0.27685546875, -0.24237060546875, -0.2078857421875, -0.17340087890625, -0.138916015625, -0.10443115234375, -0.0699462890625, -0.03546142578125, -0.0009765625, 0.03350830078125, 0.0679931640625, 0.10247802734375, 0.136962890625, 0.17144775390625, 0.2059326171875, 0.24041748046875, 0.27490234375, 0.30938720703125, 0.3438720703125, 0.37835693359375, 0.412841796875, 0.44732666015625, 0.4818115234375, 0.51629638671875, 0.55078125, 0.58526611328125, 0.6197509765625, 0.65423583984375, 0.688720703125, 0.72320556640625, 0.7576904296875, 0.79217529296875, 0.82666015625, 0.86114501953125, 0.8956298828125, 0.93011474609375, 0.964599609375, 0.99908447265625, 1.0335693359375, 1.06805419921875, 1.1025390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 0.0, 3.0, 4.0, 15.0, 10.0, 7.0, 19.0, 17.0, 22.0, 25.0, 33.0, 30.0, 24.0, 40.0, 35.0, 44.0, 35.0, 46.0, 41.0, 60.0, 48.0, 56.0, 40.0, 30.0, 33.0, 34.0, 34.0, 33.0, 23.0, 25.0, 23.0, 21.0, 16.0, 10.0, 8.0, 8.0, 5.0, 5.0, 10.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 5.0], "bins": [-0.3828125, -0.3716697692871094, -0.36052703857421875, -0.3493843078613281, -0.3382415771484375, -0.3270988464355469, -0.31595611572265625, -0.3048133850097656, -0.293670654296875, -0.2825279235839844, -0.27138519287109375, -0.2602424621582031, -0.2490997314453125, -0.23795700073242188, -0.22681427001953125, -0.21567153930664062, -0.20452880859375, -0.19338607788085938, -0.18224334716796875, -0.17110061645507812, -0.1599578857421875, -0.14881515502929688, -0.13767242431640625, -0.12652969360351562, -0.115386962890625, -0.10424423217773438, -0.09310150146484375, -0.08195877075195312, -0.0708160400390625, -0.059673309326171875, -0.04853057861328125, -0.037387847900390625, -0.0262451171875, -0.015102386474609375, -0.00395965576171875, 0.007183074951171875, 0.0183258056640625, 0.029468536376953125, 0.04061126708984375, 0.051753997802734375, 0.062896728515625, 0.07403945922851562, 0.08518218994140625, 0.09632492065429688, 0.1074676513671875, 0.11861038208007812, 0.12975311279296875, 0.14089584350585938, 0.15203857421875, 0.16318130493164062, 0.17432403564453125, 0.18546676635742188, 0.1966094970703125, 0.20775222778320312, 0.21889495849609375, 0.23003768920898438, 0.241180419921875, 0.2523231506347656, 0.26346588134765625, 0.2746086120605469, 0.2857513427734375, 0.2968940734863281, 0.30803680419921875, 0.3191795349121094, 0.330322265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 3.0, 9.0, 9.0, 10.0, 12.0, 12.0, 13.0, 15.0, 19.0, 32.0, 38.0, 27.0, 26.0, 32.0, 34.0, 33.0, 44.0, 45.0, 33.0, 37.0, 35.0, 44.0, 47.0, 39.0, 34.0, 42.0, 30.0, 27.0, 32.0, 22.0, 26.0, 16.0, 18.0, 17.0, 11.0, 15.0, 15.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.597350120544434, -13.143797874450684, -12.690245628356934, -12.236693382263184, -11.783141136169434, -11.329588890075684, -10.876036643981934, -10.422484397888184, -9.968932151794434, -9.515379905700684, -9.061827659606934, -8.608275413513184, -8.154723167419434, -7.701170921325684, -7.247618675231934, -6.794066429138184, -6.340514183044434, -5.886961936950684, -5.433409690856934, -4.979857444763184, -4.526305198669434, -4.072752952575684, -3.6192007064819336, -3.1656484603881836, -2.7120962142944336, -2.2585439682006836, -1.8049917221069336, -1.3514394760131836, -0.8978872299194336, -0.4443349838256836, 0.009217262268066406, 0.4627695083618164, 0.9163227081298828, 1.3698749542236328, 1.8234272003173828, 2.276979446411133, 2.730531692504883, 3.184083938598633, 3.637636184692383, 4.091188430786133, 4.544740676879883, 4.998292922973633, 5.451845169067383, 5.905397415161133, 6.358949661254883, 6.812501907348633, 7.266054153442383, 7.719606399536133, 8.173158645629883, 8.626710891723633, 9.080263137817383, 9.533815383911133, 9.987367630004883, 10.440919876098633, 10.894472122192383, 11.348024368286133, 11.801576614379883, 12.255128860473633, 12.708681106567383, 13.162233352661133, 13.615785598754883, 14.069337844848633, 14.522890090942383, 14.976442337036133, 15.429994583129883]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 13.0, 9.0, 9.0, 14.0, 14.0, 9.0, 18.0, 15.0, 25.0, 25.0, 28.0, 24.0, 39.0, 31.0, 29.0, 27.0, 36.0, 33.0, 44.0, 31.0, 39.0, 35.0, 39.0, 35.0, 34.0, 35.0, 40.0, 37.0, 13.0, 33.0, 20.0, 23.0, 26.0, 11.0, 16.0, 11.0, 12.0, 13.0, 7.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.131114959716797, -15.624518394470215, -15.117921829223633, -14.61132526397705, -14.104728698730469, -13.598132133483887, -13.091535568237305, -12.584939002990723, -12.07834243774414, -11.571745872497559, -11.065149307250977, -10.558552742004395, -10.051956176757812, -9.54535961151123, -9.038763046264648, -8.532166481018066, -8.025569915771484, -7.518973350524902, -7.01237678527832, -6.505780220031738, -5.999183654785156, -5.492587089538574, -4.985990524291992, -4.47939395904541, -3.972797393798828, -3.466200828552246, -2.959604263305664, -2.453007698059082, -1.9464111328125, -1.439814567565918, -0.9332180023193359, -0.4266214370727539, 0.07997512817382812, 0.5865716934204102, 1.0931682586669922, 1.5997648239135742, 2.1063613891601562, 2.6129579544067383, 3.1195545196533203, 3.6261510848999023, 4.132747650146484, 4.639344215393066, 5.145940780639648, 5.6525373458862305, 6.1591339111328125, 6.6657304763793945, 7.172327041625977, 7.678923606872559, 8.18552017211914, 8.692116737365723, 9.198713302612305, 9.705309867858887, 10.211906433105469, 10.71850299835205, 11.225099563598633, 11.731696128845215, 12.238292694091797, 12.744889259338379, 13.251485824584961, 13.758082389831543, 14.264678955078125, 14.771275520324707, 15.277872085571289, 15.784468650817871, 16.291065216064453]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 14.0, 30.0, 37.0, 69.0, 145.0, 177.0, 288.0, 517.0, 804.0, 1194.0, 1931.0, 3012.0, 4610.0, 6921.0, 10405.0, 15245.0, 21502.0, 30131.0, 40429.0, 52256.0, 64851.0, 77060.0, 86591.0, 91808.0, 92679.0, 88595.0, 80077.0, 68792.0, 56325.0, 44145.0, 32757.0, 24368.0, 16679.0, 11575.0, 7925.0, 5203.0, 3441.0, 2160.0, 1430.0, 936.0, 504.0, 327.0, 241.0, 135.0, 93.0, 63.0, 27.0, 16.0, 15.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-11.015625, -10.683349609375, -10.35107421875, -10.018798828125, -9.6865234375, -9.354248046875, -9.02197265625, -8.689697265625, -8.357421875, -8.025146484375, -7.69287109375, -7.360595703125, -7.0283203125, -6.696044921875, -6.36376953125, -6.031494140625, -5.69921875, -5.366943359375, -5.03466796875, -4.702392578125, -4.3701171875, -4.037841796875, -3.70556640625, -3.373291015625, -3.041015625, -2.708740234375, -2.37646484375, -2.044189453125, -1.7119140625, -1.379638671875, -1.04736328125, -0.715087890625, -0.3828125, -0.050537109375, 0.28173828125, 0.614013671875, 0.9462890625, 1.278564453125, 1.61083984375, 1.943115234375, 2.275390625, 2.607666015625, 2.93994140625, 3.272216796875, 3.6044921875, 3.936767578125, 4.26904296875, 4.601318359375, 4.93359375, 5.265869140625, 5.59814453125, 5.930419921875, 6.2626953125, 6.594970703125, 6.92724609375, 7.259521484375, 7.591796875, 7.924072265625, 8.25634765625, 8.588623046875, 8.9208984375, 9.253173828125, 9.58544921875, 9.917724609375, 10.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 14.0, 9.0, 11.0, 12.0, 16.0, 7.0, 16.0, 17.0, 25.0, 23.0, 30.0, 21.0, 42.0, 34.0, 28.0, 24.0, 38.0, 34.0, 40.0, 32.0, 38.0, 35.0, 38.0, 38.0, 31.0, 37.0, 42.0, 32.0, 22.0, 31.0, 17.0, 26.0, 23.0, 9.0, 19.0, 12.0, 11.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.296875, -15.785888671875, -15.27490234375, -14.763916015625, -14.2529296875, -13.741943359375, -13.23095703125, -12.719970703125, -12.208984375, -11.697998046875, -11.18701171875, -10.676025390625, -10.1650390625, -9.654052734375, -9.14306640625, -8.632080078125, -8.12109375, -7.610107421875, -7.09912109375, -6.588134765625, -6.0771484375, -5.566162109375, -5.05517578125, -4.544189453125, -4.033203125, -3.522216796875, -3.01123046875, -2.500244140625, -1.9892578125, -1.478271484375, -0.96728515625, -0.456298828125, 0.0546875, 0.565673828125, 1.07666015625, 1.587646484375, 2.0986328125, 2.609619140625, 3.12060546875, 3.631591796875, 4.142578125, 4.653564453125, 5.16455078125, 5.675537109375, 6.1865234375, 6.697509765625, 7.20849609375, 7.719482421875, 8.23046875, 8.741455078125, 9.25244140625, 9.763427734375, 10.2744140625, 10.785400390625, 11.29638671875, 11.807373046875, 12.318359375, 12.829345703125, 13.34033203125, 13.851318359375, 14.3623046875, 14.873291015625, 15.38427734375, 15.895263671875, 16.40625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 10.0, 2.0, 7.0, 14.0, 19.0, 31.0, 32.0, 76.0, 112.0, 179.0, 259.0, 367.0, 601.0, 1023.0, 1489.0, 2304.0, 3462.0, 5616.0, 8387.0, 12319.0, 18732.0, 27380.0, 38481.0, 52366.0, 67699.0, 84048.0, 96806.0, 103076.0, 103988.0, 96302.0, 83478.0, 67530.0, 52474.0, 38560.0, 26898.0, 18422.0, 12533.0, 8197.0, 5406.0, 3394.0, 2234.0, 1534.0, 917.0, 642.0, 411.0, 239.0, 171.0, 121.0, 71.0, 54.0, 29.0, 27.0, 14.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.5546875, -13.1309814453125, -12.707275390625, -12.2835693359375, -11.85986328125, -11.4361572265625, -11.012451171875, -10.5887451171875, -10.1650390625, -9.7413330078125, -9.317626953125, -8.8939208984375, -8.47021484375, -8.0465087890625, -7.622802734375, -7.1990966796875, -6.775390625, -6.3516845703125, -5.927978515625, -5.5042724609375, -5.08056640625, -4.6568603515625, -4.233154296875, -3.8094482421875, -3.3857421875, -2.9620361328125, -2.538330078125, -2.1146240234375, -1.69091796875, -1.2672119140625, -0.843505859375, -0.4197998046875, 0.00390625, 0.4276123046875, 0.851318359375, 1.2750244140625, 1.69873046875, 2.1224365234375, 2.546142578125, 2.9698486328125, 3.3935546875, 3.8172607421875, 4.240966796875, 4.6646728515625, 5.08837890625, 5.5120849609375, 5.935791015625, 6.3594970703125, 6.783203125, 7.2069091796875, 7.630615234375, 8.0543212890625, 8.47802734375, 8.9017333984375, 9.325439453125, 9.7491455078125, 10.1728515625, 10.5965576171875, 11.020263671875, 11.4439697265625, 11.86767578125, 12.2913818359375, 12.715087890625, 13.1387939453125, 13.5625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 8.0, 11.0, 14.0, 15.0, 13.0, 20.0, 25.0, 25.0, 27.0, 39.0, 44.0, 32.0, 39.0, 49.0, 41.0, 52.0, 44.0, 51.0, 42.0, 43.0, 33.0, 55.0, 33.0, 32.0, 32.0, 26.0, 26.0, 23.0, 15.0, 10.0, 11.0, 13.0, 9.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4140625, -14.009033203125, -13.60400390625, -13.198974609375, -12.7939453125, -12.388916015625, -11.98388671875, -11.578857421875, -11.173828125, -10.768798828125, -10.36376953125, -9.958740234375, -9.5537109375, -9.148681640625, -8.74365234375, -8.338623046875, -7.93359375, -7.528564453125, -7.12353515625, -6.718505859375, -6.3134765625, -5.908447265625, -5.50341796875, -5.098388671875, -4.693359375, -4.288330078125, -3.88330078125, -3.478271484375, -3.0732421875, -2.668212890625, -2.26318359375, -1.858154296875, -1.453125, -1.048095703125, -0.64306640625, -0.238037109375, 0.1669921875, 0.572021484375, 0.97705078125, 1.382080078125, 1.787109375, 2.192138671875, 2.59716796875, 3.002197265625, 3.4072265625, 3.812255859375, 4.21728515625, 4.622314453125, 5.02734375, 5.432373046875, 5.83740234375, 6.242431640625, 6.6474609375, 7.052490234375, 7.45751953125, 7.862548828125, 8.267578125, 8.672607421875, 9.07763671875, 9.482666015625, 9.8876953125, 10.292724609375, 10.69775390625, 11.102783203125, 11.5078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 5.0, 15.0, 14.0, 36.0, 46.0, 82.0, 120.0, 195.0, 312.0, 495.0, 786.0, 1284.0, 2025.0, 3335.0, 5519.0, 8898.0, 13828.0, 21847.0, 33117.0, 48610.0, 68005.0, 88074.0, 106552.0, 117185.0, 117755.0, 107562.0, 89639.0, 68900.0, 49958.0, 33844.0, 22325.0, 14519.0, 9071.0, 5446.0, 3494.0, 2091.0, 1325.0, 821.0, 514.0, 327.0, 216.0, 128.0, 92.0, 46.0, 33.0, 23.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.30078125, -5.124267578125, -4.94775390625, -4.771240234375, -4.5947265625, -4.418212890625, -4.24169921875, -4.065185546875, -3.888671875, -3.712158203125, -3.53564453125, -3.359130859375, -3.1826171875, -3.006103515625, -2.82958984375, -2.653076171875, -2.4765625, -2.300048828125, -2.12353515625, -1.947021484375, -1.7705078125, -1.593994140625, -1.41748046875, -1.240966796875, -1.064453125, -0.887939453125, -0.71142578125, -0.534912109375, -0.3583984375, -0.181884765625, -0.00537109375, 0.171142578125, 0.34765625, 0.524169921875, 0.70068359375, 0.877197265625, 1.0537109375, 1.230224609375, 1.40673828125, 1.583251953125, 1.759765625, 1.936279296875, 2.11279296875, 2.289306640625, 2.4658203125, 2.642333984375, 2.81884765625, 2.995361328125, 3.171875, 3.348388671875, 3.52490234375, 3.701416015625, 3.8779296875, 4.054443359375, 4.23095703125, 4.407470703125, 4.583984375, 4.760498046875, 4.93701171875, 5.113525390625, 5.2900390625, 5.466552734375, 5.64306640625, 5.819580078125, 5.99609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 14.0, 16.0, 20.0, 31.0, 33.0, 35.0, 42.0, 52.0, 39.0, 51.0, 65.0, 61.0, 52.0, 59.0, 42.0, 44.0, 47.0, 50.0, 42.0, 23.0, 39.0, 23.0, 19.0, 16.0, 7.0, 13.0, 9.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007200241088867188, -0.0006935149431228638, -0.0006670057773590088, -0.0006404966115951538, -0.0006139874458312988, -0.0005874782800674438, -0.0005609691143035889, -0.0005344599485397339, -0.0005079507827758789, -0.0004814416170120239, -0.00045493245124816895, -0.00042842328548431396, -0.000401914119720459, -0.000375404953956604, -0.000348895788192749, -0.00032238662242889404, -0.00029587745666503906, -0.0002693682909011841, -0.0002428591251373291, -0.00021634995937347412, -0.00018984079360961914, -0.00016333162784576416, -0.00013682246208190918, -0.0001103132963180542, -8.380413055419922e-05, -5.729496479034424e-05, -3.078579902648926e-05, -4.276633262634277e-06, 2.2232532501220703e-05, 4.8741698265075684e-05, 7.525086402893066e-05, 0.00010176002979278564, 0.00012826919555664062, 0.0001547783613204956, 0.00018128752708435059, 0.00020779669284820557, 0.00023430585861206055, 0.00026081502437591553, 0.0002873241901397705, 0.0003138333559036255, 0.00034034252166748047, 0.00036685168743133545, 0.00039336085319519043, 0.0004198700189590454, 0.0004463791847229004, 0.00047288835048675537, 0.0004993975162506104, 0.0005259066820144653, 0.0005524158477783203, 0.0005789250135421753, 0.0006054341793060303, 0.0006319433450698853, 0.0006584525108337402, 0.0006849616765975952, 0.0007114708423614502, 0.0007379800081253052, 0.0007644891738891602, 0.0007909983396530151, 0.0008175075054168701, 0.0008440166711807251, 0.0008705258369445801, 0.0008970350027084351, 0.00092354416847229, 0.000950053334236145, 0.0009765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 16.0, 29.0, 36.0, 63.0, 103.0, 183.0, 302.0, 545.0, 845.0, 1346.0, 2356.0, 3731.0, 6174.0, 10013.0, 16206.0, 25110.0, 37892.0, 54871.0, 74617.0, 95134.0, 111656.0, 119401.0, 115745.0, 101948.0, 83032.0, 62704.0, 44275.0, 29627.0, 19206.0, 12196.0, 7528.0, 4610.0, 2778.0, 1646.0, 1072.0, 610.0, 352.0, 246.0, 117.0, 91.0, 49.0, 27.0, 19.0, 16.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.37896728515625, -5.1915283203125, -5.00408935546875, -4.816650390625, -4.62921142578125, -4.4417724609375, -4.25433349609375, -4.06689453125, -3.87945556640625, -3.6920166015625, -3.50457763671875, -3.317138671875, -3.12969970703125, -2.9422607421875, -2.75482177734375, -2.5673828125, -2.37994384765625, -2.1925048828125, -2.00506591796875, -1.817626953125, -1.63018798828125, -1.4427490234375, -1.25531005859375, -1.06787109375, -0.88043212890625, -0.6929931640625, -0.50555419921875, -0.318115234375, -0.13067626953125, 0.0567626953125, 0.24420166015625, 0.431640625, 0.61907958984375, 0.8065185546875, 0.99395751953125, 1.181396484375, 1.36883544921875, 1.5562744140625, 1.74371337890625, 1.93115234375, 2.11859130859375, 2.3060302734375, 2.49346923828125, 2.680908203125, 2.86834716796875, 3.0557861328125, 3.24322509765625, 3.4306640625, 3.61810302734375, 3.8055419921875, 3.99298095703125, 4.180419921875, 4.36785888671875, 4.5552978515625, 4.74273681640625, 4.93017578125, 5.11761474609375, 5.3050537109375, 5.49249267578125, 5.679931640625, 5.86737060546875, 6.0548095703125, 6.24224853515625, 6.4296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 10.0, 20.0, 21.0, 31.0, 38.0, 33.0, 46.0, 60.0, 66.0, 55.0, 68.0, 54.0, 59.0, 59.0, 60.0, 39.0, 26.0, 38.0, 34.0, 31.0, 24.0, 19.0, 16.0, 14.0, 5.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.21319580078125, -3.1060791015625, -2.99896240234375, -2.891845703125, -2.78472900390625, -2.6776123046875, -2.57049560546875, -2.46337890625, -2.35626220703125, -2.2491455078125, -2.14202880859375, -2.034912109375, -1.92779541015625, -1.8206787109375, -1.71356201171875, -1.6064453125, -1.49932861328125, -1.3922119140625, -1.28509521484375, -1.177978515625, -1.07086181640625, -0.9637451171875, -0.85662841796875, -0.74951171875, -0.64239501953125, -0.5352783203125, -0.42816162109375, -0.321044921875, -0.21392822265625, -0.1068115234375, 0.00030517578125, 0.107421875, 0.21453857421875, 0.3216552734375, 0.42877197265625, 0.535888671875, 0.64300537109375, 0.7501220703125, 0.85723876953125, 0.96435546875, 1.07147216796875, 1.1785888671875, 1.28570556640625, 1.392822265625, 1.49993896484375, 1.6070556640625, 1.71417236328125, 1.8212890625, 1.92840576171875, 2.0355224609375, 2.14263916015625, 2.249755859375, 2.35687255859375, 2.4639892578125, 2.57110595703125, 2.67822265625, 2.78533935546875, 2.8924560546875, 2.99957275390625, 3.106689453125, 3.21380615234375, 3.3209228515625, 3.42803955078125, 3.53515625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 10.0, 17.0, 21.0, 22.0, 23.0, 25.0, 16.0, 29.0, 29.0, 40.0, 28.0, 52.0, 37.0, 43.0, 41.0, 36.0, 47.0, 35.0, 48.0, 41.0, 43.0, 39.0, 22.0, 43.0, 20.0, 17.0, 20.0, 24.0, 19.0, 13.0, 10.0, 13.0, 12.0, 7.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.391257286071777, -13.896187782287598, -13.401119232177734, -12.906049728393555, -12.410980224609375, -11.915910720825195, -11.420842170715332, -10.925772666931152, -10.430704116821289, -9.93563461303711, -9.440566062927246, -8.945496559143066, -8.450427055358887, -7.955358028411865, -7.460289001464844, -6.965219497680664, -6.470149993896484, -5.975080966949463, -5.480011463165283, -4.984942436218262, -4.489872932434082, -3.9948039054870605, -3.499734878540039, -3.0046656131744385, -2.509596347808838, -2.0145270824432373, -1.5194579362869263, -1.0243887901306152, -0.5293195247650146, -0.03425025939941406, 0.4608187675476074, 0.955888032913208, 1.450958251953125, 1.9460275173187256, 2.441096782684326, 2.9361658096313477, 3.4312350749969482, 3.926304340362549, 4.42137336730957, 4.91644287109375, 5.4115118980407715, 5.906580924987793, 6.401650428771973, 6.896719455718994, 7.391788482666016, 7.886857986450195, 8.381927490234375, 8.876996040344238, 9.372065544128418, 9.867135047912598, 10.362203598022461, 10.85727310180664, 11.35234260559082, 11.847412109375, 12.342480659484863, 12.837550163269043, 13.332618713378906, 13.827688217163086, 14.32275676727295, 14.817826271057129, 15.312895774841309, 15.807964324951172, 16.30303382873535, 16.79810333251953, 17.29317283630371]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 9.0, 15.0, 11.0, 4.0, 4.0, 14.0, 12.0, 23.0, 14.0, 25.0, 25.0, 22.0, 37.0, 31.0, 26.0, 35.0, 37.0, 37.0, 33.0, 29.0, 36.0, 31.0, 34.0, 32.0, 40.0, 32.0, 46.0, 36.0, 21.0, 37.0, 28.0, 27.0, 25.0, 12.0, 21.0, 17.0, 13.0, 13.0, 9.0, 7.0, 4.0, 7.0, 5.0, 9.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.196800231933594, -17.611371994018555, -17.02594566345215, -16.44051742553711, -15.855091094970703, -15.269662857055664, -14.684235572814941, -14.098808288574219, -13.513381004333496, -12.927953720092773, -12.34252643585205, -11.757099151611328, -11.171670913696289, -10.586244583129883, -10.000816345214844, -9.415389060974121, -8.829961776733398, -8.244534492492676, -7.659107208251953, -7.073679447174072, -6.48825216293335, -5.902824878692627, -5.317397117614746, -4.731969833374023, -4.146542549133301, -3.561115264892578, -2.9756877422332764, -2.3902602195739746, -1.804832935333252, -1.2194056510925293, -0.6339781284332275, -0.04855060577392578, 0.5368747711181641, 1.1223021745681763, 1.7077295780181885, 2.2931571006774902, 2.878584384918213, 3.4640116691589355, 4.049439430236816, 4.634866714477539, 5.220293998718262, 5.805721282958984, 6.391148567199707, 6.976576328277588, 7.5620036125183105, 8.147430419921875, 8.732858657836914, 9.318285942077637, 9.90371322631836, 10.489140510559082, 11.074567794799805, 11.659995079040527, 12.24542236328125, 12.830850601196289, 13.416277885437012, 14.001705169677734, 14.587132453918457, 15.17255973815918, 15.757987022399902, 16.343414306640625, 16.928842544555664, 17.51426887512207, 18.09969711303711, 18.685123443603516, 19.270551681518555]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 6.0, 0.0, 3.0, 3.0, 6.0, 6.0, 10.0, 9.0, 16.0, 18.0, 23.0, 39.0, 47.0, 49.0, 87.0, 99.0, 153.0, 163.0, 254.0, 301.0, 402.0, 512.0, 649.0, 791.0, 951.0, 1073.0, 1211.0, 1248.0, 1034512.0, 1184.0, 1146.0, 1043.0, 918.0, 761.0, 690.0, 501.0, 446.0, 309.0, 246.0, 183.0, 139.0, 108.0, 76.0, 63.0, 41.0, 33.0, 19.0, 21.0, 15.0, 8.0, 10.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-204.1968231201172, -197.27210998535156, -190.34739685058594, -183.4226837158203, -176.49795532226562, -169.5732421875, -162.64852905273438, -155.72381591796875, -148.79910278320312, -141.8743896484375, -134.94967651367188, -128.02496337890625, -121.1002426147461, -114.17552947998047, -107.25080871582031, -100.32609558105469, -93.40138244628906, -86.47666931152344, -79.55195617675781, -72.62723541259766, -65.70252227783203, -58.777809143066406, -51.853092193603516, -44.928375244140625, -38.003662109375, -31.078947067260742, -24.154232025146484, -17.229516983032227, -10.304801940917969, -3.3800888061523438, 3.544628143310547, 10.469345092773438, 17.394058227539062, 24.31877326965332, 31.243488311767578, 38.16820526123047, 45.092918395996094, 52.01763153076172, 58.94234848022461, 65.8670654296875, 72.79177856445312, 79.71649169921875, 86.64120483398438, 93.56592559814453, 100.49063873291016, 107.41535186767578, 114.34007263183594, 121.26478576660156, 128.1894989013672, 135.1142120361328, 142.03892517089844, 148.96363830566406, 155.88836669921875, 162.81307983398438, 169.73779296875, 176.66250610351562, 183.58721923828125, 190.51193237304688, 197.4366455078125, 204.36135864257812, 211.28607177734375, 218.21078491210938, 225.13551330566406, 232.0602264404297, 238.9849395751953]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 3.0, 7.0, 16.0, 15.0, 19.0, 30.0, 48.0, 57.0, 92.0, 111.0, 159.0, 264.0, 322.0, 419.0, 586.0, 769.0, 1035.0, 1391.0, 1827.0, 2400.0, 3012.0, 3687.0, 4751.0, 5840.0, 7760.0, 13664.0, 51321324.0, 59825.0, 10381.0, 6893.0, 5337.0, 4328.0, 3461.0, 2731.0, 2207.0, 1724.0, 1265.0, 957.0, 694.0, 529.0, 388.0, 294.0, 195.0, 153.0, 113.0, 95.0, 55.0, 33.0, 28.0, 22.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-128.9039306640625, -124.5826416015625, -120.26134490966797, -115.94005584716797, -111.61875915527344, -107.29747009277344, -102.97618103027344, -98.65489196777344, -94.3335952758789, -90.0123062133789, -85.69100952148438, -81.36972045898438, -77.04843139648438, -72.72713470458984, -68.40584564208984, -64.08454895019531, -59.76325988769531, -55.44196701049805, -51.12067413330078, -46.79938507080078, -42.478092193603516, -38.15679931640625, -33.83551025390625, -29.514217376708984, -25.19292449951172, -20.871631622314453, -16.55034065246582, -12.229048728942871, -7.907756805419922, -3.5864639282226562, 0.7348270416259766, 5.056118011474609, 9.377410888671875, 13.698702812194824, 18.019994735717773, 22.341285705566406, 26.662578582763672, 30.983871459960938, 35.30516052246094, 39.6264533996582, 43.94774627685547, 48.269039154052734, 52.59033203125, 56.91162109375, 61.232913970947266, 65.55420684814453, 69.87549591064453, 74.19679260253906, 78.51808166503906, 82.83937072753906, 87.1606674194336, 91.4819564819336, 95.80325317382812, 100.12454223632812, 104.44583129882812, 108.76712036132812, 113.08841705322266, 117.40970611572266, 121.73100280761719, 126.05229187011719, 130.3735809326172, 134.69488525390625, 139.01617431640625, 143.33746337890625, 147.65875244140625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 6.0, 11.0, 16.0, 31.0, 48.0, 67.0, 100.0, 160.0, 200.0, 276.0, 432.0, 672.0, 1040.0, 1528.0, 2596.0, 4377.0, 7818.0, 14250.0, 26420.0, 51916.0, 103574.0, 211711.0, 463547.0, 1692434.0, 2617698.0, 581561.0, 254270.0, 123366.0, 61446.0, 31153.0, 16528.0, 8996.0, 5033.0, 3002.0, 1739.0, 1159.0, 723.0, 459.0, 329.0, 192.0, 174.0, 103.0, 77.0, 63.0, 32.0, 21.0, 19.0, 18.0, 10.0, 10.0, 6.0, 3.0, 6.0, 0.0, 3.0], "bins": [-6.56640625, -6.3681640625, -6.169921875, -5.9716796875, -5.7734375, -5.5751953125, -5.376953125, -5.1787109375, -4.98046875, -4.7822265625, -4.583984375, -4.3857421875, -4.1875, -3.9892578125, -3.791015625, -3.5927734375, -3.39453125, -3.1962890625, -2.998046875, -2.7998046875, -2.6015625, -2.4033203125, -2.205078125, -2.0068359375, -1.80859375, -1.6103515625, -1.412109375, -1.2138671875, -1.015625, -0.8173828125, -0.619140625, -0.4208984375, -0.22265625, -0.0244140625, 0.173828125, 0.3720703125, 0.5703125, 0.7685546875, 0.966796875, 1.1650390625, 1.36328125, 1.5615234375, 1.759765625, 1.9580078125, 2.15625, 2.3544921875, 2.552734375, 2.7509765625, 2.94921875, 3.1474609375, 3.345703125, 3.5439453125, 3.7421875, 3.9404296875, 4.138671875, 4.3369140625, 4.53515625, 4.7333984375, 4.931640625, 5.1298828125, 5.328125, 5.5263671875, 5.724609375, 5.9228515625, 6.12109375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 0.0, 5.0, 10.0, 9.0, 17.0, 16.0, 19.0, 20.0, 35.0, 39.0, 25.0, 45.0, 42.0, 49.0, 65.0, 99.0, 379.0, 513.0, 187.0, 88.0, 48.0, 54.0, 50.0, 27.0, 37.0, 33.0, 24.0, 20.0, 16.0, 11.0, 10.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-15.3125, -14.920654296875, -14.52880859375, -14.136962890625, -13.7451171875, -13.353271484375, -12.96142578125, -12.569580078125, -12.177734375, -11.785888671875, -11.39404296875, -11.002197265625, -10.6103515625, -10.218505859375, -9.82666015625, -9.434814453125, -9.04296875, -8.651123046875, -8.25927734375, -7.867431640625, -7.4755859375, -7.083740234375, -6.69189453125, -6.300048828125, -5.908203125, -5.516357421875, -5.12451171875, -4.732666015625, -4.3408203125, -3.948974609375, -3.55712890625, -3.165283203125, -2.7734375, -2.381591796875, -1.98974609375, -1.597900390625, -1.2060546875, -0.814208984375, -0.42236328125, -0.030517578125, 0.361328125, 0.753173828125, 1.14501953125, 1.536865234375, 1.9287109375, 2.320556640625, 2.71240234375, 3.104248046875, 3.49609375, 3.887939453125, 4.27978515625, 4.671630859375, 5.0634765625, 5.455322265625, 5.84716796875, 6.239013671875, 6.630859375, 7.022705078125, 7.41455078125, 7.806396484375, 8.1982421875, 8.590087890625, 8.98193359375, 9.373779296875, 9.765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 5.0, 9.0, 7.0, 17.0, 22.0, 33.0, 39.0, 88.0, 110.0, 159.0, 249.0, 369.0, 616.0, 940.0, 1570.0, 2535.0, 4516.0, 7925.0, 15304.0, 30284.0, 62962.0, 137560.0, 308846.0, 824805.0, 3581663.0, 758175.0, 297395.0, 131891.0, 60290.0, 29071.0, 14658.0, 7940.0, 4494.0, 2592.0, 1600.0, 985.0, 557.0, 373.0, 265.0, 166.0, 117.0, 90.0, 40.0, 39.0, 24.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.7890625, -4.64599609375, -4.5029296875, -4.35986328125, -4.216796875, -4.07373046875, -3.9306640625, -3.78759765625, -3.64453125, -3.50146484375, -3.3583984375, -3.21533203125, -3.072265625, -2.92919921875, -2.7861328125, -2.64306640625, -2.5, -2.35693359375, -2.2138671875, -2.07080078125, -1.927734375, -1.78466796875, -1.6416015625, -1.49853515625, -1.35546875, -1.21240234375, -1.0693359375, -0.92626953125, -0.783203125, -0.64013671875, -0.4970703125, -0.35400390625, -0.2109375, -0.06787109375, 0.0751953125, 0.21826171875, 0.361328125, 0.50439453125, 0.6474609375, 0.79052734375, 0.93359375, 1.07666015625, 1.2197265625, 1.36279296875, 1.505859375, 1.64892578125, 1.7919921875, 1.93505859375, 2.078125, 2.22119140625, 2.3642578125, 2.50732421875, 2.650390625, 2.79345703125, 2.9365234375, 3.07958984375, 3.22265625, 3.36572265625, 3.5087890625, 3.65185546875, 3.794921875, 3.93798828125, 4.0810546875, 4.22412109375, 4.3671875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 6.0, 24.0, 21.0, 27.0, 33.0, 40.0, 50.0, 51.0, 36.0, 43.0, 49.0, 110.0, 457.0, 407.0, 171.0, 101.0, 71.0, 59.0, 50.0, 34.0, 34.0, 33.0, 23.0, 16.0, 10.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4183349609375, -8.094482421875, -7.7706298828125, -7.44677734375, -7.1229248046875, -6.799072265625, -6.4752197265625, -6.1513671875, -5.8275146484375, -5.503662109375, -5.1798095703125, -4.85595703125, -4.5321044921875, -4.208251953125, -3.8843994140625, -3.560546875, -3.2366943359375, -2.912841796875, -2.5889892578125, -2.26513671875, -1.9412841796875, -1.617431640625, -1.2935791015625, -0.9697265625, -0.6458740234375, -0.322021484375, 0.0018310546875, 0.32568359375, 0.6495361328125, 0.973388671875, 1.2972412109375, 1.62109375, 1.9449462890625, 2.268798828125, 2.5926513671875, 2.91650390625, 3.2403564453125, 3.564208984375, 3.8880615234375, 4.2119140625, 4.5357666015625, 4.859619140625, 5.1834716796875, 5.50732421875, 5.8311767578125, 6.155029296875, 6.4788818359375, 6.802734375, 7.1265869140625, 7.450439453125, 7.7742919921875, 8.09814453125, 8.4219970703125, 8.745849609375, 9.0697021484375, 9.3935546875, 9.7174072265625, 10.041259765625, 10.3651123046875, 10.68896484375, 11.0128173828125, 11.336669921875, 11.6605224609375, 11.984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 7.0, 13.0, 14.0, 35.0, 30.0, 36.0, 66.0, 65.0, 98.0, 119.0, 146.0, 205.0, 295.0, 461.0, 620.0, 1021.0, 1549.0, 3036.0, 6350.0, 15830.0, 54157.0, 5885631.0, 263414.0, 34886.0, 11741.0, 4959.0, 2499.0, 1333.0, 805.0, 522.0, 404.0, 226.0, 221.0, 145.0, 116.0, 105.0, 72.0, 40.0, 46.0, 10.0, 20.0, 14.0, 14.0, 16.0, 12.0, 3.0, 6.0, 4.0, 1.0, 0.0, 3.0, 5.0], "bins": [-35.75, -34.69384765625, -33.6376953125, -32.58154296875, -31.525390625, -30.46923828125, -29.4130859375, -28.35693359375, -27.30078125, -26.24462890625, -25.1884765625, -24.13232421875, -23.076171875, -22.02001953125, -20.9638671875, -19.90771484375, -18.8515625, -17.79541015625, -16.7392578125, -15.68310546875, -14.626953125, -13.57080078125, -12.5146484375, -11.45849609375, -10.40234375, -9.34619140625, -8.2900390625, -7.23388671875, -6.177734375, -5.12158203125, -4.0654296875, -3.00927734375, -1.953125, -0.89697265625, 0.1591796875, 1.21533203125, 2.271484375, 3.32763671875, 4.3837890625, 5.43994140625, 6.49609375, 7.55224609375, 8.6083984375, 9.66455078125, 10.720703125, 11.77685546875, 12.8330078125, 13.88916015625, 14.9453125, 16.00146484375, 17.0576171875, 18.11376953125, 19.169921875, 20.22607421875, 21.2822265625, 22.33837890625, 23.39453125, 24.45068359375, 25.5068359375, 26.56298828125, 27.619140625, 28.67529296875, 29.7314453125, 30.78759765625, 31.84375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 7.0, 2.0, 3.0, 7.0, 9.0, 8.0, 11.0, 15.0, 14.0, 16.0, 25.0, 39.0, 43.0, 52.0, 49.0, 89.0, 186.0, 549.0, 359.0, 170.0, 98.0, 75.0, 45.0, 34.0, 19.0, 16.0, 25.0, 15.0, 9.0, 8.0, 8.0, 6.0, 3.0, 7.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.3404541015625, -11.985595703125, -11.6307373046875, -11.27587890625, -10.9210205078125, -10.566162109375, -10.2113037109375, -9.8564453125, -9.5015869140625, -9.146728515625, -8.7918701171875, -8.43701171875, -8.0821533203125, -7.727294921875, -7.3724365234375, -7.017578125, -6.6627197265625, -6.307861328125, -5.9530029296875, -5.59814453125, -5.2432861328125, -4.888427734375, -4.5335693359375, -4.1787109375, -3.8238525390625, -3.468994140625, -3.1141357421875, -2.75927734375, -2.4044189453125, -2.049560546875, -1.6947021484375, -1.33984375, -0.9849853515625, -0.630126953125, -0.2752685546875, 0.07958984375, 0.4344482421875, 0.789306640625, 1.1441650390625, 1.4990234375, 1.8538818359375, 2.208740234375, 2.5635986328125, 2.91845703125, 3.2733154296875, 3.628173828125, 3.9830322265625, 4.337890625, 4.6927490234375, 5.047607421875, 5.4024658203125, 5.75732421875, 6.1121826171875, 6.467041015625, 6.8218994140625, 7.1767578125, 7.5316162109375, 7.886474609375, 8.2413330078125, 8.59619140625, 8.9510498046875, 9.305908203125, 9.6607666015625, 10.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 33.0, 221.0, 655.0, 59.0, 22.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.01712036132812, -212.94561767578125, -202.87411499023438, -192.80262756347656, -182.7311248779297, -172.6596221923828, -162.588134765625, -152.51663208007812, -142.44512939453125, -132.37362670898438, -122.30213165283203, -112.23063659667969, -102.15913391113281, -92.08763122558594, -82.0161361694336, -71.94464111328125, -61.873138427734375, -51.801639556884766, -41.730140686035156, -31.658641815185547, -21.587142944335938, -11.515644073486328, -1.4441452026367188, 8.627349853515625, 18.6988525390625, 28.77035140991211, 38.84185028076172, 48.91334915161133, 58.98484802246094, 69.05635070800781, 79.12784576416016, 89.1993408203125, 99.2708740234375, 109.34237670898438, 119.41387176513672, 129.48536682128906, 139.55686950683594, 149.6283721923828, 159.69985961914062, 169.7713623046875, 179.84286499023438, 189.91436767578125, 199.98587036132812, 210.05735778808594, 220.1288604736328, 230.2003631591797, 240.2718505859375, 250.34335327148438, 260.41485595703125, 270.4863586425781, 280.557861328125, 290.6293640136719, 300.70086669921875, 310.7723388671875, 320.8438415527344, 330.91534423828125, 340.9868469238281, 351.058349609375, 361.1298522949219, 371.20135498046875, 381.2728271484375, 391.3443298339844, 401.41583251953125, 411.4873352050781, 421.558837890625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 24.0, 37.0, 87.0, 262.0, 332.0, 108.0, 41.0, 22.0, 18.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.6688232421875, -119.075927734375, -115.4830322265625, -111.89013671875, -108.29723358154297, -104.70433807373047, -101.11144256591797, -97.51854705810547, -93.92564392089844, -90.33274841308594, -86.73985290527344, -83.14695739746094, -79.5540542602539, -75.9611587524414, -72.3682632446289, -68.7753677368164, -65.1824722290039, -61.589576721191406, -57.99667739868164, -54.40378189086914, -50.810882568359375, -47.217987060546875, -43.625091552734375, -40.032196044921875, -36.43929672241211, -32.84640121459961, -29.253501892089844, -25.660606384277344, -22.06770896911621, -18.474811553955078, -14.881916046142578, -11.289018630981445, -7.6961212158203125, -4.103224277496338, -0.5103273391723633, 3.082569122314453, 6.675466537475586, 10.268363952636719, 13.861259460449219, 17.45415687561035, 21.047054290771484, 24.639951705932617, 28.23284912109375, 31.82574462890625, 35.41864013671875, 39.011539459228516, 42.604434967041016, 46.19733428955078, 49.79022979736328, 53.38312530517578, 56.97602462768555, 60.56892013549805, 64.16181945800781, 67.75471496582031, 71.34761047363281, 74.94050598144531, 78.53340148925781, 82.12629699707031, 85.71919250488281, 89.31208801269531, 92.90499114990234, 96.49788665771484, 100.09078216552734, 103.68367767333984, 107.27658081054688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 6.0, 6.0, 7.0, 6.0, 10.0, 8.0, 14.0, 17.0, 25.0, 28.0, 35.0, 38.0, 59.0, 85.0, 96.0, 103.0, 151.0, 166.0, 266.0, 321.0, 414.0, 490.0, 734.0, 1051.0, 1546.0, 2382.0, 4039.0, 6707.0, 12374.0, 24987.0, 72851.0, 1048210.0, 2864738.0, 94704.0, 27795.0, 12622.0, 6513.0, 3808.0, 2475.0, 1611.0, 981.0, 646.0, 391.0, 261.0, 164.0, 129.0, 83.0, 50.0, 29.0, 18.0, 13.0, 10.0, 4.0, 6.0, 5.0], "bins": [-1.29296875, -1.2614898681640625, -1.230010986328125, -1.1985321044921875, -1.16705322265625, -1.1355743408203125, -1.104095458984375, -1.0726165771484375, -1.0411376953125, -1.0096588134765625, -0.978179931640625, -0.9467010498046875, -0.91522216796875, -0.8837432861328125, -0.852264404296875, -0.8207855224609375, -0.789306640625, -0.7578277587890625, -0.726348876953125, -0.6948699951171875, -0.66339111328125, -0.6319122314453125, -0.600433349609375, -0.5689544677734375, -0.5374755859375, -0.5059967041015625, -0.474517822265625, -0.4430389404296875, -0.41156005859375, -0.3800811767578125, -0.348602294921875, -0.3171234130859375, -0.28564453125, -0.2541656494140625, -0.222686767578125, -0.1912078857421875, -0.15972900390625, -0.1282501220703125, -0.096771240234375, -0.0652923583984375, -0.0338134765625, -0.0023345947265625, 0.029144287109375, 0.0606231689453125, 0.09210205078125, 0.1235809326171875, 0.155059814453125, 0.1865386962890625, 0.218017578125, 0.2494964599609375, 0.280975341796875, 0.3124542236328125, 0.34393310546875, 0.3754119873046875, 0.406890869140625, 0.4383697509765625, 0.4698486328125, 0.5013275146484375, 0.532806396484375, 0.5642852783203125, 0.59576416015625, 0.6272430419921875, 0.658721923828125, 0.6902008056640625, 0.7216796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 18.0, 35.0, 199.0, 384.0, 231.0, 42.0, 16.0, 15.0, 9.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1619873046875, -0.157989501953125, -0.15399169921875, -0.149993896484375, -0.14599609375, -0.141998291015625, -0.13800048828125, -0.134002685546875, -0.1300048828125, -0.126007080078125, -0.12200927734375, -0.118011474609375, -0.114013671875, -0.110015869140625, -0.10601806640625, -0.102020263671875, -0.0980224609375, -0.094024658203125, -0.09002685546875, -0.086029052734375, -0.08203125, -0.078033447265625, -0.07403564453125, -0.070037841796875, -0.0660400390625, -0.062042236328125, -0.05804443359375, -0.054046630859375, -0.050048828125, -0.046051025390625, -0.04205322265625, -0.038055419921875, -0.0340576171875, -0.030059814453125, -0.02606201171875, -0.022064208984375, -0.01806640625, -0.014068603515625, -0.01007080078125, -0.006072998046875, -0.0020751953125, 0.001922607421875, 0.00592041015625, 0.009918212890625, 0.013916015625, 0.017913818359375, 0.02191162109375, 0.025909423828125, 0.0299072265625, 0.033905029296875, 0.03790283203125, 0.041900634765625, 0.0458984375, 0.049896240234375, 0.05389404296875, 0.057891845703125, 0.0618896484375, 0.065887451171875, 0.06988525390625, 0.073883056640625, 0.077880859375, 0.081878662109375, 0.08587646484375, 0.089874267578125, 0.0938720703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 19.0, 24.0, 20.0, 48.0, 63.0, 74.0, 118.0, 176.0, 240.0, 424.0, 593.0, 1125.0, 2133.0, 4698.0, 10864.0, 31460.0, 108809.0, 550931.0, 2781530.0, 548049.0, 103443.0, 29095.0, 10557.0, 4589.0, 2271.0, 1166.0, 690.0, 368.0, 229.0, 167.0, 85.0, 60.0, 36.0, 24.0, 22.0, 16.0, 15.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0070953369140625, -0.975128173828125, -0.9431610107421875, -0.91119384765625, -0.8792266845703125, -0.847259521484375, -0.8152923583984375, -0.7833251953125, -0.7513580322265625, -0.719390869140625, -0.6874237060546875, -0.65545654296875, -0.6234893798828125, -0.591522216796875, -0.5595550537109375, -0.527587890625, -0.4956207275390625, -0.463653564453125, -0.4316864013671875, -0.39971923828125, -0.3677520751953125, -0.335784912109375, -0.3038177490234375, -0.2718505859375, -0.2398834228515625, -0.207916259765625, -0.1759490966796875, -0.14398193359375, -0.1120147705078125, -0.080047607421875, -0.0480804443359375, -0.01611328125, 0.0158538818359375, 0.047821044921875, 0.0797882080078125, 0.11175537109375, 0.1437225341796875, 0.175689697265625, 0.2076568603515625, 0.2396240234375, 0.2715911865234375, 0.303558349609375, 0.3355255126953125, 0.36749267578125, 0.3994598388671875, 0.431427001953125, 0.4633941650390625, 0.495361328125, 0.5273284912109375, 0.559295654296875, 0.5912628173828125, 0.62322998046875, 0.6551971435546875, 0.687164306640625, 0.7191314697265625, 0.7510986328125, 0.7830657958984375, 0.815032958984375, 0.8470001220703125, 0.87896728515625, 0.9109344482421875, 0.942901611328125, 0.9748687744140625, 1.0068359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 4.0, 12.0, 14.0, 14.0, 22.0, 21.0, 25.0, 33.0, 38.0, 45.0, 61.0, 69.0, 98.0, 138.0, 144.0, 175.0, 215.0, 297.0, 396.0, 614.0, 404.0, 290.0, 206.0, 165.0, 146.0, 88.0, 94.0, 60.0, 44.0, 39.0, 27.0, 23.0, 8.0, 7.0, 10.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.2105083465576172, -0.20360946655273438, -0.19671058654785156, -0.18981170654296875, -0.18291282653808594, -0.17601394653320312, -0.1691150665283203, -0.1622161865234375, -0.1553173065185547, -0.14841842651367188, -0.14151954650878906, -0.13462066650390625, -0.12772178649902344, -0.12082290649414062, -0.11392402648925781, -0.107025146484375, -0.10012626647949219, -0.09322738647460938, -0.08632850646972656, -0.07942962646484375, -0.07253074645996094, -0.06563186645507812, -0.05873298645019531, -0.0518341064453125, -0.04493522644042969, -0.038036346435546875, -0.031137466430664062, -0.02423858642578125, -0.017339706420898438, -0.010440826416015625, -0.0035419464111328125, 0.00335693359375, 0.010255813598632812, 0.017154693603515625, 0.024053573608398438, 0.03095245361328125, 0.03785133361816406, 0.044750213623046875, 0.05164909362792969, 0.0585479736328125, 0.06544685363769531, 0.07234573364257812, 0.07924461364746094, 0.08614349365234375, 0.09304237365722656, 0.09994125366210938, 0.10684013366699219, 0.113739013671875, 0.12063789367675781, 0.12753677368164062, 0.13443565368652344, 0.14133453369140625, 0.14823341369628906, 0.15513229370117188, 0.1620311737060547, 0.1689300537109375, 0.1758289337158203, 0.18272781372070312, 0.18962669372558594, 0.19652557373046875, 0.20342445373535156, 0.21032333374023438, 0.2172222137451172, 0.22412109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 8.0, 17.0, 19.0, 24.0, 42.0, 49.0, 63.0, 78.0, 102.0, 142.0, 123.0, 90.0, 65.0, 41.0, 34.0, 26.0, 11.0, 12.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.8650496006011963, -3.777703046798706, -3.690356731414795, -3.6030101776123047, -3.5156636238098145, -3.428317070007324, -3.340970754623413, -3.253624200820923, -3.1662778854370117, -3.0789313316345215, -2.9915850162506104, -2.90423846244812, -2.81689190864563, -2.7295455932617188, -2.6421990394592285, -2.5548524856567383, -2.467505931854248, -2.380159378051758, -2.2928130626678467, -2.2054665088653564, -2.118119955062866, -2.030773639678955, -1.9434270858764648, -1.8560805320739746, -1.768734097480774, -1.6813876628875732, -1.594041109085083, -1.5066946744918823, -1.4193482398986816, -1.3320016860961914, -1.2446552515029907, -1.15730881690979, -1.0699620246887207, -0.9826155304908752, -0.8952690362930298, -0.8079226016998291, -0.7205761075019836, -0.6332296133041382, -0.5458831787109375, -0.45853668451309204, -0.3711901903152466, -0.2838436961174011, -0.19649723172187805, -0.10915076732635498, -0.02180427312850952, 0.06554222106933594, 0.15288865566253662, 0.24023514986038208, 0.32758164405822754, 0.414928138256073, 0.5022746324539185, 0.5896210670471191, 0.6769675612449646, 0.7643140554428101, 0.8516604900360107, 0.9390069842338562, 1.0263534784317017, 1.1136999130249023, 1.2010464668273926, 1.2883929014205933, 1.375739336013794, 1.4630858898162842, 1.5504323244094849, 1.6377787590026855, 1.7251253128051758]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 6.0, 10.0, 8.0, 6.0, 9.0, 13.0, 12.0, 13.0, 14.0, 22.0, 20.0, 20.0, 35.0, 33.0, 37.0, 29.0, 49.0, 50.0, 47.0, 38.0, 33.0, 31.0, 36.0, 51.0, 53.0, 28.0, 44.0, 38.0, 27.0, 25.0, 17.0, 30.0, 22.0, 15.0, 15.0, 15.0, 9.0, 4.0, 7.0, 10.0, 5.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650987148284912, -1.5945276021957397, -1.5380679368972778, -1.4816083908081055, -1.425148844718933, -1.3686892986297607, -1.3122296333312988, -1.2557700872421265, -1.199310541152954, -1.1428509950637817, -1.0863913297653198, -1.0299317836761475, -0.9734722375869751, -0.917012631893158, -0.8605530261993408, -0.8040934801101685, -0.7476338148117065, -0.6911742091178894, -0.634714663028717, -0.5782550573348999, -0.5217955112457275, -0.4653359055519104, -0.40887629985809326, -0.3524167239665985, -0.29595714807510376, -0.239497572183609, -0.18303798139095306, -0.12657839059829712, -0.07011881470680237, -0.013659238815307617, 0.04280036687850952, 0.09925994277000427, 0.15571951866149902, 0.21217909455299377, 0.2686386704444885, 0.32509827613830566, 0.3815578520298004, 0.43801742792129517, 0.4944770336151123, 0.5509365797042847, 0.6073961853981018, 0.663855791091919, 0.7203153371810913, 0.7767749428749084, 0.8332345485687256, 0.889694094657898, 0.9461537003517151, 1.0026133060455322, 1.0590728521347046, 1.115532398223877, 1.1719920635223389, 1.2284516096115112, 1.2849111557006836, 1.3413708209991455, 1.3978303670883179, 1.4542899131774902, 1.5107495784759521, 1.5672091245651245, 1.6236687898635864, 1.6801283359527588, 1.7365878820419312, 1.7930474281311035, 1.8495070934295654, 1.9059666395187378, 1.9624261856079102]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 15.0, 18.0, 19.0, 40.0, 67.0, 111.0, 165.0, 276.0, 605.0, 1181.0, 2585.0, 7520.0, 34849.0, 530043.0, 429170.0, 30072.0, 6936.0, 2507.0, 1123.0, 538.0, 274.0, 156.0, 91.0, 53.0, 36.0, 38.0, 16.0, 14.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3687591552734375, -1.321502685546875, -1.2742462158203125, -1.22698974609375, -1.1797332763671875, -1.132476806640625, -1.0852203369140625, -1.0379638671875, -0.9907073974609375, -0.943450927734375, -0.8961944580078125, -0.84893798828125, -0.8016815185546875, -0.754425048828125, -0.7071685791015625, -0.659912109375, -0.6126556396484375, -0.565399169921875, -0.5181427001953125, -0.47088623046875, -0.4236297607421875, -0.376373291015625, -0.3291168212890625, -0.2818603515625, -0.2346038818359375, -0.187347412109375, -0.1400909423828125, -0.09283447265625, -0.0455780029296875, 0.001678466796875, 0.0489349365234375, 0.09619140625, 0.1434478759765625, 0.190704345703125, 0.2379608154296875, 0.28521728515625, 0.3324737548828125, 0.379730224609375, 0.4269866943359375, 0.4742431640625, 0.5214996337890625, 0.568756103515625, 0.6160125732421875, 0.66326904296875, 0.7105255126953125, 0.757781982421875, 0.8050384521484375, 0.852294921875, 0.8995513916015625, 0.946807861328125, 0.9940643310546875, 1.04132080078125, 1.0885772705078125, 1.135833740234375, 1.1830902099609375, 1.2303466796875, 1.2776031494140625, 1.324859619140625, 1.3721160888671875, 1.41937255859375, 1.4666290283203125, 1.513885498046875, 1.5611419677734375, 1.6083984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 4.0, 6.0, 9.0, 5.0, 17.0, 23.0, 36.0, 72.0, 103.0, 110.0, 155.0, 134.0, 111.0, 76.0, 53.0, 29.0, 18.0, 15.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.1483001708984375, -0.144256591796875, -0.1402130126953125, -0.13616943359375, -0.1321258544921875, -0.128082275390625, -0.1240386962890625, -0.1199951171875, -0.1159515380859375, -0.111907958984375, -0.1078643798828125, -0.10382080078125, -0.0997772216796875, -0.095733642578125, -0.0916900634765625, -0.087646484375, -0.0836029052734375, -0.079559326171875, -0.0755157470703125, -0.07147216796875, -0.0674285888671875, -0.063385009765625, -0.0593414306640625, -0.0552978515625, -0.0512542724609375, -0.047210693359375, -0.0431671142578125, -0.03912353515625, -0.0350799560546875, -0.031036376953125, -0.0269927978515625, -0.02294921875, -0.0189056396484375, -0.014862060546875, -0.0108184814453125, -0.00677490234375, -0.0027313232421875, 0.001312255859375, 0.0053558349609375, 0.0093994140625, 0.0134429931640625, 0.017486572265625, 0.0215301513671875, 0.02557373046875, 0.0296173095703125, 0.033660888671875, 0.0377044677734375, 0.041748046875, 0.0457916259765625, 0.049835205078125, 0.0538787841796875, 0.05792236328125, 0.0619659423828125, 0.066009521484375, 0.0700531005859375, 0.0740966796875, 0.0781402587890625, 0.082183837890625, 0.0862274169921875, 0.09027099609375, 0.0943145751953125, 0.098358154296875, 0.1024017333984375, 0.1064453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 13.0, 10.0, 24.0, 28.0, 30.0, 51.0, 68.0, 121.0, 162.0, 242.0, 435.0, 790.0, 1367.0, 2757.0, 6370.0, 19016.0, 89622.0, 625242.0, 246932.0, 36441.0, 10342.0, 4067.0, 1909.0, 995.0, 537.0, 310.0, 187.0, 135.0, 115.0, 67.0, 37.0, 41.0, 18.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1181640625, -1.08056640625, -1.04296875, -1.00537109375, -0.9677734375, -0.93017578125, -0.892578125, -0.85498046875, -0.8173828125, -0.77978515625, -0.7421875, -0.70458984375, -0.6669921875, -0.62939453125, -0.591796875, -0.55419921875, -0.5166015625, -0.47900390625, -0.44140625, -0.40380859375, -0.3662109375, -0.32861328125, -0.291015625, -0.25341796875, -0.2158203125, -0.17822265625, -0.140625, -0.10302734375, -0.0654296875, -0.02783203125, 0.009765625, 0.04736328125, 0.0849609375, 0.12255859375, 0.16015625, 0.19775390625, 0.2353515625, 0.27294921875, 0.310546875, 0.34814453125, 0.3857421875, 0.42333984375, 0.4609375, 0.49853515625, 0.5361328125, 0.57373046875, 0.611328125, 0.64892578125, 0.6865234375, 0.72412109375, 0.76171875, 0.79931640625, 0.8369140625, 0.87451171875, 0.912109375, 0.94970703125, 0.9873046875, 1.02490234375, 1.0625, 1.10009765625, 1.1376953125, 1.17529296875, 1.212890625, 1.25048828125, 1.2880859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 9.0, 6.0, 17.0, 11.0, 21.0, 16.0, 21.0, 27.0, 36.0, 30.0, 29.0, 43.0, 47.0, 48.0, 56.0, 45.0, 53.0, 51.0, 55.0, 42.0, 28.0, 44.0, 43.0, 36.0, 24.0, 31.0, 16.0, 25.0, 16.0, 15.0, 17.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6349334716796875, -0.616546630859375, -0.5981597900390625, -0.57977294921875, -0.5613861083984375, -0.542999267578125, -0.5246124267578125, -0.5062255859375, -0.4878387451171875, -0.469451904296875, -0.4510650634765625, -0.43267822265625, -0.4142913818359375, -0.395904541015625, -0.3775177001953125, -0.359130859375, -0.3407440185546875, -0.322357177734375, -0.3039703369140625, -0.28558349609375, -0.2671966552734375, -0.248809814453125, -0.2304229736328125, -0.2120361328125, -0.1936492919921875, -0.175262451171875, -0.1568756103515625, -0.13848876953125, -0.1201019287109375, -0.101715087890625, -0.0833282470703125, -0.06494140625, -0.0465545654296875, -0.028167724609375, -0.0097808837890625, 0.00860595703125, 0.0269927978515625, 0.045379638671875, 0.0637664794921875, 0.0821533203125, 0.1005401611328125, 0.118927001953125, 0.1373138427734375, 0.15570068359375, 0.1740875244140625, 0.192474365234375, 0.2108612060546875, 0.229248046875, 0.2476348876953125, 0.266021728515625, 0.2844085693359375, 0.30279541015625, 0.3211822509765625, 0.339569091796875, 0.3579559326171875, 0.3763427734375, 0.3947296142578125, 0.413116455078125, 0.4315032958984375, 0.44989013671875, 0.4682769775390625, 0.486663818359375, 0.5050506591796875, 0.5234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 5.0, 15.0, 18.0, 29.0, 59.0, 66.0, 152.0, 318.0, 969.0, 5229.0, 950711.0, 86874.0, 2881.0, 648.0, 243.0, 130.0, 67.0, 47.0, 19.0, 18.0, 15.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.66558837890625, -7.4249267578125, -7.18426513671875, -6.943603515625, -6.70294189453125, -6.4622802734375, -6.22161865234375, -5.98095703125, -5.74029541015625, -5.4996337890625, -5.25897216796875, -5.018310546875, -4.77764892578125, -4.5369873046875, -4.29632568359375, -4.0556640625, -3.81500244140625, -3.5743408203125, -3.33367919921875, -3.093017578125, -2.85235595703125, -2.6116943359375, -2.37103271484375, -2.13037109375, -1.88970947265625, -1.6490478515625, -1.40838623046875, -1.167724609375, -0.92706298828125, -0.6864013671875, -0.44573974609375, -0.205078125, 0.03558349609375, 0.2762451171875, 0.51690673828125, 0.757568359375, 0.99822998046875, 1.2388916015625, 1.47955322265625, 1.72021484375, 1.96087646484375, 2.2015380859375, 2.44219970703125, 2.682861328125, 2.92352294921875, 3.1641845703125, 3.40484619140625, 3.6455078125, 3.88616943359375, 4.1268310546875, 4.36749267578125, 4.608154296875, 4.84881591796875, 5.0894775390625, 5.33013916015625, 5.57080078125, 5.81146240234375, 6.0521240234375, 6.29278564453125, 6.533447265625, 6.77410888671875, 7.0147705078125, 7.25543212890625, 7.49609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 9.0, 7.0, 8.0, 10.0, 18.0, 21.0, 43.0, 73.0, 86.0, 125.0, 169.0, 149.0, 114.0, 64.0, 47.0, 31.0, 17.0, 11.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023925304412841797, -0.00023365672677755356, -0.00022806040942668915, -0.00022246409207582474, -0.00021686777472496033, -0.00021127145737409592, -0.0002056751400232315, -0.0002000788226723671, -0.00019448250532150269, -0.00018888618797063828, -0.00018328987061977386, -0.00017769355326890945, -0.00017209723591804504, -0.00016650091856718063, -0.00016090460121631622, -0.0001553082838654518, -0.0001497119665145874, -0.000144115649163723, -0.00013851933181285858, -0.00013292301446199417, -0.00012732669711112976, -0.00012173037976026535, -0.00011613406240940094, -0.00011053774505853653, -0.00010494142770767212, -9.934511035680771e-05, -9.37487930059433e-05, -8.815247565507889e-05, -8.255615830421448e-05, -7.695984095335007e-05, -7.136352360248566e-05, -6.576720625162125e-05, -6.0170888900756836e-05, -5.4574571549892426e-05, -4.8978254199028015e-05, -4.3381936848163605e-05, -3.7785619497299194e-05, -3.2189302146434784e-05, -2.6592984795570374e-05, -2.0996667444705963e-05, -1.5400350093841553e-05, -9.804032742977142e-06, -4.207715392112732e-06, 1.3886019587516785e-06, 6.984919309616089e-06, 1.25812366604805e-05, 1.817755401134491e-05, 2.377387136220932e-05, 2.937018871307373e-05, 3.496650606393814e-05, 4.056282341480255e-05, 4.615914076566696e-05, 5.175545811653137e-05, 5.735177546739578e-05, 6.294809281826019e-05, 6.85444101691246e-05, 7.414072751998901e-05, 7.973704487085342e-05, 8.533336222171783e-05, 9.092967957258224e-05, 9.652599692344666e-05, 0.00010212231427431107, 0.00010771863162517548, 0.00011331494897603989, 0.0001189112663269043]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 5.0, 1.0, 7.0, 3.0, 14.0, 9.0, 17.0, 19.0, 36.0, 61.0, 90.0, 122.0, 184.0, 319.0, 613.0, 1388.0, 4038.0, 18102.0, 595399.0, 405461.0, 16147.0, 3714.0, 1396.0, 580.0, 302.0, 200.0, 106.0, 60.0, 56.0, 24.0, 16.0, 16.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.17413330078125, -3.0748291015625, -2.97552490234375, -2.876220703125, -2.77691650390625, -2.6776123046875, -2.57830810546875, -2.47900390625, -2.37969970703125, -2.2803955078125, -2.18109130859375, -2.081787109375, -1.98248291015625, -1.8831787109375, -1.78387451171875, -1.6845703125, -1.58526611328125, -1.4859619140625, -1.38665771484375, -1.287353515625, -1.18804931640625, -1.0887451171875, -0.98944091796875, -0.89013671875, -0.79083251953125, -0.6915283203125, -0.59222412109375, -0.492919921875, -0.39361572265625, -0.2943115234375, -0.19500732421875, -0.095703125, 0.00360107421875, 0.1029052734375, 0.20220947265625, 0.301513671875, 0.40081787109375, 0.5001220703125, 0.59942626953125, 0.69873046875, 0.79803466796875, 0.8973388671875, 0.99664306640625, 1.095947265625, 1.19525146484375, 1.2945556640625, 1.39385986328125, 1.4931640625, 1.59246826171875, 1.6917724609375, 1.79107666015625, 1.890380859375, 1.98968505859375, 2.0889892578125, 2.18829345703125, 2.28759765625, 2.38690185546875, 2.4862060546875, 2.58551025390625, 2.684814453125, 2.78411865234375, 2.8834228515625, 2.98272705078125, 3.08203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 1.0, 6.0, 10.0, 26.0, 33.0, 100.0, 195.0, 260.0, 214.0, 85.0, 39.0, 11.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.77386474609375, -1.7039794921875, -1.63409423828125, -1.564208984375, -1.49432373046875, -1.4244384765625, -1.35455322265625, -1.28466796875, -1.21478271484375, -1.1448974609375, -1.07501220703125, -1.005126953125, -0.93524169921875, -0.8653564453125, -0.79547119140625, -0.7255859375, -0.65570068359375, -0.5858154296875, -0.51593017578125, -0.446044921875, -0.37615966796875, -0.3062744140625, -0.23638916015625, -0.16650390625, -0.09661865234375, -0.0267333984375, 0.04315185546875, 0.113037109375, 0.18292236328125, 0.2528076171875, 0.32269287109375, 0.392578125, 0.46246337890625, 0.5323486328125, 0.60223388671875, 0.672119140625, 0.74200439453125, 0.8118896484375, 0.88177490234375, 0.95166015625, 1.02154541015625, 1.0914306640625, 1.16131591796875, 1.231201171875, 1.30108642578125, 1.3709716796875, 1.44085693359375, 1.5107421875, 1.58062744140625, 1.6505126953125, 1.72039794921875, 1.790283203125, 1.86016845703125, 1.9300537109375, 1.99993896484375, 2.06982421875, 2.13970947265625, 2.2095947265625, 2.27947998046875, 2.349365234375, 2.41925048828125, 2.4891357421875, 2.55902099609375, 2.62890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 16.0, 55.0, 156.0, 338.0, 245.0, 98.0, 39.0, 14.0, 9.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.008712768554688, -17.489585876464844, -16.970458984375, -16.451332092285156, -15.932205200195312, -15.413078308105469, -14.893951416015625, -14.374824523925781, -13.855697631835938, -13.336570739746094, -12.81744384765625, -12.298316955566406, -11.779190063476562, -11.260063171386719, -10.740936279296875, -10.221809387207031, -9.702681541442871, -9.183554649353027, -8.664427757263184, -8.14530086517334, -7.626173973083496, -7.107047080993652, -6.58791971206665, -6.068792819976807, -5.549665927886963, -5.030539035797119, -4.511412143707275, -3.9922850131988525, -3.473158121109009, -2.954031229019165, -2.434904098510742, -1.9157772064208984, -1.3966503143310547, -0.8775233626365662, -0.35839641094207764, 0.16073060035705566, 0.6798574924468994, 1.1989843845367432, 1.718111515045166, 2.2372384071350098, 2.7563652992248535, 3.2754921913146973, 3.794619083404541, 4.313746452331543, 4.832873344421387, 5.3520002365112305, 5.871127128601074, 6.390254020690918, 6.909380912780762, 7.4285078048706055, 7.947634696960449, 8.466761589050293, 8.985888481140137, 9.50501537322998, 10.02414321899414, 10.543270111083984, 11.062397003173828, 11.581523895263672, 12.100650787353516, 12.61977767944336, 13.138904571533203, 13.658031463623047, 14.17715835571289, 14.696285247802734, 15.215412139892578]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 11.0, 5.0, 5.0, 9.0, 16.0, 39.0, 54.0, 76.0, 159.0, 158.0, 158.0, 113.0, 80.0, 52.0, 27.0, 14.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.976655006408691, -13.551311492919922, -13.125967025756836, -12.700623512268066, -12.275279998779297, -11.849935531616211, -11.424592018127441, -10.999248504638672, -10.573904037475586, -10.148560523986816, -9.72321605682373, -9.297872543334961, -8.872528076171875, -8.447184562683105, -8.021841049194336, -7.596497058868408, -7.1711530685424805, -6.745809078216553, -6.320465087890625, -5.8951215744018555, -5.469777584075928, -5.04443359375, -4.6190900802612305, -4.193746089935303, -3.768402099609375, -3.3430581092834473, -2.9177143573760986, -2.49237060546875, -2.0670266151428223, -1.6416826248168945, -1.216338872909546, -0.7909951210021973, -0.36565208435058594, 0.059691786766052246, 0.48503565788269043, 0.9103795289993286, 1.3357234001159668, 1.7610673904418945, 2.186411142349243, 2.611754894256592, 3.0370988845825195, 3.4624428749084473, 3.887786626815796, 4.3131303787231445, 4.738474369049072, 5.163818359375, 5.5891618728637695, 6.014505863189697, 6.439849853515625, 6.865193843841553, 7.2905378341674805, 7.71588134765625, 8.141225814819336, 8.566569328308105, 8.991912841796875, 9.417257308959961, 9.84260082244873, 10.2679443359375, 10.693288803100586, 11.118632316589355, 11.543975830078125, 11.969320297241211, 12.39466381072998, 12.82000732421875, 13.245351791381836]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 26.0, 44.0, 171.0, 1411.0, 133270.0, 4055506.0, 3380.0, 294.0, 76.0, 31.0, 18.0, 8.0, 9.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -7.83984375, -7.3828125, -6.92578125, -6.46875, -6.01171875, -5.5546875, -5.09765625, -4.640625, -4.18359375, -3.7265625, -3.26953125, -2.8125, -2.35546875, -1.8984375, -1.44140625, -0.984375, -0.52734375, -0.0703125, 0.38671875, 0.84375, 1.30078125, 1.7578125, 2.21484375, 2.671875, 3.12890625, 3.5859375, 4.04296875, 4.5, 4.95703125, 5.4140625, 5.87109375, 6.328125, 6.78515625, 7.2421875, 7.69921875, 8.15625, 8.61328125, 9.0703125, 9.52734375, 9.984375, 10.44140625, 10.8984375, 11.35546875, 11.8125, 12.26953125, 12.7265625, 13.18359375, 13.640625, 14.09765625, 14.5546875, 15.01171875, 15.46875, 15.92578125, 16.3828125, 16.83984375, 17.296875, 17.75390625, 18.2109375, 18.66796875, 19.125, 19.58203125, 20.0390625, 20.49609375, 20.953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 11.0, 2.0, 5.0, 3.0, 13.0, 19.0, 17.0, 32.0, 49.0, 50.0, 86.0, 99.0, 117.0, 99.0, 82.0, 85.0, 69.0, 51.0, 37.0, 26.0, 11.0, 9.0, 10.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12523555755615234, -0.12193107604980469, -0.11862659454345703, -0.11532211303710938, -0.11201763153076172, -0.10871315002441406, -0.1054086685180664, -0.10210418701171875, -0.0987997055053711, -0.09549522399902344, -0.09219074249267578, -0.08888626098632812, -0.08558177947998047, -0.08227729797363281, -0.07897281646728516, -0.0756683349609375, -0.07236385345458984, -0.06905937194824219, -0.06575489044189453, -0.062450408935546875, -0.05914592742919922, -0.05584144592285156, -0.052536964416503906, -0.04923248291015625, -0.045928001403808594, -0.04262351989746094, -0.03931903839111328, -0.036014556884765625, -0.03271007537841797, -0.029405593872070312, -0.026101112365722656, -0.022796630859375, -0.019492149353027344, -0.016187667846679688, -0.012883186340332031, -0.009578704833984375, -0.006274223327636719, -0.0029697418212890625, 0.00033473968505859375, 0.00363922119140625, 0.006943702697753906, 0.010248184204101562, 0.013552665710449219, 0.016857147216796875, 0.02016162872314453, 0.023466110229492188, 0.026770591735839844, 0.0300750732421875, 0.033379554748535156, 0.03668403625488281, 0.03998851776123047, 0.043292999267578125, 0.04659748077392578, 0.04990196228027344, 0.053206443786621094, 0.05651092529296875, 0.059815406799316406, 0.06311988830566406, 0.06642436981201172, 0.06972885131835938, 0.07303333282470703, 0.07633781433105469, 0.07964229583740234, 0.08294677734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 17.0, 22.0, 54.0, 90.0, 216.0, 508.0, 2311.0, 34531.0, 3841955.0, 304917.0, 8651.0, 795.0, 155.0, 30.0, 16.0, 9.0, 7.0, 2.0, 0.0, 2.0], "bins": [-11.3203125, -11.105804443359375, -10.89129638671875, -10.676788330078125, -10.4622802734375, -10.247772216796875, -10.03326416015625, -9.818756103515625, -9.604248046875, -9.389739990234375, -9.17523193359375, -8.960723876953125, -8.7462158203125, -8.531707763671875, -8.31719970703125, -8.102691650390625, -7.88818359375, -7.673675537109375, -7.45916748046875, -7.244659423828125, -7.0301513671875, -6.815643310546875, -6.60113525390625, -6.386627197265625, -6.172119140625, -5.957611083984375, -5.74310302734375, -5.528594970703125, -5.3140869140625, -5.099578857421875, -4.88507080078125, -4.670562744140625, -4.4560546875, -4.241546630859375, -4.02703857421875, -3.812530517578125, -3.5980224609375, -3.383514404296875, -3.16900634765625, -2.954498291015625, -2.739990234375, -2.525482177734375, -2.31097412109375, -2.096466064453125, -1.8819580078125, -1.667449951171875, -1.45294189453125, -1.238433837890625, -1.02392578125, -0.809417724609375, -0.59490966796875, -0.380401611328125, -0.1658935546875, 0.048614501953125, 0.26312255859375, 0.477630615234375, 0.692138671875, 0.906646728515625, 1.12115478515625, 1.335662841796875, 1.5501708984375, 1.764678955078125, 1.97918701171875, 2.193695068359375, 2.408203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 10.0, 8.0, 8.0, 10.0, 11.0, 9.0, 17.0, 29.0, 26.0, 29.0, 36.0, 61.0, 91.0, 111.0, 142.0, 259.0, 691.0, 1229.0, 411.0, 211.0, 163.0, 117.0, 86.0, 62.0, 56.0, 38.0, 30.0, 26.0, 16.0, 18.0, 14.0, 12.0, 9.0, 4.0, 4.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2376708984375, -0.23098182678222656, -0.22429275512695312, -0.2176036834716797, -0.21091461181640625, -0.2042255401611328, -0.19753646850585938, -0.19084739685058594, -0.1841583251953125, -0.17746925354003906, -0.17078018188476562, -0.1640911102294922, -0.15740203857421875, -0.1507129669189453, -0.14402389526367188, -0.13733482360839844, -0.130645751953125, -0.12395668029785156, -0.11726760864257812, -0.11057853698730469, -0.10388946533203125, -0.09720039367675781, -0.09051132202148438, -0.08382225036621094, -0.0771331787109375, -0.07044410705566406, -0.06375503540039062, -0.05706596374511719, -0.05037689208984375, -0.04368782043457031, -0.036998748779296875, -0.030309677124023438, -0.02362060546875, -0.016931533813476562, -0.010242462158203125, -0.0035533905029296875, 0.00313568115234375, 0.009824752807617188, 0.016513824462890625, 0.023202896118164062, 0.0298919677734375, 0.03658103942871094, 0.043270111083984375, 0.04995918273925781, 0.05664825439453125, 0.06333732604980469, 0.07002639770507812, 0.07671546936035156, 0.083404541015625, 0.09009361267089844, 0.09678268432617188, 0.10347175598144531, 0.11016082763671875, 0.11684989929199219, 0.12353897094726562, 0.13022804260253906, 0.1369171142578125, 0.14360618591308594, 0.15029525756835938, 0.1569843292236328, 0.16367340087890625, 0.1703624725341797, 0.17705154418945312, 0.18374061584472656, 0.1904296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 135.0, 804.0, 64.0, 1.0, 2.0, 1.0, 1.0], "bins": [-49.348167419433594, -48.50278854370117, -47.65740966796875, -46.81203079223633, -45.966651916503906, -45.12126922607422, -44.2758903503418, -43.430511474609375, -42.58513259887695, -41.73975372314453, -40.89437484741211, -40.04899597167969, -39.20361328125, -38.35823440551758, -37.512855529785156, -36.667476654052734, -35.82209777832031, -34.97671890258789, -34.13134002685547, -33.28596115112305, -32.440582275390625, -31.59520149230957, -30.749820709228516, -29.904441833496094, -29.059062957763672, -28.21368408203125, -27.368305206298828, -26.522924423217773, -25.67754554748535, -24.83216667175293, -23.986785888671875, -23.141407012939453, -22.29602813720703, -21.45064926147461, -20.605270385742188, -19.759889602661133, -18.91451072692871, -18.06913185119629, -17.223751068115234, -16.378372192382812, -15.532992362976074, -14.687612533569336, -13.842233657836914, -12.996854782104492, -12.151474952697754, -11.306095123291016, -10.460716247558594, -9.615337371826172, -8.769957542419434, -7.9245781898498535, -7.079198837280273, -6.233819484710693, -5.388440132141113, -4.543060779571533, -3.697681427001953, -2.852302074432373, -2.006922721862793, -1.161543369293213, -0.3161640167236328, 0.5292153358459473, 1.3745946884155273, 2.2199740409851074, 3.0653533935546875, 3.9107327461242676, 4.756112098693848]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 9.0, 9.0, 6.0, 7.0, 22.0, 31.0, 31.0, 57.0, 60.0, 71.0, 64.0, 94.0, 79.0, 70.0, 87.0, 66.0, 55.0, 47.0, 42.0, 26.0, 24.0, 17.0, 10.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5356924533843994, -2.4734723567962646, -2.411252021789551, -2.349031925201416, -2.2868118286132812, -2.2245917320251465, -2.1623713970184326, -2.100151300430298, -2.037930965423584, -1.9757107496261597, -1.913490653038025, -1.8512704372406006, -1.7890503406524658, -1.7268301248550415, -1.6646099090576172, -1.6023898124694824, -1.5401697158813477, -1.4779495000839233, -1.4157294034957886, -1.3535091876983643, -1.2912890911102295, -1.2290688753128052, -1.1668486595153809, -1.104628562927246, -1.0424083471298218, -0.9801881909370422, -0.9179680347442627, -0.8557478189468384, -0.7935276627540588, -0.7313075065612793, -0.669087290763855, -0.6068671345710754, -0.5446470975875854, -0.4824269413948059, -0.420206755399704, -0.35798656940460205, -0.2957664132118225, -0.23354625701904297, -0.17132607102394104, -0.10910588502883911, -0.04688572883605957, 0.015334442257881165, 0.0775546133518219, 0.13977478444576263, 0.20199495553970337, 0.2642151117324829, 0.32643529772758484, 0.38865548372268677, 0.4508756399154663, 0.5130957961082458, 0.5753159523010254, 0.6375361680984497, 0.6997563242912292, 0.7619764804840088, 0.8241966962814331, 0.8864168524742126, 0.9486370086669922, 1.0108572244644165, 1.0730773210525513, 1.1352975368499756, 1.1975176334381104, 1.2597378492355347, 1.321958065032959, 1.3841781616210938, 1.446398377418518]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 13.0, 9.0, 15.0, 15.0, 29.0, 41.0, 39.0, 70.0, 97.0, 145.0, 232.0, 418.0, 589.0, 1076.0, 1951.0, 3748.0, 7787.0, 17549.0, 43447.0, 121715.0, 372033.0, 311783.0, 99785.0, 36574.0, 15138.0, 6667.0, 3375.0, 1697.0, 922.0, 542.0, 367.0, 218.0, 124.0, 104.0, 67.0, 42.0, 34.0, 24.0, 19.0, 18.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.066619873046875, -1.02972412109375, -0.992828369140625, -0.9559326171875, -0.919036865234375, -0.88214111328125, -0.845245361328125, -0.808349609375, -0.771453857421875, -0.73455810546875, -0.697662353515625, -0.6607666015625, -0.623870849609375, -0.58697509765625, -0.550079345703125, -0.51318359375, -0.476287841796875, -0.43939208984375, -0.402496337890625, -0.3656005859375, -0.328704833984375, -0.29180908203125, -0.254913330078125, -0.218017578125, -0.181121826171875, -0.14422607421875, -0.107330322265625, -0.0704345703125, -0.033538818359375, 0.00335693359375, 0.040252685546875, 0.0771484375, 0.114044189453125, 0.15093994140625, 0.187835693359375, 0.2247314453125, 0.261627197265625, 0.29852294921875, 0.335418701171875, 0.372314453125, 0.409210205078125, 0.44610595703125, 0.483001708984375, 0.5198974609375, 0.556793212890625, 0.59368896484375, 0.630584716796875, 0.66748046875, 0.704376220703125, 0.74127197265625, 0.778167724609375, 0.8150634765625, 0.851959228515625, 0.88885498046875, 0.925750732421875, 0.962646484375, 0.999542236328125, 1.03643798828125, 1.073333740234375, 1.1102294921875, 1.147125244140625, 1.18402099609375, 1.220916748046875, 1.2578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 11.0, 6.0, 8.0, 16.0, 17.0, 23.0, 29.0, 43.0, 44.0, 61.0, 58.0, 61.0, 88.0, 64.0, 78.0, 69.0, 60.0, 38.0, 47.0, 42.0, 37.0, 26.0, 22.0, 10.0, 7.0, 13.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08407211303710938, -0.08110809326171875, -0.07814407348632812, -0.0751800537109375, -0.07221603393554688, -0.06925201416015625, -0.06628799438476562, -0.063323974609375, -0.060359954833984375, -0.05739593505859375, -0.054431915283203125, -0.0514678955078125, -0.048503875732421875, -0.04553985595703125, -0.042575836181640625, -0.03961181640625, -0.036647796630859375, -0.03368377685546875, -0.030719757080078125, -0.0277557373046875, -0.024791717529296875, -0.02182769775390625, -0.018863677978515625, -0.015899658203125, -0.012935638427734375, -0.00997161865234375, -0.007007598876953125, -0.0040435791015625, -0.001079559326171875, 0.00188446044921875, 0.004848480224609375, 0.0078125, 0.010776519775390625, 0.01374053955078125, 0.016704559326171875, 0.0196685791015625, 0.022632598876953125, 0.02559661865234375, 0.028560638427734375, 0.031524658203125, 0.034488677978515625, 0.03745269775390625, 0.040416717529296875, 0.0433807373046875, 0.046344757080078125, 0.04930877685546875, 0.052272796630859375, 0.05523681640625, 0.058200836181640625, 0.06116485595703125, 0.06412887573242188, 0.0670928955078125, 0.07005691528320312, 0.07302093505859375, 0.07598495483398438, 0.078948974609375, 0.08191299438476562, 0.08487701416015625, 0.08784103393554688, 0.0908050537109375, 0.09376907348632812, 0.09673309326171875, 0.09969711303710938, 0.1026611328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 1.0, 9.0, 7.0, 6.0, 9.0, 11.0, 18.0, 19.0, 28.0, 31.0, 52.0, 94.0, 633.0, 12169.0, 993302.0, 40843.0, 987.0, 106.0, 53.0, 34.0, 37.0, 24.0, 11.0, 15.0, 10.0, 7.0, 10.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.85394287109375, -5.6688232421875, -5.48370361328125, -5.298583984375, -5.11346435546875, -4.9283447265625, -4.74322509765625, -4.55810546875, -4.37298583984375, -4.1878662109375, -4.00274658203125, -3.817626953125, -3.63250732421875, -3.4473876953125, -3.26226806640625, -3.0771484375, -2.89202880859375, -2.7069091796875, -2.52178955078125, -2.336669921875, -2.15155029296875, -1.9664306640625, -1.78131103515625, -1.59619140625, -1.41107177734375, -1.2259521484375, -1.04083251953125, -0.855712890625, -0.67059326171875, -0.4854736328125, -0.30035400390625, -0.115234375, 0.06988525390625, 0.2550048828125, 0.44012451171875, 0.625244140625, 0.81036376953125, 0.9954833984375, 1.18060302734375, 1.36572265625, 1.55084228515625, 1.7359619140625, 1.92108154296875, 2.106201171875, 2.29132080078125, 2.4764404296875, 2.66156005859375, 2.8466796875, 3.03179931640625, 3.2169189453125, 3.40203857421875, 3.587158203125, 3.77227783203125, 3.9573974609375, 4.14251708984375, 4.32763671875, 4.51275634765625, 4.6978759765625, 4.88299560546875, 5.068115234375, 5.25323486328125, 5.4383544921875, 5.62347412109375, 5.80859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 7.0, 9.0, 11.0, 17.0, 21.0, 24.0, 24.0, 26.0, 33.0, 42.0, 52.0, 36.0, 45.0, 49.0, 51.0, 53.0, 56.0, 44.0, 33.0, 46.0, 48.0, 43.0, 35.0, 25.0, 18.0, 26.0, 22.0, 26.0, 10.0, 13.0, 8.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3811302185058594, -0.36748504638671875, -0.3538398742675781, -0.3401947021484375, -0.3265495300292969, -0.31290435791015625, -0.2992591857910156, -0.285614013671875, -0.2719688415527344, -0.25832366943359375, -0.24467849731445312, -0.2310333251953125, -0.21738815307617188, -0.20374298095703125, -0.19009780883789062, -0.17645263671875, -0.16280746459960938, -0.14916229248046875, -0.13551712036132812, -0.1218719482421875, -0.10822677612304688, -0.09458160400390625, -0.08093643188476562, -0.067291259765625, -0.053646087646484375, -0.04000091552734375, -0.026355743408203125, -0.0127105712890625, 0.000934600830078125, 0.01457977294921875, 0.028224945068359375, 0.0418701171875, 0.055515289306640625, 0.06916046142578125, 0.08280563354492188, 0.0964508056640625, 0.11009597778320312, 0.12374114990234375, 0.13738632202148438, 0.151031494140625, 0.16467666625976562, 0.17832183837890625, 0.19196701049804688, 0.2056121826171875, 0.21925735473632812, 0.23290252685546875, 0.24654769897460938, 0.26019287109375, 0.2738380432128906, 0.28748321533203125, 0.3011283874511719, 0.3147735595703125, 0.3284187316894531, 0.34206390380859375, 0.3557090759277344, 0.369354248046875, 0.3829994201660156, 0.39664459228515625, 0.4102897644042969, 0.4239349365234375, 0.4375801086425781, 0.45122528076171875, 0.4648704528808594, 0.478515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 12.0, 25.0, 27.0, 70.0, 152.0, 1478.0, 966717.0, 79038.0, 709.0, 115.0, 65.0, 27.0, 28.0, 16.0, 7.0, 12.0, 7.0, 2.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.799560546875, -16.25537109375, -15.711181640625, -15.1669921875, -14.622802734375, -14.07861328125, -13.534423828125, -12.990234375, -12.446044921875, -11.90185546875, -11.357666015625, -10.8134765625, -10.269287109375, -9.72509765625, -9.180908203125, -8.63671875, -8.092529296875, -7.54833984375, -7.004150390625, -6.4599609375, -5.915771484375, -5.37158203125, -4.827392578125, -4.283203125, -3.739013671875, -3.19482421875, -2.650634765625, -2.1064453125, -1.562255859375, -1.01806640625, -0.473876953125, 0.0703125, 0.614501953125, 1.15869140625, 1.702880859375, 2.2470703125, 2.791259765625, 3.33544921875, 3.879638671875, 4.423828125, 4.968017578125, 5.51220703125, 6.056396484375, 6.6005859375, 7.144775390625, 7.68896484375, 8.233154296875, 8.77734375, 9.321533203125, 9.86572265625, 10.409912109375, 10.9541015625, 11.498291015625, 12.04248046875, 12.586669921875, 13.130859375, 13.675048828125, 14.21923828125, 14.763427734375, 15.3076171875, 15.851806640625, 16.39599609375, 16.940185546875, 17.484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 7.0, 6.0, 15.0, 19.0, 49.0, 101.0, 271.0, 280.0, 115.0, 46.0, 24.0, 20.0, 12.0, 8.0, 10.0, 5.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005211830139160156, -0.0005038455128669739, -0.00048650801181793213, -0.0004691705107688904, -0.00045183300971984863, -0.0004344955086708069, -0.00041715800762176514, -0.0003998205065727234, -0.00038248300552368164, -0.0003651455044746399, -0.00034780800342559814, -0.0003304705023765564, -0.00031313300132751465, -0.0002957955002784729, -0.00027845799922943115, -0.0002611204981803894, -0.00024378299713134766, -0.0002264454960823059, -0.00020910799503326416, -0.0001917704939842224, -0.00017443299293518066, -0.00015709549188613892, -0.00013975799083709717, -0.00012242048978805542, -0.00010508298873901367, -8.774548768997192e-05, -7.040798664093018e-05, -5.307048559188843e-05, -3.573298454284668e-05, -1.839548349380493e-05, -1.0579824447631836e-06, 1.6279518604278564e-05, 3.361701965332031e-05, 5.095452070236206e-05, 6.829202175140381e-05, 8.562952280044556e-05, 0.0001029670238494873, 0.00012030452489852905, 0.0001376420259475708, 0.00015497952699661255, 0.0001723170280456543, 0.00018965452909469604, 0.0002069920301437378, 0.00022432953119277954, 0.0002416670322418213, 0.00025900453329086304, 0.0002763420343399048, 0.00029367953538894653, 0.0003110170364379883, 0.00032835453748703003, 0.0003456920385360718, 0.0003630295395851135, 0.0003803670406341553, 0.000397704541683197, 0.00041504204273223877, 0.0004323795437812805, 0.00044971704483032227, 0.000467054545879364, 0.00048439204692840576, 0.0005017295479774475, 0.0005190670490264893, 0.000536404550075531, 0.0005537420511245728, 0.0005710795521736145, 0.0005884170532226562]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 8.0, 13.0, 24.0, 37.0, 34.0, 63.0, 88.0, 136.0, 224.0, 322.0, 507.0, 859.0, 1583.0, 3035.0, 7240.0, 18806.0, 68627.0, 677885.0, 210570.0, 36169.0, 12133.0, 4898.0, 2345.0, 1163.0, 677.0, 394.0, 225.0, 161.0, 105.0, 80.0, 33.0, 24.0, 18.0, 20.0, 8.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.09765625, -3.96868896484375, -3.8397216796875, -3.71075439453125, -3.581787109375, -3.45281982421875, -3.3238525390625, -3.19488525390625, -3.06591796875, -2.93695068359375, -2.8079833984375, -2.67901611328125, -2.550048828125, -2.42108154296875, -2.2921142578125, -2.16314697265625, -2.0341796875, -1.90521240234375, -1.7762451171875, -1.64727783203125, -1.518310546875, -1.38934326171875, -1.2603759765625, -1.13140869140625, -1.00244140625, -0.87347412109375, -0.7445068359375, -0.61553955078125, -0.486572265625, -0.35760498046875, -0.2286376953125, -0.09967041015625, 0.029296875, 0.15826416015625, 0.2872314453125, 0.41619873046875, 0.545166015625, 0.67413330078125, 0.8031005859375, 0.93206787109375, 1.06103515625, 1.19000244140625, 1.3189697265625, 1.44793701171875, 1.576904296875, 1.70587158203125, 1.8348388671875, 1.96380615234375, 2.0927734375, 2.22174072265625, 2.3507080078125, 2.47967529296875, 2.608642578125, 2.73760986328125, 2.8665771484375, 2.99554443359375, 3.12451171875, 3.25347900390625, 3.3824462890625, 3.51141357421875, 3.640380859375, 3.76934814453125, 3.8983154296875, 4.02728271484375, 4.15625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 14.0, 15.0, 29.0, 55.0, 98.0, 185.0, 236.0, 140.0, 76.0, 31.0, 25.0, 23.0, 16.0, 11.0, 6.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.413116455078125, -2.33599853515625, -2.258880615234375, -2.1817626953125, -2.104644775390625, -2.02752685546875, -1.950408935546875, -1.873291015625, -1.796173095703125, -1.71905517578125, -1.641937255859375, -1.5648193359375, -1.487701416015625, -1.41058349609375, -1.333465576171875, -1.25634765625, -1.179229736328125, -1.10211181640625, -1.024993896484375, -0.9478759765625, -0.870758056640625, -0.79364013671875, -0.716522216796875, -0.639404296875, -0.562286376953125, -0.48516845703125, -0.408050537109375, -0.3309326171875, -0.253814697265625, -0.17669677734375, -0.099578857421875, -0.0224609375, 0.054656982421875, 0.13177490234375, 0.208892822265625, 0.2860107421875, 0.363128662109375, 0.44024658203125, 0.517364501953125, 0.594482421875, 0.671600341796875, 0.74871826171875, 0.825836181640625, 0.9029541015625, 0.980072021484375, 1.05718994140625, 1.134307861328125, 1.21142578125, 1.288543701171875, 1.36566162109375, 1.442779541015625, 1.5198974609375, 1.597015380859375, 1.67413330078125, 1.751251220703125, 1.828369140625, 1.905487060546875, 1.98260498046875, 2.059722900390625, 2.1368408203125, 2.213958740234375, 2.29107666015625, 2.368194580078125, 2.4453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 30.0, 78.0, 191.0, 295.0, 251.0, 102.0, 25.0, 18.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.916030883789062, -16.365196228027344, -15.814361572265625, -15.263526916503906, -14.712692260742188, -14.161857604980469, -13.61102294921875, -13.060188293457031, -12.509353637695312, -11.958518981933594, -11.407684326171875, -10.856849670410156, -10.306015014648438, -9.755180358886719, -9.204345703125, -8.653511047363281, -8.102676391601562, -7.551841735839844, -7.001007080078125, -6.450172424316406, -5.8993377685546875, -5.348503112792969, -4.79766845703125, -4.246833801269531, -3.6959991455078125, -3.1451644897460938, -2.594329833984375, -2.0434951782226562, -1.4926605224609375, -0.9418258666992188, -0.3909912109375, 0.15984344482421875, 0.7106781005859375, 1.2615127563476562, 1.812347412109375, 2.3631820678710938, 2.9140167236328125, 3.4648513793945312, 4.01568603515625, 4.566520690917969, 5.1173553466796875, 5.668190002441406, 6.219024658203125, 6.769859313964844, 7.3206939697265625, 7.871528625488281, 8.42236328125, 8.973197937011719, 9.524032592773438, 10.074867248535156, 10.625701904296875, 11.176536560058594, 11.727371215820312, 12.278205871582031, 12.82904052734375, 13.379875183105469, 13.930709838867188, 14.481544494628906, 15.032379150390625, 15.583213806152344, 16.134048461914062, 16.68488311767578, 17.2357177734375, 17.78655242919922, 18.337387084960938]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 10.0, 13.0, 14.0, 23.0, 31.0, 36.0, 49.0, 66.0, 94.0, 70.0, 81.0, 85.0, 68.0, 67.0, 68.0, 50.0, 36.0, 31.0, 26.0, 26.0, 11.0, 15.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.705593109130859, -5.540289878845215, -5.3749871253967285, -5.209684371948242, -5.044381141662598, -4.879077911376953, -4.713775157928467, -4.5484724044799805, -4.383169174194336, -4.217865943908691, -4.052563190460205, -3.8872601985931396, -3.721957206726074, -3.556654214859009, -3.3913512229919434, -3.226048231124878, -3.0607452392578125, -2.895442247390747, -2.7301392555236816, -2.564836263656616, -2.399533271789551, -2.2342302799224854, -2.06892728805542, -1.9036242961883545, -1.738321304321289, -1.5730183124542236, -1.4077153205871582, -1.2424123287200928, -1.0771093368530273, -0.9118063449859619, -0.7465033531188965, -0.581200361251831, -0.41589784622192383, -0.2505948543548584, -0.08529186248779297, 0.08001112937927246, 0.2453141212463379, 0.4106171131134033, 0.5759201049804688, 0.7412230968475342, 0.9065260887145996, 1.071829080581665, 1.2371320724487305, 1.402435064315796, 1.5677380561828613, 1.7330410480499268, 1.8983440399169922, 2.0636470317840576, 2.228950023651123, 2.3942530155181885, 2.559556007385254, 2.7248589992523193, 2.8901619911193848, 3.05546498298645, 3.2207679748535156, 3.386070966720581, 3.5513739585876465, 3.716676950454712, 3.8819799423217773, 4.047283172607422, 4.212585926055908, 4.3778886795043945, 4.543191909790039, 4.708495140075684, 4.87379789352417]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 6.0, 0.0, 10.0, 14.0, 6.0, 11.0, 15.0, 14.0, 34.0, 72.0, 178.0, 661.0, 3294.0, 33259.0, 3856183.0, 287459.0, 10807.0, 1370.0, 322.0, 146.0, 82.0, 41.0, 40.0, 43.0, 40.0, 29.0, 20.0, 19.0, 13.0, 6.0, 9.0, 15.0, 6.0, 10.0, 6.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0], "bins": [-7.90625, -7.68536376953125, -7.4644775390625, -7.24359130859375, -7.022705078125, -6.80181884765625, -6.5809326171875, -6.36004638671875, -6.13916015625, -5.91827392578125, -5.6973876953125, -5.47650146484375, -5.255615234375, -5.03472900390625, -4.8138427734375, -4.59295654296875, -4.3720703125, -4.15118408203125, -3.9302978515625, -3.70941162109375, -3.488525390625, -3.26763916015625, -3.0467529296875, -2.82586669921875, -2.60498046875, -2.38409423828125, -2.1632080078125, -1.94232177734375, -1.721435546875, -1.50054931640625, -1.2796630859375, -1.05877685546875, -0.837890625, -0.61700439453125, -0.3961181640625, -0.17523193359375, 0.045654296875, 0.26654052734375, 0.4874267578125, 0.70831298828125, 0.92919921875, 1.15008544921875, 1.3709716796875, 1.59185791015625, 1.812744140625, 2.03363037109375, 2.2545166015625, 2.47540283203125, 2.6962890625, 2.91717529296875, 3.1380615234375, 3.35894775390625, 3.579833984375, 3.80072021484375, 4.0216064453125, 4.24249267578125, 4.46337890625, 4.68426513671875, 4.9051513671875, 5.12603759765625, 5.346923828125, 5.56781005859375, 5.7886962890625, 6.00958251953125, 6.23046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 17.0, 21.0, 23.0, 39.0, 82.0, 85.0, 111.0, 110.0, 105.0, 113.0, 91.0, 67.0, 51.0, 31.0, 18.0, 16.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07589149475097656, -0.07085037231445312, -0.06580924987792969, -0.06076812744140625, -0.05572700500488281, -0.050685882568359375, -0.04564476013183594, -0.0406036376953125, -0.03556251525878906, -0.030521392822265625, -0.025480270385742188, -0.02043914794921875, -0.015398025512695312, -0.010356903076171875, -0.0053157806396484375, -0.000274658203125, 0.0047664642333984375, 0.009807586669921875, 0.014848709106445312, 0.01988983154296875, 0.024930953979492188, 0.029972076416015625, 0.03501319885253906, 0.0400543212890625, 0.04509544372558594, 0.050136566162109375, 0.05517768859863281, 0.06021881103515625, 0.06525993347167969, 0.07030105590820312, 0.07534217834472656, 0.08038330078125, 0.08542442321777344, 0.09046554565429688, 0.09550666809082031, 0.10054779052734375, 0.10558891296386719, 0.11063003540039062, 0.11567115783691406, 0.1207122802734375, 0.12575340270996094, 0.13079452514648438, 0.1358356475830078, 0.14087677001953125, 0.1459178924560547, 0.15095901489257812, 0.15600013732910156, 0.161041259765625, 0.16608238220214844, 0.17112350463867188, 0.1761646270751953, 0.18120574951171875, 0.1862468719482422, 0.19128799438476562, 0.19632911682128906, 0.2013702392578125, 0.20641136169433594, 0.21145248413085938, 0.2164936065673828, 0.22153472900390625, 0.2265758514404297, 0.23161697387695312, 0.23665809631347656, 0.24169921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 14.0, 44.0, 72.0, 180.0, 630.0, 50751.0, 4136869.0, 4962.0, 436.0, 149.0, 95.0, 34.0, 18.0, 10.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.75, -7.208251953125, -6.66650390625, -6.124755859375, -5.5830078125, -5.041259765625, -4.49951171875, -3.957763671875, -3.416015625, -2.874267578125, -2.33251953125, -1.790771484375, -1.2490234375, -0.707275390625, -0.16552734375, 0.376220703125, 0.91796875, 1.459716796875, 2.00146484375, 2.543212890625, 3.0849609375, 3.626708984375, 4.16845703125, 4.710205078125, 5.251953125, 5.793701171875, 6.33544921875, 6.877197265625, 7.4189453125, 7.960693359375, 8.50244140625, 9.044189453125, 9.5859375, 10.127685546875, 10.66943359375, 11.211181640625, 11.7529296875, 12.294677734375, 12.83642578125, 13.378173828125, 13.919921875, 14.461669921875, 15.00341796875, 15.545166015625, 16.0869140625, 16.628662109375, 17.17041015625, 17.712158203125, 18.25390625, 18.795654296875, 19.33740234375, 19.879150390625, 20.4208984375, 20.962646484375, 21.50439453125, 22.046142578125, 22.587890625, 23.129638671875, 23.67138671875, 24.213134765625, 24.7548828125, 25.296630859375, 25.83837890625, 26.380126953125, 26.921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 10.0, 28.0, 31.0, 44.0, 73.0, 133.0, 223.0, 437.0, 1593.0, 783.0, 297.0, 150.0, 111.0, 53.0, 42.0, 26.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.67626953125, -0.6611366271972656, -0.6460037231445312, -0.6308708190917969, -0.6157379150390625, -0.6006050109863281, -0.5854721069335938, -0.5703392028808594, -0.555206298828125, -0.5400733947753906, -0.5249404907226562, -0.5098075866699219, -0.4946746826171875, -0.4795417785644531, -0.46440887451171875, -0.4492759704589844, -0.43414306640625, -0.4190101623535156, -0.40387725830078125, -0.3887443542480469, -0.3736114501953125, -0.3584785461425781, -0.34334564208984375, -0.3282127380371094, -0.313079833984375, -0.2979469299316406, -0.28281402587890625, -0.2676811218261719, -0.2525482177734375, -0.23741531372070312, -0.22228240966796875, -0.20714950561523438, -0.1920166015625, -0.17688369750976562, -0.16175079345703125, -0.14661788940429688, -0.1314849853515625, -0.11635208129882812, -0.10121917724609375, -0.08608627319335938, -0.070953369140625, -0.055820465087890625, -0.04068756103515625, -0.025554656982421875, -0.0104217529296875, 0.004711151123046875, 0.01984405517578125, 0.034976959228515625, 0.05010986328125, 0.06524276733398438, 0.08037567138671875, 0.09550857543945312, 0.1106414794921875, 0.12577438354492188, 0.14090728759765625, 0.15604019165039062, 0.171173095703125, 0.18630599975585938, 0.20143890380859375, 0.21657180786132812, 0.2317047119140625, 0.24683761596679688, 0.26197052001953125, 0.2771034240722656, 0.292236328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [7.0, 264.0, 728.0, 21.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3375675678253174, -1.2624499797821045, -0.1873323917388916, 0.8877851963043213, 1.9629027843475342, 3.038020372390747, 4.113138198852539, 5.188255310058594, 6.263373374938965, 7.338490962982178, 8.41360855102539, 9.488725662231445, 10.563843727111816, 11.638961791992188, 12.714078903198242, 13.789196014404297, 14.864314079284668, 15.939432144165039, 17.014549255371094, 18.08966636657715, 19.164783477783203, 20.23990249633789, 21.315019607543945, 22.39013671875, 23.465253829956055, 24.54037094116211, 25.615489959716797, 26.69060707092285, 27.765724182128906, 28.84084129333496, 29.915958404541016, 30.991077423095703, 32.066192626953125, 33.14131164550781, 34.216426849365234, 35.29154586791992, 36.366661071777344, 37.44178009033203, 38.51689910888672, 39.59201431274414, 40.66713333129883, 41.742252349853516, 42.81736755371094, 43.892486572265625, 44.96760559082031, 46.042720794677734, 47.11783981323242, 48.192955017089844, 49.26807403564453, 50.34319305419922, 51.41830825805664, 52.49342727661133, 53.56854248046875, 54.64366149902344, 55.718780517578125, 56.79389572143555, 57.869014739990234, 58.94413375854492, 60.019248962402344, 61.09436798095703, 62.16948699951172, 63.24460220336914, 64.31971740722656, 65.39483642578125, 66.46995544433594]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 9.0, 17.0, 18.0, 24.0, 39.0, 44.0, 57.0, 49.0, 68.0, 84.0, 77.0, 73.0, 74.0, 77.0, 64.0, 62.0, 50.0, 33.0, 28.0, 21.0, 7.0, 10.0, 12.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7874598503112793, -2.7095694541931152, -2.631679058074951, -2.553788661956787, -2.475898265838623, -2.398008108139038, -2.320117712020874, -2.24222731590271, -2.164336919784546, -2.086446523666382, -2.0085561275482178, -1.9306658506393433, -1.8527754545211792, -1.7748850584030151, -1.6969947814941406, -1.6191043853759766, -1.5412139892578125, -1.4633235931396484, -1.3854331970214844, -1.3075429201126099, -1.2296525239944458, -1.1517621278762817, -1.0738718509674072, -0.9959814548492432, -0.9180910587310791, -0.840200662612915, -0.7623103260993958, -0.6844199895858765, -0.6065295934677124, -0.5286391973495483, -0.45074886083602905, -0.37285852432250977, -0.2949681282043457, -0.21707776188850403, -0.13918739557266235, -0.06129702925682068, 0.016593337059020996, 0.09448370337486267, 0.17237406969070435, 0.25026440620422363, 0.3281548023223877, 0.40604516863822937, 0.48393553495407104, 0.5618258714675903, 0.6397162675857544, 0.7176066637039185, 0.7954970002174377, 0.873387336730957, 0.9512777328491211, 1.0291681289672852, 1.1070585250854492, 1.1849488019943237, 1.2628391981124878, 1.3407295942306519, 1.4186198711395264, 1.4965102672576904, 1.5744006633758545, 1.6522910594940186, 1.7301814556121826, 1.8080717325210571, 1.8859621286392212, 1.9638525247573853, 2.0417428016662598, 2.119633197784424, 2.197523593902588]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 3.0, 10.0, 4.0, 10.0, 10.0, 15.0, 11.0, 20.0, 13.0, 28.0, 34.0, 23.0, 22.0, 41.0, 42.0, 84.0, 281.0, 1930.0, 20877.0, 287481.0, 658859.0, 71798.0, 5801.0, 645.0, 158.0, 62.0, 42.0, 26.0, 25.0, 29.0, 29.0, 15.0, 22.0, 22.0, 16.0, 10.0, 15.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.84765625, -2.74310302734375, -2.6385498046875, -2.53399658203125, -2.429443359375, -2.32489013671875, -2.2203369140625, -2.11578369140625, -2.01123046875, -1.90667724609375, -1.8021240234375, -1.69757080078125, -1.593017578125, -1.48846435546875, -1.3839111328125, -1.27935791015625, -1.1748046875, -1.07025146484375, -0.9656982421875, -0.86114501953125, -0.756591796875, -0.65203857421875, -0.5474853515625, -0.44293212890625, -0.33837890625, -0.23382568359375, -0.1292724609375, -0.02471923828125, 0.079833984375, 0.18438720703125, 0.2889404296875, 0.39349365234375, 0.498046875, 0.60260009765625, 0.7071533203125, 0.81170654296875, 0.916259765625, 1.02081298828125, 1.1253662109375, 1.22991943359375, 1.33447265625, 1.43902587890625, 1.5435791015625, 1.64813232421875, 1.752685546875, 1.85723876953125, 1.9617919921875, 2.06634521484375, 2.1708984375, 2.27545166015625, 2.3800048828125, 2.48455810546875, 2.589111328125, 2.69366455078125, 2.7982177734375, 2.90277099609375, 3.00732421875, 3.11187744140625, 3.2164306640625, 3.32098388671875, 3.425537109375, 3.53009033203125, 3.6346435546875, 3.73919677734375, 3.84375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 8.0, 9.0, 14.0, 34.0, 27.0, 39.0, 50.0, 47.0, 49.0, 61.0, 65.0, 68.0, 68.0, 71.0, 61.0, 59.0, 51.0, 57.0, 41.0, 30.0, 25.0, 20.0, 10.0, 8.0, 7.0, 8.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11407470703125, -0.1097249984741211, -0.10537528991699219, -0.10102558135986328, -0.09667587280273438, -0.09232616424560547, -0.08797645568847656, -0.08362674713134766, -0.07927703857421875, -0.07492733001708984, -0.07057762145996094, -0.06622791290283203, -0.061878204345703125, -0.05752849578857422, -0.05317878723144531, -0.048829078674316406, -0.0444793701171875, -0.040129661560058594, -0.03577995300292969, -0.03143024444580078, -0.027080535888671875, -0.02273082733154297, -0.018381118774414062, -0.014031410217285156, -0.00968170166015625, -0.005331993103027344, -0.0009822845458984375, 0.0033674240112304688, 0.007717132568359375, 0.012066841125488281, 0.016416549682617188, 0.020766258239746094, 0.025115966796875, 0.029465675354003906, 0.03381538391113281, 0.03816509246826172, 0.042514801025390625, 0.04686450958251953, 0.05121421813964844, 0.055563926696777344, 0.05991363525390625, 0.06426334381103516, 0.06861305236816406, 0.07296276092529297, 0.07731246948242188, 0.08166217803955078, 0.08601188659667969, 0.0903615951538086, 0.0947113037109375, 0.0990610122680664, 0.10341072082519531, 0.10776042938232422, 0.11211013793945312, 0.11645984649658203, 0.12080955505371094, 0.12515926361083984, 0.12950897216796875, 0.13385868072509766, 0.13820838928222656, 0.14255809783935547, 0.14690780639648438, 0.15125751495361328, 0.1556072235107422, 0.1599569320678711, 0.164306640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 4.0, 12.0, 14.0, 19.0, 32.0, 42.0, 61.0, 123.0, 223.0, 449.0, 952.0, 2595.0, 8238.0, 31951.0, 154113.0, 490573.0, 278891.0, 59699.0, 13931.0, 3924.0, 1436.0, 582.0, 276.0, 152.0, 91.0, 53.0, 31.0, 22.0, 17.0, 17.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.62890625, -2.56268310546875, -2.4964599609375, -2.43023681640625, -2.364013671875, -2.29779052734375, -2.2315673828125, -2.16534423828125, -2.09912109375, -2.03289794921875, -1.9666748046875, -1.90045166015625, -1.834228515625, -1.76800537109375, -1.7017822265625, -1.63555908203125, -1.5693359375, -1.50311279296875, -1.4368896484375, -1.37066650390625, -1.304443359375, -1.23822021484375, -1.1719970703125, -1.10577392578125, -1.03955078125, -0.97332763671875, -0.9071044921875, -0.84088134765625, -0.774658203125, -0.70843505859375, -0.6422119140625, -0.57598876953125, -0.509765625, -0.44354248046875, -0.3773193359375, -0.31109619140625, -0.244873046875, -0.17864990234375, -0.1124267578125, -0.04620361328125, 0.02001953125, 0.08624267578125, 0.1524658203125, 0.21868896484375, 0.284912109375, 0.35113525390625, 0.4173583984375, 0.48358154296875, 0.5498046875, 0.61602783203125, 0.6822509765625, 0.74847412109375, 0.814697265625, 0.88092041015625, 0.9471435546875, 1.01336669921875, 1.07958984375, 1.14581298828125, 1.2120361328125, 1.27825927734375, 1.344482421875, 1.41070556640625, 1.4769287109375, 1.54315185546875, 1.609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 11.0, 17.0, 18.0, 18.0, 19.0, 21.0, 16.0, 22.0, 31.0, 28.0, 40.0, 35.0, 38.0, 46.0, 36.0, 45.0, 41.0, 34.0, 52.0, 35.0, 34.0, 35.0, 32.0, 37.0, 33.0, 17.0, 30.0, 25.0, 16.0, 13.0, 21.0, 13.0, 17.0, 7.0, 12.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.57421875, -0.5565643310546875, -0.538909912109375, -0.5212554931640625, -0.50360107421875, -0.4859466552734375, -0.468292236328125, -0.4506378173828125, -0.4329833984375, -0.4153289794921875, -0.397674560546875, -0.3800201416015625, -0.36236572265625, -0.3447113037109375, -0.327056884765625, -0.3094024658203125, -0.291748046875, -0.2740936279296875, -0.256439208984375, -0.2387847900390625, -0.22113037109375, -0.2034759521484375, -0.185821533203125, -0.1681671142578125, -0.1505126953125, -0.1328582763671875, -0.115203857421875, -0.0975494384765625, -0.07989501953125, -0.0622406005859375, -0.044586181640625, -0.0269317626953125, -0.00927734375, 0.0083770751953125, 0.026031494140625, 0.0436859130859375, 0.06134033203125, 0.0789947509765625, 0.096649169921875, 0.1143035888671875, 0.1319580078125, 0.1496124267578125, 0.167266845703125, 0.1849212646484375, 0.20257568359375, 0.2202301025390625, 0.237884521484375, 0.2555389404296875, 0.273193359375, 0.2908477783203125, 0.308502197265625, 0.3261566162109375, 0.34381103515625, 0.3614654541015625, 0.379119873046875, 0.3967742919921875, 0.4144287109375, 0.4320831298828125, 0.449737548828125, 0.4673919677734375, 0.48504638671875, 0.5027008056640625, 0.520355224609375, 0.5380096435546875, 0.5556640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 15.0, 25.0, 32.0, 43.0, 70.0, 116.0, 188.0, 330.0, 686.0, 1804.0, 5425.0, 20949.0, 118015.0, 560332.0, 281354.0, 44659.0, 9591.0, 2811.0, 1021.0, 442.0, 239.0, 139.0, 71.0, 40.0, 37.0, 31.0, 22.0, 7.0, 12.0, 8.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.669921875, -2.59722900390625, -2.5245361328125, -2.45184326171875, -2.379150390625, -2.30645751953125, -2.2337646484375, -2.16107177734375, -2.08837890625, -2.01568603515625, -1.9429931640625, -1.87030029296875, -1.797607421875, -1.72491455078125, -1.6522216796875, -1.57952880859375, -1.5068359375, -1.43414306640625, -1.3614501953125, -1.28875732421875, -1.216064453125, -1.14337158203125, -1.0706787109375, -0.99798583984375, -0.92529296875, -0.85260009765625, -0.7799072265625, -0.70721435546875, -0.634521484375, -0.56182861328125, -0.4891357421875, -0.41644287109375, -0.34375, -0.27105712890625, -0.1983642578125, -0.12567138671875, -0.052978515625, 0.01971435546875, 0.0924072265625, 0.16510009765625, 0.23779296875, 0.31048583984375, 0.3831787109375, 0.45587158203125, 0.528564453125, 0.60125732421875, 0.6739501953125, 0.74664306640625, 0.8193359375, 0.89202880859375, 0.9647216796875, 1.03741455078125, 1.110107421875, 1.18280029296875, 1.2554931640625, 1.32818603515625, 1.40087890625, 1.47357177734375, 1.5462646484375, 1.61895751953125, 1.691650390625, 1.76434326171875, 1.8370361328125, 1.90972900390625, 1.982421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 8.0, 13.0, 12.0, 20.0, 24.0, 34.0, 53.0, 58.0, 95.0, 93.0, 110.0, 108.0, 97.0, 77.0, 52.0, 45.0, 19.0, 20.0, 14.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.0002678297460079193, -0.00025885552167892456, -0.0002498812973499298, -0.00024090707302093506, -0.0002319328486919403, -0.00022295862436294556, -0.0002139844000339508, -0.00020501017570495605, -0.0001960359513759613, -0.00018706172704696655, -0.0001780875027179718, -0.00016911327838897705, -0.0001601390540599823, -0.00015116482973098755, -0.0001421906054019928, -0.00013321638107299805, -0.0001242421567440033, -0.00011526793241500854, -0.0001062937080860138, -9.731948375701904e-05, -8.834525942802429e-05, -7.937103509902954e-05, -7.039681077003479e-05, -6.142258644104004e-05, -5.244836211204529e-05, -4.347413778305054e-05, -3.4499913454055786e-05, -2.5525689125061035e-05, -1.6551464796066284e-05, -7.577240467071533e-06, 1.3969838619232178e-06, 1.0371208190917969e-05, 1.934543251991272e-05, 2.831965684890747e-05, 3.729388117790222e-05, 4.626810550689697e-05, 5.5242329835891724e-05, 6.421655416488647e-05, 7.319077849388123e-05, 8.216500282287598e-05, 9.113922715187073e-05, 0.00010011345148086548, 0.00010908767580986023, 0.00011806190013885498, 0.00012703612446784973, 0.00013601034879684448, 0.00014498457312583923, 0.00015395879745483398, 0.00016293302178382874, 0.00017190724611282349, 0.00018088147044181824, 0.000189855694770813, 0.00019882991909980774, 0.0002078041434288025, 0.00021677836775779724, 0.000225752592086792, 0.00023472681641578674, 0.0002437010407447815, 0.00025267526507377625, 0.000261649489402771, 0.00027062371373176575, 0.0002795979380607605, 0.00028857216238975525, 0.00029754638671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 5.0, 8.0, 4.0, 10.0, 9.0, 22.0, 10.0, 36.0, 52.0, 76.0, 111.0, 199.0, 356.0, 707.0, 1616.0, 5069.0, 20402.0, 144151.0, 652984.0, 188471.0, 25108.0, 5668.0, 1819.0, 739.0, 323.0, 208.0, 117.0, 82.0, 53.0, 37.0, 20.0, 19.0, 13.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.583984375, -2.506988525390625, -2.42999267578125, -2.352996826171875, -2.2760009765625, -2.199005126953125, -2.12200927734375, -2.045013427734375, -1.968017578125, -1.891021728515625, -1.81402587890625, -1.737030029296875, -1.6600341796875, -1.583038330078125, -1.50604248046875, -1.429046630859375, -1.35205078125, -1.275054931640625, -1.19805908203125, -1.121063232421875, -1.0440673828125, -0.967071533203125, -0.89007568359375, -0.813079833984375, -0.736083984375, -0.659088134765625, -0.58209228515625, -0.505096435546875, -0.4281005859375, -0.351104736328125, -0.27410888671875, -0.197113037109375, -0.1201171875, -0.043121337890625, 0.03387451171875, 0.110870361328125, 0.1878662109375, 0.264862060546875, 0.34185791015625, 0.418853759765625, 0.495849609375, 0.572845458984375, 0.64984130859375, 0.726837158203125, 0.8038330078125, 0.880828857421875, 0.95782470703125, 1.034820556640625, 1.11181640625, 1.188812255859375, 1.26580810546875, 1.342803955078125, 1.4197998046875, 1.496795654296875, 1.57379150390625, 1.650787353515625, 1.727783203125, 1.804779052734375, 1.88177490234375, 1.958770751953125, 2.0357666015625, 2.112762451171875, 2.18975830078125, 2.266754150390625, 2.34375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 17.0, 15.0, 19.0, 31.0, 58.0, 82.0, 101.0, 99.0, 111.0, 100.0, 93.0, 80.0, 60.0, 42.0, 28.0, 14.0, 14.0, 10.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.075897216796875, -1.03948974609375, -1.003082275390625, -0.9666748046875, -0.930267333984375, -0.89385986328125, -0.857452392578125, -0.821044921875, -0.784637451171875, -0.74822998046875, -0.711822509765625, -0.6754150390625, -0.639007568359375, -0.60260009765625, -0.566192626953125, -0.52978515625, -0.493377685546875, -0.45697021484375, -0.420562744140625, -0.3841552734375, -0.347747802734375, -0.31134033203125, -0.274932861328125, -0.238525390625, -0.202117919921875, -0.16571044921875, -0.129302978515625, -0.0928955078125, -0.056488037109375, -0.02008056640625, 0.016326904296875, 0.052734375, 0.089141845703125, 0.12554931640625, 0.161956787109375, 0.1983642578125, 0.234771728515625, 0.27117919921875, 0.307586669921875, 0.343994140625, 0.380401611328125, 0.41680908203125, 0.453216552734375, 0.4896240234375, 0.526031494140625, 0.56243896484375, 0.598846435546875, 0.63525390625, 0.671661376953125, 0.70806884765625, 0.744476318359375, 0.7808837890625, 0.817291259765625, 0.85369873046875, 0.890106201171875, 0.926513671875, 0.962921142578125, 0.99932861328125, 1.035736083984375, 1.0721435546875, 1.108551025390625, 1.14495849609375, 1.181365966796875, 1.2177734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 12.0, 68.0, 390.0, 436.0, 83.0, 18.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.533979415893555, -8.197861671447754, -6.861743927001953, -5.5256266593933105, -4.18950891494751, -2.853391170501709, -1.5172739028930664, -0.18115615844726562, 1.1549615859985352, 2.491079330444336, 3.8271968364715576, 5.163314342498779, 6.49943208694458, 7.835549831390381, 9.171667098999023, 10.507784843444824, 11.843902587890625, 13.180020332336426, 14.516138076782227, 15.852254867553711, 17.188373565673828, 18.524490356445312, 19.860607147216797, 21.196725845336914, 22.53284454345703, 23.868961334228516, 25.205080032348633, 26.541196823120117, 27.877315521240234, 29.21343231201172, 30.549549102783203, 31.88566780090332, 33.22178268432617, 34.557899475097656, 35.89401626586914, 37.23013687133789, 38.566253662109375, 39.90237045288086, 41.238487243652344, 42.574607849121094, 43.91072463989258, 45.24684143066406, 46.58295822143555, 47.9190788269043, 49.25519561767578, 50.591312408447266, 51.92742919921875, 53.2635498046875, 54.59966278076172, 55.9357795715332, 57.27189636230469, 58.60801696777344, 59.94413375854492, 61.280250549316406, 62.61636734008789, 63.952484130859375, 65.28860473632812, 66.62472534179688, 67.9608383178711, 69.29695892333984, 70.63307189941406, 71.96919250488281, 73.30531311035156, 74.64142608642578, 75.97754669189453]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 13.0, 14.0, 19.0, 31.0, 28.0, 41.0, 44.0, 59.0, 57.0, 68.0, 73.0, 57.0, 72.0, 64.0, 58.0, 56.0, 57.0, 38.0, 29.0, 21.0, 26.0, 14.0, 9.0, 13.0, 2.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.645059585571289, -4.440197944641113, -4.235335826873779, -4.030473709106445, -3.8256120681762695, -3.6207501888275146, -3.4158883094787598, -3.211026430130005, -3.00616455078125, -2.801302671432495, -2.5964407920837402, -2.3915789127349854, -2.1867170333862305, -1.9818551540374756, -1.7769932746887207, -1.5721313953399658, -1.367269515991211, -1.162407636642456, -0.9575457572937012, -0.7526838779449463, -0.5478219985961914, -0.3429601192474365, -0.13809823989868164, 0.06676363945007324, 0.2716255187988281, 0.476487398147583, 0.6813492774963379, 0.8862111568450928, 1.0910730361938477, 1.2959349155426025, 1.5007967948913574, 1.7056586742401123, 1.9105205535888672, 2.115382432937622, 2.320244312286377, 2.525106191635132, 2.7299680709838867, 2.9348299503326416, 3.1396918296813965, 3.3445537090301514, 3.5494155883789062, 3.754277467727661, 3.959139347076416, 4.16400146484375, 4.368863105773926, 4.573724746704102, 4.7785868644714355, 4.9834489822387695, 5.188310623168945, 5.393172264099121, 5.598034381866455, 5.802896499633789, 6.007758140563965, 6.212619781494141, 6.417481899261475, 6.622344017028809, 6.827205657958984, 7.03206729888916, 7.236929416656494, 7.441791534423828, 7.646653175354004, 7.85151481628418, 8.056377410888672, 8.261239051818848, 8.466100692749023]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 15.0, 24.0, 37.0, 90.0, 279.0, 1109.0, 14584.0, 4038357.0, 135510.0, 3389.0, 550.0, 185.0, 79.0, 46.0, 14.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -3.7913818359375, -3.403076171875, -3.0147705078125, -2.62646484375, -2.2381591796875, -1.849853515625, -1.4615478515625, -1.0732421875, -0.6849365234375, -0.296630859375, 0.0916748046875, 0.47998046875, 0.8682861328125, 1.256591796875, 1.6448974609375, 2.033203125, 2.4215087890625, 2.809814453125, 3.1981201171875, 3.58642578125, 3.9747314453125, 4.363037109375, 4.7513427734375, 5.1396484375, 5.5279541015625, 5.916259765625, 6.3045654296875, 6.69287109375, 7.0811767578125, 7.469482421875, 7.8577880859375, 8.24609375, 8.6343994140625, 9.022705078125, 9.4110107421875, 9.79931640625, 10.1876220703125, 10.575927734375, 10.9642333984375, 11.3525390625, 11.7408447265625, 12.129150390625, 12.5174560546875, 12.90576171875, 13.2940673828125, 13.682373046875, 14.0706787109375, 14.458984375, 14.8472900390625, 15.235595703125, 15.6239013671875, 16.01220703125, 16.4005126953125, 16.788818359375, 17.1771240234375, 17.5654296875, 17.9537353515625, 18.342041015625, 18.7303466796875, 19.11865234375, 19.5069580078125, 19.895263671875, 20.2835693359375, 20.671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 5.0, 5.0, 14.0, 18.0, 20.0, 26.0, 42.0, 40.0, 50.0, 62.0, 62.0, 49.0, 64.0, 76.0, 71.0, 56.0, 65.0, 52.0, 40.0, 39.0, 36.0, 23.0, 20.0, 20.0, 11.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1353759765625, -0.13004112243652344, -0.12470626831054688, -0.11937141418457031, -0.11403656005859375, -0.10870170593261719, -0.10336685180664062, -0.09803199768066406, -0.0926971435546875, -0.08736228942871094, -0.08202743530273438, -0.07669258117675781, -0.07135772705078125, -0.06602287292480469, -0.060688018798828125, -0.05535316467285156, -0.050018310546875, -0.04468345642089844, -0.039348602294921875, -0.03401374816894531, -0.02867889404296875, -0.023344039916992188, -0.018009185791015625, -0.012674331665039062, -0.0073394775390625, -0.0020046234130859375, 0.003330230712890625, 0.008665084838867188, 0.01399993896484375, 0.019334793090820312, 0.024669647216796875, 0.030004501342773438, 0.03533935546875, 0.04067420959472656, 0.046009063720703125, 0.05134391784667969, 0.05667877197265625, 0.06201362609863281, 0.06734848022460938, 0.07268333435058594, 0.0780181884765625, 0.08335304260253906, 0.08868789672851562, 0.09402275085449219, 0.09935760498046875, 0.10469245910644531, 0.11002731323242188, 0.11536216735839844, 0.120697021484375, 0.12603187561035156, 0.13136672973632812, 0.1367015838623047, 0.14203643798828125, 0.1473712921142578, 0.15270614624023438, 0.15804100036621094, 0.1633758544921875, 0.16871070861816406, 0.17404556274414062, 0.1793804168701172, 0.18471527099609375, 0.1900501251220703, 0.19538497924804688, 0.20071983337402344, 0.2060546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 11.0, 31.0, 54.0, 90.0, 127.0, 244.0, 486.0, 84251.0, 4107435.0, 885.0, 260.0, 187.0, 109.0, 68.0, 29.0, 16.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.625, -14.71435546875, -13.8037109375, -12.89306640625, -11.982421875, -11.07177734375, -10.1611328125, -9.25048828125, -8.33984375, -7.42919921875, -6.5185546875, -5.60791015625, -4.697265625, -3.78662109375, -2.8759765625, -1.96533203125, -1.0546875, -0.14404296875, 0.7666015625, 1.67724609375, 2.587890625, 3.49853515625, 4.4091796875, 5.31982421875, 6.23046875, 7.14111328125, 8.0517578125, 8.96240234375, 9.873046875, 10.78369140625, 11.6943359375, 12.60498046875, 13.515625, 14.42626953125, 15.3369140625, 16.24755859375, 17.158203125, 18.06884765625, 18.9794921875, 19.89013671875, 20.80078125, 21.71142578125, 22.6220703125, 23.53271484375, 24.443359375, 25.35400390625, 26.2646484375, 27.17529296875, 28.0859375, 28.99658203125, 29.9072265625, 30.81787109375, 31.728515625, 32.63916015625, 33.5498046875, 34.46044921875, 35.37109375, 36.28173828125, 37.1923828125, 38.10302734375, 39.013671875, 39.92431640625, 40.8349609375, 41.74560546875, 42.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 32.0, 69.0, 195.0, 643.0, 2448.0, 468.0, 137.0, 38.0, 23.0, 12.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.98333740234375, -0.9373779296875, -0.89141845703125, -0.845458984375, -0.79949951171875, -0.7535400390625, -0.70758056640625, -0.66162109375, -0.61566162109375, -0.5697021484375, -0.52374267578125, -0.477783203125, -0.43182373046875, -0.3858642578125, -0.33990478515625, -0.2939453125, -0.24798583984375, -0.2020263671875, -0.15606689453125, -0.110107421875, -0.06414794921875, -0.0181884765625, 0.02777099609375, 0.07373046875, 0.11968994140625, 0.1656494140625, 0.21160888671875, 0.257568359375, 0.30352783203125, 0.3494873046875, 0.39544677734375, 0.44140625, 0.48736572265625, 0.5333251953125, 0.57928466796875, 0.625244140625, 0.67120361328125, 0.7171630859375, 0.76312255859375, 0.80908203125, 0.85504150390625, 0.9010009765625, 0.94696044921875, 0.992919921875, 1.03887939453125, 1.0848388671875, 1.13079833984375, 1.1767578125, 1.22271728515625, 1.2686767578125, 1.31463623046875, 1.360595703125, 1.40655517578125, 1.4525146484375, 1.49847412109375, 1.54443359375, 1.59039306640625, 1.6363525390625, 1.68231201171875, 1.728271484375, 1.77423095703125, 1.8201904296875, 1.86614990234375, 1.912109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 88.0, 768.0, 124.0, 14.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.58824157714844, -42.15888595581055, -40.729530334472656, -39.3001708984375, -37.87081527709961, -36.44145965576172, -35.01210403442383, -33.58274841308594, -32.15338897705078, -30.72403335571289, -29.294675827026367, -27.865320205688477, -26.435962677001953, -25.006607055664062, -23.577251434326172, -22.14789390563965, -20.718538284301758, -19.289182662963867, -17.859825134277344, -16.430469512939453, -15.00111198425293, -13.571756362915039, -12.142399787902832, -10.713043212890625, -9.283686637878418, -7.854330062866211, -6.424973487854004, -4.995617389678955, -3.566260814666748, -2.136904239654541, -0.7075481414794922, 0.7218084335327148, 2.151165008544922, 3.580521583557129, 5.009878158569336, 6.439234256744385, 7.868590831756592, 9.29794692993164, 10.727303504943848, 12.156660079956055, 13.586016654968262, 15.015373229980469, 16.44472885131836, 17.874086380004883, 19.303442001342773, 20.732799530029297, 22.162155151367188, 23.591510772705078, 25.0208683013916, 26.450223922729492, 27.879581451416016, 29.308937072753906, 30.73829460144043, 32.16765213012695, 33.597007751464844, 35.026363372802734, 36.455718994140625, 37.885074615478516, 39.314430236816406, 40.74378967285156, 42.17314529418945, 43.602500915527344, 45.031856536865234, 46.461212158203125, 47.89057159423828]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 9.0, 16.0, 17.0, 30.0, 35.0, 45.0, 52.0, 66.0, 69.0, 87.0, 84.0, 93.0, 79.0, 61.0, 70.0, 53.0, 34.0, 36.0, 17.0, 17.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00689172744751, -3.8794171810150146, -3.7519426345825195, -3.6244678497314453, -3.49699330329895, -3.369518756866455, -3.242043972015381, -3.1145694255828857, -2.9870948791503906, -2.8596203327178955, -2.7321457862854004, -2.604671001434326, -2.477196455001831, -2.349721908569336, -2.2222471237182617, -2.0947725772857666, -1.9672980308532715, -1.8398234844207764, -1.7123488187789917, -1.584874153137207, -1.457399606704712, -1.3299250602722168, -1.2024503946304321, -1.0749757289886475, -0.9475011825561523, -0.8200265765190125, -0.6925519704818726, -0.5650773644447327, -0.4376027584075928, -0.3101281523704529, -0.182653546333313, -0.055178940296173096, 0.072296142578125, 0.1997707486152649, 0.3272453546524048, 0.4547199606895447, 0.5821945667266846, 0.7096691727638245, 0.8371437788009644, 0.9646183848381042, 1.0920929908752441, 1.2195675373077393, 1.347042202949524, 1.4745168685913086, 1.6019914150238037, 1.7294659614562988, 1.8569406270980835, 1.9844152927398682, 2.1118898391723633, 2.2393643856048584, 2.3668389320373535, 2.4943137168884277, 2.621788263320923, 2.749262809753418, 2.876737594604492, 3.0042121410369873, 3.1316866874694824, 3.2591612339019775, 3.3866357803344727, 3.514110565185547, 3.641585111618042, 3.769059658050537, 3.8965344429016113, 4.024008750915527, 4.151483535766602]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 8.0, 10.0, 9.0, 20.0, 10.0, 16.0, 29.0, 26.0, 37.0, 48.0, 87.0, 130.0, 285.0, 504.0, 1084.0, 2649.0, 10690.0, 73798.0, 516290.0, 383521.0, 47618.0, 7587.0, 2143.0, 817.0, 445.0, 259.0, 117.0, 85.0, 47.0, 28.0, 26.0, 17.0, 15.0, 15.0, 23.0, 13.0, 12.0, 4.0, 9.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.841796875, -3.713287353515625, -3.58477783203125, -3.456268310546875, -3.3277587890625, -3.199249267578125, -3.07073974609375, -2.942230224609375, -2.813720703125, -2.685211181640625, -2.55670166015625, -2.428192138671875, -2.2996826171875, -2.171173095703125, -2.04266357421875, -1.914154052734375, -1.78564453125, -1.657135009765625, -1.52862548828125, -1.400115966796875, -1.2716064453125, -1.143096923828125, -1.01458740234375, -0.886077880859375, -0.757568359375, -0.629058837890625, -0.50054931640625, -0.372039794921875, -0.2435302734375, -0.115020751953125, 0.01348876953125, 0.141998291015625, 0.2705078125, 0.399017333984375, 0.52752685546875, 0.656036376953125, 0.7845458984375, 0.913055419921875, 1.04156494140625, 1.170074462890625, 1.298583984375, 1.427093505859375, 1.55560302734375, 1.684112548828125, 1.8126220703125, 1.941131591796875, 2.06964111328125, 2.198150634765625, 2.32666015625, 2.455169677734375, 2.58367919921875, 2.712188720703125, 2.8406982421875, 2.969207763671875, 3.09771728515625, 3.226226806640625, 3.354736328125, 3.483245849609375, 3.61175537109375, 3.740264892578125, 3.8687744140625, 3.997283935546875, 4.12579345703125, 4.254302978515625, 4.3828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 17.0, 25.0, 34.0, 39.0, 47.0, 55.0, 64.0, 84.0, 97.0, 81.0, 83.0, 76.0, 63.0, 61.0, 53.0, 36.0, 26.0, 20.0, 11.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.258087158203125, -0.24932861328125, -0.240570068359375, -0.2318115234375, -0.223052978515625, -0.21429443359375, -0.205535888671875, -0.19677734375, -0.188018798828125, -0.17926025390625, -0.170501708984375, -0.1617431640625, -0.152984619140625, -0.14422607421875, -0.135467529296875, -0.126708984375, -0.117950439453125, -0.10919189453125, -0.100433349609375, -0.0916748046875, -0.082916259765625, -0.07415771484375, -0.065399169921875, -0.056640625, -0.047882080078125, -0.03912353515625, -0.030364990234375, -0.0216064453125, -0.012847900390625, -0.00408935546875, 0.004669189453125, 0.013427734375, 0.022186279296875, 0.03094482421875, 0.039703369140625, 0.0484619140625, 0.057220458984375, 0.06597900390625, 0.074737548828125, 0.08349609375, 0.092254638671875, 0.10101318359375, 0.109771728515625, 0.1185302734375, 0.127288818359375, 0.13604736328125, 0.144805908203125, 0.153564453125, 0.162322998046875, 0.17108154296875, 0.179840087890625, 0.1885986328125, 0.197357177734375, 0.20611572265625, 0.214874267578125, 0.2236328125, 0.232391357421875, 0.24114990234375, 0.249908447265625, 0.2586669921875, 0.267425537109375, 0.27618408203125, 0.284942626953125, 0.293701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 10.0, 15.0, 17.0, 26.0, 39.0, 52.0, 94.0, 203.0, 533.0, 1590.0, 5334.0, 24171.0, 164001.0, 604320.0, 208113.0, 30630.0, 6434.0, 1782.0, 614.0, 245.0, 104.0, 54.0, 24.0, 26.0, 18.0, 18.0, 15.0, 8.0, 8.0, 12.0, 3.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.00762939453125, -2.9058837890625, -2.80413818359375, -2.702392578125, -2.60064697265625, -2.4989013671875, -2.39715576171875, -2.29541015625, -2.19366455078125, -2.0919189453125, -1.99017333984375, -1.888427734375, -1.78668212890625, -1.6849365234375, -1.58319091796875, -1.4814453125, -1.37969970703125, -1.2779541015625, -1.17620849609375, -1.074462890625, -0.97271728515625, -0.8709716796875, -0.76922607421875, -0.66748046875, -0.56573486328125, -0.4639892578125, -0.36224365234375, -0.260498046875, -0.15875244140625, -0.0570068359375, 0.04473876953125, 0.146484375, 0.24822998046875, 0.3499755859375, 0.45172119140625, 0.553466796875, 0.65521240234375, 0.7569580078125, 0.85870361328125, 0.96044921875, 1.06219482421875, 1.1639404296875, 1.26568603515625, 1.367431640625, 1.46917724609375, 1.5709228515625, 1.67266845703125, 1.7744140625, 1.87615966796875, 1.9779052734375, 2.07965087890625, 2.181396484375, 2.28314208984375, 2.3848876953125, 2.48663330078125, 2.58837890625, 2.69012451171875, 2.7918701171875, 2.89361572265625, 2.995361328125, 3.09710693359375, 3.1988525390625, 3.30059814453125, 3.40234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 11.0, 11.0, 16.0, 16.0, 25.0, 27.0, 22.0, 21.0, 29.0, 29.0, 31.0, 42.0, 35.0, 47.0, 33.0, 45.0, 38.0, 47.0, 32.0, 40.0, 44.0, 41.0, 34.0, 31.0, 31.0, 35.0, 16.0, 24.0, 20.0, 20.0, 14.0, 12.0, 11.0, 10.0, 16.0, 10.0, 3.0, 8.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.83642578125, -0.8103103637695312, -0.7841949462890625, -0.7580795288085938, -0.731964111328125, -0.7058486938476562, -0.6797332763671875, -0.6536178588867188, -0.62750244140625, -0.6013870239257812, -0.5752716064453125, -0.5491561889648438, -0.523040771484375, -0.49692535400390625, -0.4708099365234375, -0.44469451904296875, -0.4185791015625, -0.39246368408203125, -0.3663482666015625, -0.34023284912109375, -0.314117431640625, -0.28800201416015625, -0.2618865966796875, -0.23577117919921875, -0.20965576171875, -0.18354034423828125, -0.1574249267578125, -0.13130950927734375, -0.105194091796875, -0.07907867431640625, -0.0529632568359375, -0.02684783935546875, -0.000732421875, 0.02538299560546875, 0.0514984130859375, 0.07761383056640625, 0.103729248046875, 0.12984466552734375, 0.1559600830078125, 0.18207550048828125, 0.20819091796875, 0.23430633544921875, 0.2604217529296875, 0.28653717041015625, 0.312652587890625, 0.33876800537109375, 0.3648834228515625, 0.39099884033203125, 0.4171142578125, 0.44322967529296875, 0.4693450927734375, 0.49546051025390625, 0.521575927734375, 0.5476913452148438, 0.5738067626953125, 0.5999221801757812, 0.62603759765625, 0.6521530151367188, 0.6782684326171875, 0.7043838500976562, 0.730499267578125, 0.7566146850585938, 0.7827301025390625, 0.8088455200195312, 0.8349609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 17.0, 30.0, 48.0, 87.0, 135.0, 269.0, 553.0, 1254.0, 3308.0, 11445.0, 76354.0, 632188.0, 284546.0, 28573.0, 5986.0, 2079.0, 802.0, 356.0, 220.0, 107.0, 68.0, 46.0, 19.0, 12.0, 8.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.34210205078125, -3.2486572265625, -3.15521240234375, -3.061767578125, -2.96832275390625, -2.8748779296875, -2.78143310546875, -2.68798828125, -2.59454345703125, -2.5010986328125, -2.40765380859375, -2.314208984375, -2.22076416015625, -2.1273193359375, -2.03387451171875, -1.9404296875, -1.84698486328125, -1.7535400390625, -1.66009521484375, -1.566650390625, -1.47320556640625, -1.3797607421875, -1.28631591796875, -1.19287109375, -1.09942626953125, -1.0059814453125, -0.91253662109375, -0.819091796875, -0.72564697265625, -0.6322021484375, -0.53875732421875, -0.4453125, -0.35186767578125, -0.2584228515625, -0.16497802734375, -0.071533203125, 0.02191162109375, 0.1153564453125, 0.20880126953125, 0.30224609375, 0.39569091796875, 0.4891357421875, 0.58258056640625, 0.676025390625, 0.76947021484375, 0.8629150390625, 0.95635986328125, 1.0498046875, 1.14324951171875, 1.2366943359375, 1.33013916015625, 1.423583984375, 1.51702880859375, 1.6104736328125, 1.70391845703125, 1.79736328125, 1.89080810546875, 1.9842529296875, 2.07769775390625, 2.171142578125, 2.26458740234375, 2.3580322265625, 2.45147705078125, 2.544921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 24.0, 16.0, 31.0, 61.0, 74.0, 103.0, 137.0, 158.0, 119.0, 85.0, 59.0, 48.0, 22.0, 16.0, 14.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003528594970703125, -0.0003422647714614868, -0.00033167004585266113, -0.00032107532024383545, -0.00031048059463500977, -0.0002998858690261841, -0.0002892911434173584, -0.0002786964178085327, -0.00026810169219970703, -0.00025750696659088135, -0.00024691224098205566, -0.00023631751537322998, -0.0002257227897644043, -0.0002151280641555786, -0.00020453333854675293, -0.00019393861293792725, -0.00018334388732910156, -0.00017274916172027588, -0.0001621544361114502, -0.0001515597105026245, -0.00014096498489379883, -0.00013037025928497314, -0.00011977553367614746, -0.00010918080806732178, -9.85860824584961e-05, -8.799135684967041e-05, -7.739663124084473e-05, -6.680190563201904e-05, -5.620718002319336e-05, -4.5612454414367676e-05, -3.501772880554199e-05, -2.442300319671631e-05, -1.3828277587890625e-05, -3.2335519790649414e-06, 7.361173629760742e-06, 1.7955899238586426e-05, 2.855062484741211e-05, 3.914535045623779e-05, 4.9740076065063477e-05, 6.033480167388916e-05, 7.092952728271484e-05, 8.152425289154053e-05, 9.211897850036621e-05, 0.0001027137041091919, 0.00011330842971801758, 0.00012390315532684326, 0.00013449788093566895, 0.00014509260654449463, 0.0001556873321533203, 0.000166282057762146, 0.00017687678337097168, 0.00018747150897979736, 0.00019806623458862305, 0.00020866096019744873, 0.00021925568580627441, 0.0002298504114151001, 0.00024044513702392578, 0.00025103986263275146, 0.00026163458824157715, 0.00027222931385040283, 0.0002828240394592285, 0.0002934187650680542, 0.0003040134906768799, 0.00031460821628570557, 0.00032520294189453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 12.0, 17.0, 16.0, 34.0, 46.0, 77.0, 167.0, 344.0, 707.0, 2084.0, 8328.0, 69633.0, 644571.0, 292141.0, 24166.0, 4037.0, 1148.0, 476.0, 189.0, 132.0, 77.0, 51.0, 19.0, 22.0, 7.0, 10.0, 9.0, 9.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.2421875, -4.14300537109375, -4.0438232421875, -3.94464111328125, -3.845458984375, -3.74627685546875, -3.6470947265625, -3.54791259765625, -3.44873046875, -3.34954833984375, -3.2503662109375, -3.15118408203125, -3.052001953125, -2.95281982421875, -2.8536376953125, -2.75445556640625, -2.6552734375, -2.55609130859375, -2.4569091796875, -2.35772705078125, -2.258544921875, -2.15936279296875, -2.0601806640625, -1.96099853515625, -1.86181640625, -1.76263427734375, -1.6634521484375, -1.56427001953125, -1.465087890625, -1.36590576171875, -1.2667236328125, -1.16754150390625, -1.068359375, -0.96917724609375, -0.8699951171875, -0.77081298828125, -0.671630859375, -0.57244873046875, -0.4732666015625, -0.37408447265625, -0.27490234375, -0.17572021484375, -0.0765380859375, 0.02264404296875, 0.121826171875, 0.22100830078125, 0.3201904296875, 0.41937255859375, 0.5185546875, 0.61773681640625, 0.7169189453125, 0.81610107421875, 0.915283203125, 1.01446533203125, 1.1136474609375, 1.21282958984375, 1.31201171875, 1.41119384765625, 1.5103759765625, 1.60955810546875, 1.708740234375, 1.80792236328125, 1.9071044921875, 2.00628662109375, 2.10546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 4.0, 10.0, 15.0, 24.0, 26.0, 38.0, 44.0, 86.0, 73.0, 96.0, 94.0, 82.0, 77.0, 80.0, 61.0, 47.0, 35.0, 27.0, 17.0, 13.0, 6.0, 9.0, 4.0, 8.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7080078125, -1.6679000854492188, -1.6277923583984375, -1.5876846313476562, -1.547576904296875, -1.5074691772460938, -1.4673614501953125, -1.4272537231445312, -1.38714599609375, -1.3470382690429688, -1.3069305419921875, -1.2668228149414062, -1.226715087890625, -1.1866073608398438, -1.1464996337890625, -1.1063919067382812, -1.0662841796875, -1.0261764526367188, -0.9860687255859375, -0.9459609985351562, -0.905853271484375, -0.8657455444335938, -0.8256378173828125, -0.7855300903320312, -0.74542236328125, -0.7053146362304688, -0.6652069091796875, -0.6250991821289062, -0.584991455078125, -0.5448837280273438, -0.5047760009765625, -0.46466827392578125, -0.424560546875, -0.38445281982421875, -0.3443450927734375, -0.30423736572265625, -0.264129638671875, -0.22402191162109375, -0.1839141845703125, -0.14380645751953125, -0.10369873046875, -0.06359100341796875, -0.0234832763671875, 0.01662445068359375, 0.056732177734375, 0.09683990478515625, 0.1369476318359375, 0.17705535888671875, 0.2171630859375, 0.25727081298828125, 0.2973785400390625, 0.33748626708984375, 0.377593994140625, 0.41770172119140625, 0.4578094482421875, 0.49791717529296875, 0.53802490234375, 0.5781326293945312, 0.6182403564453125, 0.6583480834960938, 0.698455810546875, 0.7385635375976562, 0.7786712646484375, 0.8187789916992188, 0.85888671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 34.0, 141.0, 436.0, 318.0, 57.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.23845672607422, -17.749343872070312, -16.260231018066406, -14.7711181640625, -13.282005310058594, -11.792892456054688, -10.303780555725098, -8.814667701721191, -7.325554847717285, -5.836441993713379, -4.347329139709473, -2.8582167625427246, -1.3691039085388184, 0.12000894546508789, 1.609121322631836, 3.098234176635742, 4.587347030639648, 6.076459884643555, 7.565572738647461, 9.054685592651367, 10.543798446655273, 12.03291130065918, 13.52202320098877, 15.011136054992676, 16.500247955322266, 17.989360809326172, 19.478473663330078, 20.967586517333984, 22.45669937133789, 23.945812225341797, 25.434925079345703, 26.92403793334961, 28.413150787353516, 29.902263641357422, 31.391376495361328, 32.880489349365234, 34.36960220336914, 35.85871505737305, 37.34782791137695, 38.83694076538086, 40.326053619384766, 41.81516647338867, 43.30427932739258, 44.793392181396484, 46.28250503540039, 47.7716178894043, 49.2607307434082, 50.74984359741211, 52.23895263671875, 53.728065490722656, 55.21717834472656, 56.70629119873047, 58.195404052734375, 59.68451690673828, 61.17362976074219, 62.662742614746094, 64.15185546875, 65.6409683227539, 67.13008117675781, 68.61919403076172, 70.10830688476562, 71.59741973876953, 73.08653259277344, 74.57564544677734, 76.06475830078125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 23.0, 10.0, 21.0, 20.0, 23.0, 33.0, 40.0, 34.0, 50.0, 48.0, 42.0, 62.0, 49.0, 41.0, 38.0, 54.0, 54.0, 34.0, 42.0, 35.0, 32.0, 33.0, 26.0, 23.0, 14.0, 15.0, 18.0, 7.0, 10.0, 8.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.494129180908203, -6.2764458656311035, -6.058763027191162, -5.8410797119140625, -5.623396396636963, -5.405713081359863, -5.188030242919922, -4.970346927642822, -4.752663612365723, -4.534980297088623, -4.317297458648682, -4.099614143371582, -3.8819308280944824, -3.664247751235962, -3.4465646743774414, -3.228881359100342, -3.0111982822418213, -2.793515205383301, -2.575831890106201, -2.3581488132476807, -2.140465497970581, -1.9227824211120605, -1.7050992250442505, -1.4874160289764404, -1.2697328329086304, -1.0520496368408203, -0.8343664407730103, -0.616683304309845, -0.3990001082420349, -0.18131697177886963, 0.03636622428894043, 0.2540494203567505, 0.47173261642456055, 0.6894158124923706, 0.9070990085601807, 1.1247820854187012, 1.3424654006958008, 1.5601484775543213, 1.7778316736221313, 1.9955148696899414, 2.213198184967041, 2.4308812618255615, 2.648564577102661, 2.8662476539611816, 3.0839309692382812, 3.3016140460968018, 3.5192971229553223, 3.736980438232422, 3.9546635150909424, 4.172346591949463, 4.3900299072265625, 4.607713222503662, 4.8253960609436035, 5.043079376220703, 5.260762691497803, 5.478446006774902, 5.696128845214844, 5.913812160491943, 6.131494998931885, 6.349178314208984, 6.566861629486084, 6.784544944763184, 7.002227783203125, 7.219911098480225, 7.437594413757324]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 13.0, 29.0, 73.0, 150.0, 392.0, 1635.0, 12219.0, 594274.0, 3559695.0, 22443.0, 2367.0, 547.0, 204.0, 89.0, 52.0, 25.0, 26.0, 14.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.199371337890625, -2.95538330078125, -2.711395263671875, -2.4674072265625, -2.223419189453125, -1.97943115234375, -1.735443115234375, -1.491455078125, -1.247467041015625, -1.00347900390625, -0.759490966796875, -0.5155029296875, -0.271514892578125, -0.02752685546875, 0.216461181640625, 0.46044921875, 0.704437255859375, 0.94842529296875, 1.192413330078125, 1.4364013671875, 1.680389404296875, 1.92437744140625, 2.168365478515625, 2.412353515625, 2.656341552734375, 2.90032958984375, 3.144317626953125, 3.3883056640625, 3.632293701171875, 3.87628173828125, 4.120269775390625, 4.3642578125, 4.608245849609375, 4.85223388671875, 5.096221923828125, 5.3402099609375, 5.584197998046875, 5.82818603515625, 6.072174072265625, 6.316162109375, 6.560150146484375, 6.80413818359375, 7.048126220703125, 7.2921142578125, 7.536102294921875, 7.78009033203125, 8.024078369140625, 8.26806640625, 8.512054443359375, 8.75604248046875, 9.000030517578125, 9.2440185546875, 9.488006591796875, 9.73199462890625, 9.975982666015625, 10.219970703125, 10.463958740234375, 10.70794677734375, 10.951934814453125, 11.1959228515625, 11.439910888671875, 11.68389892578125, 11.927886962890625, 12.171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 9.0, 20.0, 19.0, 30.0, 36.0, 39.0, 63.0, 73.0, 64.0, 80.0, 68.0, 79.0, 86.0, 56.0, 56.0, 50.0, 45.0, 34.0, 34.0, 9.0, 12.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2349853515625, -0.2261943817138672, -0.21740341186523438, -0.20861244201660156, -0.19982147216796875, -0.19103050231933594, -0.18223953247070312, -0.1734485626220703, -0.1646575927734375, -0.1558666229248047, -0.14707565307617188, -0.13828468322753906, -0.12949371337890625, -0.12070274353027344, -0.11191177368164062, -0.10312080383300781, -0.094329833984375, -0.08553886413574219, -0.07674789428710938, -0.06795692443847656, -0.05916595458984375, -0.05037498474121094, -0.041584014892578125, -0.03279304504394531, -0.0240020751953125, -0.015211105346679688, -0.006420135498046875, 0.0023708343505859375, 0.01116180419921875, 0.019952774047851562, 0.028743743896484375, 0.03753471374511719, 0.04632568359375, 0.05511665344238281, 0.06390762329101562, 0.07269859313964844, 0.08148956298828125, 0.09028053283691406, 0.09907150268554688, 0.10786247253417969, 0.1166534423828125, 0.1254444122314453, 0.13423538208007812, 0.14302635192871094, 0.15181732177734375, 0.16060829162597656, 0.16939926147460938, 0.1781902313232422, 0.186981201171875, 0.1957721710205078, 0.20456314086914062, 0.21335411071777344, 0.22214508056640625, 0.23093605041503906, 0.23972702026367188, 0.2485179901123047, 0.2573089599609375, 0.2660999298095703, 0.2748908996582031, 0.28368186950683594, 0.29247283935546875, 0.30126380920410156, 0.3100547790527344, 0.3188457489013672, 0.32763671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 12.0, 15.0, 47.0, 79.0, 186.0, 579.0, 5342.0, 4168900.0, 17522.0, 1020.0, 317.0, 114.0, 71.0, 34.0, 25.0, 3.0, 10.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.6331787109375, -9.992919921875, -9.3526611328125, -8.71240234375, -8.0721435546875, -7.431884765625, -6.7916259765625, -6.1513671875, -5.5111083984375, -4.870849609375, -4.2305908203125, -3.59033203125, -2.9500732421875, -2.309814453125, -1.6695556640625, -1.029296875, -0.3890380859375, 0.251220703125, 0.8914794921875, 1.53173828125, 2.1719970703125, 2.812255859375, 3.4525146484375, 4.0927734375, 4.7330322265625, 5.373291015625, 6.0135498046875, 6.65380859375, 7.2940673828125, 7.934326171875, 8.5745849609375, 9.21484375, 9.8551025390625, 10.495361328125, 11.1356201171875, 11.77587890625, 12.4161376953125, 13.056396484375, 13.6966552734375, 14.3369140625, 14.9771728515625, 15.617431640625, 16.2576904296875, 16.89794921875, 17.5382080078125, 18.178466796875, 18.8187255859375, 19.458984375, 20.0992431640625, 20.739501953125, 21.3797607421875, 22.02001953125, 22.6602783203125, 23.300537109375, 23.9407958984375, 24.5810546875, 25.2213134765625, 25.861572265625, 26.5018310546875, 27.14208984375, 27.7823486328125, 28.422607421875, 29.0628662109375, 29.703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 19.0, 24.0, 45.0, 90.0, 208.0, 506.0, 1739.0, 856.0, 320.0, 126.0, 55.0, 41.0, 19.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.49378204345703125, -0.4577789306640625, -0.42177581787109375, -0.385772705078125, -0.34976959228515625, -0.3137664794921875, -0.27776336669921875, -0.24176025390625, -0.20575714111328125, -0.1697540283203125, -0.13375091552734375, -0.097747802734375, -0.06174468994140625, -0.0257415771484375, 0.01026153564453125, 0.0462646484375, 0.08226776123046875, 0.1182708740234375, 0.15427398681640625, 0.190277099609375, 0.22628021240234375, 0.2622833251953125, 0.29828643798828125, 0.33428955078125, 0.37029266357421875, 0.4062957763671875, 0.44229888916015625, 0.478302001953125, 0.5143051147460938, 0.5503082275390625, 0.5863113403320312, 0.622314453125, 0.6583175659179688, 0.6943206787109375, 0.7303237915039062, 0.766326904296875, 0.8023300170898438, 0.8383331298828125, 0.8743362426757812, 0.91033935546875, 0.9463424682617188, 0.9823455810546875, 1.0183486938476562, 1.054351806640625, 1.0903549194335938, 1.1263580322265625, 1.1623611450195312, 1.1983642578125, 1.2343673706054688, 1.2703704833984375, 1.3063735961914062, 1.342376708984375, 1.3783798217773438, 1.4143829345703125, 1.4503860473632812, 1.48638916015625, 1.5223922729492188, 1.5583953857421875, 1.5943984985351562, 1.630401611328125, 1.6664047241210938, 1.7024078369140625, 1.7384109497070312, 1.7744140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 38.0, 511.0, 406.0, 36.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.10993194580078, -51.952728271484375, -50.795528411865234, -49.638328552246094, -48.48112487792969, -47.32392120361328, -46.16672134399414, -45.009521484375, -43.852317810058594, -42.69511413574219, -41.53791427612305, -40.380714416503906, -39.2235107421875, -38.066307067871094, -36.90910720825195, -35.75190734863281, -34.594703674316406, -33.4375, -32.28030014038086, -31.123098373413086, -29.965896606445312, -28.80869483947754, -27.651493072509766, -26.494291305541992, -25.33708953857422, -24.179887771606445, -23.022686004638672, -21.8654842376709, -20.708282470703125, -19.55108070373535, -18.393878936767578, -17.236677169799805, -16.079479217529297, -14.922277450561523, -13.76507568359375, -12.607873916625977, -11.450672149658203, -10.29347038269043, -9.136268615722656, -7.979066848754883, -6.821865081787109, -5.664663314819336, -4.5074615478515625, -3.350259780883789, -2.1930580139160156, -1.0358562469482422, 0.12134552001953125, 1.2785472869873047, 2.435749053955078, 3.5929508209228516, 4.750152587890625, 5.907354354858398, 7.064556121826172, 8.221757888793945, 9.378959655761719, 10.536161422729492, 11.693363189697266, 12.850564956665039, 14.007766723632812, 15.164968490600586, 16.32217025756836, 17.479372024536133, 18.636573791503906, 19.79377555847168, 20.950977325439453]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 13.0, 9.0, 8.0, 22.0, 24.0, 35.0, 33.0, 50.0, 66.0, 57.0, 73.0, 71.0, 69.0, 70.0, 65.0, 65.0, 69.0, 43.0, 32.0, 30.0, 26.0, 21.0, 10.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.728523254394531, -4.588433742523193, -4.4483442306518555, -4.308254718780518, -4.16816520690918, -4.028076171875, -3.887986660003662, -3.747897148132324, -3.6078076362609863, -3.4677181243896484, -3.3276286125183105, -3.1875393390655518, -3.047449827194214, -2.907360315322876, -2.767271041870117, -2.6271815299987793, -2.4870920181274414, -2.3470025062561035, -2.2069129943847656, -2.066823720932007, -1.926734209060669, -1.786644697189331, -1.6465553045272827, -1.5064659118652344, -1.3663763999938965, -1.2262868881225586, -1.0861974954605103, -0.9461080431938171, -0.806018590927124, -0.6659291386604309, -0.5258396863937378, -0.3857502341270447, -0.24566125869750977, -0.10557180643081665, 0.034517645835876465, 0.17460709810256958, 0.3146965503692627, 0.4547860026359558, 0.5948754549026489, 0.734964907169342, 0.8750543594360352, 1.015143871307373, 1.1552332639694214, 1.2953226566314697, 1.4354121685028076, 1.5755016803741455, 1.7155910730361938, 1.8556804656982422, 1.99576997756958, 2.135859489440918, 2.275949001312256, 2.4160382747650146, 2.5561277866363525, 2.6962172985076904, 2.836306571960449, 2.976396083831787, 3.116485595703125, 3.256575107574463, 3.396664619445801, 3.5367538928985596, 3.6768434047698975, 3.8169329166412354, 3.957022190093994, 4.097111701965332, 4.23720121383667]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 15.0, 16.0, 19.0, 26.0, 41.0, 41.0, 55.0, 91.0, 104.0, 173.0, 253.0, 404.0, 721.0, 1509.0, 3935.0, 13462.0, 58796.0, 305040.0, 504920.0, 121870.0, 25635.0, 6619.0, 2269.0, 961.0, 515.0, 291.0, 218.0, 134.0, 101.0, 55.0, 67.0, 41.0, 27.0, 33.0, 19.0, 13.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.6875, -3.576507568359375, -3.46551513671875, -3.354522705078125, -3.2435302734375, -3.132537841796875, -3.02154541015625, -2.910552978515625, -2.799560546875, -2.688568115234375, -2.57757568359375, -2.466583251953125, -2.3555908203125, -2.244598388671875, -2.13360595703125, -2.022613525390625, -1.91162109375, -1.800628662109375, -1.68963623046875, -1.578643798828125, -1.4676513671875, -1.356658935546875, -1.24566650390625, -1.134674072265625, -1.023681640625, -0.912689208984375, -0.80169677734375, -0.690704345703125, -0.5797119140625, -0.468719482421875, -0.35772705078125, -0.246734619140625, -0.1357421875, -0.024749755859375, 0.08624267578125, 0.197235107421875, 0.3082275390625, 0.419219970703125, 0.53021240234375, 0.641204833984375, 0.752197265625, 0.863189697265625, 0.97418212890625, 1.085174560546875, 1.1961669921875, 1.307159423828125, 1.41815185546875, 1.529144287109375, 1.64013671875, 1.751129150390625, 1.86212158203125, 1.973114013671875, 2.0841064453125, 2.195098876953125, 2.30609130859375, 2.417083740234375, 2.528076171875, 2.639068603515625, 2.75006103515625, 2.861053466796875, 2.9720458984375, 3.083038330078125, 3.19403076171875, 3.305023193359375, 3.416015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 9.0, 8.0, 12.0, 19.0, 23.0, 27.0, 38.0, 37.0, 45.0, 46.0, 51.0, 74.0, 59.0, 63.0, 63.0, 69.0, 77.0, 54.0, 36.0, 31.0, 38.0, 41.0, 28.0, 15.0, 13.0, 8.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.33203125, -0.3219032287597656, -0.31177520751953125, -0.3016471862792969, -0.2915191650390625, -0.2813911437988281, -0.27126312255859375, -0.2611351013183594, -0.251007080078125, -0.24087905883789062, -0.23075103759765625, -0.22062301635742188, -0.2104949951171875, -0.20036697387695312, -0.19023895263671875, -0.18011093139648438, -0.16998291015625, -0.15985488891601562, -0.14972686767578125, -0.13959884643554688, -0.1294708251953125, -0.11934280395507812, -0.10921478271484375, -0.09908676147460938, -0.088958740234375, -0.07883071899414062, -0.06870269775390625, -0.058574676513671875, -0.0484466552734375, -0.038318634033203125, -0.02819061279296875, -0.018062591552734375, -0.0079345703125, 0.002193450927734375, 0.01232147216796875, 0.022449493408203125, 0.0325775146484375, 0.042705535888671875, 0.05283355712890625, 0.06296157836914062, 0.073089599609375, 0.08321762084960938, 0.09334564208984375, 0.10347366333007812, 0.1136016845703125, 0.12372970581054688, 0.13385772705078125, 0.14398574829101562, 0.15411376953125, 0.16424179077148438, 0.17436981201171875, 0.18449783325195312, 0.1946258544921875, 0.20475387573242188, 0.21488189697265625, 0.22500991821289062, 0.235137939453125, 0.24526596069335938, 0.25539398193359375, 0.2655220031738281, 0.2756500244140625, 0.2857780456542969, 0.29590606689453125, 0.3060340881347656, 0.316162109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 13.0, 12.0, 27.0, 24.0, 66.0, 79.0, 130.0, 255.0, 455.0, 899.0, 1938.0, 4481.0, 11624.0, 37228.0, 138482.0, 420735.0, 309941.0, 83977.0, 23938.0, 8064.0, 3188.0, 1374.0, 718.0, 367.0, 168.0, 135.0, 77.0, 49.0, 37.0, 18.0, 12.0, 10.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.630859375, -2.557403564453125, -2.48394775390625, -2.410491943359375, -2.3370361328125, -2.263580322265625, -2.19012451171875, -2.116668701171875, -2.043212890625, -1.969757080078125, -1.89630126953125, -1.822845458984375, -1.7493896484375, -1.675933837890625, -1.60247802734375, -1.529022216796875, -1.45556640625, -1.382110595703125, -1.30865478515625, -1.235198974609375, -1.1617431640625, -1.088287353515625, -1.01483154296875, -0.941375732421875, -0.867919921875, -0.794464111328125, -0.72100830078125, -0.647552490234375, -0.5740966796875, -0.500640869140625, -0.42718505859375, -0.353729248046875, -0.2802734375, -0.206817626953125, -0.13336181640625, -0.059906005859375, 0.0135498046875, 0.087005615234375, 0.16046142578125, 0.233917236328125, 0.307373046875, 0.380828857421875, 0.45428466796875, 0.527740478515625, 0.6011962890625, 0.674652099609375, 0.74810791015625, 0.821563720703125, 0.89501953125, 0.968475341796875, 1.04193115234375, 1.115386962890625, 1.1888427734375, 1.262298583984375, 1.33575439453125, 1.409210205078125, 1.482666015625, 1.556121826171875, 1.62957763671875, 1.703033447265625, 1.7764892578125, 1.849945068359375, 1.92340087890625, 1.996856689453125, 2.0703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 6.0, 9.0, 11.0, 11.0, 10.0, 14.0, 20.0, 19.0, 25.0, 21.0, 29.0, 35.0, 36.0, 49.0, 35.0, 48.0, 40.0, 50.0, 37.0, 39.0, 36.0, 41.0, 29.0, 41.0, 26.0, 37.0, 35.0, 35.0, 32.0, 15.0, 30.0, 18.0, 14.0, 16.0, 12.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0], "bins": [-1.3037109375, -1.2694625854492188, -1.2352142333984375, -1.2009658813476562, -1.166717529296875, -1.1324691772460938, -1.0982208251953125, -1.0639724731445312, -1.02972412109375, -0.9954757690429688, -0.9612274169921875, -0.9269790649414062, -0.892730712890625, -0.8584823608398438, -0.8242340087890625, -0.7899856567382812, -0.7557373046875, -0.7214889526367188, -0.6872406005859375, -0.6529922485351562, -0.618743896484375, -0.5844955444335938, -0.5502471923828125, -0.5159988403320312, -0.48175048828125, -0.44750213623046875, -0.4132537841796875, -0.37900543212890625, -0.344757080078125, -0.31050872802734375, -0.2762603759765625, -0.24201202392578125, -0.207763671875, -0.17351531982421875, -0.1392669677734375, -0.10501861572265625, -0.070770263671875, -0.03652191162109375, -0.0022735595703125, 0.03197479248046875, 0.06622314453125, 0.10047149658203125, 0.1347198486328125, 0.16896820068359375, 0.203216552734375, 0.23746490478515625, 0.2717132568359375, 0.30596160888671875, 0.3402099609375, 0.37445831298828125, 0.4087066650390625, 0.44295501708984375, 0.477203369140625, 0.5114517211914062, 0.5457000732421875, 0.5799484252929688, 0.61419677734375, 0.6484451293945312, 0.6826934814453125, 0.7169418334960938, 0.751190185546875, 0.7854385375976562, 0.8196868896484375, 0.8539352416992188, 0.88818359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 10.0, 7.0, 14.0, 10.0, 18.0, 31.0, 46.0, 52.0, 97.0, 136.0, 175.0, 282.0, 436.0, 680.0, 1216.0, 2215.0, 4767.0, 11350.0, 33002.0, 119041.0, 385624.0, 343644.0, 98618.0, 27857.0, 9964.0, 4172.0, 2111.0, 1100.0, 668.0, 394.0, 253.0, 159.0, 141.0, 81.0, 48.0, 34.0, 20.0, 29.0, 21.0, 5.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2974700927734375, -1.254119873046875, -1.2107696533203125, -1.16741943359375, -1.1240692138671875, -1.080718994140625, -1.0373687744140625, -0.9940185546875, -0.9506683349609375, -0.907318115234375, -0.8639678955078125, -0.82061767578125, -0.7772674560546875, -0.733917236328125, -0.6905670166015625, -0.647216796875, -0.6038665771484375, -0.560516357421875, -0.5171661376953125, -0.47381591796875, -0.4304656982421875, -0.387115478515625, -0.3437652587890625, -0.3004150390625, -0.2570648193359375, -0.213714599609375, -0.1703643798828125, -0.12701416015625, -0.0836639404296875, -0.040313720703125, 0.0030364990234375, 0.04638671875, 0.0897369384765625, 0.133087158203125, 0.1764373779296875, 0.21978759765625, 0.2631378173828125, 0.306488037109375, 0.3498382568359375, 0.3931884765625, 0.4365386962890625, 0.479888916015625, 0.5232391357421875, 0.56658935546875, 0.6099395751953125, 0.653289794921875, 0.6966400146484375, 0.739990234375, 0.7833404541015625, 0.826690673828125, 0.8700408935546875, 0.91339111328125, 0.9567413330078125, 1.000091552734375, 1.0434417724609375, 1.0867919921875, 1.1301422119140625, 1.173492431640625, 1.2168426513671875, 1.26019287109375, 1.3035430908203125, 1.346893310546875, 1.3902435302734375, 1.43359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 7.0, 13.0, 11.0, 13.0, 15.0, 26.0, 29.0, 32.0, 44.0, 54.0, 58.0, 82.0, 100.0, 69.0, 66.0, 66.0, 54.0, 70.0, 42.0, 19.0, 24.0, 17.0, 21.0, 12.0, 10.0, 5.0, 10.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00017642974853515625, -0.0001715049147605896, -0.00016658008098602295, -0.0001616552472114563, -0.00015673041343688965, -0.000151805579662323, -0.00014688074588775635, -0.0001419559121131897, -0.00013703107833862305, -0.0001321062445640564, -0.00012718141078948975, -0.0001222565770149231, -0.00011733174324035645, -0.0001124069094657898, -0.00010748207569122314, -0.0001025572419166565, -9.763240814208984e-05, -9.27075743675232e-05, -8.778274059295654e-05, -8.285790681838989e-05, -7.793307304382324e-05, -7.300823926925659e-05, -6.808340549468994e-05, -6.315857172012329e-05, -5.823373794555664e-05, -5.330890417098999e-05, -4.838407039642334e-05, -4.345923662185669e-05, -3.853440284729004e-05, -3.360956907272339e-05, -2.8684735298156738e-05, -2.3759901523590088e-05, -1.8835067749023438e-05, -1.3910233974456787e-05, -8.985400199890137e-06, -4.060566425323486e-06, 8.642673492431641e-07, 5.7891011238098145e-06, 1.0713934898376465e-05, 1.5638768672943115e-05, 2.0563602447509766e-05, 2.5488436222076416e-05, 3.0413269996643066e-05, 3.533810377120972e-05, 4.026293754577637e-05, 4.518777132034302e-05, 5.011260509490967e-05, 5.503743886947632e-05, 5.996227264404297e-05, 6.488710641860962e-05, 6.981194019317627e-05, 7.473677396774292e-05, 7.966160774230957e-05, 8.458644151687622e-05, 8.951127529144287e-05, 9.443610906600952e-05, 9.936094284057617e-05, 0.00010428577661514282, 0.00010921061038970947, 0.00011413544416427612, 0.00011906027793884277, 0.00012398511171340942, 0.00012890994548797607, 0.00013383477926254272, 0.00013875961303710938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 10.0, 7.0, 13.0, 16.0, 24.0, 48.0, 115.0, 226.0, 565.0, 1499.0, 4737.0, 20282.0, 144192.0, 650952.0, 192130.0, 25379.0, 5441.0, 1723.0, 615.0, 314.0, 121.0, 62.0, 30.0, 17.0, 14.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.408203125, -2.336456298828125, -2.26470947265625, -2.192962646484375, -2.1212158203125, -2.049468994140625, -1.97772216796875, -1.905975341796875, -1.834228515625, -1.762481689453125, -1.69073486328125, -1.618988037109375, -1.5472412109375, -1.475494384765625, -1.40374755859375, -1.332000732421875, -1.26025390625, -1.188507080078125, -1.11676025390625, -1.045013427734375, -0.9732666015625, -0.901519775390625, -0.82977294921875, -0.758026123046875, -0.686279296875, -0.614532470703125, -0.54278564453125, -0.471038818359375, -0.3992919921875, -0.327545166015625, -0.25579833984375, -0.184051513671875, -0.1123046875, -0.040557861328125, 0.03118896484375, 0.102935791015625, 0.1746826171875, 0.246429443359375, 0.31817626953125, 0.389923095703125, 0.461669921875, 0.533416748046875, 0.60516357421875, 0.676910400390625, 0.7486572265625, 0.820404052734375, 0.89215087890625, 0.963897705078125, 1.03564453125, 1.107391357421875, 1.17913818359375, 1.250885009765625, 1.3226318359375, 1.394378662109375, 1.46612548828125, 1.537872314453125, 1.609619140625, 1.681365966796875, 1.75311279296875, 1.824859619140625, 1.8966064453125, 1.968353271484375, 2.04010009765625, 2.111846923828125, 2.18359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 20.0, 23.0, 33.0, 38.0, 49.0, 81.0, 86.0, 107.0, 97.0, 88.0, 85.0, 62.0, 50.0, 39.0, 27.0, 25.0, 24.0, 9.0, 10.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5302734375, -1.48486328125, -1.439453125, -1.39404296875, -1.3486328125, -1.30322265625, -1.2578125, -1.21240234375, -1.1669921875, -1.12158203125, -1.076171875, -1.03076171875, -0.9853515625, -0.93994140625, -0.89453125, -0.84912109375, -0.8037109375, -0.75830078125, -0.712890625, -0.66748046875, -0.6220703125, -0.57666015625, -0.53125, -0.48583984375, -0.4404296875, -0.39501953125, -0.349609375, -0.30419921875, -0.2587890625, -0.21337890625, -0.16796875, -0.12255859375, -0.0771484375, -0.03173828125, 0.013671875, 0.05908203125, 0.1044921875, 0.14990234375, 0.1953125, 0.24072265625, 0.2861328125, 0.33154296875, 0.376953125, 0.42236328125, 0.4677734375, 0.51318359375, 0.55859375, 0.60400390625, 0.6494140625, 0.69482421875, 0.740234375, 0.78564453125, 0.8310546875, 0.87646484375, 0.921875, 0.96728515625, 1.0126953125, 1.05810546875, 1.103515625, 1.14892578125, 1.1943359375, 1.23974609375, 1.28515625, 1.33056640625, 1.3759765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 11.0, 31.0, 94.0, 238.0, 339.0, 191.0, 63.0, 17.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.248069763183594, -48.1144905090332, -46.98091125488281, -45.84733200073242, -44.71375274658203, -43.58017349243164, -42.44659423828125, -41.313018798828125, -40.17943572998047, -39.04585647583008, -37.91227722167969, -36.7786979675293, -35.645118713378906, -34.511539459228516, -33.377960205078125, -32.244384765625, -31.11080551147461, -29.97722625732422, -28.843647003173828, -27.710067749023438, -26.576488494873047, -25.442909240722656, -24.3093318939209, -23.175752639770508, -22.042173385620117, -20.908594131469727, -19.775014877319336, -18.641435623168945, -17.507858276367188, -16.374279022216797, -15.240699768066406, -14.107120513916016, -12.97354507446289, -11.8399658203125, -10.70638656616211, -9.572808265686035, -8.439229011535645, -7.305649757385254, -6.1720709800720215, -5.038492202758789, -3.9049129486083984, -2.771333932876587, -1.6377549171447754, -0.5041759014129639, 0.6294031143188477, 1.7629823684692383, 2.8965611457824707, 4.030139923095703, 5.163719177246094, 6.297298431396484, 7.430877208709717, 8.56445598602295, 9.69803524017334, 10.83161449432373, 11.965192794799805, 13.098772048950195, 14.232351303100586, 15.365930557250977, 16.499509811401367, 17.633089065551758, 18.766666412353516, 19.900245666503906, 21.033824920654297, 22.167404174804688, 23.300983428955078]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 10.0, 11.0, 22.0, 14.0, 19.0, 36.0, 36.0, 38.0, 33.0, 43.0, 57.0, 41.0, 48.0, 47.0, 59.0, 52.0, 57.0, 44.0, 55.0, 40.0, 40.0, 33.0, 24.0, 20.0, 26.0, 20.0, 12.0, 11.0, 9.0, 2.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.185792922973633, -8.92286205291748, -8.659931182861328, -8.397000312805176, -8.134069442749023, -7.871138095855713, -7.608206748962402, -7.34527587890625, -7.082345008850098, -6.819414138793945, -6.556483268737793, -6.293551921844482, -6.03062105178833, -5.767690181732178, -5.504758834838867, -5.241827964782715, -4.9788970947265625, -4.71596622467041, -4.453035354614258, -4.190104007720947, -3.927173137664795, -3.6642422676086426, -3.401311159133911, -3.1383800506591797, -2.8754491806030273, -2.612518310546875, -2.3495872020721436, -2.086656093597412, -1.8237252235412598, -1.5607942342758179, -1.297863245010376, -1.034932255744934, -0.7720017433166504, -0.5090707540512085, -0.2461397647857666, 0.016791224479675293, 0.2797222137451172, 0.5426532030105591, 0.805584192276001, 1.0685151815414429, 1.3314461708068848, 1.5943771600723267, 1.8573081493377686, 2.1202392578125, 2.3831701278686523, 2.6461009979248047, 2.909032106399536, 3.1719632148742676, 3.43489408493042, 3.6978249549865723, 3.9607560634613037, 4.223687171936035, 4.4866180419921875, 4.74954891204834, 5.012479782104492, 5.275411128997803, 5.538341999053955, 5.801272869110107, 6.064204216003418, 6.32713508605957, 6.590065956115723, 6.852996826171875, 7.115927696228027, 7.378859043121338, 7.64178991317749]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 12.0, 16.0, 26.0, 52.0, 91.0, 159.0, 297.0, 688.0, 1755.0, 5959.0, 33002.0, 855233.0, 3233293.0, 51661.0, 7903.0, 2235.0, 875.0, 442.0, 205.0, 128.0, 79.0, 57.0, 30.0, 22.0, 10.0, 13.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.037109375, -2.886016845703125, -2.73492431640625, -2.583831787109375, -2.4327392578125, -2.281646728515625, -2.13055419921875, -1.979461669921875, -1.828369140625, -1.677276611328125, -1.52618408203125, -1.375091552734375, -1.2239990234375, -1.072906494140625, -0.92181396484375, -0.770721435546875, -0.61962890625, -0.468536376953125, -0.31744384765625, -0.166351318359375, -0.0152587890625, 0.135833740234375, 0.28692626953125, 0.438018798828125, 0.589111328125, 0.740203857421875, 0.89129638671875, 1.042388916015625, 1.1934814453125, 1.344573974609375, 1.49566650390625, 1.646759033203125, 1.7978515625, 1.948944091796875, 2.10003662109375, 2.251129150390625, 2.4022216796875, 2.553314208984375, 2.70440673828125, 2.855499267578125, 3.006591796875, 3.157684326171875, 3.30877685546875, 3.459869384765625, 3.6109619140625, 3.762054443359375, 3.91314697265625, 4.064239501953125, 4.21533203125, 4.366424560546875, 4.51751708984375, 4.668609619140625, 4.8197021484375, 4.970794677734375, 5.12188720703125, 5.272979736328125, 5.424072265625, 5.575164794921875, 5.72625732421875, 5.877349853515625, 6.0284423828125, 6.179534912109375, 6.33062744140625, 6.481719970703125, 6.6328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 5.0, 11.0, 20.0, 23.0, 27.0, 37.0, 46.0, 48.0, 44.0, 53.0, 59.0, 56.0, 65.0, 59.0, 57.0, 49.0, 68.0, 50.0, 49.0, 31.0, 31.0, 25.0, 14.0, 15.0, 12.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.320068359375, -0.3100318908691406, -0.29999542236328125, -0.2899589538574219, -0.2799224853515625, -0.2698860168457031, -0.25984954833984375, -0.24981307983398438, -0.239776611328125, -0.22974014282226562, -0.21970367431640625, -0.20966720581054688, -0.1996307373046875, -0.18959426879882812, -0.17955780029296875, -0.16952133178710938, -0.15948486328125, -0.14944839477539062, -0.13941192626953125, -0.12937545776367188, -0.1193389892578125, -0.10930252075195312, -0.09926605224609375, -0.08922958374023438, -0.079193115234375, -0.06915664672851562, -0.05912017822265625, -0.049083709716796875, -0.0390472412109375, -0.029010772705078125, -0.01897430419921875, -0.008937835693359375, 0.0010986328125, 0.011135101318359375, 0.02117156982421875, 0.031208038330078125, 0.0412445068359375, 0.051280975341796875, 0.06131744384765625, 0.07135391235351562, 0.081390380859375, 0.09142684936523438, 0.10146331787109375, 0.11149978637695312, 0.1215362548828125, 0.13157272338867188, 0.14160919189453125, 0.15164566040039062, 0.16168212890625, 0.17171859741210938, 0.18175506591796875, 0.19179153442382812, 0.2018280029296875, 0.21186447143554688, 0.22190093994140625, 0.23193740844726562, 0.241973876953125, 0.2520103454589844, 0.26204681396484375, 0.2720832824707031, 0.2821197509765625, 0.2921562194824219, 0.30219268798828125, 0.3122291564941406, 0.322265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 15.0, 23.0, 27.0, 33.0, 51.0, 56.0, 90.0, 150.0, 689.0, 4163884.0, 28595.0, 313.0, 122.0, 75.0, 46.0, 34.0, 28.0, 18.0, 6.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.6875, -45.645751953125, -44.60400390625, -43.562255859375, -42.5205078125, -41.478759765625, -40.43701171875, -39.395263671875, -38.353515625, -37.311767578125, -36.27001953125, -35.228271484375, -34.1865234375, -33.144775390625, -32.10302734375, -31.061279296875, -30.01953125, -28.977783203125, -27.93603515625, -26.894287109375, -25.8525390625, -24.810791015625, -23.76904296875, -22.727294921875, -21.685546875, -20.643798828125, -19.60205078125, -18.560302734375, -17.5185546875, -16.476806640625, -15.43505859375, -14.393310546875, -13.3515625, -12.309814453125, -11.26806640625, -10.226318359375, -9.1845703125, -8.142822265625, -7.10107421875, -6.059326171875, -5.017578125, -3.975830078125, -2.93408203125, -1.892333984375, -0.8505859375, 0.191162109375, 1.23291015625, 2.274658203125, 3.31640625, 4.358154296875, 5.39990234375, 6.441650390625, 7.4833984375, 8.525146484375, 9.56689453125, 10.608642578125, 11.650390625, 12.692138671875, 13.73388671875, 14.775634765625, 15.8173828125, 16.859130859375, 17.90087890625, 18.942626953125, 19.984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 40.0, 333.0, 3221.0, 434.0, 41.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.99334716796875, -5.8616943359375, -5.73004150390625, -5.598388671875, -5.46673583984375, -5.3350830078125, -5.20343017578125, -5.07177734375, -4.94012451171875, -4.8084716796875, -4.67681884765625, -4.545166015625, -4.41351318359375, -4.2818603515625, -4.15020751953125, -4.0185546875, -3.88690185546875, -3.7552490234375, -3.62359619140625, -3.491943359375, -3.36029052734375, -3.2286376953125, -3.09698486328125, -2.96533203125, -2.83367919921875, -2.7020263671875, -2.57037353515625, -2.438720703125, -2.30706787109375, -2.1754150390625, -2.04376220703125, -1.912109375, -1.78045654296875, -1.6488037109375, -1.51715087890625, -1.385498046875, -1.25384521484375, -1.1221923828125, -0.99053955078125, -0.85888671875, -0.72723388671875, -0.5955810546875, -0.46392822265625, -0.332275390625, -0.20062255859375, -0.0689697265625, 0.06268310546875, 0.1943359375, 0.32598876953125, 0.4576416015625, 0.58929443359375, 0.720947265625, 0.85260009765625, 0.9842529296875, 1.11590576171875, 1.24755859375, 1.37921142578125, 1.5108642578125, 1.64251708984375, 1.774169921875, 1.90582275390625, 2.0374755859375, 2.16912841796875, 2.30078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 23.0, 777.0, 204.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78047561645508, -38.81562423706055, -36.85077667236328, -34.88592529296875, -32.92107391357422, -30.956226348876953, -28.991374969482422, -27.026525497436523, -25.061676025390625, -23.096826553344727, -21.131977081298828, -19.167125701904297, -17.2022762298584, -15.2374267578125, -13.272576332092285, -11.30772590637207, -9.342876434326172, -7.378026485443115, -5.413176536560059, -3.448326587677002, -1.4834766387939453, 0.4813728332519531, 2.446223258972168, 4.411073684692383, 6.375923156738281, 8.34077262878418, 10.305623054504395, 12.27047348022461, 14.235322952270508, 16.200172424316406, 18.165023803710938, 20.129873275756836, 22.09471893310547, 24.059568405151367, 26.024417877197266, 27.989269256591797, 29.954118728637695, 31.918968200683594, 33.883819580078125, 35.848670959472656, 37.81351852416992, 39.77836990356445, 41.74321746826172, 43.70806884765625, 45.67292022705078, 47.63776779174805, 49.60261917114258, 51.567466735839844, 53.532318115234375, 55.497169494628906, 57.46201705932617, 59.4268684387207, 61.39171600341797, 63.3565673828125, 65.32141876220703, 67.28627014160156, 69.25111389160156, 71.2159652709961, 73.18081665039062, 75.14566040039062, 77.11051177978516, 79.07536315917969, 81.04021453857422, 83.00506591796875, 84.96991729736328]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 6.0, 19.0, 26.0, 47.0, 76.0, 94.0, 108.0, 117.0, 109.0, 115.0, 111.0, 70.0, 38.0, 33.0, 17.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.464579105377197, -7.1965651512146, -6.928551197052002, -6.660537242889404, -6.392522811889648, -6.124508857727051, -5.856494903564453, -5.5884809494018555, -5.320466995239258, -5.05245304107666, -4.7844390869140625, -4.516425132751465, -4.248411178588867, -3.9803969860076904, -3.7123827934265137, -3.444368839263916, -3.1763548851013184, -2.9083409309387207, -2.640326976776123, -2.3723127841949463, -2.1042988300323486, -1.836284875869751, -1.5682708024978638, -1.3002567291259766, -1.032242774963379, -0.7642287611961365, -0.49621474742889404, -0.2282007336616516, 0.03981328010559082, 0.3078272342681885, 0.5758413076400757, 0.8438553810119629, 1.1118698120117188, 1.3798837661743164, 1.6478978395462036, 1.9159119129180908, 2.1839258670806885, 2.451939821243286, 2.719954013824463, 2.9879679679870605, 3.255981922149658, 3.523995876312256, 3.7920098304748535, 4.060023784637451, 4.328038215637207, 4.596052169799805, 4.864066123962402, 5.132080078125, 5.400094032287598, 5.668107986450195, 5.936121940612793, 6.204135894775391, 6.472149848937988, 6.740163803100586, 7.008178234100342, 7.2761921882629395, 7.544206142425537, 7.812220096588135, 8.08023452758789, 8.348248481750488, 8.616262435913086, 8.884276390075684, 9.152290344238281, 9.420304298400879, 9.688318252563477]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 4.0, 8.0, 17.0, 17.0, 23.0, 44.0, 60.0, 57.0, 104.0, 192.0, 280.0, 571.0, 1105.0, 2150.0, 5284.0, 14483.0, 46043.0, 156196.0, 391562.0, 292564.0, 93300.0, 28131.0, 9198.0, 3573.0, 1636.0, 814.0, 421.0, 233.0, 163.0, 80.0, 72.0, 38.0, 29.0, 24.0, 19.0, 22.0, 11.0, 3.0, 5.0, 1.0, 9.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.224609375, -2.1473388671875, -2.070068359375, -1.9927978515625, -1.91552734375, -1.8382568359375, -1.760986328125, -1.6837158203125, -1.6064453125, -1.5291748046875, -1.451904296875, -1.3746337890625, -1.29736328125, -1.2200927734375, -1.142822265625, -1.0655517578125, -0.98828125, -0.9110107421875, -0.833740234375, -0.7564697265625, -0.67919921875, -0.6019287109375, -0.524658203125, -0.4473876953125, -0.3701171875, -0.2928466796875, -0.215576171875, -0.1383056640625, -0.06103515625, 0.0162353515625, 0.093505859375, 0.1707763671875, 0.248046875, 0.3253173828125, 0.402587890625, 0.4798583984375, 0.55712890625, 0.6343994140625, 0.711669921875, 0.7889404296875, 0.8662109375, 0.9434814453125, 1.020751953125, 1.0980224609375, 1.17529296875, 1.2525634765625, 1.329833984375, 1.4071044921875, 1.484375, 1.5616455078125, 1.638916015625, 1.7161865234375, 1.79345703125, 1.8707275390625, 1.947998046875, 2.0252685546875, 2.1025390625, 2.1798095703125, 2.257080078125, 2.3343505859375, 2.41162109375, 2.4888916015625, 2.566162109375, 2.6434326171875, 2.720703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 10.0, 17.0, 17.0, 11.0, 22.0, 30.0, 25.0, 47.0, 34.0, 44.0, 44.0, 64.0, 63.0, 53.0, 51.0, 46.0, 56.0, 45.0, 50.0, 47.0, 40.0, 33.0, 33.0, 30.0, 23.0, 14.0, 14.0, 9.0, 6.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.323486328125, -0.3138389587402344, -0.30419158935546875, -0.2945442199707031, -0.2848968505859375, -0.2752494812011719, -0.26560211181640625, -0.2559547424316406, -0.246307373046875, -0.23666000366210938, -0.22701263427734375, -0.21736526489257812, -0.2077178955078125, -0.19807052612304688, -0.18842315673828125, -0.17877578735351562, -0.16912841796875, -0.15948104858398438, -0.14983367919921875, -0.14018630981445312, -0.1305389404296875, -0.12089157104492188, -0.11124420166015625, -0.10159683227539062, -0.091949462890625, -0.08230209350585938, -0.07265472412109375, -0.06300735473632812, -0.0533599853515625, -0.043712615966796875, -0.03406524658203125, -0.024417877197265625, -0.0147705078125, -0.005123138427734375, 0.00452423095703125, 0.014171600341796875, 0.0238189697265625, 0.033466339111328125, 0.04311370849609375, 0.052761077880859375, 0.062408447265625, 0.07205581665039062, 0.08170318603515625, 0.09135055541992188, 0.1009979248046875, 0.11064529418945312, 0.12029266357421875, 0.12994003295898438, 0.13958740234375, 0.14923477172851562, 0.15888214111328125, 0.16852951049804688, 0.1781768798828125, 0.18782424926757812, 0.19747161865234375, 0.20711898803710938, 0.216766357421875, 0.22641372680664062, 0.23606109619140625, 0.24570846557617188, 0.2553558349609375, 0.2650032043457031, 0.27465057373046875, 0.2842979431152344, 0.2939453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 8.0, 15.0, 23.0, 29.0, 46.0, 60.0, 79.0, 138.0, 181.0, 313.0, 505.0, 904.0, 1534.0, 2817.0, 5728.0, 12716.0, 32199.0, 92354.0, 250438.0, 357888.0, 184006.0, 63696.0, 23190.0, 9596.0, 4618.0, 2349.0, 1203.0, 674.0, 429.0, 253.0, 192.0, 120.0, 78.0, 48.0, 34.0, 22.0, 12.0, 13.0, 8.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.087890625, -2.0287933349609375, -1.969696044921875, -1.9105987548828125, -1.85150146484375, -1.7924041748046875, -1.733306884765625, -1.6742095947265625, -1.6151123046875, -1.5560150146484375, -1.496917724609375, -1.4378204345703125, -1.37872314453125, -1.3196258544921875, -1.260528564453125, -1.2014312744140625, -1.142333984375, -1.0832366943359375, -1.024139404296875, -0.9650421142578125, -0.90594482421875, -0.8468475341796875, -0.787750244140625, -0.7286529541015625, -0.6695556640625, -0.6104583740234375, -0.551361083984375, -0.4922637939453125, -0.43316650390625, -0.3740692138671875, -0.314971923828125, -0.2558746337890625, -0.19677734375, -0.1376800537109375, -0.078582763671875, -0.0194854736328125, 0.03961181640625, 0.0987091064453125, 0.157806396484375, 0.2169036865234375, 0.2760009765625, 0.3350982666015625, 0.394195556640625, 0.4532928466796875, 0.51239013671875, 0.5714874267578125, 0.630584716796875, 0.6896820068359375, 0.748779296875, 0.8078765869140625, 0.866973876953125, 0.9260711669921875, 0.98516845703125, 1.0442657470703125, 1.103363037109375, 1.1624603271484375, 1.2215576171875, 1.2806549072265625, 1.339752197265625, 1.3988494873046875, 1.45794677734375, 1.5170440673828125, 1.576141357421875, 1.6352386474609375, 1.6943359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 10.0, 12.0, 15.0, 15.0, 17.0, 18.0, 29.0, 14.0, 25.0, 28.0, 27.0, 39.0, 42.0, 41.0, 40.0, 41.0, 44.0, 52.0, 48.0, 48.0, 40.0, 43.0, 28.0, 31.0, 30.0, 30.0, 27.0, 21.0, 29.0, 16.0, 16.0, 12.0, 4.0, 10.0, 6.0, 6.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0], "bins": [-1.443359375, -1.404510498046875, -1.36566162109375, -1.326812744140625, -1.2879638671875, -1.249114990234375, -1.21026611328125, -1.171417236328125, -1.132568359375, -1.093719482421875, -1.05487060546875, -1.016021728515625, -0.9771728515625, -0.938323974609375, -0.89947509765625, -0.860626220703125, -0.82177734375, -0.782928466796875, -0.74407958984375, -0.705230712890625, -0.6663818359375, -0.627532958984375, -0.58868408203125, -0.549835205078125, -0.510986328125, -0.472137451171875, -0.43328857421875, -0.394439697265625, -0.3555908203125, -0.316741943359375, -0.27789306640625, -0.239044189453125, -0.2001953125, -0.161346435546875, -0.12249755859375, -0.083648681640625, -0.0447998046875, -0.005950927734375, 0.03289794921875, 0.071746826171875, 0.110595703125, 0.149444580078125, 0.18829345703125, 0.227142333984375, 0.2659912109375, 0.304840087890625, 0.34368896484375, 0.382537841796875, 0.42138671875, 0.460235595703125, 0.49908447265625, 0.537933349609375, 0.5767822265625, 0.615631103515625, 0.65447998046875, 0.693328857421875, 0.732177734375, 0.771026611328125, 0.80987548828125, 0.848724365234375, 0.8875732421875, 0.926422119140625, 0.96527099609375, 1.004119873046875, 1.04296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 9.0, 17.0, 17.0, 26.0, 34.0, 66.0, 95.0, 142.0, 273.0, 438.0, 800.0, 1617.0, 3267.0, 8462.0, 27569.0, 127179.0, 512353.0, 286607.0, 55127.0, 14527.0, 5113.0, 2259.0, 1065.0, 592.0, 320.0, 193.0, 129.0, 77.0, 54.0, 43.0, 19.0, 13.0, 16.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.515167236328125, -1.46588134765625, -1.416595458984375, -1.3673095703125, -1.318023681640625, -1.26873779296875, -1.219451904296875, -1.170166015625, -1.120880126953125, -1.07159423828125, -1.022308349609375, -0.9730224609375, -0.923736572265625, -0.87445068359375, -0.825164794921875, -0.77587890625, -0.726593017578125, -0.67730712890625, -0.628021240234375, -0.5787353515625, -0.529449462890625, -0.48016357421875, -0.430877685546875, -0.381591796875, -0.332305908203125, -0.28302001953125, -0.233734130859375, -0.1844482421875, -0.135162353515625, -0.08587646484375, -0.036590576171875, 0.0126953125, 0.061981201171875, 0.11126708984375, 0.160552978515625, 0.2098388671875, 0.259124755859375, 0.30841064453125, 0.357696533203125, 0.406982421875, 0.456268310546875, 0.50555419921875, 0.554840087890625, 0.6041259765625, 0.653411865234375, 0.70269775390625, 0.751983642578125, 0.80126953125, 0.850555419921875, 0.89984130859375, 0.949127197265625, 0.9984130859375, 1.047698974609375, 1.09698486328125, 1.146270751953125, 1.195556640625, 1.244842529296875, 1.29412841796875, 1.343414306640625, 1.3927001953125, 1.441986083984375, 1.49127197265625, 1.540557861328125, 1.58984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 9.0, 3.0, 19.0, 16.0, 20.0, 15.0, 26.0, 42.0, 35.0, 46.0, 54.0, 60.0, 57.0, 63.0, 64.0, 61.0, 68.0, 51.0, 51.0, 48.0, 27.0, 24.0, 22.0, 21.0, 24.0, 9.0, 19.0, 5.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013589859008789062, -0.00013170763850212097, -0.00012751668691635132, -0.00012332573533058167, -0.00011913478374481201, -0.00011494383215904236, -0.0001107528805732727, -0.00010656192898750305, -0.0001023709774017334, -9.818002581596375e-05, -9.398907423019409e-05, -8.979812264442444e-05, -8.560717105865479e-05, -8.141621947288513e-05, -7.722526788711548e-05, -7.303431630134583e-05, -6.884336471557617e-05, -6.465241312980652e-05, -6.0461461544036865e-05, -5.627050995826721e-05, -5.207955837249756e-05, -4.7888606786727905e-05, -4.369765520095825e-05, -3.95067036151886e-05, -3.5315752029418945e-05, -3.112480044364929e-05, -2.693384885787964e-05, -2.2742897272109985e-05, -1.8551945686340332e-05, -1.4360994100570679e-05, -1.0170042514801025e-05, -5.979090929031372e-06, -1.7881393432617188e-06, 2.4028122425079346e-06, 6.593763828277588e-06, 1.0784715414047241e-05, 1.4975666999816895e-05, 1.9166618585586548e-05, 2.33575701713562e-05, 2.7548521757125854e-05, 3.173947334289551e-05, 3.593042492866516e-05, 4.0121376514434814e-05, 4.431232810020447e-05, 4.850327968597412e-05, 5.2694231271743774e-05, 5.688518285751343e-05, 6.107613444328308e-05, 6.526708602905273e-05, 6.945803761482239e-05, 7.364898920059204e-05, 7.78399407863617e-05, 8.203089237213135e-05, 8.6221843957901e-05, 9.041279554367065e-05, 9.460374712944031e-05, 9.879469871520996e-05, 0.00010298565030097961, 0.00010717660188674927, 0.00011136755347251892, 0.00011555850505828857, 0.00011974945664405823, 0.00012394040822982788, 0.00012813135981559753, 0.0001323223114013672]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 9.0, 20.0, 24.0, 42.0, 58.0, 123.0, 193.0, 356.0, 606.0, 1277.0, 3165.0, 8865.0, 33537.0, 185904.0, 567272.0, 196334.0, 35535.0, 9183.0, 3235.0, 1382.0, 654.0, 343.0, 173.0, 85.0, 64.0, 44.0, 22.0, 16.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4619140625, -1.412384033203125, -1.36285400390625, -1.313323974609375, -1.2637939453125, -1.214263916015625, -1.16473388671875, -1.115203857421875, -1.065673828125, -1.016143798828125, -0.96661376953125, -0.917083740234375, -0.8675537109375, -0.818023681640625, -0.76849365234375, -0.718963623046875, -0.66943359375, -0.619903564453125, -0.57037353515625, -0.520843505859375, -0.4713134765625, -0.421783447265625, -0.37225341796875, -0.322723388671875, -0.273193359375, -0.223663330078125, -0.17413330078125, -0.124603271484375, -0.0750732421875, -0.025543212890625, 0.02398681640625, 0.073516845703125, 0.123046875, 0.172576904296875, 0.22210693359375, 0.271636962890625, 0.3211669921875, 0.370697021484375, 0.42022705078125, 0.469757080078125, 0.519287109375, 0.568817138671875, 0.61834716796875, 0.667877197265625, 0.7174072265625, 0.766937255859375, 0.81646728515625, 0.865997314453125, 0.91552734375, 0.965057373046875, 1.01458740234375, 1.064117431640625, 1.1136474609375, 1.163177490234375, 1.21270751953125, 1.262237548828125, 1.311767578125, 1.361297607421875, 1.41082763671875, 1.460357666015625, 1.5098876953125, 1.559417724609375, 1.60894775390625, 1.658477783203125, 1.7080078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 10.0, 14.0, 10.0, 19.0, 22.0, 31.0, 46.0, 65.0, 77.0, 83.0, 102.0, 84.0, 87.0, 79.0, 71.0, 49.0, 35.0, 30.0, 21.0, 11.0, 7.0, 7.0, 11.0, 1.0, 10.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.130401611328125, -1.09283447265625, -1.055267333984375, -1.0177001953125, -0.980133056640625, -0.94256591796875, -0.904998779296875, -0.867431640625, -0.829864501953125, -0.79229736328125, -0.754730224609375, -0.7171630859375, -0.679595947265625, -0.64202880859375, -0.604461669921875, -0.56689453125, -0.529327392578125, -0.49176025390625, -0.454193115234375, -0.4166259765625, -0.379058837890625, -0.34149169921875, -0.303924560546875, -0.266357421875, -0.228790283203125, -0.19122314453125, -0.153656005859375, -0.1160888671875, -0.078521728515625, -0.04095458984375, -0.003387451171875, 0.0341796875, 0.071746826171875, 0.10931396484375, 0.146881103515625, 0.1844482421875, 0.222015380859375, 0.25958251953125, 0.297149658203125, 0.334716796875, 0.372283935546875, 0.40985107421875, 0.447418212890625, 0.4849853515625, 0.522552490234375, 0.56011962890625, 0.597686767578125, 0.63525390625, 0.672821044921875, 0.71038818359375, 0.747955322265625, 0.7855224609375, 0.823089599609375, 0.86065673828125, 0.898223876953125, 0.935791015625, 0.973358154296875, 1.01092529296875, 1.048492431640625, 1.0860595703125, 1.123626708984375, 1.16119384765625, 1.198760986328125, 1.236328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 7.0, 18.0, 22.0, 23.0, 59.0, 105.0, 160.0, 180.0, 166.0, 106.0, 63.0, 41.0, 19.0, 11.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.532722473144531, -9.853334426879883, -9.173946380615234, -8.49455738067627, -7.815169334411621, -7.135781288146973, -6.456392765045166, -5.777004241943359, -5.097616195678711, -4.4182281494140625, -3.738839626312256, -3.0594513416290283, -2.380063056945801, -1.7006747722625732, -1.0212864875793457, -0.34189796447753906, 0.3374900817871094, 1.016878366470337, 1.6962666511535645, 2.375654935836792, 3.0550432205200195, 3.734431505203247, 4.413819789886475, 5.093208312988281, 5.77259635925293, 6.451984405517578, 7.131372928619385, 7.810761451721191, 8.49014949798584, 9.169537544250488, 9.848926544189453, 10.528314590454102, 11.20770263671875, 11.887090682983398, 12.566478729248047, 13.245867729187012, 13.92525577545166, 14.604643821716309, 15.284032821655273, 15.963420867919922, 16.64280891418457, 17.32219696044922, 18.001585006713867, 18.680973052978516, 19.360363006591797, 20.039751052856445, 20.719139099121094, 21.398527145385742, 22.07791519165039, 22.75730323791504, 23.436691284179688, 24.116079330444336, 24.795467376708984, 25.474857330322266, 26.154245376586914, 26.833633422851562, 27.51302146911621, 28.19240951538086, 28.871797561645508, 29.551185607910156, 30.230575561523438, 30.909963607788086, 31.589351654052734, 32.26873779296875, 32.94812774658203]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 10.0, 11.0, 13.0, 18.0, 14.0, 17.0, 22.0, 38.0, 38.0, 50.0, 52.0, 60.0, 65.0, 62.0, 57.0, 71.0, 56.0, 61.0, 44.0, 47.0, 51.0, 26.0, 36.0, 19.0, 14.0, 11.0, 11.0, 6.0, 4.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.445122718811035, -13.076869010925293, -12.70861530303955, -12.340361595153809, -11.972107887268066, -11.603854179382324, -11.235601425170898, -10.867347717285156, -10.499094009399414, -10.130840301513672, -9.76258659362793, -9.394332885742188, -9.026079177856445, -8.657825469970703, -8.289571762084961, -7.921318531036377, -7.553064346313477, -7.184810638427734, -6.816556930541992, -6.44830322265625, -6.080049514770508, -5.711795806884766, -5.343542575836182, -4.9752888679504395, -4.607035160064697, -4.238781452178955, -3.870527744293213, -3.50227427482605, -3.1340205669403076, -2.7657668590545654, -2.3975133895874023, -2.02925968170166, -1.6610050201416016, -1.2927513122558594, -0.9244977235794067, -0.5562441349029541, -0.18799042701721191, 0.18026328086853027, 0.5485167503356934, 0.9167704582214355, 1.2850241661071777, 1.65327787399292, 2.021531581878662, 2.389785051345825, 2.7580387592315674, 3.1262924671173096, 3.4945459365844727, 3.862799644470215, 4.231053352355957, 4.599307060241699, 4.967560768127441, 5.335814476013184, 5.704068183898926, 6.072321891784668, 6.440575122833252, 6.808828830718994, 7.177082538604736, 7.5453362464904785, 7.913589954376221, 8.281843185424805, 8.650096893310547, 9.018350601196289, 9.386604309082031, 9.754858016967773, 10.123111724853516]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 24.0, 26.0, 52.0, 84.0, 127.0, 202.0, 356.0, 764.0, 1467.0, 3427.0, 8914.0, 30042.0, 142838.0, 2256700.0, 1581739.0, 124418.0, 27712.0, 8718.0, 3439.0, 1537.0, 679.0, 411.0, 197.0, 143.0, 78.0, 46.0, 24.0, 22.0, 15.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.36163330078125, -2.2740478515625, -2.18646240234375, -2.098876953125, -2.01129150390625, -1.9237060546875, -1.83612060546875, -1.74853515625, -1.66094970703125, -1.5733642578125, -1.48577880859375, -1.398193359375, -1.31060791015625, -1.2230224609375, -1.13543701171875, -1.0478515625, -0.96026611328125, -0.8726806640625, -0.78509521484375, -0.697509765625, -0.60992431640625, -0.5223388671875, -0.43475341796875, -0.34716796875, -0.25958251953125, -0.1719970703125, -0.08441162109375, 0.003173828125, 0.09075927734375, 0.1783447265625, 0.26593017578125, 0.353515625, 0.44110107421875, 0.5286865234375, 0.61627197265625, 0.703857421875, 0.79144287109375, 0.8790283203125, 0.96661376953125, 1.05419921875, 1.14178466796875, 1.2293701171875, 1.31695556640625, 1.404541015625, 1.49212646484375, 1.5797119140625, 1.66729736328125, 1.7548828125, 1.84246826171875, 1.9300537109375, 2.01763916015625, 2.105224609375, 2.19281005859375, 2.2803955078125, 2.36798095703125, 2.45556640625, 2.54315185546875, 2.6307373046875, 2.71832275390625, 2.805908203125, 2.89349365234375, 2.9810791015625, 3.06866455078125, 3.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 11.0, 20.0, 30.0, 39.0, 40.0, 43.0, 55.0, 81.0, 57.0, 73.0, 84.0, 63.0, 69.0, 61.0, 58.0, 49.0, 45.0, 37.0, 26.0, 16.0, 17.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3203010559082031, -0.30735015869140625, -0.2943992614746094, -0.2814483642578125, -0.2684974670410156, -0.25554656982421875, -0.24259567260742188, -0.229644775390625, -0.21669387817382812, -0.20374298095703125, -0.19079208374023438, -0.1778411865234375, -0.16489028930664062, -0.15193939208984375, -0.13898849487304688, -0.12603759765625, -0.11308670043945312, -0.10013580322265625, -0.08718490600585938, -0.0742340087890625, -0.061283111572265625, -0.04833221435546875, -0.035381317138671875, -0.022430419921875, -0.009479522705078125, 0.00347137451171875, 0.016422271728515625, 0.0293731689453125, 0.042324066162109375, 0.05527496337890625, 0.06822586059570312, 0.0811767578125, 0.09412765502929688, 0.10707855224609375, 0.12002944946289062, 0.1329803466796875, 0.14593124389648438, 0.15888214111328125, 0.17183303833007812, 0.184783935546875, 0.19773483276367188, 0.21068572998046875, 0.22363662719726562, 0.2365875244140625, 0.24953842163085938, 0.26248931884765625, 0.2754402160644531, 0.28839111328125, 0.3013420104980469, 0.31429290771484375, 0.3272438049316406, 0.3401947021484375, 0.3531455993652344, 0.36609649658203125, 0.3790473937988281, 0.391998291015625, 0.4049491882324219, 0.41790008544921875, 0.4308509826660156, 0.4438018798828125, 0.4567527770996094, 0.46970367431640625, 0.4826545715332031, 0.49560546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 7.0, 13.0, 27.0, 37.0, 65.0, 83.0, 148.0, 232.0, 485.0, 1014.0, 2737.0, 12114.0, 173691.0, 3822331.0, 166236.0, 11097.0, 2371.0, 807.0, 339.0, 171.0, 88.0, 65.0, 39.0, 39.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.41937255859375, -6.2332763671875, -6.04718017578125, -5.861083984375, -5.67498779296875, -5.4888916015625, -5.30279541015625, -5.11669921875, -4.93060302734375, -4.7445068359375, -4.55841064453125, -4.372314453125, -4.18621826171875, -4.0001220703125, -3.81402587890625, -3.6279296875, -3.44183349609375, -3.2557373046875, -3.06964111328125, -2.883544921875, -2.69744873046875, -2.5113525390625, -2.32525634765625, -2.13916015625, -1.95306396484375, -1.7669677734375, -1.58087158203125, -1.394775390625, -1.20867919921875, -1.0225830078125, -0.83648681640625, -0.650390625, -0.46429443359375, -0.2781982421875, -0.09210205078125, 0.093994140625, 0.28009033203125, 0.4661865234375, 0.65228271484375, 0.83837890625, 1.02447509765625, 1.2105712890625, 1.39666748046875, 1.582763671875, 1.76885986328125, 1.9549560546875, 2.14105224609375, 2.3271484375, 2.51324462890625, 2.6993408203125, 2.88543701171875, 3.071533203125, 3.25762939453125, 3.4437255859375, 3.62982177734375, 3.81591796875, 4.00201416015625, 4.1881103515625, 4.37420654296875, 4.560302734375, 4.74639892578125, 4.9324951171875, 5.11859130859375, 5.3046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 29.0, 41.0, 104.0, 154.0, 336.0, 752.0, 1324.0, 704.0, 297.0, 145.0, 65.0, 38.0, 22.0, 4.0, 10.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.0489349365234375, -1.998260498046875, -1.9475860595703125, -1.89691162109375, -1.8462371826171875, -1.795562744140625, -1.7448883056640625, -1.6942138671875, -1.6435394287109375, -1.592864990234375, -1.5421905517578125, -1.49151611328125, -1.4408416748046875, -1.390167236328125, -1.3394927978515625, -1.288818359375, -1.2381439208984375, -1.187469482421875, -1.1367950439453125, -1.08612060546875, -1.0354461669921875, -0.984771728515625, -0.9340972900390625, -0.8834228515625, -0.8327484130859375, -0.782073974609375, -0.7313995361328125, -0.68072509765625, -0.6300506591796875, -0.579376220703125, -0.5287017822265625, -0.47802734375, -0.4273529052734375, -0.376678466796875, -0.3260040283203125, -0.27532958984375, -0.2246551513671875, -0.173980712890625, -0.1233062744140625, -0.0726318359375, -0.0219573974609375, 0.028717041015625, 0.0793914794921875, 0.13006591796875, 0.1807403564453125, 0.231414794921875, 0.2820892333984375, 0.332763671875, 0.3834381103515625, 0.434112548828125, 0.4847869873046875, 0.53546142578125, 0.5861358642578125, 0.636810302734375, 0.6874847412109375, 0.7381591796875, 0.7888336181640625, 0.839508056640625, 0.8901824951171875, 0.94085693359375, 0.9915313720703125, 1.042205810546875, 1.0928802490234375, 1.1435546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 11.0, 13.0, 16.0, 33.0, 60.0, 89.0, 136.0, 141.0, 145.0, 124.0, 83.0, 56.0, 39.0, 14.0, 17.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.631415367126465, -15.313575744628906, -14.995736122131348, -14.677896499633789, -14.36005687713623, -14.042217254638672, -13.724377632141113, -13.406538009643555, -13.08869743347168, -12.770857810974121, -12.453018188476562, -12.135178565979004, -11.817338943481445, -11.499499320983887, -11.181659698486328, -10.863819122314453, -10.545980453491211, -10.228140830993652, -9.910301208496094, -9.592461585998535, -9.274621963500977, -8.956782341003418, -8.63894271850586, -8.321102142333984, -8.003263473510742, -7.685423851013184, -7.367584228515625, -7.049744606018066, -6.731904983520508, -6.414065361022949, -6.096225261688232, -5.778385639190674, -5.460546493530273, -5.142706871032715, -4.824867248535156, -4.507027626037598, -4.189188003540039, -3.8713481426239014, -3.5535082817077637, -3.235668659210205, -2.9178290367126465, -2.599989414215088, -2.2821497917175293, -1.9643099308013916, -1.646470308303833, -1.3286306858062744, -1.0107909440994263, -0.6929512023925781, -0.37511157989501953, -0.05727189779281616, 0.2605677843093872, 0.5784074664115906, 0.896247148513794, 1.2140867710113525, 1.5319265127182007, 1.8497662544250488, 2.1676058769226074, 2.485445499420166, 2.8032851219177246, 3.1211249828338623, 3.438964605331421, 3.7568042278289795, 4.074644088745117, 4.392483711242676, 4.710323333740234]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 7.0, 13.0, 14.0, 20.0, 28.0, 34.0, 44.0, 54.0, 62.0, 86.0, 91.0, 77.0, 78.0, 58.0, 61.0, 69.0, 54.0, 41.0, 24.0, 30.0, 14.0, 14.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.696931838989258, -9.44190502166748, -9.186878204345703, -8.931851387023926, -8.676824569702148, -8.421797752380371, -8.166770935058594, -7.911744117736816, -7.656717300415039, -7.401690483093262, -7.146663665771484, -6.891636848449707, -6.63661003112793, -6.381583213806152, -6.126556396484375, -5.871529579162598, -5.61650276184082, -5.361475944519043, -5.106449127197266, -4.851422309875488, -4.596395492553711, -4.341368675231934, -4.086341857910156, -3.831315040588379, -3.5762882232666016, -3.321261405944824, -3.066234588623047, -2.8112077713012695, -2.556180953979492, -2.301154136657715, -2.0461273193359375, -1.7911005020141602, -1.536074161529541, -1.2810473442077637, -1.0260205268859863, -0.770993709564209, -0.5159668922424316, -0.2609400749206543, -0.005913257598876953, 0.2491135597229004, 0.5041403770446777, 0.7591671943664551, 1.0141940116882324, 1.2692208290100098, 1.524247646331787, 1.7792744636535645, 2.034301280975342, 2.289328098297119, 2.5443549156188965, 2.799381732940674, 3.054408550262451, 3.3094353675842285, 3.564462184906006, 3.819489002227783, 4.0745158195495605, 4.329542636871338, 4.584569454193115, 4.839596271514893, 5.09462308883667, 5.349649906158447, 5.604676723480225, 5.859703540802002, 6.114730358123779, 6.369757175445557, 6.624783992767334]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 9.0, 11.0, 15.0, 16.0, 20.0, 35.0, 64.0, 73.0, 114.0, 147.0, 248.0, 427.0, 669.0, 1242.0, 2491.0, 5493.0, 13280.0, 37827.0, 113530.0, 296981.0, 346574.0, 149074.0, 49645.0, 17109.0, 6837.0, 2980.0, 1524.0, 819.0, 460.0, 260.0, 184.0, 136.0, 68.0, 44.0, 32.0, 16.0, 28.0, 19.0, 12.0, 15.0, 6.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0390625, -1.96905517578125, -1.8990478515625, -1.82904052734375, -1.759033203125, -1.68902587890625, -1.6190185546875, -1.54901123046875, -1.47900390625, -1.40899658203125, -1.3389892578125, -1.26898193359375, -1.198974609375, -1.12896728515625, -1.0589599609375, -0.98895263671875, -0.9189453125, -0.84893798828125, -0.7789306640625, -0.70892333984375, -0.638916015625, -0.56890869140625, -0.4989013671875, -0.42889404296875, -0.35888671875, -0.28887939453125, -0.2188720703125, -0.14886474609375, -0.078857421875, -0.00885009765625, 0.0611572265625, 0.13116455078125, 0.201171875, 0.27117919921875, 0.3411865234375, 0.41119384765625, 0.481201171875, 0.55120849609375, 0.6212158203125, 0.69122314453125, 0.76123046875, 0.83123779296875, 0.9012451171875, 0.97125244140625, 1.041259765625, 1.11126708984375, 1.1812744140625, 1.25128173828125, 1.3212890625, 1.39129638671875, 1.4613037109375, 1.53131103515625, 1.601318359375, 1.67132568359375, 1.7413330078125, 1.81134033203125, 1.88134765625, 1.95135498046875, 2.0213623046875, 2.09136962890625, 2.161376953125, 2.23138427734375, 2.3013916015625, 2.37139892578125, 2.44140625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 13.0, 15.0, 32.0, 25.0, 44.0, 67.0, 59.0, 85.0, 88.0, 82.0, 80.0, 73.0, 82.0, 65.0, 55.0, 39.0, 29.0, 23.0, 17.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5037345886230469, -0.48793792724609375, -0.4721412658691406, -0.4563446044921875, -0.4405479431152344, -0.42475128173828125, -0.4089546203613281, -0.393157958984375, -0.3773612976074219, -0.36156463623046875, -0.3457679748535156, -0.3299713134765625, -0.3141746520996094, -0.29837799072265625, -0.2825813293457031, -0.26678466796875, -0.2509880065917969, -0.23519134521484375, -0.21939468383789062, -0.2035980224609375, -0.18780136108398438, -0.17200469970703125, -0.15620803833007812, -0.140411376953125, -0.12461471557617188, -0.10881805419921875, -0.09302139282226562, -0.0772247314453125, -0.061428070068359375, -0.04563140869140625, -0.029834747314453125, -0.0140380859375, 0.001758575439453125, 0.01755523681640625, 0.033351898193359375, 0.0491485595703125, 0.06494522094726562, 0.08074188232421875, 0.09653854370117188, 0.112335205078125, 0.12813186645507812, 0.14392852783203125, 0.15972518920898438, 0.1755218505859375, 0.19131851196289062, 0.20711517333984375, 0.22291183471679688, 0.23870849609375, 0.2545051574707031, 0.27030181884765625, 0.2860984802246094, 0.3018951416015625, 0.3176918029785156, 0.33348846435546875, 0.3492851257324219, 0.365081787109375, 0.3808784484863281, 0.39667510986328125, 0.4124717712402344, 0.4282684326171875, 0.4440650939941406, 0.45986175537109375, 0.4756584167480469, 0.491455078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 15.0, 23.0, 27.0, 44.0, 48.0, 81.0, 118.0, 200.0, 268.0, 431.0, 657.0, 1040.0, 1738.0, 2787.0, 4897.0, 9023.0, 16691.0, 32682.0, 63450.0, 118172.0, 192613.0, 228218.0, 167949.0, 97679.0, 51768.0, 26565.0, 13593.0, 7217.0, 4097.0, 2376.0, 1441.0, 895.0, 570.0, 384.0, 244.0, 175.0, 104.0, 76.0, 59.0, 33.0, 27.0, 24.0, 13.0, 9.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.1142578125, -1.079803466796875, -1.04534912109375, -1.010894775390625, -0.9764404296875, -0.941986083984375, -0.90753173828125, -0.873077392578125, -0.838623046875, -0.804168701171875, -0.76971435546875, -0.735260009765625, -0.7008056640625, -0.666351318359375, -0.63189697265625, -0.597442626953125, -0.56298828125, -0.528533935546875, -0.49407958984375, -0.459625244140625, -0.4251708984375, -0.390716552734375, -0.35626220703125, -0.321807861328125, -0.287353515625, -0.252899169921875, -0.21844482421875, -0.183990478515625, -0.1495361328125, -0.115081787109375, -0.08062744140625, -0.046173095703125, -0.01171875, 0.022735595703125, 0.05718994140625, 0.091644287109375, 0.1260986328125, 0.160552978515625, 0.19500732421875, 0.229461669921875, 0.263916015625, 0.298370361328125, 0.33282470703125, 0.367279052734375, 0.4017333984375, 0.436187744140625, 0.47064208984375, 0.505096435546875, 0.53955078125, 0.574005126953125, 0.60845947265625, 0.642913818359375, 0.6773681640625, 0.711822509765625, 0.74627685546875, 0.780731201171875, 0.815185546875, 0.849639892578125, 0.88409423828125, 0.918548583984375, 0.9530029296875, 0.987457275390625, 1.02191162109375, 1.056365966796875, 1.0908203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 8.0, 6.0, 4.0, 8.0, 7.0, 11.0, 8.0, 10.0, 17.0, 17.0, 24.0, 33.0, 21.0, 36.0, 30.0, 28.0, 38.0, 42.0, 41.0, 43.0, 45.0, 31.0, 42.0, 47.0, 42.0, 46.0, 26.0, 46.0, 22.0, 28.0, 29.0, 22.0, 29.0, 18.0, 14.0, 11.0, 18.0, 12.0, 7.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.3076171875, -1.270782470703125, -1.23394775390625, -1.197113037109375, -1.1602783203125, -1.123443603515625, -1.08660888671875, -1.049774169921875, -1.012939453125, -0.976104736328125, -0.93927001953125, -0.902435302734375, -0.8656005859375, -0.828765869140625, -0.79193115234375, -0.755096435546875, -0.71826171875, -0.681427001953125, -0.64459228515625, -0.607757568359375, -0.5709228515625, -0.534088134765625, -0.49725341796875, -0.460418701171875, -0.423583984375, -0.386749267578125, -0.34991455078125, -0.313079833984375, -0.2762451171875, -0.239410400390625, -0.20257568359375, -0.165740966796875, -0.12890625, -0.092071533203125, -0.05523681640625, -0.018402099609375, 0.0184326171875, 0.055267333984375, 0.09210205078125, 0.128936767578125, 0.165771484375, 0.202606201171875, 0.23944091796875, 0.276275634765625, 0.3131103515625, 0.349945068359375, 0.38677978515625, 0.423614501953125, 0.46044921875, 0.497283935546875, 0.53411865234375, 0.570953369140625, 0.6077880859375, 0.644622802734375, 0.68145751953125, 0.718292236328125, 0.755126953125, 0.791961669921875, 0.82879638671875, 0.865631103515625, 0.9024658203125, 0.939300537109375, 0.97613525390625, 1.012969970703125, 1.0498046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 18.0, 8.0, 10.0, 23.0, 29.0, 49.0, 103.0, 114.0, 223.0, 402.0, 785.0, 1653.0, 3413.0, 8342.0, 22631.0, 75497.0, 324114.0, 443153.0, 116761.0, 31539.0, 11081.0, 4455.0, 2021.0, 958.0, 470.0, 287.0, 158.0, 91.0, 65.0, 31.0, 19.0, 18.0, 14.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.5634765625, -1.521392822265625, -1.47930908203125, -1.437225341796875, -1.3951416015625, -1.353057861328125, -1.31097412109375, -1.268890380859375, -1.226806640625, -1.184722900390625, -1.14263916015625, -1.100555419921875, -1.0584716796875, -1.016387939453125, -0.97430419921875, -0.932220458984375, -0.89013671875, -0.848052978515625, -0.80596923828125, -0.763885498046875, -0.7218017578125, -0.679718017578125, -0.63763427734375, -0.595550537109375, -0.553466796875, -0.511383056640625, -0.46929931640625, -0.427215576171875, -0.3851318359375, -0.343048095703125, -0.30096435546875, -0.258880615234375, -0.216796875, -0.174713134765625, -0.13262939453125, -0.090545654296875, -0.0484619140625, -0.006378173828125, 0.03570556640625, 0.077789306640625, 0.119873046875, 0.161956787109375, 0.20404052734375, 0.246124267578125, 0.2882080078125, 0.330291748046875, 0.37237548828125, 0.414459228515625, 0.45654296875, 0.498626708984375, 0.54071044921875, 0.582794189453125, 0.6248779296875, 0.666961669921875, 0.70904541015625, 0.751129150390625, 0.793212890625, 0.835296630859375, 0.87738037109375, 0.919464111328125, 0.9615478515625, 1.003631591796875, 1.04571533203125, 1.087799072265625, 1.1298828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 14.0, 18.0, 23.0, 25.0, 28.0, 49.0, 61.0, 69.0, 82.0, 101.0, 113.0, 81.0, 69.0, 59.0, 43.0, 35.0, 22.0, 18.0, 16.0, 10.0, 10.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019884109497070312, -0.0001934543251991272, -0.00018806755542755127, -0.00018268078565597534, -0.00017729401588439941, -0.00017190724611282349, -0.00016652047634124756, -0.00016113370656967163, -0.0001557469367980957, -0.00015036016702651978, -0.00014497339725494385, -0.00013958662748336792, -0.000134199857711792, -0.00012881308794021606, -0.00012342631816864014, -0.00011803954839706421, -0.00011265277862548828, -0.00010726600885391235, -0.00010187923908233643, -9.64924693107605e-05, -9.110569953918457e-05, -8.571892976760864e-05, -8.033215999603271e-05, -7.494539022445679e-05, -6.955862045288086e-05, -6.417185068130493e-05, -5.8785080909729004e-05, -5.3398311138153076e-05, -4.801154136657715e-05, -4.262477159500122e-05, -3.723800182342529e-05, -3.1851232051849365e-05, -2.6464462280273438e-05, -2.107769250869751e-05, -1.5690922737121582e-05, -1.0304152965545654e-05, -4.9173831939697266e-06, 4.6938657760620117e-07, 5.856156349182129e-06, 1.1242926120758057e-05, 1.6629695892333984e-05, 2.2016465663909912e-05, 2.740323543548584e-05, 3.279000520706177e-05, 3.8176774978637695e-05, 4.356354475021362e-05, 4.895031452178955e-05, 5.433708429336548e-05, 5.9723854064941406e-05, 6.511062383651733e-05, 7.049739360809326e-05, 7.588416337966919e-05, 8.127093315124512e-05, 8.665770292282104e-05, 9.204447269439697e-05, 9.74312424659729e-05, 0.00010281801223754883, 0.00010820478200912476, 0.00011359155178070068, 0.00011897832155227661, 0.00012436509132385254, 0.00012975186109542847, 0.0001351386308670044, 0.00014052540063858032, 0.00014591217041015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 11.0, 9.0, 11.0, 31.0, 45.0, 73.0, 142.0, 210.0, 450.0, 983.0, 2365.0, 6885.0, 25708.0, 168935.0, 674096.0, 136034.0, 22393.0, 6204.0, 2106.0, 893.0, 430.0, 222.0, 136.0, 74.0, 53.0, 20.0, 13.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7726593017578125, -1.710357666015625, -1.6480560302734375, -1.58575439453125, -1.5234527587890625, -1.461151123046875, -1.3988494873046875, -1.3365478515625, -1.2742462158203125, -1.211944580078125, -1.1496429443359375, -1.08734130859375, -1.0250396728515625, -0.962738037109375, -0.9004364013671875, -0.838134765625, -0.7758331298828125, -0.713531494140625, -0.6512298583984375, -0.58892822265625, -0.5266265869140625, -0.464324951171875, -0.4020233154296875, -0.3397216796875, -0.2774200439453125, -0.215118408203125, -0.1528167724609375, -0.09051513671875, -0.0282135009765625, 0.034088134765625, 0.0963897705078125, 0.15869140625, 0.2209930419921875, 0.283294677734375, 0.3455963134765625, 0.40789794921875, 0.4701995849609375, 0.532501220703125, 0.5948028564453125, 0.6571044921875, 0.7194061279296875, 0.781707763671875, 0.8440093994140625, 0.90631103515625, 0.9686126708984375, 1.030914306640625, 1.0932159423828125, 1.155517578125, 1.2178192138671875, 1.280120849609375, 1.3424224853515625, 1.40472412109375, 1.4670257568359375, 1.529327392578125, 1.5916290283203125, 1.6539306640625, 1.7162322998046875, 1.778533935546875, 1.8408355712890625, 1.90313720703125, 1.9654388427734375, 2.027740478515625, 2.0900421142578125, 2.15234375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 8.0, 4.0, 4.0, 15.0, 13.0, 15.0, 39.0, 46.0, 36.0, 53.0, 73.0, 93.0, 93.0, 90.0, 98.0, 75.0, 52.0, 45.0, 27.0, 25.0, 22.0, 18.0, 8.0, 9.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.932525634765625, -0.90020751953125, -0.867889404296875, -0.8355712890625, -0.803253173828125, -0.77093505859375, -0.738616943359375, -0.706298828125, -0.673980712890625, -0.64166259765625, -0.609344482421875, -0.5770263671875, -0.544708251953125, -0.51239013671875, -0.480072021484375, -0.44775390625, -0.415435791015625, -0.38311767578125, -0.350799560546875, -0.3184814453125, -0.286163330078125, -0.25384521484375, -0.221527099609375, -0.189208984375, -0.156890869140625, -0.12457275390625, -0.092254638671875, -0.0599365234375, -0.027618408203125, 0.00469970703125, 0.037017822265625, 0.0693359375, 0.101654052734375, 0.13397216796875, 0.166290283203125, 0.1986083984375, 0.230926513671875, 0.26324462890625, 0.295562744140625, 0.327880859375, 0.360198974609375, 0.39251708984375, 0.424835205078125, 0.4571533203125, 0.489471435546875, 0.52178955078125, 0.554107666015625, 0.58642578125, 0.618743896484375, 0.65106201171875, 0.683380126953125, 0.7156982421875, 0.748016357421875, 0.78033447265625, 0.812652587890625, 0.844970703125, 0.877288818359375, 0.90960693359375, 0.941925048828125, 0.9742431640625, 1.006561279296875, 1.03887939453125, 1.071197509765625, 1.103515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 16.0, 17.0, 50.0, 81.0, 99.0, 153.0, 135.0, 134.0, 111.0, 79.0, 40.0, 32.0, 18.0, 12.0, 6.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.92098045349121, -18.316871643066406, -17.7127628326416, -17.108654022216797, -16.50454330444336, -15.900434494018555, -15.29632568359375, -14.692216873168945, -14.08810806274414, -13.483999252319336, -12.879889488220215, -12.27578067779541, -11.671671867370605, -11.067562103271484, -10.46345329284668, -9.859344482421875, -9.255234718322754, -8.65112590789795, -8.047016143798828, -7.442907333374023, -6.838798522949219, -6.234689235687256, -5.630579948425293, -5.026471138000488, -4.422361850738525, -3.8182528018951416, -3.214143753051758, -2.610034465789795, -2.005925416946411, -1.4018163681030273, -0.7977070808410645, -0.19359827041625977, 0.4105110168457031, 1.014620065689087, 1.6187292337417603, 2.2228384017944336, 2.8269474506378174, 3.431056499481201, 4.035165786743164, 4.639274597167969, 5.243383884429932, 5.8474931716918945, 6.451601982116699, 7.055711269378662, 7.659820556640625, 8.26392936706543, 8.868038177490234, 9.472146987915039, 10.07625675201416, 10.680365562438965, 11.284475326538086, 11.88858413696289, 12.492692947387695, 13.0968017578125, 13.700911521911621, 14.305020332336426, 14.909130096435547, 15.513238906860352, 16.117347717285156, 16.721458435058594, 17.3255672454834, 17.929676055908203, 18.533784866333008, 19.137893676757812, 19.742002487182617]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 6.0, 9.0, 15.0, 18.0, 19.0, 27.0, 35.0, 38.0, 49.0, 56.0, 50.0, 66.0, 61.0, 60.0, 55.0, 47.0, 62.0, 50.0, 47.0, 44.0, 43.0, 22.0, 27.0, 15.0, 20.0, 11.0, 12.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667394638061523, -12.328136444091797, -11.988879203796387, -11.64962100982666, -11.31036376953125, -10.971105575561523, -10.631847381591797, -10.29258918762207, -9.95333194732666, -9.614073753356934, -9.274816513061523, -8.935558319091797, -8.59630012512207, -8.25704288482666, -7.917784690856934, -7.578526973724365, -7.239269256591797, -6.9000115394592285, -6.56075382232666, -6.221495628356934, -5.882237911224365, -5.542980194091797, -5.20372200012207, -4.864464282989502, -4.525206565856934, -4.185948848724365, -3.8466908931732178, -3.5074329376220703, -3.168175220489502, -2.8289175033569336, -2.489659547805786, -2.1504015922546387, -1.8111438751220703, -1.4718860387802124, -1.1326282024383545, -0.7933703660964966, -0.45411252975463867, -0.11485469341278076, 0.22440314292907715, 0.5636610984802246, 0.902918815612793, 1.2421766519546509, 1.5814344882965088, 1.9206923246383667, 2.2599501609802246, 2.599207878112793, 2.9384658336639404, 3.277723789215088, 3.6169815063476562, 3.9562392234802246, 4.295496940612793, 4.6347551345825195, 4.974012851715088, 5.313270568847656, 5.652528762817383, 5.991786479949951, 6.3310441970825195, 6.670301914215088, 7.009559631347656, 7.348817825317383, 7.688075542449951, 8.02733325958252, 8.366591453552246, 8.705848693847656, 9.045106887817383]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 2.0, 8.0, 9.0, 18.0, 24.0, 26.0, 39.0, 52.0, 63.0, 86.0, 136.0, 230.0, 404.0, 672.0, 1393.0, 3037.0, 7505.0, 23949.0, 117181.0, 3215739.0, 732902.0, 64265.0, 16228.0, 5575.0, 2246.0, 1118.0, 520.0, 318.0, 213.0, 106.0, 79.0, 52.0, 25.0, 20.0, 10.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.375, -3.285797119140625, -3.19659423828125, -3.107391357421875, -3.0181884765625, -2.928985595703125, -2.83978271484375, -2.750579833984375, -2.661376953125, -2.572174072265625, -2.48297119140625, -2.393768310546875, -2.3045654296875, -2.215362548828125, -2.12615966796875, -2.036956787109375, -1.94775390625, -1.858551025390625, -1.76934814453125, -1.680145263671875, -1.5909423828125, -1.501739501953125, -1.41253662109375, -1.323333740234375, -1.234130859375, -1.144927978515625, -1.05572509765625, -0.966522216796875, -0.8773193359375, -0.788116455078125, -0.69891357421875, -0.609710693359375, -0.5205078125, -0.431304931640625, -0.34210205078125, -0.252899169921875, -0.1636962890625, -0.074493408203125, 0.01470947265625, 0.103912353515625, 0.193115234375, 0.282318115234375, 0.37152099609375, 0.460723876953125, 0.5499267578125, 0.639129638671875, 0.72833251953125, 0.817535400390625, 0.90673828125, 0.995941162109375, 1.08514404296875, 1.174346923828125, 1.2635498046875, 1.352752685546875, 1.44195556640625, 1.531158447265625, 1.620361328125, 1.709564208984375, 1.79876708984375, 1.887969970703125, 1.9771728515625, 2.066375732421875, 2.15557861328125, 2.244781494140625, 2.333984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 6.0, 21.0, 34.0, 38.0, 38.0, 52.0, 64.0, 67.0, 70.0, 70.0, 85.0, 78.0, 78.0, 54.0, 52.0, 47.0, 37.0, 33.0, 18.0, 14.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490234375, -0.47586822509765625, -0.4615020751953125, -0.44713592529296875, -0.432769775390625, -0.41840362548828125, -0.4040374755859375, -0.38967132568359375, -0.37530517578125, -0.36093902587890625, -0.3465728759765625, -0.33220672607421875, -0.317840576171875, -0.30347442626953125, -0.2891082763671875, -0.27474212646484375, -0.2603759765625, -0.24600982666015625, -0.2316436767578125, -0.21727752685546875, -0.202911376953125, -0.18854522705078125, -0.1741790771484375, -0.15981292724609375, -0.14544677734375, -0.13108062744140625, -0.1167144775390625, -0.10234832763671875, -0.087982177734375, -0.07361602783203125, -0.0592498779296875, -0.04488372802734375, -0.030517578125, -0.01615142822265625, -0.0017852783203125, 0.01258087158203125, 0.026947021484375, 0.04131317138671875, 0.0556793212890625, 0.07004547119140625, 0.08441162109375, 0.09877777099609375, 0.1131439208984375, 0.12751007080078125, 0.141876220703125, 0.15624237060546875, 0.1706085205078125, 0.18497467041015625, 0.1993408203125, 0.21370697021484375, 0.2280731201171875, 0.24243927001953125, 0.256805419921875, 0.27117156982421875, 0.2855377197265625, 0.29990386962890625, 0.31427001953125, 0.32863616943359375, 0.3430023193359375, 0.35736846923828125, 0.371734619140625, 0.38610076904296875, 0.4004669189453125, 0.41483306884765625, 0.42919921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 7.0, 23.0, 17.0, 21.0, 26.0, 54.0, 80.0, 114.0, 206.0, 300.0, 557.0, 1050.0, 2172.0, 5095.0, 13876.0, 45858.0, 222062.0, 2680775.0, 1048272.0, 125629.0, 30697.0, 9817.0, 3752.0, 1719.0, 844.0, 449.0, 273.0, 140.0, 127.0, 72.0, 49.0, 37.0, 26.0, 19.0, 14.0, 13.0, 7.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.4609375, -2.39227294921875, -2.3236083984375, -2.25494384765625, -2.186279296875, -2.11761474609375, -2.0489501953125, -1.98028564453125, -1.91162109375, -1.84295654296875, -1.7742919921875, -1.70562744140625, -1.636962890625, -1.56829833984375, -1.4996337890625, -1.43096923828125, -1.3623046875, -1.29364013671875, -1.2249755859375, -1.15631103515625, -1.087646484375, -1.01898193359375, -0.9503173828125, -0.88165283203125, -0.81298828125, -0.74432373046875, -0.6756591796875, -0.60699462890625, -0.538330078125, -0.46966552734375, -0.4010009765625, -0.33233642578125, -0.263671875, -0.19500732421875, -0.1263427734375, -0.05767822265625, 0.010986328125, 0.07965087890625, 0.1483154296875, 0.21697998046875, 0.28564453125, 0.35430908203125, 0.4229736328125, 0.49163818359375, 0.560302734375, 0.62896728515625, 0.6976318359375, 0.76629638671875, 0.8349609375, 0.90362548828125, 0.9722900390625, 1.04095458984375, 1.109619140625, 1.17828369140625, 1.2469482421875, 1.31561279296875, 1.38427734375, 1.45294189453125, 1.5216064453125, 1.59027099609375, 1.658935546875, 1.72760009765625, 1.7962646484375, 1.86492919921875, 1.93359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 13.0, 9.0, 18.0, 26.0, 48.0, 44.0, 79.0, 127.0, 199.0, 360.0, 591.0, 1129.0, 583.0, 275.0, 177.0, 129.0, 79.0, 51.0, 29.0, 21.0, 18.0, 13.0, 14.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5568389892578125, -0.533111572265625, -0.5093841552734375, -0.48565673828125, -0.4619293212890625, -0.438201904296875, -0.4144744873046875, -0.3907470703125, -0.3670196533203125, -0.343292236328125, -0.3195648193359375, -0.29583740234375, -0.2721099853515625, -0.248382568359375, -0.2246551513671875, -0.200927734375, -0.1772003173828125, -0.153472900390625, -0.1297454833984375, -0.10601806640625, -0.0822906494140625, -0.058563232421875, -0.0348358154296875, -0.0111083984375, 0.0126190185546875, 0.036346435546875, 0.0600738525390625, 0.08380126953125, 0.1075286865234375, 0.131256103515625, 0.1549835205078125, 0.1787109375, 0.2024383544921875, 0.226165771484375, 0.2498931884765625, 0.27362060546875, 0.2973480224609375, 0.321075439453125, 0.3448028564453125, 0.3685302734375, 0.3922576904296875, 0.415985107421875, 0.4397125244140625, 0.46343994140625, 0.4871673583984375, 0.510894775390625, 0.5346221923828125, 0.558349609375, 0.5820770263671875, 0.605804443359375, 0.6295318603515625, 0.65325927734375, 0.6769866943359375, 0.700714111328125, 0.7244415283203125, 0.7481689453125, 0.7718963623046875, 0.795623779296875, 0.8193511962890625, 0.84307861328125, 0.8668060302734375, 0.890533447265625, 0.9142608642578125, 0.93798828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 18.0, 45.0, 116.0, 210.0, 274.0, 196.0, 94.0, 32.0, 16.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.535314559936523, -21.100561141967773, -20.665809631347656, -20.231056213378906, -19.79630470275879, -19.36155128479004, -18.926799774169922, -18.492046356201172, -18.057292938232422, -17.622539520263672, -17.187788009643555, -16.753034591674805, -16.318283081054688, -15.883529663085938, -15.448777198791504, -15.01402473449707, -14.579273223876953, -14.14452075958252, -13.709768295288086, -13.275014877319336, -12.840262413024902, -12.405509948730469, -11.970757484436035, -11.536005020141602, -11.101251602172852, -10.666499137878418, -10.231746673583984, -9.796993255615234, -9.3622407913208, -8.927488327026367, -8.492735862731934, -8.0579833984375, -7.623230934143066, -7.188478469848633, -6.753725528717041, -6.318973064422607, -5.884220600128174, -5.449467658996582, -5.014715194702148, -4.579962730407715, -4.145210266113281, -3.7104575634002686, -3.275705099105835, -2.8409523963928223, -2.4061999320983887, -1.971447229385376, -1.5366945266723633, -1.1019420623779297, -0.6671891212463379, -0.23243650794029236, 0.20231610536575317, 0.6370687484741211, 1.0718213319778442, 1.5065739154815674, 1.94132661819458, 2.3760790824890137, 2.8108317852020264, 3.245584487915039, 3.6803369522094727, 4.115089416503906, 4.549842357635498, 4.984594821929932, 5.419347763061523, 5.854100227355957, 6.288852691650391]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 8.0, 10.0, 16.0, 13.0, 17.0, 25.0, 27.0, 30.0, 26.0, 42.0, 39.0, 43.0, 40.0, 49.0, 43.0, 53.0, 50.0, 39.0, 55.0, 44.0, 45.0, 39.0, 27.0, 28.0, 32.0, 18.0, 23.0, 19.0, 19.0, 11.0, 12.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1007704734802246, -3.01249098777771, -2.9242117404937744, -2.8359322547912598, -2.747653007507324, -2.6593735218048096, -2.571094036102295, -2.4828147888183594, -2.394535541534424, -2.306256055831909, -2.2179768085479736, -2.129697322845459, -2.0414180755615234, -1.9531385898590088, -1.8648592233657837, -1.7765798568725586, -1.688300371170044, -1.6000210046768188, -1.5117416381835938, -1.423462152481079, -1.3351829051971436, -1.246903419494629, -1.1586240530014038, -1.0703446865081787, -0.9820653200149536, -0.8937859535217285, -0.8055065870285034, -0.7172271609306335, -0.6289477944374084, -0.5406684279441833, -0.4523890018463135, -0.3641096353530884, -0.2758302688598633, -0.187550887465477, -0.0992715060710907, -0.010992109775543213, 0.07728725671768188, 0.16556662321090698, 0.25384604930877686, 0.34212541580200195, 0.43040478229522705, 0.5186841487884521, 0.6069635152816772, 0.6952429413795471, 0.7835223078727722, 0.8718016743659973, 0.9600811004638672, 1.0483604669570923, 1.1366398334503174, 1.2249191999435425, 1.3131985664367676, 1.4014780521392822, 1.4897572994232178, 1.5780367851257324, 1.6663161516189575, 1.7545955181121826, 1.8428748846054077, 1.9311542510986328, 2.0194337368011475, 2.107712984085083, 2.1959924697875977, 2.284271717071533, 2.372551202774048, 2.4608306884765625, 2.549109935760498]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 6.0, 12.0, 21.0, 30.0, 30.0, 45.0, 72.0, 84.0, 156.0, 217.0, 343.0, 636.0, 991.0, 1786.0, 3444.0, 6692.0, 14665.0, 33751.0, 82159.0, 187305.0, 302116.0, 227786.0, 106095.0, 43556.0, 18653.0, 8358.0, 4220.0, 2169.0, 1231.0, 678.0, 407.0, 253.0, 158.0, 128.0, 80.0, 54.0, 42.0, 28.0, 23.0, 20.0, 10.0, 11.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.01953125, -1.957672119140625, -1.89581298828125, -1.833953857421875, -1.7720947265625, -1.710235595703125, -1.64837646484375, -1.586517333984375, -1.524658203125, -1.462799072265625, -1.40093994140625, -1.339080810546875, -1.2772216796875, -1.215362548828125, -1.15350341796875, -1.091644287109375, -1.02978515625, -0.967926025390625, -0.90606689453125, -0.844207763671875, -0.7823486328125, -0.720489501953125, -0.65863037109375, -0.596771240234375, -0.534912109375, -0.473052978515625, -0.41119384765625, -0.349334716796875, -0.2874755859375, -0.225616455078125, -0.16375732421875, -0.101898193359375, -0.0400390625, 0.021820068359375, 0.08367919921875, 0.145538330078125, 0.2073974609375, 0.269256591796875, 0.33111572265625, 0.392974853515625, 0.454833984375, 0.516693115234375, 0.57855224609375, 0.640411376953125, 0.7022705078125, 0.764129638671875, 0.82598876953125, 0.887847900390625, 0.94970703125, 1.011566162109375, 1.07342529296875, 1.135284423828125, 1.1971435546875, 1.259002685546875, 1.32086181640625, 1.382720947265625, 1.444580078125, 1.506439208984375, 1.56829833984375, 1.630157470703125, 1.6920166015625, 1.753875732421875, 1.81573486328125, 1.877593994140625, 1.939453125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 11.0, 16.0, 22.0, 34.0, 38.0, 43.0, 51.0, 69.0, 60.0, 71.0, 71.0, 72.0, 80.0, 60.0, 61.0, 47.0, 49.0, 33.0, 31.0, 30.0, 9.0, 4.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4423942565917969, -0.42848968505859375, -0.4145851135253906, -0.4006805419921875, -0.3867759704589844, -0.37287139892578125, -0.3589668273925781, -0.345062255859375, -0.3311576843261719, -0.31725311279296875, -0.3033485412597656, -0.2894439697265625, -0.2755393981933594, -0.26163482666015625, -0.24773025512695312, -0.23382568359375, -0.21992111206054688, -0.20601654052734375, -0.19211196899414062, -0.1782073974609375, -0.16430282592773438, -0.15039825439453125, -0.13649368286132812, -0.122589111328125, -0.10868453979492188, -0.09477996826171875, -0.08087539672851562, -0.0669708251953125, -0.053066253662109375, -0.03916168212890625, -0.025257110595703125, -0.0113525390625, 0.002552032470703125, 0.01645660400390625, 0.030361175537109375, 0.0442657470703125, 0.058170318603515625, 0.07207489013671875, 0.08597946166992188, 0.099884033203125, 0.11378860473632812, 0.12769317626953125, 0.14159774780273438, 0.1555023193359375, 0.16940689086914062, 0.18331146240234375, 0.19721603393554688, 0.21112060546875, 0.22502517700195312, 0.23892974853515625, 0.2528343200683594, 0.2667388916015625, 0.2806434631347656, 0.29454803466796875, 0.3084526062011719, 0.322357177734375, 0.3362617492675781, 0.35016632080078125, 0.3640708923339844, 0.3779754638671875, 0.3918800354003906, 0.40578460693359375, 0.4196891784667969, 0.43359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 6.0, 8.0, 11.0, 21.0, 41.0, 53.0, 67.0, 88.0, 134.0, 203.0, 308.0, 524.0, 902.0, 1406.0, 2471.0, 4534.0, 8628.0, 16862.0, 33800.0, 68506.0, 127343.0, 205084.0, 231005.0, 161833.0, 90576.0, 46028.0, 22808.0, 11513.0, 5987.0, 3101.0, 1829.0, 1043.0, 655.0, 391.0, 233.0, 172.0, 138.0, 72.0, 50.0, 34.0, 29.0, 13.0, 15.0, 7.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.154296875, -1.11846923828125, -1.0826416015625, -1.04681396484375, -1.010986328125, -0.97515869140625, -0.9393310546875, -0.90350341796875, -0.86767578125, -0.83184814453125, -0.7960205078125, -0.76019287109375, -0.724365234375, -0.68853759765625, -0.6527099609375, -0.61688232421875, -0.5810546875, -0.54522705078125, -0.5093994140625, -0.47357177734375, -0.437744140625, -0.40191650390625, -0.3660888671875, -0.33026123046875, -0.29443359375, -0.25860595703125, -0.2227783203125, -0.18695068359375, -0.151123046875, -0.11529541015625, -0.0794677734375, -0.04364013671875, -0.0078125, 0.02801513671875, 0.0638427734375, 0.09967041015625, 0.135498046875, 0.17132568359375, 0.2071533203125, 0.24298095703125, 0.27880859375, 0.31463623046875, 0.3504638671875, 0.38629150390625, 0.422119140625, 0.45794677734375, 0.4937744140625, 0.52960205078125, 0.5654296875, 0.60125732421875, 0.6370849609375, 0.67291259765625, 0.708740234375, 0.74456787109375, 0.7803955078125, 0.81622314453125, 0.85205078125, 0.88787841796875, 0.9237060546875, 0.95953369140625, 0.995361328125, 1.03118896484375, 1.0670166015625, 1.10284423828125, 1.138671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 11.0, 13.0, 9.0, 6.0, 14.0, 14.0, 16.0, 15.0, 26.0, 30.0, 34.0, 32.0, 33.0, 34.0, 26.0, 49.0, 43.0, 39.0, 38.0, 46.0, 38.0, 41.0, 37.0, 39.0, 30.0, 39.0, 22.0, 29.0, 21.0, 23.0, 18.0, 36.0, 13.0, 16.0, 6.0, 6.0, 9.0, 10.0, 2.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-1.1728515625, -1.1381683349609375, -1.103485107421875, -1.0688018798828125, -1.03411865234375, -0.9994354248046875, -0.964752197265625, -0.9300689697265625, -0.8953857421875, -0.8607025146484375, -0.826019287109375, -0.7913360595703125, -0.75665283203125, -0.7219696044921875, -0.687286376953125, -0.6526031494140625, -0.617919921875, -0.5832366943359375, -0.548553466796875, -0.5138702392578125, -0.47918701171875, -0.4445037841796875, -0.409820556640625, -0.3751373291015625, -0.3404541015625, -0.3057708740234375, -0.271087646484375, -0.2364044189453125, -0.20172119140625, -0.1670379638671875, -0.132354736328125, -0.0976715087890625, -0.06298828125, -0.0283050537109375, 0.006378173828125, 0.0410614013671875, 0.07574462890625, 0.1104278564453125, 0.145111083984375, 0.1797943115234375, 0.2144775390625, 0.2491607666015625, 0.283843994140625, 0.3185272216796875, 0.35321044921875, 0.3878936767578125, 0.422576904296875, 0.4572601318359375, 0.491943359375, 0.5266265869140625, 0.561309814453125, 0.5959930419921875, 0.63067626953125, 0.6653594970703125, 0.700042724609375, 0.7347259521484375, 0.7694091796875, 0.8040924072265625, 0.838775634765625, 0.8734588623046875, 0.90814208984375, 0.9428253173828125, 0.977508544921875, 1.0121917724609375, 1.046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 6.0, 17.0, 30.0, 63.0, 108.0, 233.0, 470.0, 1008.0, 2745.0, 8236.0, 30890.0, 187458.0, 640891.0, 140018.0, 25278.0, 6907.0, 2405.0, 951.0, 392.0, 199.0, 103.0, 54.0, 37.0, 15.0, 14.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.1144866943359375, -2.049285888671875, -1.9840850830078125, -1.91888427734375, -1.8536834716796875, -1.788482666015625, -1.7232818603515625, -1.6580810546875, -1.5928802490234375, -1.527679443359375, -1.4624786376953125, -1.39727783203125, -1.3320770263671875, -1.266876220703125, -1.2016754150390625, -1.136474609375, -1.0712738037109375, -1.006072998046875, -0.9408721923828125, -0.87567138671875, -0.8104705810546875, -0.745269775390625, -0.6800689697265625, -0.6148681640625, -0.5496673583984375, -0.484466552734375, -0.4192657470703125, -0.35406494140625, -0.2888641357421875, -0.223663330078125, -0.1584625244140625, -0.09326171875, -0.0280609130859375, 0.037139892578125, 0.1023406982421875, 0.16754150390625, 0.2327423095703125, 0.297943115234375, 0.3631439208984375, 0.4283447265625, 0.4935455322265625, 0.558746337890625, 0.6239471435546875, 0.68914794921875, 0.7543487548828125, 0.819549560546875, 0.8847503662109375, 0.949951171875, 1.0151519775390625, 1.080352783203125, 1.1455535888671875, 1.21075439453125, 1.2759552001953125, 1.341156005859375, 1.4063568115234375, 1.4715576171875, 1.5367584228515625, 1.601959228515625, 1.6671600341796875, 1.73236083984375, 1.7975616455078125, 1.862762451171875, 1.9279632568359375, 1.9931640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 12.0, 8.0, 7.0, 9.0, 14.0, 30.0, 30.0, 47.0, 51.0, 55.0, 86.0, 101.0, 104.0, 88.0, 75.0, 71.0, 50.0, 31.0, 24.0, 19.0, 15.0, 13.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019347667694091797, -0.00018615461885929108, -0.00017883256077766418, -0.0001715105026960373, -0.0001641884446144104, -0.0001568663865327835, -0.00014954432845115662, -0.00014222227036952972, -0.00013490021228790283, -0.00012757815420627594, -0.00012025609612464905, -0.00011293403804302216, -0.00010561197996139526, -9.828992187976837e-05, -9.096786379814148e-05, -8.364580571651459e-05, -7.63237476348877e-05, -6.90016895532608e-05, -6.167963147163391e-05, -5.435757339000702e-05, -4.703551530838013e-05, -3.9713457226753235e-05, -3.239139914512634e-05, -2.506934106349945e-05, -1.774728298187256e-05, -1.0425224900245667e-05, -3.1031668186187744e-06, 4.218891263008118e-06, 1.154094934463501e-05, 1.8863007426261902e-05, 2.6185065507888794e-05, 3.3507123589515686e-05, 4.082918167114258e-05, 4.815123975276947e-05, 5.547329783439636e-05, 6.279535591602325e-05, 7.011741399765015e-05, 7.743947207927704e-05, 8.476153016090393e-05, 9.208358824253082e-05, 9.940564632415771e-05, 0.00010672770440578461, 0.0001140497624874115, 0.00012137182056903839, 0.00012869387865066528, 0.00013601593673229218, 0.00014333799481391907, 0.00015066005289554596, 0.00015798211097717285, 0.00016530416905879974, 0.00017262622714042664, 0.00017994828522205353, 0.00018727034330368042, 0.0001945924013853073, 0.0002019144594669342, 0.0002092365175485611, 0.000216558575630188, 0.00022388063371181488, 0.00023120269179344177, 0.00023852474987506866, 0.00024584680795669556, 0.00025316886603832245, 0.00026049092411994934, 0.00026781298220157623, 0.0002751350402832031]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 8.0, 17.0, 11.0, 31.0, 44.0, 56.0, 89.0, 116.0, 202.0, 335.0, 645.0, 1219.0, 2611.0, 5583.0, 14043.0, 39785.0, 145121.0, 479978.0, 258531.0, 64058.0, 20863.0, 8030.0, 3520.0, 1586.0, 878.0, 447.0, 268.0, 159.0, 106.0, 72.0, 33.0, 22.0, 25.0, 14.0, 9.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.259765625, -1.21734619140625, -1.1749267578125, -1.13250732421875, -1.090087890625, -1.04766845703125, -1.0052490234375, -0.96282958984375, -0.92041015625, -0.87799072265625, -0.8355712890625, -0.79315185546875, -0.750732421875, -0.70831298828125, -0.6658935546875, -0.62347412109375, -0.5810546875, -0.53863525390625, -0.4962158203125, -0.45379638671875, -0.411376953125, -0.36895751953125, -0.3265380859375, -0.28411865234375, -0.24169921875, -0.19927978515625, -0.1568603515625, -0.11444091796875, -0.072021484375, -0.02960205078125, 0.0128173828125, 0.05523681640625, 0.09765625, 0.14007568359375, 0.1824951171875, 0.22491455078125, 0.267333984375, 0.30975341796875, 0.3521728515625, 0.39459228515625, 0.43701171875, 0.47943115234375, 0.5218505859375, 0.56427001953125, 0.606689453125, 0.64910888671875, 0.6915283203125, 0.73394775390625, 0.7763671875, 0.81878662109375, 0.8612060546875, 0.90362548828125, 0.946044921875, 0.98846435546875, 1.0308837890625, 1.07330322265625, 1.11572265625, 1.15814208984375, 1.2005615234375, 1.24298095703125, 1.285400390625, 1.32781982421875, 1.3702392578125, 1.41265869140625, 1.455078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 5.0, 14.0, 18.0, 20.0, 22.0, 29.0, 40.0, 56.0, 66.0, 101.0, 102.0, 108.0, 88.0, 80.0, 64.0, 45.0, 31.0, 18.0, 17.0, 11.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.185546875, -1.1433258056640625, -1.101104736328125, -1.0588836669921875, -1.01666259765625, -0.9744415283203125, -0.932220458984375, -0.8899993896484375, -0.8477783203125, -0.8055572509765625, -0.763336181640625, -0.7211151123046875, -0.67889404296875, -0.6366729736328125, -0.594451904296875, -0.5522308349609375, -0.510009765625, -0.4677886962890625, -0.425567626953125, -0.3833465576171875, -0.34112548828125, -0.2989044189453125, -0.256683349609375, -0.2144622802734375, -0.1722412109375, -0.1300201416015625, -0.087799072265625, -0.0455780029296875, -0.00335693359375, 0.0388641357421875, 0.081085205078125, 0.1233062744140625, 0.16552734375, 0.2077484130859375, 0.249969482421875, 0.2921905517578125, 0.33441162109375, 0.3766326904296875, 0.418853759765625, 0.4610748291015625, 0.5032958984375, 0.5455169677734375, 0.587738037109375, 0.6299591064453125, 0.67218017578125, 0.7144012451171875, 0.756622314453125, 0.7988433837890625, 0.841064453125, 0.8832855224609375, 0.925506591796875, 0.9677276611328125, 1.00994873046875, 1.0521697998046875, 1.094390869140625, 1.1366119384765625, 1.1788330078125, 1.2210540771484375, 1.263275146484375, 1.3054962158203125, 1.34771728515625, 1.3899383544921875, 1.432159423828125, 1.4743804931640625, 1.5166015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 19.0, 50.0, 113.0, 198.0, 216.0, 191.0, 109.0, 48.0, 19.0, 15.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15909194946289, -18.298742294311523, -17.438390731811523, -16.578041076660156, -15.717690467834473, -14.857339859008789, -13.996990203857422, -13.136639595031738, -12.276288986206055, -11.415938377380371, -10.555588722229004, -9.69523811340332, -8.834887504577637, -7.974537372589111, -7.114187240600586, -6.253836631774902, -5.393486976623535, -4.53313684463501, -3.672786235809326, -2.812436103820801, -1.9520857334136963, -1.0917353630065918, -0.2313852310180664, 0.6289653778076172, 1.4893155097961426, 2.349665880203247, 3.2100162506103516, 4.070366382598877, 4.930716514587402, 5.791067123413086, 6.651417255401611, 7.511767864227295, 8.37211799621582, 9.232468605041504, 10.092818260192871, 10.953168869018555, 11.813519477844238, 12.673870086669922, 13.534219741821289, 14.394570350646973, 15.254920959472656, 16.115270614624023, 16.975622177124023, 17.83597183227539, 18.696321487426758, 19.556673049926758, 20.417022705078125, 21.277374267578125, 22.13772201538086, 22.998071670532227, 23.858423233032227, 24.718772888183594, 25.57912254333496, 26.43947410583496, 27.299823760986328, 28.160175323486328, 29.020524978637695, 29.880874633789062, 30.741226196289062, 31.60157585144043, 32.4619255065918, 33.3222770690918, 34.18262481689453, 35.04297637939453, 35.90332794189453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 7.0, 6.0, 11.0, 9.0, 15.0, 13.0, 21.0, 28.0, 25.0, 20.0, 27.0, 41.0, 42.0, 43.0, 52.0, 44.0, 54.0, 43.0, 46.0, 42.0, 44.0, 40.0, 42.0, 34.0, 29.0, 29.0, 26.0, 24.0, 25.0, 28.0, 23.0, 9.0, 15.0, 8.0, 7.0, 2.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.809619903564453, -7.565699100494385, -7.321778297424316, -7.077857494354248, -6.83393669128418, -6.590015888214111, -6.346095085144043, -6.102173805236816, -5.858253479003906, -5.614332675933838, -5.3704118728637695, -5.126491069793701, -4.882570266723633, -4.6386494636535645, -4.394728660583496, -4.1508073806762695, -3.906886577606201, -3.662965774536133, -3.4190449714660645, -3.175124168395996, -2.9312033653259277, -2.6872825622558594, -2.443361520767212, -2.1994407176971436, -1.9555199146270752, -1.7115991115570068, -1.4676783084869385, -1.2237573862075806, -0.9798365831375122, -0.7359157800674438, -0.49199485778808594, -0.24807405471801758, -0.004152774810791016, 0.23976805806159973, 0.4836888909339905, 0.7276097536087036, 0.971530556678772, 1.2154513597488403, 1.4593722820281982, 1.7032930850982666, 1.947213888168335, 2.1911346912384033, 2.4350554943084717, 2.678976535797119, 2.9228973388671875, 3.166818141937256, 3.410738945007324, 3.6546597480773926, 3.898580551147461, 4.142501354217529, 4.386422157287598, 4.630342960357666, 4.874263763427734, 5.118184566497803, 5.362105369567871, 5.606026649475098, 5.849946975708008, 6.093867778778076, 6.3377885818481445, 6.581709384918213, 6.825630187988281, 7.06955099105835, 7.313471794128418, 7.5573930740356445, 7.801313877105713]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 5.0, 6.0, 9.0, 23.0, 19.0, 22.0, 39.0, 73.0, 82.0, 111.0, 165.0, 244.0, 425.0, 710.0, 1232.0, 2357.0, 4910.0, 11667.0, 35918.0, 168183.0, 2980113.0, 854387.0, 93992.0, 23971.0, 8313.0, 3447.0, 1730.0, 878.0, 486.0, 263.0, 155.0, 110.0, 65.0, 39.0, 35.0, 25.0, 14.0, 15.0, 14.0, 5.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.873046875, -2.788116455078125, -2.70318603515625, -2.618255615234375, -2.5333251953125, -2.448394775390625, -2.36346435546875, -2.278533935546875, -2.193603515625, -2.108673095703125, -2.02374267578125, -1.938812255859375, -1.8538818359375, -1.768951416015625, -1.68402099609375, -1.599090576171875, -1.51416015625, -1.429229736328125, -1.34429931640625, -1.259368896484375, -1.1744384765625, -1.089508056640625, -1.00457763671875, -0.919647216796875, -0.834716796875, -0.749786376953125, -0.66485595703125, -0.579925537109375, -0.4949951171875, -0.410064697265625, -0.32513427734375, -0.240203857421875, -0.1552734375, -0.070343017578125, 0.01458740234375, 0.099517822265625, 0.1844482421875, 0.269378662109375, 0.35430908203125, 0.439239501953125, 0.524169921875, 0.609100341796875, 0.69403076171875, 0.778961181640625, 0.8638916015625, 0.948822021484375, 1.03375244140625, 1.118682861328125, 1.20361328125, 1.288543701171875, 1.37347412109375, 1.458404541015625, 1.5433349609375, 1.628265380859375, 1.71319580078125, 1.798126220703125, 1.883056640625, 1.967987060546875, 2.05291748046875, 2.137847900390625, 2.2227783203125, 2.307708740234375, 2.39263916015625, 2.477569580078125, 2.5625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 11.0, 10.0, 12.0, 13.0, 16.0, 20.0, 33.0, 42.0, 52.0, 58.0, 61.0, 72.0, 84.0, 71.0, 72.0, 58.0, 61.0, 52.0, 35.0, 39.0, 40.0, 22.0, 23.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.4260101318359375, -0.412322998046875, -0.3986358642578125, -0.38494873046875, -0.3712615966796875, -0.357574462890625, -0.3438873291015625, -0.3302001953125, -0.3165130615234375, -0.302825927734375, -0.2891387939453125, -0.27545166015625, -0.2617645263671875, -0.248077392578125, -0.2343902587890625, -0.220703125, -0.2070159912109375, -0.193328857421875, -0.1796417236328125, -0.16595458984375, -0.1522674560546875, -0.138580322265625, -0.1248931884765625, -0.1112060546875, -0.0975189208984375, -0.083831787109375, -0.0701446533203125, -0.05645751953125, -0.0427703857421875, -0.029083251953125, -0.0153961181640625, -0.001708984375, 0.0119781494140625, 0.025665283203125, 0.0393524169921875, 0.05303955078125, 0.0667266845703125, 0.080413818359375, 0.0941009521484375, 0.1077880859375, 0.1214752197265625, 0.135162353515625, 0.1488494873046875, 0.16253662109375, 0.1762237548828125, 0.189910888671875, 0.2035980224609375, 0.21728515625, 0.2309722900390625, 0.244659423828125, 0.2583465576171875, 0.27203369140625, 0.2857208251953125, 0.299407958984375, 0.3130950927734375, 0.3267822265625, 0.3404693603515625, 0.354156494140625, 0.3678436279296875, 0.38153076171875, 0.3952178955078125, 0.408905029296875, 0.4225921630859375, 0.436279296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 9.0, 8.0, 14.0, 16.0, 27.0, 35.0, 57.0, 98.0, 153.0, 273.0, 531.0, 1042.0, 2374.0, 5871.0, 16451.0, 52858.0, 222127.0, 1991800.0, 1625616.0, 200845.0, 48931.0, 15146.0, 5596.0, 2220.0, 1012.0, 521.0, 244.0, 149.0, 86.0, 59.0, 38.0, 17.0, 15.0, 13.0, 18.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.72509765625, -1.6611328125, -1.59716796875, -1.533203125, -1.46923828125, -1.4052734375, -1.34130859375, -1.27734375, -1.21337890625, -1.1494140625, -1.08544921875, -1.021484375, -0.95751953125, -0.8935546875, -0.82958984375, -0.765625, -0.70166015625, -0.6376953125, -0.57373046875, -0.509765625, -0.44580078125, -0.3818359375, -0.31787109375, -0.25390625, -0.18994140625, -0.1259765625, -0.06201171875, 0.001953125, 0.06591796875, 0.1298828125, 0.19384765625, 0.2578125, 0.32177734375, 0.3857421875, 0.44970703125, 0.513671875, 0.57763671875, 0.6416015625, 0.70556640625, 0.76953125, 0.83349609375, 0.8974609375, 0.96142578125, 1.025390625, 1.08935546875, 1.1533203125, 1.21728515625, 1.28125, 1.34521484375, 1.4091796875, 1.47314453125, 1.537109375, 1.60107421875, 1.6650390625, 1.72900390625, 1.79296875, 1.85693359375, 1.9208984375, 1.98486328125, 2.048828125, 2.11279296875, 2.1767578125, 2.24072265625, 2.3046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 7.0, 5.0, 10.0, 20.0, 26.0, 40.0, 39.0, 72.0, 114.0, 151.0, 279.0, 462.0, 841.0, 829.0, 439.0, 251.0, 155.0, 108.0, 67.0, 50.0, 34.0, 24.0, 12.0, 11.0, 10.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0687332153320312, -1.0398101806640625, -1.0108871459960938, -0.981964111328125, -0.9530410766601562, -0.9241180419921875, -0.8951950073242188, -0.86627197265625, -0.8373489379882812, -0.8084259033203125, -0.7795028686523438, -0.750579833984375, -0.7216567993164062, -0.6927337646484375, -0.6638107299804688, -0.6348876953125, -0.6059646606445312, -0.5770416259765625, -0.5481185913085938, -0.519195556640625, -0.49027252197265625, -0.4613494873046875, -0.43242645263671875, -0.40350341796875, -0.37458038330078125, -0.3456573486328125, -0.31673431396484375, -0.287811279296875, -0.25888824462890625, -0.2299652099609375, -0.20104217529296875, -0.172119140625, -0.14319610595703125, -0.1142730712890625, -0.08535003662109375, -0.056427001953125, -0.02750396728515625, 0.0014190673828125, 0.03034210205078125, 0.05926513671875, 0.08818817138671875, 0.1171112060546875, 0.14603424072265625, 0.174957275390625, 0.20388031005859375, 0.2328033447265625, 0.26172637939453125, 0.2906494140625, 0.31957244873046875, 0.3484954833984375, 0.37741851806640625, 0.406341552734375, 0.43526458740234375, 0.4641876220703125, 0.49311065673828125, 0.52203369140625, 0.5509567260742188, 0.5798797607421875, 0.6088027954101562, 0.637725830078125, 0.6666488647460938, 0.6955718994140625, 0.7244949340820312, 0.75341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 24.0, 28.0, 57.0, 115.0, 147.0, 191.0, 150.0, 122.0, 63.0, 43.0, 20.0, 16.0, 6.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.450633525848389, -4.122186660766602, -3.7937397956848145, -3.4652931690216064, -3.1368463039398193, -2.8083994388580322, -2.479952812194824, -2.151505947113037, -1.82305908203125, -1.494612216949463, -1.1661654710769653, -0.837718665599823, -0.5092718601226807, -0.18082499504089355, 0.147621750831604, 0.47606849670410156, 0.8045153617858887, 1.1329622268676758, 1.4614089727401733, 1.789855718612671, 2.118302583694458, 2.446749448776245, 2.775196075439453, 3.1036429405212402, 3.4320898056030273, 3.7605366706848145, 4.088983535766602, 4.417430400848389, 4.745877265930176, 5.074323654174805, 5.402770519256592, 5.731217384338379, 6.059663772583008, 6.388110637664795, 6.716557502746582, 7.045004367828369, 7.373451232910156, 7.701897621154785, 8.03034496307373, 8.35879135131836, 8.687238693237305, 9.015685081481934, 9.344132423400879, 9.672578811645508, 10.001026153564453, 10.329472541809082, 10.657919883728027, 10.986366271972656, 11.314812660217285, 11.643259048461914, 11.97170639038086, 12.300152778625488, 12.628600120544434, 12.957046508789062, 13.285493850708008, 13.613940238952637, 13.942386627197266, 14.270833015441895, 14.59928035736084, 14.927726745605469, 15.256174087524414, 15.584620475769043, 15.913067817687988, 16.241514205932617, 16.569961547851562]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 13.0, 10.0, 18.0, 15.0, 18.0, 23.0, 27.0, 29.0, 27.0, 32.0, 44.0, 39.0, 41.0, 52.0, 53.0, 63.0, 53.0, 45.0, 50.0, 40.0, 37.0, 34.0, 42.0, 25.0, 35.0, 21.0, 17.0, 14.0, 21.0, 12.0, 8.0, 8.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7309255599975586, -2.617586851119995, -2.5042481422424316, -2.390909433364868, -2.2775707244873047, -2.164232015609741, -2.0508933067321777, -1.9375545978546143, -1.8242158889770508, -1.7108771800994873, -1.5975384712219238, -1.4841997623443604, -1.3708610534667969, -1.2575223445892334, -1.14418363571167, -1.0308449268341064, -0.917506217956543, -0.8041675090789795, -0.690828800201416, -0.5774900913238525, -0.46415138244628906, -0.3508126735687256, -0.2374739646911621, -0.12413525581359863, -0.010796546936035156, 0.10254216194152832, 0.2158808708190918, 0.3292195796966553, 0.44255828857421875, 0.5558969974517822, 0.6692357063293457, 0.7825744152069092, 0.8959131240844727, 1.0092518329620361, 1.1225905418395996, 1.235929250717163, 1.3492679595947266, 1.46260666847229, 1.5759453773498535, 1.689284086227417, 1.8026227951049805, 1.915961503982544, 2.0293002128601074, 2.142638921737671, 2.2559776306152344, 2.369316339492798, 2.4826550483703613, 2.595993757247925, 2.7093324661254883, 2.8226711750030518, 2.9360098838806152, 3.0493485927581787, 3.162687301635742, 3.2760260105133057, 3.389364719390869, 3.5027034282684326, 3.616042137145996, 3.7293808460235596, 3.842719554901123, 3.9560582637786865, 4.06939697265625, 4.182735443115234, 4.296074390411377, 4.4094133377075195, 4.522751808166504]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 9.0, 8.0, 16.0, 14.0, 21.0, 37.0, 37.0, 49.0, 88.0, 126.0, 190.0, 313.0, 456.0, 744.0, 1337.0, 2624.0, 5546.0, 12234.0, 29000.0, 73541.0, 207259.0, 403534.0, 192265.0, 69257.0, 27172.0, 11572.0, 5246.0, 2528.0, 1328.0, 765.0, 429.0, 268.0, 144.0, 129.0, 65.0, 55.0, 39.0, 30.0, 21.0, 17.0, 10.0, 9.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.30078125, -2.2376861572265625, -2.174591064453125, -2.1114959716796875, -2.04840087890625, -1.9853057861328125, -1.922210693359375, -1.8591156005859375, -1.7960205078125, -1.7329254150390625, -1.669830322265625, -1.6067352294921875, -1.54364013671875, -1.4805450439453125, -1.417449951171875, -1.3543548583984375, -1.291259765625, -1.2281646728515625, -1.165069580078125, -1.1019744873046875, -1.03887939453125, -0.9757843017578125, -0.912689208984375, -0.8495941162109375, -0.7864990234375, -0.7234039306640625, -0.660308837890625, -0.5972137451171875, -0.53411865234375, -0.4710235595703125, -0.407928466796875, -0.3448333740234375, -0.28173828125, -0.2186431884765625, -0.155548095703125, -0.0924530029296875, -0.02935791015625, 0.0337371826171875, 0.096832275390625, 0.1599273681640625, 0.2230224609375, 0.2861175537109375, 0.349212646484375, 0.4123077392578125, 0.47540283203125, 0.5384979248046875, 0.601593017578125, 0.6646881103515625, 0.727783203125, 0.7908782958984375, 0.853973388671875, 0.9170684814453125, 0.98016357421875, 1.0432586669921875, 1.106353759765625, 1.1694488525390625, 1.2325439453125, 1.2956390380859375, 1.358734130859375, 1.4218292236328125, 1.48492431640625, 1.5480194091796875, 1.611114501953125, 1.6742095947265625, 1.7373046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 13.0, 8.0, 3.0, 11.0, 8.0, 19.0, 30.0, 30.0, 36.0, 48.0, 52.0, 67.0, 70.0, 71.0, 88.0, 56.0, 58.0, 67.0, 73.0, 51.0, 39.0, 24.0, 20.0, 24.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4912109375, -0.4764671325683594, -0.46172332763671875, -0.4469795227050781, -0.4322357177734375, -0.4174919128417969, -0.40274810791015625, -0.3880043029785156, -0.373260498046875, -0.3585166931152344, -0.34377288818359375, -0.3290290832519531, -0.3142852783203125, -0.2995414733886719, -0.28479766845703125, -0.2700538635253906, -0.25531005859375, -0.24056625366210938, -0.22582244873046875, -0.21107864379882812, -0.1963348388671875, -0.18159103393554688, -0.16684722900390625, -0.15210342407226562, -0.137359619140625, -0.12261581420898438, -0.10787200927734375, -0.09312820434570312, -0.0783843994140625, -0.06364059448242188, -0.04889678955078125, -0.034152984619140625, -0.0194091796875, -0.004665374755859375, 0.01007843017578125, 0.024822235107421875, 0.0395660400390625, 0.054309844970703125, 0.06905364990234375, 0.08379745483398438, 0.098541259765625, 0.11328506469726562, 0.12802886962890625, 0.14277267456054688, 0.1575164794921875, 0.17226028442382812, 0.18700408935546875, 0.20174789428710938, 0.21649169921875, 0.23123550415039062, 0.24597930908203125, 0.2607231140136719, 0.2754669189453125, 0.2902107238769531, 0.30495452880859375, 0.3196983337402344, 0.334442138671875, 0.3491859436035156, 0.36392974853515625, 0.3786735534667969, 0.3934173583984375, 0.4081611633300781, 0.42290496826171875, 0.4376487731933594, 0.452392578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 9.0, 11.0, 14.0, 20.0, 25.0, 31.0, 42.0, 64.0, 98.0, 131.0, 204.0, 303.0, 495.0, 816.0, 1371.0, 2524.0, 4912.0, 10110.0, 21264.0, 46294.0, 102770.0, 225322.0, 310893.0, 174170.0, 77723.0, 35481.0, 16516.0, 7833.0, 3944.0, 2058.0, 1145.0, 680.0, 402.0, 267.0, 192.0, 100.0, 76.0, 64.0, 49.0, 41.0, 19.0, 19.0, 8.0, 13.0, 6.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.25, -1.2087860107421875, -1.167572021484375, -1.1263580322265625, -1.08514404296875, -1.0439300537109375, -1.002716064453125, -0.9615020751953125, -0.9202880859375, -0.8790740966796875, -0.837860107421875, -0.7966461181640625, -0.75543212890625, -0.7142181396484375, -0.673004150390625, -0.6317901611328125, -0.590576171875, -0.5493621826171875, -0.508148193359375, -0.4669342041015625, -0.42572021484375, -0.3845062255859375, -0.343292236328125, -0.3020782470703125, -0.2608642578125, -0.2196502685546875, -0.178436279296875, -0.1372222900390625, -0.09600830078125, -0.0547943115234375, -0.013580322265625, 0.0276336669921875, 0.06884765625, 0.1100616455078125, 0.151275634765625, 0.1924896240234375, 0.23370361328125, 0.2749176025390625, 0.316131591796875, 0.3573455810546875, 0.3985595703125, 0.4397735595703125, 0.480987548828125, 0.5222015380859375, 0.56341552734375, 0.6046295166015625, 0.645843505859375, 0.6870574951171875, 0.728271484375, 0.7694854736328125, 0.810699462890625, 0.8519134521484375, 0.89312744140625, 0.9343414306640625, 0.975555419921875, 1.0167694091796875, 1.0579833984375, 1.0991973876953125, 1.140411376953125, 1.1816253662109375, 1.22283935546875, 1.2640533447265625, 1.305267333984375, 1.3464813232421875, 1.3876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 13.0, 10.0, 7.0, 17.0, 23.0, 14.0, 28.0, 22.0, 25.0, 37.0, 35.0, 29.0, 40.0, 41.0, 41.0, 43.0, 48.0, 45.0, 53.0, 40.0, 35.0, 45.0, 43.0, 33.0, 33.0, 32.0, 23.0, 21.0, 14.0, 21.0, 12.0, 17.0, 14.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.5, -1.459075927734375, -1.41815185546875, -1.377227783203125, -1.3363037109375, -1.295379638671875, -1.25445556640625, -1.213531494140625, -1.172607421875, -1.131683349609375, -1.09075927734375, -1.049835205078125, -1.0089111328125, -0.967987060546875, -0.92706298828125, -0.886138916015625, -0.84521484375, -0.804290771484375, -0.76336669921875, -0.722442626953125, -0.6815185546875, -0.640594482421875, -0.59967041015625, -0.558746337890625, -0.517822265625, -0.476898193359375, -0.43597412109375, -0.395050048828125, -0.3541259765625, -0.313201904296875, -0.27227783203125, -0.231353759765625, -0.1904296875, -0.149505615234375, -0.10858154296875, -0.067657470703125, -0.0267333984375, 0.014190673828125, 0.05511474609375, 0.096038818359375, 0.136962890625, 0.177886962890625, 0.21881103515625, 0.259735107421875, 0.3006591796875, 0.341583251953125, 0.38250732421875, 0.423431396484375, 0.46435546875, 0.505279541015625, 0.54620361328125, 0.587127685546875, 0.6280517578125, 0.668975830078125, 0.70989990234375, 0.750823974609375, 0.791748046875, 0.832672119140625, 0.87359619140625, 0.914520263671875, 0.9554443359375, 0.996368408203125, 1.03729248046875, 1.078216552734375, 1.119140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 16.0, 22.0, 17.0, 43.0, 62.0, 89.0, 133.0, 295.0, 609.0, 1436.0, 4383.0, 15176.0, 67284.0, 487993.0, 397428.0, 54190.0, 12928.0, 3895.0, 1354.0, 508.0, 266.0, 130.0, 76.0, 51.0, 37.0, 41.0, 14.0, 16.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.7008819580078125, -1.645904541015625, -1.5909271240234375, -1.53594970703125, -1.4809722900390625, -1.425994873046875, -1.3710174560546875, -1.3160400390625, -1.2610626220703125, -1.206085205078125, -1.1511077880859375, -1.09613037109375, -1.0411529541015625, -0.986175537109375, -0.9311981201171875, -0.876220703125, -0.8212432861328125, -0.766265869140625, -0.7112884521484375, -0.65631103515625, -0.6013336181640625, -0.546356201171875, -0.4913787841796875, -0.4364013671875, -0.3814239501953125, -0.326446533203125, -0.2714691162109375, -0.21649169921875, -0.1615142822265625, -0.106536865234375, -0.0515594482421875, 0.00341796875, 0.0583953857421875, 0.113372802734375, 0.1683502197265625, 0.22332763671875, 0.2783050537109375, 0.333282470703125, 0.3882598876953125, 0.4432373046875, 0.4982147216796875, 0.553192138671875, 0.6081695556640625, 0.66314697265625, 0.7181243896484375, 0.773101806640625, 0.8280792236328125, 0.883056640625, 0.9380340576171875, 0.993011474609375, 1.0479888916015625, 1.10296630859375, 1.1579437255859375, 1.212921142578125, 1.2678985595703125, 1.3228759765625, 1.3778533935546875, 1.432830810546875, 1.4878082275390625, 1.54278564453125, 1.5977630615234375, 1.652740478515625, 1.7077178955078125, 1.7626953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 9.0, 14.0, 34.0, 22.0, 26.0, 42.0, 117.0, 178.0, 207.0, 138.0, 61.0, 36.0, 35.0, 11.0, 17.0, 9.0, 2.0, 7.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004563331604003906, -0.000445537269115448, -0.00043474137783050537, -0.00042394548654556274, -0.0004131495952606201, -0.0004023537039756775, -0.00039155781269073486, -0.00038076192140579224, -0.0003699660301208496, -0.000359170138835907, -0.00034837424755096436, -0.00033757835626602173, -0.0003267824649810791, -0.0003159865736961365, -0.00030519068241119385, -0.0002943947911262512, -0.0002835988998413086, -0.00027280300855636597, -0.00026200711727142334, -0.0002512112259864807, -0.00024041533470153809, -0.00022961944341659546, -0.00021882355213165283, -0.0002080276608467102, -0.00019723176956176758, -0.00018643587827682495, -0.00017563998699188232, -0.0001648440957069397, -0.00015404820442199707, -0.00014325231313705444, -0.00013245642185211182, -0.00012166053056716919, -0.00011086463928222656, -0.00010006874799728394, -8.927285671234131e-05, -7.847696542739868e-05, -6.768107414245605e-05, -5.688518285751343e-05, -4.60892915725708e-05, -3.5293400287628174e-05, -2.4497509002685547e-05, -1.370161771774292e-05, -2.905726432800293e-06, 7.890164852142334e-06, 1.868605613708496e-05, 2.9481947422027588e-05, 4.0277838706970215e-05, 5.107372999191284e-05, 6.186962127685547e-05, 7.26655125617981e-05, 8.346140384674072e-05, 9.425729513168335e-05, 0.00010505318641662598, 0.0001158490777015686, 0.00012664496898651123, 0.00013744086027145386, 0.00014823675155639648, 0.0001590326428413391, 0.00016982853412628174, 0.00018062442541122437, 0.000191420316696167, 0.00020221620798110962, 0.00021301209926605225, 0.00022380799055099487, 0.0002346038818359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 24.0, 21.0, 41.0, 92.0, 129.0, 268.0, 461.0, 1329.0, 6136.0, 42884.0, 696117.0, 274231.0, 21603.0, 3475.0, 912.0, 364.0, 168.0, 94.0, 65.0, 33.0, 25.0, 21.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.578125, -2.499603271484375, -2.42108154296875, -2.342559814453125, -2.2640380859375, -2.185516357421875, -2.10699462890625, -2.028472900390625, -1.949951171875, -1.871429443359375, -1.79290771484375, -1.714385986328125, -1.6358642578125, -1.557342529296875, -1.47882080078125, -1.400299072265625, -1.32177734375, -1.243255615234375, -1.16473388671875, -1.086212158203125, -1.0076904296875, -0.929168701171875, -0.85064697265625, -0.772125244140625, -0.693603515625, -0.615081787109375, -0.53656005859375, -0.458038330078125, -0.3795166015625, -0.300994873046875, -0.22247314453125, -0.143951416015625, -0.0654296875, 0.013092041015625, 0.09161376953125, 0.170135498046875, 0.2486572265625, 0.327178955078125, 0.40570068359375, 0.484222412109375, 0.562744140625, 0.641265869140625, 0.71978759765625, 0.798309326171875, 0.8768310546875, 0.955352783203125, 1.03387451171875, 1.112396240234375, 1.19091796875, 1.269439697265625, 1.34796142578125, 1.426483154296875, 1.5050048828125, 1.583526611328125, 1.66204833984375, 1.740570068359375, 1.819091796875, 1.897613525390625, 1.97613525390625, 2.054656982421875, 2.1331787109375, 2.211700439453125, 2.29022216796875, 2.368743896484375, 2.447265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 20.0, 18.0, 29.0, 33.0, 64.0, 87.0, 115.0, 122.0, 151.0, 103.0, 79.0, 44.0, 34.0, 15.0, 18.0, 5.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.8994140625, -1.854949951171875, -1.81048583984375, -1.766021728515625, -1.7215576171875, -1.677093505859375, -1.63262939453125, -1.588165283203125, -1.543701171875, -1.499237060546875, -1.45477294921875, -1.410308837890625, -1.3658447265625, -1.321380615234375, -1.27691650390625, -1.232452392578125, -1.18798828125, -1.143524169921875, -1.09906005859375, -1.054595947265625, -1.0101318359375, -0.965667724609375, -0.92120361328125, -0.876739501953125, -0.832275390625, -0.787811279296875, -0.74334716796875, -0.698883056640625, -0.6544189453125, -0.609954833984375, -0.56549072265625, -0.521026611328125, -0.4765625, -0.432098388671875, -0.38763427734375, -0.343170166015625, -0.2987060546875, -0.254241943359375, -0.20977783203125, -0.165313720703125, -0.120849609375, -0.076385498046875, -0.03192138671875, 0.012542724609375, 0.0570068359375, 0.101470947265625, 0.14593505859375, 0.190399169921875, 0.23486328125, 0.279327392578125, 0.32379150390625, 0.368255615234375, 0.4127197265625, 0.457183837890625, 0.50164794921875, 0.546112060546875, 0.590576171875, 0.635040283203125, 0.67950439453125, 0.723968505859375, 0.7684326171875, 0.812896728515625, 0.85736083984375, 0.901824951171875, 0.9462890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 15.0, 25.0, 47.0, 71.0, 117.0, 143.0, 169.0, 142.0, 105.0, 70.0, 44.0, 24.0, 20.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.369895935058594, -26.734100341796875, -26.098304748535156, -25.462509155273438, -24.82671356201172, -24.19091796875, -23.55512237548828, -22.919326782226562, -22.283531188964844, -21.647735595703125, -21.011940002441406, -20.376144409179688, -19.74034881591797, -19.10455322265625, -18.46875762939453, -17.832962036132812, -17.19716453552246, -16.561368942260742, -15.925573348999023, -15.289777755737305, -14.653982162475586, -14.018186569213867, -13.382390022277832, -12.746594429016113, -12.110798835754395, -11.475003242492676, -10.839207649230957, -10.203412055969238, -9.567615509033203, -8.931819915771484, -8.296024322509766, -7.660228729248047, -7.0244340896606445, -6.388638496398926, -5.752842903137207, -5.11704683303833, -4.481251239776611, -3.8454556465148926, -3.2096598148345947, -2.573863983154297, -1.9380683898925781, -1.3022726774215698, -0.6664769649505615, -0.030681252479553223, 0.6051144599914551, 1.2409100532531738, 1.8767058849334717, 2.5125017166137695, 3.1482973098754883, 3.784092903137207, 4.419888496398926, 5.055684566497803, 5.6914801597595215, 6.32727575302124, 6.963071823120117, 7.598867416381836, 8.234663009643555, 8.870458602905273, 9.506254196166992, 10.142049789428711, 10.77784538269043, 11.413640975952148, 12.049437522888184, 12.685233116149902, 13.321028709411621]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 3.0, 5.0, 19.0, 9.0, 13.0, 9.0, 15.0, 22.0, 10.0, 18.0, 14.0, 22.0, 31.0, 26.0, 35.0, 33.0, 30.0, 47.0, 44.0, 40.0, 34.0, 45.0, 39.0, 41.0, 32.0, 36.0, 24.0, 38.0, 26.0, 31.0, 26.0, 19.0, 19.0, 22.0, 17.0, 18.0, 16.0, 17.0, 6.0, 6.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.17392635345459, -5.970163345336914, -5.7664008140563965, -5.562637805938721, -5.358874797821045, -5.155112266540527, -4.951349258422852, -4.747586250305176, -4.5438232421875, -4.340060234069824, -4.136297702789307, -3.932534694671631, -3.728771686553955, -3.5250089168548584, -3.3212461471557617, -3.117483139038086, -2.9137206077575684, -2.7099578380584717, -2.506194829940796, -2.302432060241699, -2.0986690521240234, -1.8949062824249268, -1.69114351272583, -1.4873806238174438, -1.2836177349090576, -1.0798548460006714, -0.8760920166969299, -0.6723291873931885, -0.46856629848480225, -0.264803409576416, -0.061040639877319336, 0.1427222490310669, 0.3464846611022949, 0.5502475500106812, 0.7540103793144226, 0.9577732086181641, 1.1615360975265503, 1.3652989864349365, 1.5690617561340332, 1.7728246450424194, 1.9765875339508057, 2.1803503036499023, 2.384113311767578, 2.587876081466675, 2.7916388511657715, 2.9954018592834473, 3.199164628982544, 3.4029273986816406, 3.6066904067993164, 3.810453176498413, 4.01421594619751, 4.2179789543151855, 4.421741962432861, 4.625504493713379, 4.829267501831055, 5.0330305099487305, 5.236793518066406, 5.440556526184082, 5.6443190574646, 5.848082065582275, 6.051845073699951, 6.255607604980469, 6.4593706130981445, 6.66313362121582, 6.866896152496338]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 13.0, 14.0, 25.0, 39.0, 66.0, 80.0, 141.0, 243.0, 383.0, 741.0, 1548.0, 3406.0, 9453.0, 34924.0, 258512.0, 3643064.0, 196889.0, 30180.0, 8583.0, 3078.0, 1322.0, 640.0, 363.0, 210.0, 104.0, 76.0, 48.0, 32.0, 24.0, 19.0, 7.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.20703125, -4.088348388671875, -3.96966552734375, -3.850982666015625, -3.7322998046875, -3.613616943359375, -3.49493408203125, -3.376251220703125, -3.257568359375, -3.138885498046875, -3.02020263671875, -2.901519775390625, -2.7828369140625, -2.664154052734375, -2.54547119140625, -2.426788330078125, -2.30810546875, -2.189422607421875, -2.07073974609375, -1.952056884765625, -1.8333740234375, -1.714691162109375, -1.59600830078125, -1.477325439453125, -1.358642578125, -1.239959716796875, -1.12127685546875, -1.002593994140625, -0.8839111328125, -0.765228271484375, -0.64654541015625, -0.527862548828125, -0.4091796875, -0.290496826171875, -0.17181396484375, -0.053131103515625, 0.0655517578125, 0.184234619140625, 0.30291748046875, 0.421600341796875, 0.540283203125, 0.658966064453125, 0.77764892578125, 0.896331787109375, 1.0150146484375, 1.133697509765625, 1.25238037109375, 1.371063232421875, 1.48974609375, 1.608428955078125, 1.72711181640625, 1.845794677734375, 1.9644775390625, 2.083160400390625, 2.20184326171875, 2.320526123046875, 2.439208984375, 2.557891845703125, 2.67657470703125, 2.795257568359375, 2.9139404296875, 3.032623291015625, 3.15130615234375, 3.269989013671875, 3.388671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 6.0, 8.0, 11.0, 33.0, 38.0, 30.0, 35.0, 57.0, 68.0, 72.0, 61.0, 74.0, 80.0, 59.0, 61.0, 77.0, 54.0, 35.0, 27.0, 26.0, 23.0, 13.0, 16.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.51544189453125, -0.5001220703125, -0.48480224609375, -0.469482421875, -0.45416259765625, -0.4388427734375, -0.42352294921875, -0.408203125, -0.39288330078125, -0.3775634765625, -0.36224365234375, -0.346923828125, -0.33160400390625, -0.3162841796875, -0.30096435546875, -0.28564453125, -0.27032470703125, -0.2550048828125, -0.23968505859375, -0.224365234375, -0.20904541015625, -0.1937255859375, -0.17840576171875, -0.1630859375, -0.14776611328125, -0.1324462890625, -0.11712646484375, -0.101806640625, -0.08648681640625, -0.0711669921875, -0.05584716796875, -0.04052734375, -0.02520751953125, -0.0098876953125, 0.00543212890625, 0.020751953125, 0.03607177734375, 0.0513916015625, 0.06671142578125, 0.08203125, 0.09735107421875, 0.1126708984375, 0.12799072265625, 0.143310546875, 0.15863037109375, 0.1739501953125, 0.18927001953125, 0.20458984375, 0.21990966796875, 0.2352294921875, 0.25054931640625, 0.265869140625, 0.28118896484375, 0.2965087890625, 0.31182861328125, 0.3271484375, 0.34246826171875, 0.3577880859375, 0.37310791015625, 0.388427734375, 0.40374755859375, 0.4190673828125, 0.43438720703125, 0.44970703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 6.0, 9.0, 6.0, 11.0, 13.0, 15.0, 20.0, 29.0, 28.0, 26.0, 28.0, 45.0, 53.0, 86.0, 231.0, 727.0, 4510.0, 45975.0, 3290573.0, 822809.0, 25267.0, 2822.0, 468.0, 154.0, 75.0, 38.0, 32.0, 32.0, 22.0, 20.0, 24.0, 16.0, 20.0, 14.0, 10.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.92578125, -5.75592041015625, -5.5860595703125, -5.41619873046875, -5.246337890625, -5.07647705078125, -4.9066162109375, -4.73675537109375, -4.56689453125, -4.39703369140625, -4.2271728515625, -4.05731201171875, -3.887451171875, -3.71759033203125, -3.5477294921875, -3.37786865234375, -3.2080078125, -3.03814697265625, -2.8682861328125, -2.69842529296875, -2.528564453125, -2.35870361328125, -2.1888427734375, -2.01898193359375, -1.84912109375, -1.67926025390625, -1.5093994140625, -1.33953857421875, -1.169677734375, -0.99981689453125, -0.8299560546875, -0.66009521484375, -0.490234375, -0.32037353515625, -0.1505126953125, 0.01934814453125, 0.189208984375, 0.35906982421875, 0.5289306640625, 0.69879150390625, 0.86865234375, 1.03851318359375, 1.2083740234375, 1.37823486328125, 1.548095703125, 1.71795654296875, 1.8878173828125, 2.05767822265625, 2.2275390625, 2.39739990234375, 2.5672607421875, 2.73712158203125, 2.906982421875, 3.07684326171875, 3.2467041015625, 3.41656494140625, 3.58642578125, 3.75628662109375, 3.9261474609375, 4.09600830078125, 4.265869140625, 4.43572998046875, 4.6055908203125, 4.77545166015625, 4.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 14.0, 32.0, 33.0, 66.0, 117.0, 262.0, 727.0, 1822.0, 538.0, 238.0, 105.0, 46.0, 27.0, 18.0, 8.0, 10.0, 8.0, 1.0, 0.0, 2.0], "bins": [-2.46484375, -2.4168853759765625, -2.368927001953125, -2.3209686279296875, -2.27301025390625, -2.2250518798828125, -2.177093505859375, -2.1291351318359375, -2.0811767578125, -2.0332183837890625, -1.985260009765625, -1.9373016357421875, -1.88934326171875, -1.8413848876953125, -1.793426513671875, -1.7454681396484375, -1.697509765625, -1.6495513916015625, -1.601593017578125, -1.5536346435546875, -1.50567626953125, -1.4577178955078125, -1.409759521484375, -1.3618011474609375, -1.3138427734375, -1.2658843994140625, -1.217926025390625, -1.1699676513671875, -1.12200927734375, -1.0740509033203125, -1.026092529296875, -0.9781341552734375, -0.93017578125, -0.8822174072265625, -0.834259033203125, -0.7863006591796875, -0.73834228515625, -0.6903839111328125, -0.642425537109375, -0.5944671630859375, -0.5465087890625, -0.4985504150390625, -0.450592041015625, -0.4026336669921875, -0.35467529296875, -0.3067169189453125, -0.258758544921875, -0.2108001708984375, -0.162841796875, -0.1148834228515625, -0.066925048828125, -0.0189666748046875, 0.02899169921875, 0.0769500732421875, 0.124908447265625, 0.1728668212890625, 0.2208251953125, 0.2687835693359375, 0.316741943359375, 0.3647003173828125, 0.41265869140625, 0.4606170654296875, 0.508575439453125, 0.5565338134765625, 0.6044921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 15.0, 7.0, 31.0, 48.0, 73.0, 121.0, 161.0, 163.0, 141.0, 113.0, 58.0, 30.0, 21.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.662063598632812, -12.372052192687988, -12.08204174041748, -11.792030334472656, -11.502018928527832, -11.212007522583008, -10.9219970703125, -10.631985664367676, -10.341974258422852, -10.051962852478027, -9.76195240020752, -9.471940994262695, -9.181929588317871, -8.891918182373047, -8.601907730102539, -8.311896324157715, -8.021885871887207, -7.731874942779541, -7.441863536834717, -7.151852607727051, -6.861841201782227, -6.5718302726745605, -6.2818193435668945, -5.99180793762207, -5.701797008514404, -5.411786079406738, -5.121774673461914, -4.831763744354248, -4.541752815246582, -4.251741409301758, -3.961730480194092, -3.6717193126678467, -3.3817081451416016, -3.0916969776153564, -2.8016858100891113, -2.5116748809814453, -2.2216637134552, -1.931652545928955, -1.6416414976119995, -1.351630449295044, -1.0616192817687988, -0.7716081738471985, -0.48159706592559814, -0.1915859580039978, 0.09842514991760254, 0.38843631744384766, 0.6784473657608032, 0.9684584140777588, 1.258469581604004, 1.548480749130249, 1.8384917974472046, 2.12850284576416, 2.4185140132904053, 2.7085251808166504, 2.9985361099243164, 3.2885472774505615, 3.5785584449768066, 3.8685696125030518, 4.158580780029297, 4.448591709136963, 4.738602638244629, 5.028614044189453, 5.318624973297119, 5.608635902404785, 5.898647308349609]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 9.0, 11.0, 8.0, 12.0, 17.0, 21.0, 24.0, 32.0, 30.0, 26.0, 34.0, 33.0, 34.0, 33.0, 35.0, 54.0, 45.0, 50.0, 35.0, 47.0, 57.0, 43.0, 41.0, 33.0, 28.0, 28.0, 33.0, 33.0, 22.0, 15.0, 13.0, 14.0, 12.0, 14.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.935969829559326, -3.825162410736084, -3.714354991912842, -3.6035475730895996, -3.4927401542663574, -3.3819327354431152, -3.271125078201294, -3.1603176593780518, -3.0495102405548096, -2.9387028217315674, -2.827895402908325, -2.717087984085083, -2.6062803268432617, -2.4954729080200195, -2.3846654891967773, -2.273858070373535, -2.163050651550293, -2.052243232727051, -1.9414358139038086, -1.8306282758712769, -1.7198208570480347, -1.6090134382247925, -1.4982059001922607, -1.3873984813690186, -1.2765910625457764, -1.1657836437225342, -1.054976224899292, -0.9441686868667603, -0.8333612680435181, -0.7225538492202759, -0.6117463707923889, -0.500938892364502, -0.39013147354125977, -0.2793240249156952, -0.16851657629013062, -0.05770912766456604, 0.053098320960998535, 0.16390573978424072, 0.2747132182121277, 0.38552069664001465, 0.49632811546325684, 0.607135534286499, 0.717943012714386, 0.828750491142273, 0.9395579099655151, 1.0503653287887573, 1.161172866821289, 1.2719802856445312, 1.3827877044677734, 1.4935951232910156, 1.6044025421142578, 1.7152100801467896, 1.8260174989700317, 1.936824917793274, 2.0476324558258057, 2.158439874649048, 2.26924729347229, 2.3800547122955322, 2.4908621311187744, 2.6016695499420166, 2.712477207183838, 2.82328462600708, 2.9340920448303223, 3.0448994636535645, 3.1557068824768066]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 4.0, 7.0, 11.0, 21.0, 17.0, 26.0, 36.0, 43.0, 76.0, 118.0, 178.0, 321.0, 540.0, 941.0, 2047.0, 4734.0, 12182.0, 34836.0, 107722.0, 388895.0, 349741.0, 94927.0, 31430.0, 11225.0, 4371.0, 1867.0, 863.0, 553.0, 283.0, 192.0, 109.0, 67.0, 49.0, 26.0, 23.0, 26.0, 9.0, 12.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.505859375, -2.4298095703125, -2.353759765625, -2.2777099609375, -2.20166015625, -2.1256103515625, -2.049560546875, -1.9735107421875, -1.8974609375, -1.8214111328125, -1.745361328125, -1.6693115234375, -1.59326171875, -1.5172119140625, -1.441162109375, -1.3651123046875, -1.2890625, -1.2130126953125, -1.136962890625, -1.0609130859375, -0.98486328125, -0.9088134765625, -0.832763671875, -0.7567138671875, -0.6806640625, -0.6046142578125, -0.528564453125, -0.4525146484375, -0.37646484375, -0.3004150390625, -0.224365234375, -0.1483154296875, -0.072265625, 0.0037841796875, 0.079833984375, 0.1558837890625, 0.23193359375, 0.3079833984375, 0.384033203125, 0.4600830078125, 0.5361328125, 0.6121826171875, 0.688232421875, 0.7642822265625, 0.84033203125, 0.9163818359375, 0.992431640625, 1.0684814453125, 1.14453125, 1.2205810546875, 1.296630859375, 1.3726806640625, 1.44873046875, 1.5247802734375, 1.600830078125, 1.6768798828125, 1.7529296875, 1.8289794921875, 1.905029296875, 1.9810791015625, 2.05712890625, 2.1331787109375, 2.209228515625, 2.2852783203125, 2.361328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 12.0, 28.0, 36.0, 36.0, 70.0, 54.0, 81.0, 72.0, 63.0, 86.0, 60.0, 67.0, 61.0, 54.0, 34.0, 34.0, 25.0, 24.0, 8.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5823287963867188, -0.5660247802734375, -0.5497207641601562, -0.533416748046875, -0.5171127319335938, -0.5008087158203125, -0.48450469970703125, -0.46820068359375, -0.45189666748046875, -0.4355926513671875, -0.41928863525390625, -0.402984619140625, -0.38668060302734375, -0.3703765869140625, -0.35407257080078125, -0.3377685546875, -0.32146453857421875, -0.3051605224609375, -0.28885650634765625, -0.272552490234375, -0.25624847412109375, -0.2399444580078125, -0.22364044189453125, -0.20733642578125, -0.19103240966796875, -0.1747283935546875, -0.15842437744140625, -0.142120361328125, -0.12581634521484375, -0.1095123291015625, -0.09320831298828125, -0.076904296875, -0.06060028076171875, -0.0442962646484375, -0.02799224853515625, -0.011688232421875, 0.00461578369140625, 0.0209197998046875, 0.03722381591796875, 0.05352783203125, 0.06983184814453125, 0.0861358642578125, 0.10243988037109375, 0.118743896484375, 0.13504791259765625, 0.1513519287109375, 0.16765594482421875, 0.1839599609375, 0.20026397705078125, 0.2165679931640625, 0.23287200927734375, 0.249176025390625, 0.26548004150390625, 0.2817840576171875, 0.29808807373046875, 0.31439208984375, 0.33069610595703125, 0.3470001220703125, 0.36330413818359375, 0.379608154296875, 0.39591217041015625, 0.4122161865234375, 0.42852020263671875, 0.44482421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 14.0, 26.0, 31.0, 46.0, 92.0, 124.0, 202.0, 324.0, 603.0, 1144.0, 2413.0, 5610.0, 13783.0, 35362.0, 95742.0, 289261.0, 382076.0, 139466.0, 49143.0, 18930.0, 7713.0, 3242.0, 1451.0, 727.0, 366.0, 226.0, 148.0, 64.0, 58.0, 45.0, 28.0, 29.0, 19.0, 12.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.4693603515625, -1.415283203125, -1.3612060546875, -1.30712890625, -1.2530517578125, -1.198974609375, -1.1448974609375, -1.0908203125, -1.0367431640625, -0.982666015625, -0.9285888671875, -0.87451171875, -0.8204345703125, -0.766357421875, -0.7122802734375, -0.658203125, -0.6041259765625, -0.550048828125, -0.4959716796875, -0.44189453125, -0.3878173828125, -0.333740234375, -0.2796630859375, -0.2255859375, -0.1715087890625, -0.117431640625, -0.0633544921875, -0.00927734375, 0.0447998046875, 0.098876953125, 0.1529541015625, 0.20703125, 0.2611083984375, 0.315185546875, 0.3692626953125, 0.42333984375, 0.4774169921875, 0.531494140625, 0.5855712890625, 0.6396484375, 0.6937255859375, 0.747802734375, 0.8018798828125, 0.85595703125, 0.9100341796875, 0.964111328125, 1.0181884765625, 1.072265625, 1.1263427734375, 1.180419921875, 1.2344970703125, 1.28857421875, 1.3426513671875, 1.396728515625, 1.4508056640625, 1.5048828125, 1.5589599609375, 1.613037109375, 1.6671142578125, 1.72119140625, 1.7752685546875, 1.829345703125, 1.8834228515625, 1.9375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 21.0, 9.0, 17.0, 28.0, 20.0, 18.0, 23.0, 34.0, 43.0, 43.0, 43.0, 48.0, 52.0, 52.0, 38.0, 40.0, 42.0, 51.0, 38.0, 44.0, 43.0, 33.0, 29.0, 25.0, 23.0, 19.0, 17.0, 20.0, 12.0, 11.0, 10.0, 12.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.4579315185546875, -1.410003662109375, -1.3620758056640625, -1.31414794921875, -1.2662200927734375, -1.218292236328125, -1.1703643798828125, -1.1224365234375, -1.0745086669921875, -1.026580810546875, -0.9786529541015625, -0.93072509765625, -0.8827972412109375, -0.834869384765625, -0.7869415283203125, -0.739013671875, -0.6910858154296875, -0.643157958984375, -0.5952301025390625, -0.54730224609375, -0.4993743896484375, -0.451446533203125, -0.4035186767578125, -0.3555908203125, -0.3076629638671875, -0.259735107421875, -0.2118072509765625, -0.16387939453125, -0.1159515380859375, -0.068023681640625, -0.0200958251953125, 0.02783203125, 0.0757598876953125, 0.123687744140625, 0.1716156005859375, 0.21954345703125, 0.2674713134765625, 0.315399169921875, 0.3633270263671875, 0.4112548828125, 0.4591827392578125, 0.507110595703125, 0.5550384521484375, 0.60296630859375, 0.6508941650390625, 0.698822021484375, 0.7467498779296875, 0.794677734375, 0.8426055908203125, 0.890533447265625, 0.9384613037109375, 0.98638916015625, 1.0343170166015625, 1.082244873046875, 1.1301727294921875, 1.1781005859375, 1.2260284423828125, 1.273956298828125, 1.3218841552734375, 1.36981201171875, 1.4177398681640625, 1.465667724609375, 1.5135955810546875, 1.5615234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 9.0, 11.0, 22.0, 28.0, 56.0, 88.0, 140.0, 243.0, 441.0, 929.0, 2020.0, 4903.0, 14086.0, 45783.0, 173559.0, 496786.0, 224076.0, 57417.0, 17354.0, 5918.0, 2374.0, 1037.0, 559.0, 314.0, 156.0, 76.0, 53.0, 29.0, 27.0, 15.0, 12.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7277297973632812, -0.6981353759765625, -0.6685409545898438, -0.638946533203125, -0.6093521118164062, -0.5797576904296875, -0.5501632690429688, -0.52056884765625, -0.49097442626953125, -0.4613800048828125, -0.43178558349609375, -0.402191162109375, -0.37259674072265625, -0.3430023193359375, -0.31340789794921875, -0.2838134765625, -0.25421905517578125, -0.2246246337890625, -0.19503021240234375, -0.165435791015625, -0.13584136962890625, -0.1062469482421875, -0.07665252685546875, -0.04705810546875, -0.01746368408203125, 0.0121307373046875, 0.04172515869140625, 0.071319580078125, 0.10091400146484375, 0.1305084228515625, 0.16010284423828125, 0.189697265625, 0.21929168701171875, 0.2488861083984375, 0.27848052978515625, 0.308074951171875, 0.33766937255859375, 0.3672637939453125, 0.39685821533203125, 0.42645263671875, 0.45604705810546875, 0.4856414794921875, 0.5152359008789062, 0.544830322265625, 0.5744247436523438, 0.6040191650390625, 0.6336135864257812, 0.6632080078125, 0.6928024291992188, 0.7223968505859375, 0.7519912719726562, 0.781585693359375, 0.8111801147460938, 0.8407745361328125, 0.8703689575195312, 0.89996337890625, 0.9295578002929688, 0.9591522216796875, 0.9887466430664062, 1.018341064453125, 1.0479354858398438, 1.0775299072265625, 1.1071243286132812, 1.13671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 16.0, 20.0, 27.0, 34.0, 45.0, 83.0, 113.0, 163.0, 138.0, 94.0, 69.0, 42.0, 31.0, 28.0, 16.0, 9.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022649765014648438, -0.00022001191973686218, -0.00021352618932724, -0.0002070404589176178, -0.0002005547285079956, -0.0001940689980983734, -0.00018758326768875122, -0.00018109753727912903, -0.00017461180686950684, -0.00016812607645988464, -0.00016164034605026245, -0.00015515461564064026, -0.00014866888523101807, -0.00014218315482139587, -0.00013569742441177368, -0.0001292116940021515, -0.0001227259635925293, -0.0001162402331829071, -0.00010975450277328491, -0.00010326877236366272, -9.678304195404053e-05, -9.029731154441833e-05, -8.381158113479614e-05, -7.732585072517395e-05, -7.084012031555176e-05, -6.435438990592957e-05, -5.786865949630737e-05, -5.138292908668518e-05, -4.489719867706299e-05, -3.8411468267440796e-05, -3.1925737857818604e-05, -2.544000744819641e-05, -1.895427703857422e-05, -1.2468546628952026e-05, -5.982816219329834e-06, 5.029141902923584e-07, 6.988644599914551e-06, 1.3474375009536743e-05, 1.9960105419158936e-05, 2.6445835828781128e-05, 3.293156623840332e-05, 3.941729664802551e-05, 4.5903027057647705e-05, 5.23887574672699e-05, 5.887448787689209e-05, 6.536021828651428e-05, 7.184594869613647e-05, 7.833167910575867e-05, 8.481740951538086e-05, 9.130313992500305e-05, 9.778887033462524e-05, 0.00010427460074424744, 0.00011076033115386963, 0.00011724606156349182, 0.00012373179197311401, 0.0001302175223827362, 0.0001367032527923584, 0.0001431889832019806, 0.00014967471361160278, 0.00015616044402122498, 0.00016264617443084717, 0.00016913190484046936, 0.00017561763525009155, 0.00018210336565971375, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 6.0, 17.0, 29.0, 40.0, 81.0, 108.0, 162.0, 305.0, 701.0, 1574.0, 3824.0, 10978.0, 34643.0, 141150.0, 570746.0, 214763.0, 46778.0, 14119.0, 4871.0, 1891.0, 813.0, 402.0, 231.0, 118.0, 82.0, 39.0, 18.0, 22.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99462890625, -0.9631729125976562, -0.9317169189453125, -0.9002609252929688, -0.868804931640625, -0.8373489379882812, -0.8058929443359375, -0.7744369506835938, -0.74298095703125, -0.7115249633789062, -0.6800689697265625, -0.6486129760742188, -0.617156982421875, -0.5857009887695312, -0.5542449951171875, -0.5227890014648438, -0.4913330078125, -0.45987701416015625, -0.4284210205078125, -0.39696502685546875, -0.365509033203125, -0.33405303955078125, -0.3025970458984375, -0.27114105224609375, -0.23968505859375, -0.20822906494140625, -0.1767730712890625, -0.14531707763671875, -0.113861083984375, -0.08240509033203125, -0.0509490966796875, -0.01949310302734375, 0.011962890625, 0.04341888427734375, 0.0748748779296875, 0.10633087158203125, 0.137786865234375, 0.16924285888671875, 0.2006988525390625, 0.23215484619140625, 0.26361083984375, 0.29506683349609375, 0.3265228271484375, 0.35797882080078125, 0.389434814453125, 0.42089080810546875, 0.4523468017578125, 0.48380279541015625, 0.5152587890625, 0.5467147827148438, 0.5781707763671875, 0.6096267700195312, 0.641082763671875, 0.6725387573242188, 0.7039947509765625, 0.7354507446289062, 0.76690673828125, 0.7983627319335938, 0.8298187255859375, 0.8612747192382812, 0.892730712890625, 0.9241867065429688, 0.9556427001953125, 0.9870986938476562, 1.0185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 4.0, 3.0, 8.0, 5.0, 10.0, 8.0, 9.0, 9.0, 13.0, 20.0, 26.0, 23.0, 45.0, 41.0, 63.0, 70.0, 80.0, 80.0, 82.0, 70.0, 68.0, 45.0, 44.0, 26.0, 32.0, 22.0, 17.0, 21.0, 16.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.6442184448242188, -0.6224212646484375, -0.6006240844726562, -0.578826904296875, -0.5570297241210938, -0.5352325439453125, -0.5134353637695312, -0.49163818359375, -0.46984100341796875, -0.4480438232421875, -0.42624664306640625, -0.404449462890625, -0.38265228271484375, -0.3608551025390625, -0.33905792236328125, -0.3172607421875, -0.29546356201171875, -0.2736663818359375, -0.25186920166015625, -0.230072021484375, -0.20827484130859375, -0.1864776611328125, -0.16468048095703125, -0.14288330078125, -0.12108612060546875, -0.0992889404296875, -0.07749176025390625, -0.055694580078125, -0.03389739990234375, -0.0121002197265625, 0.00969696044921875, 0.031494140625, 0.05329132080078125, 0.0750885009765625, 0.09688568115234375, 0.118682861328125, 0.14048004150390625, 0.1622772216796875, 0.18407440185546875, 0.20587158203125, 0.22766876220703125, 0.2494659423828125, 0.27126312255859375, 0.293060302734375, 0.31485748291015625, 0.3366546630859375, 0.35845184326171875, 0.3802490234375, 0.40204620361328125, 0.4238433837890625, 0.44564056396484375, 0.467437744140625, 0.48923492431640625, 0.5110321044921875, 0.5328292846679688, 0.55462646484375, 0.5764236450195312, 0.5982208251953125, 0.6200180053710938, 0.641815185546875, 0.6636123657226562, 0.6854095458984375, 0.7072067260742188, 0.72900390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 15.0, 34.0, 99.0, 149.0, 205.0, 183.0, 165.0, 76.0, 41.0, 22.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-40.049278259277344, -39.290897369384766, -38.53251647949219, -37.77413558959961, -37.01575469970703, -36.25736999511719, -35.498992919921875, -34.74060821533203, -33.98222732543945, -33.223846435546875, -32.4654655456543, -31.70708465576172, -30.948701858520508, -30.19032096862793, -29.43194007873535, -28.673559188842773, -27.915178298950195, -27.156797409057617, -26.39841651916504, -25.640033721923828, -24.88165283203125, -24.123271942138672, -23.364891052246094, -22.606510162353516, -21.848129272460938, -21.08974838256836, -20.33136749267578, -19.572986602783203, -18.814603805541992, -18.056222915649414, -17.297842025756836, -16.539461135864258, -15.781079292297363, -15.022698402404785, -14.26431655883789, -13.505935668945312, -12.747554779052734, -11.98917293548584, -11.230792045593262, -10.472410202026367, -9.714029312133789, -8.955648422241211, -8.197266578674316, -7.438885688781738, -6.680504322052002, -5.922122955322266, -5.1637420654296875, -4.405360698699951, -3.646979331970215, -2.8885979652404785, -2.1302168369293213, -1.371835708618164, -0.6134543418884277, 0.1449270248413086, 0.9033079147338867, 1.661689281463623, 2.4200706481933594, 3.1784520149230957, 3.936833143234253, 4.69521427154541, 5.4535956382751465, 6.211977005004883, 6.970357894897461, 7.728739261627197, 8.487120628356934]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 9.0, 13.0, 16.0, 15.0, 20.0, 18.0, 18.0, 34.0, 48.0, 41.0, 31.0, 39.0, 40.0, 50.0, 58.0, 45.0, 23.0, 50.0, 44.0, 33.0, 45.0, 33.0, 41.0, 41.0, 38.0, 24.0, 19.0, 21.0, 14.0, 14.0, 9.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.520538330078125, -7.292177200317383, -7.063816070556641, -6.83545446395874, -6.607093334197998, -6.378732204437256, -6.1503705978393555, -5.922009468078613, -5.693648338317871, -5.465287208557129, -5.236926078796387, -5.008564472198486, -4.780203342437744, -4.551842212677002, -4.323480606079102, -4.095119476318359, -3.866758346557617, -3.638397216796875, -3.4100358486175537, -3.1816744804382324, -2.9533133506774902, -2.724952220916748, -2.4965908527374268, -2.2682294845581055, -2.0398683547973633, -1.8115071058273315, -1.5831458568572998, -1.354784607887268, -1.1264233589172363, -0.8980621099472046, -0.6697008609771729, -0.4413396120071411, -0.21297836303710938, 0.015382885932922363, 0.2437441349029541, 0.47210538387298584, 0.7004666328430176, 0.9288278818130493, 1.157189130783081, 1.3855503797531128, 1.6139116287231445, 1.8422728776931763, 2.070634126663208, 2.2989954948425293, 2.5273566246032715, 2.7557177543640137, 2.984079122543335, 3.2124404907226562, 3.4408016204833984, 3.6691627502441406, 3.897524118423462, 4.125885486602783, 4.354246616363525, 4.582607746124268, 4.810969352722168, 5.03933048248291, 5.267691612243652, 5.4960527420043945, 5.724413871765137, 5.952775478363037, 6.181136608123779, 6.4094977378845215, 6.637859344482422, 6.866220474243164, 7.094581604003906]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 11.0, 6.0, 10.0, 24.0, 52.0, 76.0, 172.0, 366.0, 858.0, 2900.0, 12156.0, 99685.0, 3930266.0, 129171.0, 13966.0, 3004.0, 888.0, 320.0, 148.0, 88.0, 48.0, 26.0, 20.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.098876953125, -5.87744140625, -5.656005859375, -5.4345703125, -5.213134765625, -4.99169921875, -4.770263671875, -4.548828125, -4.327392578125, -4.10595703125, -3.884521484375, -3.6630859375, -3.441650390625, -3.22021484375, -2.998779296875, -2.77734375, -2.555908203125, -2.33447265625, -2.113037109375, -1.8916015625, -1.670166015625, -1.44873046875, -1.227294921875, -1.005859375, -0.784423828125, -0.56298828125, -0.341552734375, -0.1201171875, 0.101318359375, 0.32275390625, 0.544189453125, 0.765625, 0.987060546875, 1.20849609375, 1.429931640625, 1.6513671875, 1.872802734375, 2.09423828125, 2.315673828125, 2.537109375, 2.758544921875, 2.97998046875, 3.201416015625, 3.4228515625, 3.644287109375, 3.86572265625, 4.087158203125, 4.30859375, 4.530029296875, 4.75146484375, 4.972900390625, 5.1943359375, 5.415771484375, 5.63720703125, 5.858642578125, 6.080078125, 6.301513671875, 6.52294921875, 6.744384765625, 6.9658203125, 7.187255859375, 7.40869140625, 7.630126953125, 7.8515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 8.0, 19.0, 16.0, 17.0, 26.0, 41.0, 45.0, 56.0, 56.0, 61.0, 78.0, 72.0, 78.0, 60.0, 63.0, 61.0, 55.0, 50.0, 34.0, 17.0, 26.0, 11.0, 9.0, 4.0, 12.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60791015625, -0.5913581848144531, -0.5748062133789062, -0.5582542419433594, -0.5417022705078125, -0.5251502990722656, -0.5085983276367188, -0.4920463562011719, -0.475494384765625, -0.4589424133300781, -0.44239044189453125, -0.4258384704589844, -0.4092864990234375, -0.3927345275878906, -0.37618255615234375, -0.3596305847167969, -0.34307861328125, -0.3265266418457031, -0.30997467041015625, -0.2934226989746094, -0.2768707275390625, -0.2603187561035156, -0.24376678466796875, -0.22721481323242188, -0.210662841796875, -0.19411087036132812, -0.17755889892578125, -0.16100692749023438, -0.1444549560546875, -0.12790298461914062, -0.11135101318359375, -0.09479904174804688, -0.0782470703125, -0.061695098876953125, -0.04514312744140625, -0.028591156005859375, -0.0120391845703125, 0.004512786865234375, 0.02106475830078125, 0.037616729736328125, 0.054168701171875, 0.07072067260742188, 0.08727264404296875, 0.10382461547851562, 0.1203765869140625, 0.13692855834960938, 0.15348052978515625, 0.17003250122070312, 0.18658447265625, 0.20313644409179688, 0.21968841552734375, 0.23624038696289062, 0.2527923583984375, 0.2693443298339844, 0.28589630126953125, 0.3024482727050781, 0.319000244140625, 0.3355522155761719, 0.35210418701171875, 0.3686561584472656, 0.3852081298828125, 0.4017601013183594, 0.41831207275390625, 0.4348640441894531, 0.451416015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 9.0, 9.0, 16.0, 23.0, 55.0, 76.0, 100.0, 188.0, 290.0, 495.0, 780.0, 1518.0, 3254.0, 7749.0, 19926.0, 61692.0, 301845.0, 3375942.0, 321164.0, 63879.0, 20497.0, 7840.0, 3347.0, 1637.0, 770.0, 429.0, 260.0, 181.0, 111.0, 79.0, 44.0, 23.0, 16.0, 14.0, 9.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.686248779296875, -2.60101318359375, -2.515777587890625, -2.4305419921875, -2.345306396484375, -2.26007080078125, -2.174835205078125, -2.089599609375, -2.004364013671875, -1.91912841796875, -1.833892822265625, -1.7486572265625, -1.663421630859375, -1.57818603515625, -1.492950439453125, -1.40771484375, -1.322479248046875, -1.23724365234375, -1.152008056640625, -1.0667724609375, -0.981536865234375, -0.89630126953125, -0.811065673828125, -0.725830078125, -0.640594482421875, -0.55535888671875, -0.470123291015625, -0.3848876953125, -0.299652099609375, -0.21441650390625, -0.129180908203125, -0.0439453125, 0.041290283203125, 0.12652587890625, 0.211761474609375, 0.2969970703125, 0.382232666015625, 0.46746826171875, 0.552703857421875, 0.637939453125, 0.723175048828125, 0.80841064453125, 0.893646240234375, 0.9788818359375, 1.064117431640625, 1.14935302734375, 1.234588623046875, 1.31982421875, 1.405059814453125, 1.49029541015625, 1.575531005859375, 1.6607666015625, 1.746002197265625, 1.83123779296875, 1.916473388671875, 2.001708984375, 2.086944580078125, 2.17218017578125, 2.257415771484375, 2.3426513671875, 2.427886962890625, 2.51312255859375, 2.598358154296875, 2.68359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 9.0, 10.0, 17.0, 22.0, 32.0, 52.0, 79.0, 148.0, 314.0, 1108.0, 1650.0, 295.0, 120.0, 91.0, 45.0, 22.0, 18.0, 10.0, 17.0, 7.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.126861572265625, -1.08184814453125, -1.036834716796875, -0.9918212890625, -0.946807861328125, -0.90179443359375, -0.856781005859375, -0.811767578125, -0.766754150390625, -0.72174072265625, -0.676727294921875, -0.6317138671875, -0.586700439453125, -0.54168701171875, -0.496673583984375, -0.45166015625, -0.406646728515625, -0.36163330078125, -0.316619873046875, -0.2716064453125, -0.226593017578125, -0.18157958984375, -0.136566162109375, -0.091552734375, -0.046539306640625, -0.00152587890625, 0.043487548828125, 0.0885009765625, 0.133514404296875, 0.17852783203125, 0.223541259765625, 0.2685546875, 0.313568115234375, 0.35858154296875, 0.403594970703125, 0.4486083984375, 0.493621826171875, 0.53863525390625, 0.583648681640625, 0.628662109375, 0.673675537109375, 0.71868896484375, 0.763702392578125, 0.8087158203125, 0.853729248046875, 0.89874267578125, 0.943756103515625, 0.98876953125, 1.033782958984375, 1.07879638671875, 1.123809814453125, 1.1688232421875, 1.213836669921875, 1.25885009765625, 1.303863525390625, 1.348876953125, 1.393890380859375, 1.43890380859375, 1.483917236328125, 1.5289306640625, 1.573944091796875, 1.61895751953125, 1.663970947265625, 1.708984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 13.0, 23.0, 51.0, 120.0, 174.0, 226.0, 196.0, 91.0, 53.0, 20.0, 12.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.02601146697998, -9.665599822998047, -9.30518913269043, -8.944777488708496, -8.584366798400879, -8.223955154418945, -7.86354398727417, -7.5031328201293945, -7.142721652984619, -6.782310485839844, -6.421899318695068, -6.061488151550293, -5.701076507568359, -5.340665817260742, -4.980254173278809, -4.619843006134033, -4.259431838989258, -3.8990206718444824, -3.538609504699707, -3.1781980991363525, -2.817786931991577, -2.4573757648468018, -2.0969643592834473, -1.7365531921386719, -1.3761420249938965, -1.015730857849121, -0.6553195714950562, -0.2949082851409912, 0.06550288200378418, 0.42591404914855957, 0.7863254547119141, 1.1467366218566895, 1.5071487426757812, 1.8675599098205566, 2.227971076965332, 2.5883824825286865, 2.948793649673462, 3.3092048168182373, 3.669616222381592, 4.030027389526367, 4.390438556671143, 4.750849723815918, 5.111260890960693, 5.471672058105469, 5.832083702087402, 6.1924943923950195, 6.552906036376953, 6.9133172035217285, 7.273728370666504, 7.634139537811279, 7.994550704956055, 8.354962348937988, 8.715373039245605, 9.075784683227539, 9.436195373535156, 9.79660701751709, 10.157018661499023, 10.517430305480957, 10.877840995788574, 11.238252639770508, 11.598663330078125, 11.959074974060059, 12.319486618041992, 12.67989730834961, 13.040307998657227]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 8.0, 7.0, 8.0, 7.0, 15.0, 11.0, 15.0, 18.0, 22.0, 25.0, 28.0, 29.0, 39.0, 31.0, 48.0, 36.0, 35.0, 41.0, 47.0, 46.0, 42.0, 47.0, 42.0, 43.0, 43.0, 24.0, 25.0, 17.0, 29.0, 22.0, 27.0, 23.0, 17.0, 13.0, 6.0, 12.0, 9.0, 14.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.227794885635376, -3.1318273544311523, -3.0358598232269287, -2.939892292022705, -2.8439247608184814, -2.747957229614258, -2.651989459991455, -2.5560219287872314, -2.460054397583008, -2.364086866378784, -2.2681193351745605, -2.172151803970337, -2.0761842727661133, -1.9802166223526, -1.8842490911483765, -1.7882814407348633, -1.6923140287399292, -1.5963464975357056, -1.500378966331482, -1.4044113159179688, -1.3084437847137451, -1.2124762535095215, -1.1165087223052979, -1.0205411911010742, -0.9245736002922058, -0.8286060690879822, -0.7326384782791138, -0.6366709470748901, -0.5407034158706665, -0.4447358250617981, -0.34876829385757446, -0.25280070304870605, -0.15683317184448242, -0.060865618288517, 0.035101935267448425, 0.13106948137283325, 0.22703704237937927, 0.3230046033859253, 0.4189721345901489, 0.5149397253990173, 0.610907256603241, 0.7068747878074646, 0.802842378616333, 0.8988099098205566, 0.9947774410247803, 1.090744972229004, 1.1867125034332275, 1.2826801538467407, 1.3786476850509644, 1.474615216255188, 1.5705827474594116, 1.6665503978729248, 1.7625179290771484, 1.858485460281372, 1.9544529914855957, 2.0504205226898193, 2.146388053894043, 2.2423555850982666, 2.3383231163024902, 2.434290647506714, 2.5302581787109375, 2.6262259483337402, 2.7221932411193848, 2.8181610107421875, 2.914128541946411]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 3.0, 2.0, 9.0, 8.0, 13.0, 13.0, 20.0, 22.0, 30.0, 47.0, 43.0, 89.0, 109.0, 146.0, 215.0, 292.0, 476.0, 726.0, 1090.0, 1920.0, 3274.0, 5830.0, 11290.0, 22226.0, 45082.0, 92241.0, 188168.0, 300845.0, 188161.0, 92546.0, 45677.0, 22348.0, 11227.0, 5831.0, 3271.0, 1832.0, 1141.0, 698.0, 482.0, 333.0, 209.0, 176.0, 110.0, 82.0, 54.0, 47.0, 30.0, 18.0, 19.0, 10.0, 12.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.82421875, -1.7663116455078125, -1.708404541015625, -1.6504974365234375, -1.59259033203125, -1.5346832275390625, -1.476776123046875, -1.4188690185546875, -1.3609619140625, -1.3030548095703125, -1.245147705078125, -1.1872406005859375, -1.12933349609375, -1.0714263916015625, -1.013519287109375, -0.9556121826171875, -0.897705078125, -0.8397979736328125, -0.781890869140625, -0.7239837646484375, -0.66607666015625, -0.6081695556640625, -0.550262451171875, -0.4923553466796875, -0.4344482421875, -0.3765411376953125, -0.318634033203125, -0.2607269287109375, -0.20281982421875, -0.1449127197265625, -0.087005615234375, -0.0290985107421875, 0.02880859375, 0.0867156982421875, 0.144622802734375, 0.2025299072265625, 0.26043701171875, 0.3183441162109375, 0.376251220703125, 0.4341583251953125, 0.4920654296875, 0.5499725341796875, 0.607879638671875, 0.6657867431640625, 0.72369384765625, 0.7816009521484375, 0.839508056640625, 0.8974151611328125, 0.955322265625, 1.0132293701171875, 1.071136474609375, 1.1290435791015625, 1.18695068359375, 1.2448577880859375, 1.302764892578125, 1.3606719970703125, 1.4185791015625, 1.4764862060546875, 1.534393310546875, 1.5923004150390625, 1.65020751953125, 1.7081146240234375, 1.766021728515625, 1.8239288330078125, 1.8818359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 11.0, 2.0, 9.0, 13.0, 21.0, 22.0, 24.0, 31.0, 47.0, 46.0, 59.0, 62.0, 68.0, 59.0, 54.0, 66.0, 70.0, 58.0, 61.0, 46.0, 31.0, 34.0, 22.0, 25.0, 20.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.63427734375, -0.6172523498535156, -0.6002273559570312, -0.5832023620605469, -0.5661773681640625, -0.5491523742675781, -0.5321273803710938, -0.5151023864746094, -0.498077392578125, -0.4810523986816406, -0.46402740478515625, -0.4470024108886719, -0.4299774169921875, -0.4129524230957031, -0.39592742919921875, -0.3789024353027344, -0.36187744140625, -0.3448524475097656, -0.32782745361328125, -0.3108024597167969, -0.2937774658203125, -0.2767524719238281, -0.25972747802734375, -0.24270248413085938, -0.225677490234375, -0.20865249633789062, -0.19162750244140625, -0.17460250854492188, -0.1575775146484375, -0.14055252075195312, -0.12352752685546875, -0.10650253295898438, -0.0894775390625, -0.07245254516601562, -0.05542755126953125, -0.038402557373046875, -0.0213775634765625, -0.004352569580078125, 0.01267242431640625, 0.029697418212890625, 0.046722412109375, 0.06374740600585938, 0.08077239990234375, 0.09779739379882812, 0.1148223876953125, 0.13184738159179688, 0.14887237548828125, 0.16589736938476562, 0.18292236328125, 0.19994735717773438, 0.21697235107421875, 0.23399734497070312, 0.2510223388671875, 0.2680473327636719, 0.28507232666015625, 0.3020973205566406, 0.319122314453125, 0.3361473083496094, 0.35317230224609375, 0.3701972961425781, 0.3872222900390625, 0.4042472839355469, 0.42127227783203125, 0.4382972717285156, 0.455322265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 11.0, 11.0, 11.0, 20.0, 19.0, 42.0, 42.0, 75.0, 108.0, 150.0, 247.0, 403.0, 606.0, 1106.0, 2001.0, 4078.0, 9055.0, 21076.0, 51187.0, 124818.0, 293059.0, 310063.0, 133358.0, 55032.0, 22878.0, 9643.0, 4334.0, 2139.0, 1084.0, 642.0, 450.0, 253.0, 170.0, 111.0, 79.0, 62.0, 38.0, 34.0, 14.0, 14.0, 11.0, 13.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.74249267578125, -1.6881103515625, -1.63372802734375, -1.579345703125, -1.52496337890625, -1.4705810546875, -1.41619873046875, -1.36181640625, -1.30743408203125, -1.2530517578125, -1.19866943359375, -1.144287109375, -1.08990478515625, -1.0355224609375, -0.98114013671875, -0.9267578125, -0.87237548828125, -0.8179931640625, -0.76361083984375, -0.709228515625, -0.65484619140625, -0.6004638671875, -0.54608154296875, -0.49169921875, -0.43731689453125, -0.3829345703125, -0.32855224609375, -0.274169921875, -0.21978759765625, -0.1654052734375, -0.11102294921875, -0.056640625, -0.00225830078125, 0.0521240234375, 0.10650634765625, 0.160888671875, 0.21527099609375, 0.2696533203125, 0.32403564453125, 0.37841796875, 0.43280029296875, 0.4871826171875, 0.54156494140625, 0.595947265625, 0.65032958984375, 0.7047119140625, 0.75909423828125, 0.8134765625, 0.86785888671875, 0.9222412109375, 0.97662353515625, 1.031005859375, 1.08538818359375, 1.1397705078125, 1.19415283203125, 1.24853515625, 1.30291748046875, 1.3572998046875, 1.41168212890625, 1.466064453125, 1.52044677734375, 1.5748291015625, 1.62921142578125, 1.68359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 13.0, 8.0, 14.0, 14.0, 18.0, 12.0, 34.0, 36.0, 33.0, 31.0, 36.0, 47.0, 44.0, 43.0, 53.0, 50.0, 62.0, 42.0, 42.0, 37.0, 50.0, 43.0, 27.0, 31.0, 31.0, 27.0, 11.0, 23.0, 15.0, 16.0, 17.0, 9.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7741241455078125, -1.713287353515625, -1.6524505615234375, -1.59161376953125, -1.5307769775390625, -1.469940185546875, -1.4091033935546875, -1.3482666015625, -1.2874298095703125, -1.226593017578125, -1.1657562255859375, -1.10491943359375, -1.0440826416015625, -0.983245849609375, -0.9224090576171875, -0.861572265625, -0.8007354736328125, -0.739898681640625, -0.6790618896484375, -0.61822509765625, -0.5573883056640625, -0.496551513671875, -0.4357147216796875, -0.3748779296875, -0.3140411376953125, -0.253204345703125, -0.1923675537109375, -0.13153076171875, -0.0706939697265625, -0.009857177734375, 0.0509796142578125, 0.11181640625, 0.1726531982421875, 0.233489990234375, 0.2943267822265625, 0.35516357421875, 0.4160003662109375, 0.476837158203125, 0.5376739501953125, 0.5985107421875, 0.6593475341796875, 0.720184326171875, 0.7810211181640625, 0.84185791015625, 0.9026947021484375, 0.963531494140625, 1.0243682861328125, 1.085205078125, 1.1460418701171875, 1.206878662109375, 1.2677154541015625, 1.32855224609375, 1.3893890380859375, 1.450225830078125, 1.5110626220703125, 1.5718994140625, 1.6327362060546875, 1.693572998046875, 1.7544097900390625, 1.81524658203125, 1.8760833740234375, 1.936920166015625, 1.9977569580078125, 2.05859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 3.0, 8.0, 15.0, 24.0, 24.0, 44.0, 99.0, 136.0, 242.0, 451.0, 891.0, 2075.0, 4965.0, 14126.0, 52277.0, 307486.0, 555447.0, 79226.0, 19711.0, 6461.0, 2480.0, 1106.0, 522.0, 284.0, 165.0, 103.0, 60.0, 36.0, 23.0, 22.0, 9.0, 4.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.756134033203125, -1.69586181640625, -1.635589599609375, -1.5753173828125, -1.515045166015625, -1.45477294921875, -1.394500732421875, -1.334228515625, -1.273956298828125, -1.21368408203125, -1.153411865234375, -1.0931396484375, -1.032867431640625, -0.97259521484375, -0.912322998046875, -0.85205078125, -0.791778564453125, -0.73150634765625, -0.671234130859375, -0.6109619140625, -0.550689697265625, -0.49041748046875, -0.430145263671875, -0.369873046875, -0.309600830078125, -0.24932861328125, -0.189056396484375, -0.1287841796875, -0.068511962890625, -0.00823974609375, 0.052032470703125, 0.1123046875, 0.172576904296875, 0.23284912109375, 0.293121337890625, 0.3533935546875, 0.413665771484375, 0.47393798828125, 0.534210205078125, 0.594482421875, 0.654754638671875, 0.71502685546875, 0.775299072265625, 0.8355712890625, 0.895843505859375, 0.95611572265625, 1.016387939453125, 1.07666015625, 1.136932373046875, 1.19720458984375, 1.257476806640625, 1.3177490234375, 1.378021240234375, 1.43829345703125, 1.498565673828125, 1.558837890625, 1.619110107421875, 1.67938232421875, 1.739654541015625, 1.7999267578125, 1.860198974609375, 1.92047119140625, 1.980743408203125, 2.041015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 8.0, 6.0, 14.0, 13.0, 29.0, 34.0, 38.0, 40.0, 72.0, 114.0, 170.0, 153.0, 98.0, 64.0, 48.0, 36.0, 24.0, 19.0, 17.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030159950256347656, -0.0002921484410762787, -0.0002826973795890808, -0.00027324631810188293, -0.00026379525661468506, -0.0002543441951274872, -0.0002448931336402893, -0.00023544207215309143, -0.00022599101066589355, -0.00021653994917869568, -0.0002070888876914978, -0.00019763782620429993, -0.00018818676471710205, -0.00017873570322990417, -0.0001692846417427063, -0.00015983358025550842, -0.00015038251876831055, -0.00014093145728111267, -0.0001314803957939148, -0.00012202933430671692, -0.00011257827281951904, -0.00010312721133232117, -9.367614984512329e-05, -8.422508835792542e-05, -7.477402687072754e-05, -6.532296538352966e-05, -5.587190389633179e-05, -4.642084240913391e-05, -3.6969780921936035e-05, -2.751871943473816e-05, -1.8067657947540283e-05, -8.616596460342407e-06, 8.344650268554688e-07, 1.0285526514053345e-05, 1.973658800125122e-05, 2.9187649488449097e-05, 3.863871097564697e-05, 4.808977246284485e-05, 5.7540833950042725e-05, 6.69918954372406e-05, 7.644295692443848e-05, 8.589401841163635e-05, 9.534507989883423e-05, 0.0001047961413860321, 0.00011424720287322998, 0.00012369826436042786, 0.00013314932584762573, 0.0001426003873348236, 0.00015205144882202148, 0.00016150251030921936, 0.00017095357179641724, 0.0001804046332836151, 0.000189855694770813, 0.00019930675625801086, 0.00020875781774520874, 0.00021820887923240662, 0.0002276599407196045, 0.00023711100220680237, 0.00024656206369400024, 0.0002560131251811981, 0.000265464186668396, 0.00027491524815559387, 0.00028436630964279175, 0.0002938173711299896, 0.0003032684326171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 13.0, 26.0, 43.0, 67.0, 122.0, 233.0, 460.0, 1047.0, 3189.0, 12579.0, 77701.0, 737772.0, 183402.0, 23905.0, 5156.0, 1576.0, 626.0, 261.0, 121.0, 96.0, 51.0, 23.0, 17.0, 17.0, 9.0, 4.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.97265625, -2.886962890625, -2.80126953125, -2.715576171875, -2.6298828125, -2.544189453125, -2.45849609375, -2.372802734375, -2.287109375, -2.201416015625, -2.11572265625, -2.030029296875, -1.9443359375, -1.858642578125, -1.77294921875, -1.687255859375, -1.6015625, -1.515869140625, -1.43017578125, -1.344482421875, -1.2587890625, -1.173095703125, -1.08740234375, -1.001708984375, -0.916015625, -0.830322265625, -0.74462890625, -0.658935546875, -0.5732421875, -0.487548828125, -0.40185546875, -0.316162109375, -0.23046875, -0.144775390625, -0.05908203125, 0.026611328125, 0.1123046875, 0.197998046875, 0.28369140625, 0.369384765625, 0.455078125, 0.540771484375, 0.62646484375, 0.712158203125, 0.7978515625, 0.883544921875, 0.96923828125, 1.054931640625, 1.140625, 1.226318359375, 1.31201171875, 1.397705078125, 1.4833984375, 1.569091796875, 1.65478515625, 1.740478515625, 1.826171875, 1.911865234375, 1.99755859375, 2.083251953125, 2.1689453125, 2.254638671875, 2.34033203125, 2.426025390625, 2.51171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 18.0, 12.0, 18.0, 18.0, 32.0, 65.0, 97.0, 156.0, 229.0, 102.0, 82.0, 44.0, 41.0, 18.0, 17.0, 9.0, 9.0, 6.0, 10.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.261383056640625, -2.18682861328125, -2.112274169921875, -2.0377197265625, -1.963165283203125, -1.88861083984375, -1.814056396484375, -1.739501953125, -1.664947509765625, -1.59039306640625, -1.515838623046875, -1.4412841796875, -1.366729736328125, -1.29217529296875, -1.217620849609375, -1.14306640625, -1.068511962890625, -0.99395751953125, -0.919403076171875, -0.8448486328125, -0.770294189453125, -0.69573974609375, -0.621185302734375, -0.546630859375, -0.472076416015625, -0.39752197265625, -0.322967529296875, -0.2484130859375, -0.173858642578125, -0.09930419921875, -0.024749755859375, 0.0498046875, 0.124359130859375, 0.19891357421875, 0.273468017578125, 0.3480224609375, 0.422576904296875, 0.49713134765625, 0.571685791015625, 0.646240234375, 0.720794677734375, 0.79534912109375, 0.869903564453125, 0.9444580078125, 1.019012451171875, 1.09356689453125, 1.168121337890625, 1.24267578125, 1.317230224609375, 1.39178466796875, 1.466339111328125, 1.5408935546875, 1.615447998046875, 1.69000244140625, 1.764556884765625, 1.839111328125, 1.913665771484375, 1.98822021484375, 2.062774658203125, 2.1373291015625, 2.211883544921875, 2.28643798828125, 2.360992431640625, 2.435546875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 13.0, 6.0, 24.0, 20.0, 47.0, 62.0, 74.0, 103.0, 109.0, 112.0, 87.0, 97.0, 67.0, 55.0, 46.0, 26.0, 16.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.143619537353516, -25.552173614501953, -24.96072769165039, -24.369281768798828, -23.777835845947266, -23.186389923095703, -22.59494400024414, -22.003498077392578, -21.412052154541016, -20.820606231689453, -20.22916030883789, -19.637714385986328, -19.046268463134766, -18.454822540283203, -17.86337661743164, -17.271930694580078, -16.680484771728516, -16.089038848876953, -15.49759292602539, -14.906147003173828, -14.314701080322266, -13.723255157470703, -13.13180923461914, -12.540363311767578, -11.948917388916016, -11.357471466064453, -10.76602554321289, -10.174579620361328, -9.583133697509766, -8.991687774658203, -8.40024185180664, -7.808795928955078, -7.217350006103516, -6.625904083251953, -6.034458160400391, -5.443012237548828, -4.851566314697266, -4.260120391845703, -3.6686744689941406, -3.077228546142578, -2.4857826232910156, -1.8943367004394531, -1.3028907775878906, -0.7114448547363281, -0.11999893188476562, 0.4714469909667969, 1.0628929138183594, 1.6543388366699219, 2.2457847595214844, 2.837230682373047, 3.4286766052246094, 4.020122528076172, 4.611568450927734, 5.203014373779297, 5.794460296630859, 6.385906219482422, 6.977352142333984, 7.568798065185547, 8.16024398803711, 8.751689910888672, 9.343135833740234, 9.934581756591797, 10.52602767944336, 11.117473602294922, 11.708919525146484]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 9.0, 13.0, 12.0, 15.0, 19.0, 24.0, 25.0, 26.0, 28.0, 30.0, 27.0, 34.0, 33.0, 38.0, 42.0, 63.0, 44.0, 48.0, 42.0, 35.0, 35.0, 37.0, 35.0, 36.0, 33.0, 40.0, 34.0, 21.0, 23.0, 15.0, 16.0, 13.0, 11.0, 3.0, 6.0, 12.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.034894943237305, -10.70212173461914, -10.369349479675293, -10.036576271057129, -9.703804016113281, -9.371030807495117, -9.038257598876953, -8.705484390258789, -8.372712135314941, -8.039938926696777, -7.70716667175293, -7.374393463134766, -7.04162073135376, -6.708847999572754, -6.37607479095459, -6.043302059173584, -5.710529327392578, -5.377756595611572, -5.044983863830566, -4.712210655212402, -4.3794379234313965, -4.046665191650391, -3.7138922214508057, -3.3811192512512207, -3.048346519470215, -2.715573787689209, -2.382800817489624, -2.050027847290039, -1.7172551155090332, -1.3844822645187378, -1.0517094135284424, -0.7189364433288574, -0.38616275787353516, -0.053389906883239746, 0.27938294410705566, 0.6121557950973511, 0.9449286460876465, 1.277701497077942, 1.6104743480682373, 1.9432473182678223, 2.276020050048828, 2.608792781829834, 2.941565752029419, 3.274338722229004, 3.6071114540100098, 3.9398841857910156, 4.27265739440918, 4.6054301261901855, 4.938202857971191, 5.270975589752197, 5.603748321533203, 5.936521530151367, 6.269294261932373, 6.602066993713379, 6.934840202331543, 7.267612934112549, 7.600385665893555, 7.9331583976745605, 8.265931129455566, 8.59870433807373, 8.931476593017578, 9.264249801635742, 9.597023010253906, 9.92979621887207, 10.262568473815918]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 10.0, 14.0, 9.0, 25.0, 29.0, 43.0, 66.0, 104.0, 147.0, 246.0, 461.0, 738.0, 1326.0, 2726.0, 5492.0, 12816.0, 35309.0, 146460.0, 3331152.0, 545262.0, 73342.0, 21973.0, 8444.0, 3854.0, 1873.0, 974.0, 529.0, 307.0, 178.0, 111.0, 74.0, 54.0, 30.0, 20.0, 13.0, 11.0, 14.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.683013916015625, -2.58282470703125, -2.482635498046875, -2.3824462890625, -2.282257080078125, -2.18206787109375, -2.081878662109375, -1.981689453125, -1.881500244140625, -1.78131103515625, -1.681121826171875, -1.5809326171875, -1.480743408203125, -1.38055419921875, -1.280364990234375, -1.18017578125, -1.079986572265625, -0.97979736328125, -0.879608154296875, -0.7794189453125, -0.679229736328125, -0.57904052734375, -0.478851318359375, -0.378662109375, -0.278472900390625, -0.17828369140625, -0.078094482421875, 0.0220947265625, 0.122283935546875, 0.22247314453125, 0.322662353515625, 0.4228515625, 0.523040771484375, 0.62322998046875, 0.723419189453125, 0.8236083984375, 0.923797607421875, 1.02398681640625, 1.124176025390625, 1.224365234375, 1.324554443359375, 1.42474365234375, 1.524932861328125, 1.6251220703125, 1.725311279296875, 1.82550048828125, 1.925689697265625, 2.02587890625, 2.126068115234375, 2.22625732421875, 2.326446533203125, 2.4266357421875, 2.526824951171875, 2.62701416015625, 2.727203369140625, 2.827392578125, 2.927581787109375, 3.02777099609375, 3.127960205078125, 3.2281494140625, 3.328338623046875, 3.42852783203125, 3.528717041015625, 3.62890625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 5.0, 13.0, 19.0, 14.0, 25.0, 31.0, 23.0, 35.0, 38.0, 47.0, 44.0, 69.0, 51.0, 59.0, 56.0, 81.0, 56.0, 57.0, 49.0, 45.0, 37.0, 28.0, 27.0, 32.0, 14.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6422653198242188, -0.6248626708984375, -0.6074600219726562, -0.590057373046875, -0.5726547241210938, -0.5552520751953125, -0.5378494262695312, -0.52044677734375, -0.5030441284179688, -0.4856414794921875, -0.46823883056640625, -0.450836181640625, -0.43343353271484375, -0.4160308837890625, -0.39862823486328125, -0.3812255859375, -0.36382293701171875, -0.3464202880859375, -0.32901763916015625, -0.311614990234375, -0.29421234130859375, -0.2768096923828125, -0.25940704345703125, -0.24200439453125, -0.22460174560546875, -0.2071990966796875, -0.18979644775390625, -0.172393798828125, -0.15499114990234375, -0.1375885009765625, -0.12018585205078125, -0.102783203125, -0.08538055419921875, -0.0679779052734375, -0.05057525634765625, -0.033172607421875, -0.01576995849609375, 0.0016326904296875, 0.01903533935546875, 0.03643798828125, 0.05384063720703125, 0.0712432861328125, 0.08864593505859375, 0.106048583984375, 0.12345123291015625, 0.1408538818359375, 0.15825653076171875, 0.1756591796875, 0.19306182861328125, 0.2104644775390625, 0.22786712646484375, 0.245269775390625, 0.26267242431640625, 0.2800750732421875, 0.29747772216796875, 0.31488037109375, 0.33228302001953125, 0.3496856689453125, 0.36708831787109375, 0.384490966796875, 0.40189361572265625, 0.4192962646484375, 0.43669891357421875, 0.4541015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 6.0, 14.0, 17.0, 26.0, 46.0, 65.0, 115.0, 147.0, 249.0, 422.0, 699.0, 1320.0, 2384.0, 4364.0, 9138.0, 20351.0, 50988.0, 160383.0, 1266590.0, 2383202.0, 192581.0, 57768.0, 22712.0, 10082.0, 4766.0, 2497.0, 1379.0, 759.0, 462.0, 250.0, 178.0, 101.0, 72.0, 38.0, 33.0, 19.0, 8.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.341796875, -2.2750091552734375, -2.208221435546875, -2.1414337158203125, -2.07464599609375, -2.0078582763671875, -1.941070556640625, -1.8742828369140625, -1.8074951171875, -1.7407073974609375, -1.673919677734375, -1.6071319580078125, -1.54034423828125, -1.4735565185546875, -1.406768798828125, -1.3399810791015625, -1.273193359375, -1.2064056396484375, -1.139617919921875, -1.0728302001953125, -1.00604248046875, -0.9392547607421875, -0.872467041015625, -0.8056793212890625, -0.7388916015625, -0.6721038818359375, -0.605316162109375, -0.5385284423828125, -0.47174072265625, -0.4049530029296875, -0.338165283203125, -0.2713775634765625, -0.20458984375, -0.1378021240234375, -0.071014404296875, -0.0042266845703125, 0.06256103515625, 0.1293487548828125, 0.196136474609375, 0.2629241943359375, 0.3297119140625, 0.3964996337890625, 0.463287353515625, 0.5300750732421875, 0.59686279296875, 0.6636505126953125, 0.730438232421875, 0.7972259521484375, 0.864013671875, 0.9308013916015625, 0.997589111328125, 1.0643768310546875, 1.13116455078125, 1.1979522705078125, 1.264739990234375, 1.3315277099609375, 1.3983154296875, 1.4651031494140625, 1.531890869140625, 1.5986785888671875, 1.66546630859375, 1.7322540283203125, 1.799041748046875, 1.8658294677734375, 1.9326171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 9.0, 10.0, 17.0, 17.0, 19.0, 31.0, 63.0, 69.0, 139.0, 230.0, 595.0, 1724.0, 524.0, 239.0, 133.0, 80.0, 54.0, 32.0, 28.0, 18.0, 8.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.258087158203125, -1.21051025390625, -1.162933349609375, -1.1153564453125, -1.067779541015625, -1.02020263671875, -0.972625732421875, -0.925048828125, -0.877471923828125, -0.82989501953125, -0.782318115234375, -0.7347412109375, -0.687164306640625, -0.63958740234375, -0.592010498046875, -0.54443359375, -0.496856689453125, -0.44927978515625, -0.401702880859375, -0.3541259765625, -0.306549072265625, -0.25897216796875, -0.211395263671875, -0.163818359375, -0.116241455078125, -0.06866455078125, -0.021087646484375, 0.0264892578125, 0.074066162109375, 0.12164306640625, 0.169219970703125, 0.216796875, 0.264373779296875, 0.31195068359375, 0.359527587890625, 0.4071044921875, 0.454681396484375, 0.50225830078125, 0.549835205078125, 0.597412109375, 0.644989013671875, 0.69256591796875, 0.740142822265625, 0.7877197265625, 0.835296630859375, 0.88287353515625, 0.930450439453125, 0.97802734375, 1.025604248046875, 1.07318115234375, 1.120758056640625, 1.1683349609375, 1.215911865234375, 1.26348876953125, 1.311065673828125, 1.358642578125, 1.406219482421875, 1.45379638671875, 1.501373291015625, 1.5489501953125, 1.596527099609375, 1.64410400390625, 1.691680908203125, 1.7392578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 23.0, 72.0, 246.0, 323.0, 223.0, 79.0, 24.0, 10.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.864779472351074, -5.06349515914917, -4.262210369110107, -3.460926055908203, -2.6596415042877197, -1.8583569526672363, -1.057072639465332, -0.25578784942626953, 0.5454964637756348, 1.3467810153961182, 2.1480655670166016, 2.949349880218506, 3.7506344318389893, 4.551918983459473, 5.353203296661377, 6.1544880867004395, 6.955772399902344, 7.757056713104248, 8.558341026306152, 9.359625816345215, 10.160910606384277, 10.962194442749023, 11.763479232788086, 12.564764022827148, 13.366048812866211, 14.167333602905273, 14.96861743927002, 15.769902229309082, 16.571186065673828, 17.37247085571289, 18.173755645751953, 18.975040435791016, 19.776323318481445, 20.577608108520508, 21.37889289855957, 22.18017578125, 22.981460571289062, 23.782745361328125, 24.584030151367188, 25.38531494140625, 26.186599731445312, 26.987884521484375, 27.789169311523438, 28.5904541015625, 29.39173698425293, 30.193021774291992, 30.994306564331055, 31.795591354370117, 32.59687423706055, 33.39815902709961, 34.19944381713867, 35.000728607177734, 35.8020133972168, 36.60329818725586, 37.404579162597656, 38.20586395263672, 39.00715255737305, 39.80843734741211, 40.60972213745117, 41.411006927490234, 42.2122917175293, 43.01357650756836, 43.814857482910156, 44.61614227294922, 45.41742706298828]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 12.0, 17.0, 12.0, 11.0, 14.0, 18.0, 18.0, 19.0, 27.0, 31.0, 28.0, 33.0, 27.0, 30.0, 34.0, 28.0, 41.0, 49.0, 49.0, 22.0, 39.0, 46.0, 25.0, 31.0, 27.0, 23.0, 33.0, 29.0, 27.0, 19.0, 15.0, 19.0, 10.0, 14.0, 15.0, 15.0, 13.0, 10.0, 9.0, 5.0, 8.0, 8.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.676394462585449, -3.5574376583099365, -3.4384806156158447, -3.319523811340332, -3.2005670070648193, -3.0816102027893066, -2.962653160095215, -2.843696355819702, -2.7247395515441895, -2.6057827472686768, -2.486825704574585, -2.3678689002990723, -2.2489120960235596, -2.129955291748047, -2.010998249053955, -1.8920414447784424, -1.7730844020843506, -1.6541274785995483, -1.5351706743240356, -1.4162137508392334, -1.2972569465637207, -1.1783000230789185, -1.0593430995941162, -0.9403862357139587, -0.8214293718338013, -0.7024725079536438, -0.5835156440734863, -0.4645587205886841, -0.3456018567085266, -0.22664499282836914, -0.1076880693435669, 0.011268794536590576, 0.13022565841674805, 0.2491825371980667, 0.3681394159793854, 0.48709630966186523, 0.6060531735420227, 0.7250100374221802, 0.8439669609069824, 0.9629238247871399, 1.0818806886672974, 1.2008376121520996, 1.3197944164276123, 1.4387513399124146, 1.5577082633972168, 1.6766650676727295, 1.7956219911575317, 1.914578914642334, 2.0335357189178467, 2.1524925231933594, 2.271449565887451, 2.390406370162964, 2.5093631744384766, 2.6283202171325684, 2.747277021408081, 2.8662338256835938, 2.9851908683776855, 3.1041476726531982, 3.22310471534729, 3.3420615196228027, 3.4610183238983154, 3.579975128173828, 3.69893217086792, 3.8178889751434326, 3.9368457794189453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 8.0, 18.0, 17.0, 28.0, 37.0, 87.0, 118.0, 170.0, 300.0, 484.0, 830.0, 1477.0, 2739.0, 5395.0, 11117.0, 24479.0, 55576.0, 121637.0, 224591.0, 263886.0, 176835.0, 86428.0, 38324.0, 17140.0, 8023.0, 4028.0, 1994.0, 1092.0, 622.0, 360.0, 252.0, 139.0, 94.0, 63.0, 48.0, 23.0, 25.0, 14.0, 10.0, 6.0, 8.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8896484375, -1.8311004638671875, -1.772552490234375, -1.7140045166015625, -1.65545654296875, -1.5969085693359375, -1.538360595703125, -1.4798126220703125, -1.4212646484375, -1.3627166748046875, -1.304168701171875, -1.2456207275390625, -1.18707275390625, -1.1285247802734375, -1.069976806640625, -1.0114288330078125, -0.952880859375, -0.8943328857421875, -0.835784912109375, -0.7772369384765625, -0.71868896484375, -0.6601409912109375, -0.601593017578125, -0.5430450439453125, -0.4844970703125, -0.4259490966796875, -0.367401123046875, -0.3088531494140625, -0.25030517578125, -0.1917572021484375, -0.133209228515625, -0.0746612548828125, -0.01611328125, 0.0424346923828125, 0.100982666015625, 0.1595306396484375, 0.21807861328125, 0.2766265869140625, 0.335174560546875, 0.3937225341796875, 0.4522705078125, 0.5108184814453125, 0.569366455078125, 0.6279144287109375, 0.68646240234375, 0.7450103759765625, 0.803558349609375, 0.8621063232421875, 0.920654296875, 0.9792022705078125, 1.037750244140625, 1.0962982177734375, 1.15484619140625, 1.2133941650390625, 1.271942138671875, 1.3304901123046875, 1.3890380859375, 1.4475860595703125, 1.506134033203125, 1.5646820068359375, 1.62322998046875, 1.6817779541015625, 1.740325927734375, 1.7988739013671875, 1.857421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 12.0, 18.0, 10.0, 25.0, 21.0, 32.0, 38.0, 48.0, 42.0, 54.0, 40.0, 55.0, 66.0, 66.0, 67.0, 59.0, 43.0, 46.0, 46.0, 54.0, 29.0, 30.0, 26.0, 14.0, 15.0, 6.0, 12.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6980705261230469, -0.6793441772460938, -0.6606178283691406, -0.6418914794921875, -0.6231651306152344, -0.6044387817382812, -0.5857124328613281, -0.566986083984375, -0.5482597351074219, -0.5295333862304688, -0.5108070373535156, -0.4920806884765625, -0.4733543395996094, -0.45462799072265625, -0.4359016418457031, -0.41717529296875, -0.3984489440917969, -0.37972259521484375, -0.3609962463378906, -0.3422698974609375, -0.3235435485839844, -0.30481719970703125, -0.2860908508300781, -0.267364501953125, -0.24863815307617188, -0.22991180419921875, -0.21118545532226562, -0.1924591064453125, -0.17373275756835938, -0.15500640869140625, -0.13628005981445312, -0.1175537109375, -0.09882736206054688, -0.08010101318359375, -0.061374664306640625, -0.0426483154296875, -0.023921966552734375, -0.00519561767578125, 0.013530731201171875, 0.032257080078125, 0.050983428955078125, 0.06970977783203125, 0.08843612670898438, 0.1071624755859375, 0.12588882446289062, 0.14461517333984375, 0.16334152221679688, 0.18206787109375, 0.20079421997070312, 0.21952056884765625, 0.23824691772460938, 0.2569732666015625, 0.2756996154785156, 0.29442596435546875, 0.3131523132324219, 0.331878662109375, 0.3506050109863281, 0.36933135986328125, 0.3880577087402344, 0.4067840576171875, 0.4255104064941406, 0.44423675537109375, 0.4629631042480469, 0.481689453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 10.0, 8.0, 14.0, 21.0, 26.0, 33.0, 51.0, 85.0, 108.0, 165.0, 248.0, 382.0, 671.0, 1208.0, 2385.0, 4634.0, 10688.0, 25039.0, 61169.0, 141743.0, 263465.0, 272060.0, 149739.0, 65706.0, 26865.0, 11480.0, 4992.0, 2395.0, 1258.0, 687.0, 407.0, 244.0, 190.0, 118.0, 78.0, 51.0, 36.0, 30.0, 21.0, 22.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.80078125, -1.7478790283203125, -1.694976806640625, -1.6420745849609375, -1.58917236328125, -1.5362701416015625, -1.483367919921875, -1.4304656982421875, -1.3775634765625, -1.3246612548828125, -1.271759033203125, -1.2188568115234375, -1.16595458984375, -1.1130523681640625, -1.060150146484375, -1.0072479248046875, -0.954345703125, -0.9014434814453125, -0.848541259765625, -0.7956390380859375, -0.74273681640625, -0.6898345947265625, -0.636932373046875, -0.5840301513671875, -0.5311279296875, -0.4782257080078125, -0.425323486328125, -0.3724212646484375, -0.31951904296875, -0.2666168212890625, -0.213714599609375, -0.1608123779296875, -0.10791015625, -0.0550079345703125, -0.002105712890625, 0.0507965087890625, 0.10369873046875, 0.1566009521484375, 0.209503173828125, 0.2624053955078125, 0.3153076171875, 0.3682098388671875, 0.421112060546875, 0.4740142822265625, 0.52691650390625, 0.5798187255859375, 0.632720947265625, 0.6856231689453125, 0.738525390625, 0.7914276123046875, 0.844329833984375, 0.8972320556640625, 0.95013427734375, 1.0030364990234375, 1.055938720703125, 1.1088409423828125, 1.1617431640625, 1.2146453857421875, 1.267547607421875, 1.3204498291015625, 1.37335205078125, 1.4262542724609375, 1.479156494140625, 1.5320587158203125, 1.5849609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 3.0, 3.0, 9.0, 9.0, 8.0, 23.0, 23.0, 15.0, 30.0, 29.0, 36.0, 41.0, 47.0, 45.0, 42.0, 40.0, 45.0, 50.0, 64.0, 40.0, 48.0, 44.0, 33.0, 36.0, 42.0, 25.0, 25.0, 27.0, 31.0, 12.0, 8.0, 9.0, 8.0, 12.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.732421875, -2.65924072265625, -2.5860595703125, -2.51287841796875, -2.439697265625, -2.36651611328125, -2.2933349609375, -2.22015380859375, -2.14697265625, -2.07379150390625, -2.0006103515625, -1.92742919921875, -1.854248046875, -1.78106689453125, -1.7078857421875, -1.63470458984375, -1.5615234375, -1.48834228515625, -1.4151611328125, -1.34197998046875, -1.268798828125, -1.19561767578125, -1.1224365234375, -1.04925537109375, -0.97607421875, -0.90289306640625, -0.8297119140625, -0.75653076171875, -0.683349609375, -0.61016845703125, -0.5369873046875, -0.46380615234375, -0.390625, -0.31744384765625, -0.2442626953125, -0.17108154296875, -0.097900390625, -0.02471923828125, 0.0484619140625, 0.12164306640625, 0.19482421875, 0.26800537109375, 0.3411865234375, 0.41436767578125, 0.487548828125, 0.56072998046875, 0.6339111328125, 0.70709228515625, 0.7802734375, 0.85345458984375, 0.9266357421875, 0.99981689453125, 1.072998046875, 1.14617919921875, 1.2193603515625, 1.29254150390625, 1.36572265625, 1.43890380859375, 1.5120849609375, 1.58526611328125, 1.658447265625, 1.73162841796875, 1.8048095703125, 1.87799072265625, 1.951171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 4.0, 3.0, 11.0, 19.0, 24.0, 34.0, 28.0, 56.0, 96.0, 146.0, 231.0, 402.0, 788.0, 1383.0, 3050.0, 6800.0, 17478.0, 52700.0, 166783.0, 393050.0, 267486.0, 90144.0, 28926.0, 10290.0, 4237.0, 2032.0, 1038.0, 528.0, 291.0, 163.0, 105.0, 86.0, 44.0, 18.0, 32.0, 19.0, 9.0, 5.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.780487060546875, -0.74456787109375, -0.708648681640625, -0.6727294921875, -0.636810302734375, -0.60089111328125, -0.564971923828125, -0.529052734375, -0.493133544921875, -0.45721435546875, -0.421295166015625, -0.3853759765625, -0.349456787109375, -0.31353759765625, -0.277618408203125, -0.24169921875, -0.205780029296875, -0.16986083984375, -0.133941650390625, -0.0980224609375, -0.062103271484375, -0.02618408203125, 0.009735107421875, 0.045654296875, 0.081573486328125, 0.11749267578125, 0.153411865234375, 0.1893310546875, 0.225250244140625, 0.26116943359375, 0.297088623046875, 0.3330078125, 0.368927001953125, 0.40484619140625, 0.440765380859375, 0.4766845703125, 0.512603759765625, 0.54852294921875, 0.584442138671875, 0.620361328125, 0.656280517578125, 0.69219970703125, 0.728118896484375, 0.7640380859375, 0.799957275390625, 0.83587646484375, 0.871795654296875, 0.90771484375, 0.943634033203125, 0.97955322265625, 1.015472412109375, 1.0513916015625, 1.087310791015625, 1.12322998046875, 1.159149169921875, 1.195068359375, 1.230987548828125, 1.26690673828125, 1.302825927734375, 1.3387451171875, 1.374664306640625, 1.41058349609375, 1.446502685546875, 1.482421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 4.0, 4.0, 6.0, 4.0, 11.0, 3.0, 16.0, 18.0, 23.0, 24.0, 35.0, 43.0, 61.0, 64.0, 72.0, 72.0, 76.0, 65.0, 67.0, 67.0, 56.0, 39.0, 34.0, 32.0, 27.0, 16.0, 19.0, 9.0, 11.0, 4.0, 4.0, 0.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018477439880371094, -0.00017854012548923492, -0.0001723058521747589, -0.0001660715788602829, -0.00015983730554580688, -0.00015360303223133087, -0.00014736875891685486, -0.00014113448560237885, -0.00013490021228790283, -0.00012866593897342682, -0.0001224316656589508, -0.00011619739234447479, -0.00010996311902999878, -0.00010372884571552277, -9.749457240104675e-05, -9.126029908657074e-05, -8.502602577209473e-05, -7.879175245761871e-05, -7.25574791431427e-05, -6.632320582866669e-05, -6.0088932514190674e-05, -5.385465919971466e-05, -4.762038588523865e-05, -4.1386112570762634e-05, -3.515183925628662e-05, -2.8917565941810608e-05, -2.2683292627334595e-05, -1.644901931285858e-05, -1.0214745998382568e-05, -3.980472683906555e-06, 2.253800630569458e-06, 8.488073945045471e-06, 1.4722347259521484e-05, 2.0956620573997498e-05, 2.719089388847351e-05, 3.3425167202949524e-05, 3.965944051742554e-05, 4.589371383190155e-05, 5.2127987146377563e-05, 5.836226046085358e-05, 6.459653377532959e-05, 7.08308070898056e-05, 7.706508040428162e-05, 8.329935371875763e-05, 8.953362703323364e-05, 9.576790034770966e-05, 0.00010200217366218567, 0.00010823644697666168, 0.0001144707202911377, 0.00012070499360561371, 0.00012693926692008972, 0.00013317354023456573, 0.00013940781354904175, 0.00014564208686351776, 0.00015187636017799377, 0.0001581106334924698, 0.0001643449068069458, 0.00017057918012142181, 0.00017681345343589783, 0.00018304772675037384, 0.00018928200006484985, 0.00019551627337932587, 0.00020175054669380188, 0.0002079848200082779, 0.0002142190933227539]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 14.0, 18.0, 26.0, 45.0, 111.0, 205.0, 473.0, 1256.0, 4063.0, 19787.0, 144421.0, 619526.0, 220953.0, 29298.0, 5567.0, 1662.0, 585.0, 279.0, 125.0, 48.0, 25.0, 17.0, 23.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4373931884765625, -1.373809814453125, -1.3102264404296875, -1.24664306640625, -1.1830596923828125, -1.119476318359375, -1.0558929443359375, -0.9923095703125, -0.9287261962890625, -0.865142822265625, -0.8015594482421875, -0.73797607421875, -0.6743927001953125, -0.610809326171875, -0.5472259521484375, -0.483642578125, -0.4200592041015625, -0.356475830078125, -0.2928924560546875, -0.22930908203125, -0.1657257080078125, -0.102142333984375, -0.0385589599609375, 0.0250244140625, 0.0886077880859375, 0.152191162109375, 0.2157745361328125, 0.27935791015625, 0.3429412841796875, 0.406524658203125, 0.4701080322265625, 0.53369140625, 0.5972747802734375, 0.660858154296875, 0.7244415283203125, 0.78802490234375, 0.8516082763671875, 0.915191650390625, 0.9787750244140625, 1.0423583984375, 1.1059417724609375, 1.169525146484375, 1.2331085205078125, 1.29669189453125, 1.3602752685546875, 1.423858642578125, 1.4874420166015625, 1.551025390625, 1.6146087646484375, 1.678192138671875, 1.7417755126953125, 1.80535888671875, 1.8689422607421875, 1.932525634765625, 1.9961090087890625, 2.0596923828125, 2.1232757568359375, 2.186859130859375, 2.2504425048828125, 2.31402587890625, 2.3776092529296875, 2.441192626953125, 2.5047760009765625, 2.568359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 25.0, 29.0, 41.0, 54.0, 61.0, 83.0, 100.0, 112.0, 102.0, 81.0, 68.0, 62.0, 30.0, 33.0, 30.0, 18.0, 13.0, 6.0, 3.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6334686279296875, -1.576507568359375, -1.5195465087890625, -1.46258544921875, -1.4056243896484375, -1.348663330078125, -1.2917022705078125, -1.2347412109375, -1.1777801513671875, -1.120819091796875, -1.0638580322265625, -1.00689697265625, -0.9499359130859375, -0.892974853515625, -0.8360137939453125, -0.779052734375, -0.7220916748046875, -0.665130615234375, -0.6081695556640625, -0.55120849609375, -0.4942474365234375, -0.437286376953125, -0.3803253173828125, -0.3233642578125, -0.2664031982421875, -0.209442138671875, -0.1524810791015625, -0.09552001953125, -0.0385589599609375, 0.018402099609375, 0.0753631591796875, 0.13232421875, 0.1892852783203125, 0.246246337890625, 0.3032073974609375, 0.36016845703125, 0.4171295166015625, 0.474090576171875, 0.5310516357421875, 0.5880126953125, 0.6449737548828125, 0.701934814453125, 0.7588958740234375, 0.81585693359375, 0.8728179931640625, 0.929779052734375, 0.9867401123046875, 1.043701171875, 1.1006622314453125, 1.157623291015625, 1.2145843505859375, 1.27154541015625, 1.3285064697265625, 1.385467529296875, 1.4424285888671875, 1.4993896484375, 1.5563507080078125, 1.613311767578125, 1.6702728271484375, 1.72723388671875, 1.7841949462890625, 1.841156005859375, 1.8981170654296875, 1.955078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 26.0, 52.0, 131.0, 221.0, 241.0, 186.0, 82.0, 37.0, 19.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.51769256591797, -63.180030822753906, -61.842369079589844, -60.50471115112305, -59.167049407958984, -57.82938766479492, -56.491729736328125, -55.15406799316406, -53.81640625, -52.47874450683594, -51.141082763671875, -49.80342483520508, -48.465763092041016, -47.12810134887695, -45.790443420410156, -44.452781677246094, -43.11511993408203, -41.77745819091797, -40.439796447753906, -39.10213851928711, -37.76447677612305, -36.426815032958984, -35.08915710449219, -33.751495361328125, -32.41383361816406, -31.076171875, -29.73851203918457, -28.40085220336914, -27.063190460205078, -25.725528717041016, -24.387868881225586, -23.050209045410156, -21.712547302246094, -20.37488555908203, -19.0372257232666, -17.699565887451172, -16.36190414428711, -15.024243354797363, -13.686582565307617, -12.348921775817871, -11.011260986328125, -9.673600196838379, -8.335939407348633, -6.998278617858887, -5.660617828369141, -4.3229570388793945, -2.9852962493896484, -1.6476354598999023, -0.30997467041015625, 1.0276861190795898, 2.365346908569336, 3.703007698059082, 5.040668487548828, 6.378329277038574, 7.71599006652832, 9.053650856018066, 10.391311645507812, 11.728972434997559, 13.066633224487305, 14.40429401397705, 15.741954803466797, 17.07961654663086, 18.41727638244629, 19.75493621826172, 21.09259796142578]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 4.0, 9.0, 14.0, 18.0, 7.0, 19.0, 14.0, 29.0, 27.0, 30.0, 29.0, 30.0, 48.0, 42.0, 43.0, 50.0, 40.0, 59.0, 48.0, 34.0, 48.0, 56.0, 33.0, 47.0, 25.0, 39.0, 25.0, 16.0, 21.0, 26.0, 9.0, 11.0, 8.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.099786758422852, -11.729218482971191, -11.358649253845215, -10.988080978393555, -10.617511749267578, -10.246943473815918, -9.876375198364258, -9.505805969238281, -9.135237693786621, -8.764669418334961, -8.394100189208984, -8.023531913757324, -7.652963161468506, -7.2823944091796875, -6.911826133728027, -6.541257381439209, -6.170688629150391, -5.800119876861572, -5.429551124572754, -5.058982849121094, -4.688414096832275, -4.317845344543457, -3.9472768306732178, -3.5767083168029785, -3.20613956451416, -2.835570812225342, -2.4650022983551025, -2.0944337844848633, -1.723865032196045, -1.3532963991165161, -0.9827277660369873, -0.612159252166748, -0.24158954620361328, 0.12897908687591553, 0.49954771995544434, 0.8701163530349731, 1.240684986114502, 1.6112536191940308, 1.9818222522735596, 2.352390766143799, 2.722959518432617, 3.0935282707214355, 3.464096784591675, 3.834665298461914, 4.205234050750732, 4.575802803039551, 4.946371078491211, 5.316939830780029, 5.687508583068848, 6.058077335357666, 6.428646087646484, 6.7992143630981445, 7.169783115386963, 7.540351867675781, 7.910920143127441, 8.281488418579102, 8.652057647705078, 9.022625923156738, 9.393195152282715, 9.763763427734375, 10.134332656860352, 10.504900932312012, 10.875469207763672, 11.246038436889648, 11.616606712341309]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 11.0, 7.0, 17.0, 21.0, 29.0, 46.0, 64.0, 87.0, 165.0, 272.0, 539.0, 992.0, 2293.0, 6382.0, 28523.0, 4006648.0, 126739.0, 14105.0, 4050.0, 1549.0, 745.0, 362.0, 221.0, 127.0, 94.0, 44.0, 39.0, 28.0, 17.0, 13.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.52374267578125, -5.3443603515625, -5.16497802734375, -4.985595703125, -4.80621337890625, -4.6268310546875, -4.44744873046875, -4.26806640625, -4.08868408203125, -3.9093017578125, -3.72991943359375, -3.550537109375, -3.37115478515625, -3.1917724609375, -3.01239013671875, -2.8330078125, -2.65362548828125, -2.4742431640625, -2.29486083984375, -2.115478515625, -1.93609619140625, -1.7567138671875, -1.57733154296875, -1.39794921875, -1.21856689453125, -1.0391845703125, -0.85980224609375, -0.680419921875, -0.50103759765625, -0.3216552734375, -0.14227294921875, 0.037109375, 0.21649169921875, 0.3958740234375, 0.57525634765625, 0.754638671875, 0.93402099609375, 1.1134033203125, 1.29278564453125, 1.47216796875, 1.65155029296875, 1.8309326171875, 2.01031494140625, 2.189697265625, 2.36907958984375, 2.5484619140625, 2.72784423828125, 2.9072265625, 3.08660888671875, 3.2659912109375, 3.44537353515625, 3.624755859375, 3.80413818359375, 3.9835205078125, 4.16290283203125, 4.34228515625, 4.52166748046875, 4.7010498046875, 4.88043212890625, 5.059814453125, 5.23919677734375, 5.4185791015625, 5.59796142578125, 5.77734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 13.0, 15.0, 27.0, 31.0, 23.0, 33.0, 33.0, 51.0, 63.0, 38.0, 40.0, 42.0, 54.0, 45.0, 51.0, 54.0, 53.0, 29.0, 35.0, 36.0, 33.0, 29.0, 25.0, 14.0, 20.0, 10.0, 16.0, 8.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.61279296875, -0.5956153869628906, -0.5784378051757812, -0.5612602233886719, -0.5440826416015625, -0.5269050598144531, -0.5097274780273438, -0.4925498962402344, -0.475372314453125, -0.4581947326660156, -0.44101715087890625, -0.4238395690917969, -0.4066619873046875, -0.3894844055175781, -0.37230682373046875, -0.3551292419433594, -0.33795166015625, -0.3207740783691406, -0.30359649658203125, -0.2864189147949219, -0.2692413330078125, -0.2520637512207031, -0.23488616943359375, -0.21770858764648438, -0.200531005859375, -0.18335342407226562, -0.16617584228515625, -0.14899826049804688, -0.1318206787109375, -0.11464309692382812, -0.09746551513671875, -0.08028793334960938, -0.0631103515625, -0.045932769775390625, -0.02875518798828125, -0.011577606201171875, 0.0055999755859375, 0.022777557373046875, 0.03995513916015625, 0.057132720947265625, 0.074310302734375, 0.09148788452148438, 0.10866546630859375, 0.12584304809570312, 0.1430206298828125, 0.16019821166992188, 0.17737579345703125, 0.19455337524414062, 0.21173095703125, 0.22890853881835938, 0.24608612060546875, 0.2632637023925781, 0.2804412841796875, 0.2976188659667969, 0.31479644775390625, 0.3319740295410156, 0.349151611328125, 0.3663291931152344, 0.38350677490234375, 0.4006843566894531, 0.4178619384765625, 0.4350395202636719, 0.45221710205078125, 0.4693946838378906, 0.486572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 17.0, 28.0, 49.0, 90.0, 154.0, 244.0, 443.0, 906.0, 2038.0, 5004.0, 14438.0, 61843.0, 3882280.0, 186196.0, 26989.0, 8038.0, 2861.0, 1333.0, 566.0, 329.0, 182.0, 109.0, 60.0, 37.0, 26.0, 12.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30859375, -3.204345703125, -3.10009765625, -2.995849609375, -2.8916015625, -2.787353515625, -2.68310546875, -2.578857421875, -2.474609375, -2.370361328125, -2.26611328125, -2.161865234375, -2.0576171875, -1.953369140625, -1.84912109375, -1.744873046875, -1.640625, -1.536376953125, -1.43212890625, -1.327880859375, -1.2236328125, -1.119384765625, -1.01513671875, -0.910888671875, -0.806640625, -0.702392578125, -0.59814453125, -0.493896484375, -0.3896484375, -0.285400390625, -0.18115234375, -0.076904296875, 0.02734375, 0.131591796875, 0.23583984375, 0.340087890625, 0.4443359375, 0.548583984375, 0.65283203125, 0.757080078125, 0.861328125, 0.965576171875, 1.06982421875, 1.174072265625, 1.2783203125, 1.382568359375, 1.48681640625, 1.591064453125, 1.6953125, 1.799560546875, 1.90380859375, 2.008056640625, 2.1123046875, 2.216552734375, 2.32080078125, 2.425048828125, 2.529296875, 2.633544921875, 2.73779296875, 2.842041015625, 2.9462890625, 3.050537109375, 3.15478515625, 3.259033203125, 3.36328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 10.0, 9.0, 15.0, 27.0, 45.0, 57.0, 80.0, 239.0, 3115.0, 179.0, 82.0, 51.0, 36.0, 25.0, 19.0, 11.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3857421875, -0.3711090087890625, -0.356475830078125, -0.3418426513671875, -0.32720947265625, -0.3125762939453125, -0.297943115234375, -0.2833099365234375, -0.2686767578125, -0.2540435791015625, -0.239410400390625, -0.2247772216796875, -0.21014404296875, -0.1955108642578125, -0.180877685546875, -0.1662445068359375, -0.151611328125, -0.1369781494140625, -0.122344970703125, -0.1077117919921875, -0.09307861328125, -0.0784454345703125, -0.063812255859375, -0.0491790771484375, -0.0345458984375, -0.0199127197265625, -0.005279541015625, 0.0093536376953125, 0.02398681640625, 0.0386199951171875, 0.053253173828125, 0.0678863525390625, 0.08251953125, 0.0971527099609375, 0.111785888671875, 0.1264190673828125, 0.14105224609375, 0.1556854248046875, 0.170318603515625, 0.1849517822265625, 0.1995849609375, 0.2142181396484375, 0.228851318359375, 0.2434844970703125, 0.25811767578125, 0.2727508544921875, 0.287384033203125, 0.3020172119140625, 0.316650390625, 0.3312835693359375, 0.345916748046875, 0.3605499267578125, 0.37518310546875, 0.3898162841796875, 0.404449462890625, 0.4190826416015625, 0.4337158203125, 0.4483489990234375, 0.462982177734375, 0.4776153564453125, 0.49224853515625, 0.5068817138671875, 0.521514892578125, 0.5361480712890625, 0.55078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 15.0, 33.0, 34.0, 59.0, 94.0, 114.0, 134.0, 132.0, 126.0, 79.0, 69.0, 47.0, 26.0, 18.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.540987968444824, -2.4557275772094727, -2.370467185974121, -2.2852065563201904, -2.199946165084839, -2.1146857738494873, -2.0294251441955566, -1.944164752960205, -1.8589043617248535, -1.773643970489502, -1.6883834600448608, -1.6031229496002197, -1.5178625583648682, -1.4326021671295166, -1.3473416566848755, -1.2620811462402344, -1.1768207550048828, -1.0915603637695312, -1.0062998533248901, -0.9210394024848938, -0.8357789516448975, -0.7505185008049011, -0.6652580499649048, -0.5799975991249084, -0.4947371482849121, -0.40947669744491577, -0.32421624660491943, -0.2389557957649231, -0.15369534492492676, -0.06843489408493042, 0.016825556755065918, 0.10208600759506226, 0.1873464584350586, 0.27260690927505493, 0.35786736011505127, 0.4431278109550476, 0.528388261795044, 0.6136487126350403, 0.6989091634750366, 0.784169614315033, 0.8694300651550293, 0.9546905159950256, 1.039950966835022, 1.125211477279663, 1.2104718685150146, 1.2957322597503662, 1.3809927701950073, 1.4662532806396484, 1.551513671875, 1.6367740631103516, 1.7220345735549927, 1.8072950839996338, 1.8925554752349854, 1.977815866470337, 2.0630764961242676, 2.148336887359619, 2.2335972785949707, 2.3188576698303223, 2.404118061065674, 2.4893786907196045, 2.574639081954956, 2.6598994731903076, 2.7451601028442383, 2.83042049407959, 2.9156808853149414]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 10.0, 8.0, 6.0, 12.0, 22.0, 25.0, 29.0, 34.0, 27.0, 33.0, 40.0, 42.0, 41.0, 42.0, 43.0, 46.0, 40.0, 46.0, 49.0, 37.0, 41.0, 41.0, 35.0, 46.0, 28.0, 21.0, 28.0, 23.0, 18.0, 16.0, 17.0, 13.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4903054237365723, -1.4488273859024048, -1.4073494672775269, -1.3658714294433594, -1.3243935108184814, -1.282915472984314, -1.241437554359436, -1.1999595165252686, -1.1584815979003906, -1.1170035600662231, -1.0755256414413452, -1.0340476036071777, -0.9925696849822998, -0.9510917067527771, -0.9096137285232544, -0.8681356906890869, -0.8266577124595642, -0.7851797342300415, -0.7437017560005188, -0.7022237777709961, -0.6607457995414734, -0.6192678213119507, -0.5777897834777832, -0.5363118648529053, -0.4948338568210602, -0.4533558785915375, -0.41187790036201477, -0.3703998923301697, -0.328921914100647, -0.28744393587112427, -0.24596595764160156, -0.20448797941207886, -0.16301000118255615, -0.12153202295303345, -0.08005403727293015, -0.03857605159282684, 0.002901926636695862, 0.04437990486621857, 0.08585789799690247, 0.12733587622642517, 0.16881385445594788, 0.21029183268547058, 0.2517698109149933, 0.2932478189468384, 0.3347257971763611, 0.3762037754058838, 0.4176817536354065, 0.4591597318649292, 0.5006377100944519, 0.5421156883239746, 0.5835936665534973, 0.62507164478302, 0.6665496230125427, 0.7080276012420654, 0.7495056390762329, 0.7909835577011108, 0.8324615955352783, 0.873939573764801, 0.9154175519943237, 0.9568955302238464, 0.9983735084533691, 1.0398515462875366, 1.0813294649124146, 1.122807502746582, 1.16428542137146]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 13.0, 9.0, 10.0, 18.0, 27.0, 39.0, 47.0, 89.0, 146.0, 229.0, 408.0, 724.0, 1327.0, 2547.0, 5141.0, 10535.0, 22116.0, 45527.0, 90616.0, 167172.0, 237988.0, 210620.0, 125781.0, 64931.0, 32028.0, 15341.0, 7469.0, 3599.0, 1742.0, 992.0, 493.0, 304.0, 201.0, 114.0, 70.0, 51.0, 26.0, 13.0, 17.0, 12.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.5693359375, -1.5228424072265625, -1.476348876953125, -1.4298553466796875, -1.38336181640625, -1.3368682861328125, -1.290374755859375, -1.2438812255859375, -1.1973876953125, -1.1508941650390625, -1.104400634765625, -1.0579071044921875, -1.01141357421875, -0.9649200439453125, -0.918426513671875, -0.8719329833984375, -0.825439453125, -0.7789459228515625, -0.732452392578125, -0.6859588623046875, -0.63946533203125, -0.5929718017578125, -0.546478271484375, -0.4999847412109375, -0.4534912109375, -0.4069976806640625, -0.360504150390625, -0.3140106201171875, -0.26751708984375, -0.2210235595703125, -0.174530029296875, -0.1280364990234375, -0.08154296875, -0.0350494384765625, 0.011444091796875, 0.0579376220703125, 0.10443115234375, 0.1509246826171875, 0.197418212890625, 0.2439117431640625, 0.2904052734375, 0.3368988037109375, 0.383392333984375, 0.4298858642578125, 0.47637939453125, 0.5228729248046875, 0.569366455078125, 0.6158599853515625, 0.662353515625, 0.7088470458984375, 0.755340576171875, 0.8018341064453125, 0.84832763671875, 0.8948211669921875, 0.941314697265625, 0.9878082275390625, 1.0343017578125, 1.0807952880859375, 1.127288818359375, 1.1737823486328125, 1.22027587890625, 1.2667694091796875, 1.313262939453125, 1.3597564697265625, 1.40625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 13.0, 15.0, 25.0, 27.0, 29.0, 32.0, 39.0, 30.0, 42.0, 56.0, 38.0, 66.0, 49.0, 57.0, 56.0, 40.0, 54.0, 53.0, 36.0, 36.0, 29.0, 23.0, 26.0, 24.0, 13.0, 20.0, 7.0, 15.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6720809936523438, -0.6522674560546875, -0.6324539184570312, -0.612640380859375, -0.5928268432617188, -0.5730133056640625, -0.5531997680664062, -0.53338623046875, -0.5135726928710938, -0.4937591552734375, -0.47394561767578125, -0.454132080078125, -0.43431854248046875, -0.4145050048828125, -0.39469146728515625, -0.3748779296875, -0.35506439208984375, -0.3352508544921875, -0.31543731689453125, -0.295623779296875, -0.27581024169921875, -0.2559967041015625, -0.23618316650390625, -0.21636962890625, -0.19655609130859375, -0.1767425537109375, -0.15692901611328125, -0.137115478515625, -0.11730194091796875, -0.0974884033203125, -0.07767486572265625, -0.057861328125, -0.03804779052734375, -0.0182342529296875, 0.00157928466796875, 0.021392822265625, 0.04120635986328125, 0.0610198974609375, 0.08083343505859375, 0.10064697265625, 0.12046051025390625, 0.1402740478515625, 0.16008758544921875, 0.179901123046875, 0.19971466064453125, 0.2195281982421875, 0.23934173583984375, 0.2591552734375, 0.27896881103515625, 0.2987823486328125, 0.31859588623046875, 0.338409423828125, 0.35822296142578125, 0.3780364990234375, 0.39785003662109375, 0.41766357421875, 0.43747711181640625, 0.4572906494140625, 0.47710418701171875, 0.496917724609375, 0.5167312622070312, 0.5365447998046875, 0.5563583374023438, 0.576171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 17.0, 26.0, 35.0, 50.0, 72.0, 86.0, 129.0, 192.0, 252.0, 416.0, 647.0, 1169.0, 2246.0, 4939.0, 12002.0, 30297.0, 79565.0, 199751.0, 357159.0, 215740.0, 86419.0, 33144.0, 12983.0, 5462.0, 2421.0, 1269.0, 698.0, 405.0, 276.0, 192.0, 137.0, 95.0, 59.0, 40.0, 42.0, 30.0, 14.0, 11.0, 12.0, 12.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.486968994140625, -1.43487548828125, -1.382781982421875, -1.3306884765625, -1.278594970703125, -1.22650146484375, -1.174407958984375, -1.122314453125, -1.070220947265625, -1.01812744140625, -0.966033935546875, -0.9139404296875, -0.861846923828125, -0.80975341796875, -0.757659912109375, -0.70556640625, -0.653472900390625, -0.60137939453125, -0.549285888671875, -0.4971923828125, -0.445098876953125, -0.39300537109375, -0.340911865234375, -0.288818359375, -0.236724853515625, -0.18463134765625, -0.132537841796875, -0.0804443359375, -0.028350830078125, 0.02374267578125, 0.075836181640625, 0.1279296875, 0.180023193359375, 0.23211669921875, 0.284210205078125, 0.3363037109375, 0.388397216796875, 0.44049072265625, 0.492584228515625, 0.544677734375, 0.596771240234375, 0.64886474609375, 0.700958251953125, 0.7530517578125, 0.805145263671875, 0.85723876953125, 0.909332275390625, 0.96142578125, 1.013519287109375, 1.06561279296875, 1.117706298828125, 1.1697998046875, 1.221893310546875, 1.27398681640625, 1.326080322265625, 1.378173828125, 1.430267333984375, 1.48236083984375, 1.534454345703125, 1.5865478515625, 1.638641357421875, 1.69073486328125, 1.742828369140625, 1.794921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 3.0, 5.0, 8.0, 7.0, 15.0, 12.0, 19.0, 16.0, 17.0, 24.0, 18.0, 26.0, 31.0, 39.0, 45.0, 34.0, 32.0, 36.0, 41.0, 38.0, 48.0, 39.0, 52.0, 44.0, 39.0, 48.0, 39.0, 33.0, 33.0, 23.0, 19.0, 18.0, 15.0, 14.0, 9.0, 7.0, 7.0, 10.0, 5.0, 10.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.5078125, -2.432098388671875, -2.35638427734375, -2.280670166015625, -2.2049560546875, -2.129241943359375, -2.05352783203125, -1.977813720703125, -1.902099609375, -1.826385498046875, -1.75067138671875, -1.674957275390625, -1.5992431640625, -1.523529052734375, -1.44781494140625, -1.372100830078125, -1.29638671875, -1.220672607421875, -1.14495849609375, -1.069244384765625, -0.9935302734375, -0.917816162109375, -0.84210205078125, -0.766387939453125, -0.690673828125, -0.614959716796875, -0.53924560546875, -0.463531494140625, -0.3878173828125, -0.312103271484375, -0.23638916015625, -0.160675048828125, -0.0849609375, -0.009246826171875, 0.06646728515625, 0.142181396484375, 0.2178955078125, 0.293609619140625, 0.36932373046875, 0.445037841796875, 0.520751953125, 0.596466064453125, 0.67218017578125, 0.747894287109375, 0.8236083984375, 0.899322509765625, 0.97503662109375, 1.050750732421875, 1.12646484375, 1.202178955078125, 1.27789306640625, 1.353607177734375, 1.4293212890625, 1.505035400390625, 1.58074951171875, 1.656463623046875, 1.732177734375, 1.807891845703125, 1.88360595703125, 1.959320068359375, 2.0350341796875, 2.110748291015625, 2.18646240234375, 2.262176513671875, 2.337890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 20.0, 36.0, 48.0, 71.0, 135.0, 244.0, 451.0, 906.0, 1873.0, 4507.0, 13006.0, 45117.0, 181906.0, 495198.0, 224754.0, 55257.0, 15506.0, 5218.0, 2122.0, 1001.0, 467.0, 286.0, 162.0, 89.0, 57.0, 30.0, 26.0, 13.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.0239715576171875, -0.989349365234375, -0.9547271728515625, -0.92010498046875, -0.8854827880859375, -0.850860595703125, -0.8162384033203125, -0.7816162109375, -0.7469940185546875, -0.712371826171875, -0.6777496337890625, -0.64312744140625, -0.6085052490234375, -0.573883056640625, -0.5392608642578125, -0.504638671875, -0.4700164794921875, -0.435394287109375, -0.4007720947265625, -0.36614990234375, -0.3315277099609375, -0.296905517578125, -0.2622833251953125, -0.2276611328125, -0.1930389404296875, -0.158416748046875, -0.1237945556640625, -0.08917236328125, -0.0545501708984375, -0.019927978515625, 0.0146942138671875, 0.04931640625, 0.0839385986328125, 0.118560791015625, 0.1531829833984375, 0.18780517578125, 0.2224273681640625, 0.257049560546875, 0.2916717529296875, 0.3262939453125, 0.3609161376953125, 0.395538330078125, 0.4301605224609375, 0.46478271484375, 0.4994049072265625, 0.534027099609375, 0.5686492919921875, 0.603271484375, 0.6378936767578125, 0.672515869140625, 0.7071380615234375, 0.74176025390625, 0.7763824462890625, 0.811004638671875, 0.8456268310546875, 0.8802490234375, 0.9148712158203125, 0.949493408203125, 0.9841156005859375, 1.01873779296875, 1.0533599853515625, 1.087982177734375, 1.1226043701171875, 1.1572265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 4.0, 8.0, 16.0, 23.0, 16.0, 28.0, 30.0, 31.0, 30.0, 42.0, 44.0, 44.0, 54.0, 58.0, 54.0, 66.0, 73.0, 55.0, 53.0, 40.0, 46.0, 32.0, 24.0, 18.0, 16.0, 10.0, 19.0, 11.0, 5.0, 7.0, 5.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00014901161193847656, -0.0001446940004825592, -0.00014037638902664185, -0.0001360587775707245, -0.00013174116611480713, -0.00012742355465888977, -0.0001231059432029724, -0.00011878833174705505, -0.0001144707202911377, -0.00011015310883522034, -0.00010583549737930298, -0.00010151788592338562, -9.720027446746826e-05, -9.28826630115509e-05, -8.856505155563354e-05, -8.424744009971619e-05, -7.992982864379883e-05, -7.561221718788147e-05, -7.129460573196411e-05, -6.697699427604675e-05, -6.26593828201294e-05, -5.8341771364212036e-05, -5.402415990829468e-05, -4.970654845237732e-05, -4.538893699645996e-05, -4.10713255405426e-05, -3.6753714084625244e-05, -3.2436102628707886e-05, -2.8118491172790527e-05, -2.380087971687317e-05, -1.948326826095581e-05, -1.5165656805038452e-05, -1.0848045349121094e-05, -6.530433893203735e-06, -2.212822437286377e-06, 2.1047890186309814e-06, 6.42240047454834e-06, 1.0740011930465698e-05, 1.5057623386383057e-05, 1.9375234842300415e-05, 2.3692846298217773e-05, 2.8010457754135132e-05, 3.232806921005249e-05, 3.664568066596985e-05, 4.096329212188721e-05, 4.5280903577804565e-05, 4.9598515033721924e-05, 5.391612648963928e-05, 5.823373794555664e-05, 6.2551349401474e-05, 6.686896085739136e-05, 7.118657231330872e-05, 7.550418376922607e-05, 7.982179522514343e-05, 8.413940668106079e-05, 8.845701813697815e-05, 9.277462959289551e-05, 9.709224104881287e-05, 0.00010140985250473022, 0.00010572746396064758, 0.00011004507541656494, 0.0001143626868724823, 0.00011868029832839966, 0.00012299790978431702, 0.00012731552124023438]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 9.0, 15.0, 30.0, 53.0, 72.0, 167.0, 247.0, 465.0, 909.0, 2019.0, 5143.0, 18872.0, 102770.0, 529731.0, 318931.0, 51602.0, 10936.0, 3529.0, 1445.0, 712.0, 366.0, 204.0, 118.0, 64.0, 45.0, 28.0, 21.0, 14.0, 8.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.2565765380859375, -1.211395263671875, -1.1662139892578125, -1.12103271484375, -1.0758514404296875, -1.030670166015625, -0.9854888916015625, -0.9403076171875, -0.8951263427734375, -0.849945068359375, -0.8047637939453125, -0.75958251953125, -0.7144012451171875, -0.669219970703125, -0.6240386962890625, -0.578857421875, -0.5336761474609375, -0.488494873046875, -0.4433135986328125, -0.39813232421875, -0.3529510498046875, -0.307769775390625, -0.2625885009765625, -0.2174072265625, -0.1722259521484375, -0.127044677734375, -0.0818634033203125, -0.03668212890625, 0.0084991455078125, 0.053680419921875, 0.0988616943359375, 0.14404296875, 0.1892242431640625, 0.234405517578125, 0.2795867919921875, 0.32476806640625, 0.3699493408203125, 0.415130615234375, 0.4603118896484375, 0.5054931640625, 0.5506744384765625, 0.595855712890625, 0.6410369873046875, 0.68621826171875, 0.7313995361328125, 0.776580810546875, 0.8217620849609375, 0.866943359375, 0.9121246337890625, 0.957305908203125, 1.0024871826171875, 1.04766845703125, 1.0928497314453125, 1.138031005859375, 1.1832122802734375, 1.2283935546875, 1.2735748291015625, 1.318756103515625, 1.3639373779296875, 1.40911865234375, 1.4542999267578125, 1.499481201171875, 1.5446624755859375, 1.58984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 21.0, 36.0, 42.0, 57.0, 93.0, 101.0, 113.0, 123.0, 93.0, 78.0, 51.0, 49.0, 36.0, 21.0, 11.0, 15.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5703125, -2.5142364501953125, -2.458160400390625, -2.4020843505859375, -2.34600830078125, -2.2899322509765625, -2.233856201171875, -2.1777801513671875, -2.1217041015625, -2.0656280517578125, -2.009552001953125, -1.9534759521484375, -1.89739990234375, -1.8413238525390625, -1.785247802734375, -1.7291717529296875, -1.673095703125, -1.6170196533203125, -1.560943603515625, -1.5048675537109375, -1.44879150390625, -1.3927154541015625, -1.336639404296875, -1.2805633544921875, -1.2244873046875, -1.1684112548828125, -1.112335205078125, -1.0562591552734375, -1.00018310546875, -0.9441070556640625, -0.888031005859375, -0.8319549560546875, -0.77587890625, -0.7198028564453125, -0.663726806640625, -0.6076507568359375, -0.55157470703125, -0.4954986572265625, -0.439422607421875, -0.3833465576171875, -0.3272705078125, -0.2711944580078125, -0.215118408203125, -0.1590423583984375, -0.10296630859375, -0.0468902587890625, 0.009185791015625, 0.0652618408203125, 0.121337890625, 0.1774139404296875, 0.233489990234375, 0.2895660400390625, 0.34564208984375, 0.4017181396484375, 0.457794189453125, 0.5138702392578125, 0.5699462890625, 0.6260223388671875, 0.682098388671875, 0.7381744384765625, 0.79425048828125, 0.8503265380859375, 0.906402587890625, 0.9624786376953125, 1.0185546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 9.0, 31.0, 77.0, 171.0, 282.0, 222.0, 113.0, 61.0, 22.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.69205093383789, -27.388267517089844, -26.084484100341797, -24.78070068359375, -23.476917266845703, -22.173133850097656, -20.86935043334961, -19.565567016601562, -18.261783599853516, -16.95800018310547, -15.654216766357422, -14.350433349609375, -13.046649932861328, -11.742866516113281, -10.439083099365234, -9.135299682617188, -7.831516265869141, -6.527732849121094, -5.223949432373047, -3.920166015625, -2.616382598876953, -1.3125991821289062, -0.008815765380859375, 1.2949676513671875, 2.5987510681152344, 3.9025344848632812, 5.206317901611328, 6.510101318359375, 7.813884735107422, 9.117668151855469, 10.421451568603516, 11.725234985351562, 13.02901840209961, 14.332801818847656, 15.636585235595703, 16.94036865234375, 18.244152069091797, 19.547935485839844, 20.85171890258789, 22.155502319335938, 23.459285736083984, 24.76306915283203, 26.066852569580078, 27.370635986328125, 28.674419403076172, 29.97820281982422, 31.281986236572266, 32.58576965332031, 33.88955307006836, 35.193336486816406, 36.49711990356445, 37.8009033203125, 39.10468673706055, 40.408470153808594, 41.71225357055664, 43.01603698730469, 44.319820404052734, 45.62360382080078, 46.92738723754883, 48.231170654296875, 49.53495407104492, 50.83873748779297, 52.142520904541016, 53.44630432128906, 54.75008773803711]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 1.0, 5.0, 4.0, 8.0, 3.0, 11.0, 13.0, 12.0, 28.0, 21.0, 25.0, 28.0, 40.0, 39.0, 40.0, 47.0, 47.0, 60.0, 47.0, 61.0, 64.0, 48.0, 53.0, 38.0, 45.0, 51.0, 28.0, 24.0, 31.0, 15.0, 18.0, 7.0, 13.0, 3.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.377784729003906, -15.882405281066895, -15.387025833129883, -14.891645431518555, -14.396265983581543, -13.900886535644531, -13.40550708770752, -12.910127639770508, -12.41474723815918, -11.919367790222168, -11.423988342285156, -10.928607940673828, -10.433228492736816, -9.937849044799805, -9.442469596862793, -8.947090148925781, -8.45171070098877, -7.956331253051758, -7.460951328277588, -6.965571880340576, -6.470191955566406, -5.9748125076293945, -5.479433059692383, -4.984053611755371, -4.488673686981201, -3.9932940006256104, -3.4979143142700195, -3.002534866333008, -2.507155179977417, -2.011775493621826, -1.5163960456848145, -1.0210163593292236, -0.5256366729736328, -0.030257046222686768, 0.4651225805282593, 0.9605021476745605, 1.4558818340301514, 1.9512615203857422, 2.446640968322754, 2.9420206546783447, 3.4374003410339355, 3.9327800273895264, 4.428159713745117, 4.923539161682129, 5.418918609619141, 5.9142985343933105, 6.409677982330322, 6.905057907104492, 7.400437355041504, 7.895816802978516, 8.391196250915527, 8.886575698852539, 9.381956100463867, 9.877335548400879, 10.37271499633789, 10.868094444274902, 11.363473892211914, 11.858853340148926, 12.354232788085938, 12.849613189697266, 13.344992637634277, 13.840372085571289, 14.3357515335083, 14.831130981445312, 15.32651138305664]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 8.0, 13.0, 20.0, 22.0, 23.0, 57.0, 85.0, 120.0, 179.0, 302.0, 517.0, 907.0, 1833.0, 4536.0, 14778.0, 93687.0, 4015426.0, 45460.0, 9596.0, 3306.0, 1521.0, 736.0, 413.0, 246.0, 162.0, 117.0, 67.0, 28.0, 36.0, 19.0, 8.0, 7.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9921875, -2.88275146484375, -2.7733154296875, -2.66387939453125, -2.554443359375, -2.44500732421875, -2.3355712890625, -2.22613525390625, -2.11669921875, -2.00726318359375, -1.8978271484375, -1.78839111328125, -1.678955078125, -1.56951904296875, -1.4600830078125, -1.35064697265625, -1.2412109375, -1.13177490234375, -1.0223388671875, -0.91290283203125, -0.803466796875, -0.69403076171875, -0.5845947265625, -0.47515869140625, -0.36572265625, -0.25628662109375, -0.1468505859375, -0.03741455078125, 0.072021484375, 0.18145751953125, 0.2908935546875, 0.40032958984375, 0.509765625, 0.61920166015625, 0.7286376953125, 0.83807373046875, 0.947509765625, 1.05694580078125, 1.1663818359375, 1.27581787109375, 1.38525390625, 1.49468994140625, 1.6041259765625, 1.71356201171875, 1.822998046875, 1.93243408203125, 2.0418701171875, 2.15130615234375, 2.2607421875, 2.37017822265625, 2.4796142578125, 2.58905029296875, 2.698486328125, 2.80792236328125, 2.9173583984375, 3.02679443359375, 3.13623046875, 3.24566650390625, 3.3551025390625, 3.46453857421875, 3.573974609375, 3.68341064453125, 3.7928466796875, 3.90228271484375, 4.01171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 12.0, 19.0, 23.0, 32.0, 28.0, 25.0, 41.0, 46.0, 49.0, 55.0, 64.0, 46.0, 64.0, 47.0, 54.0, 55.0, 42.0, 33.0, 34.0, 43.0, 28.0, 26.0, 23.0, 15.0, 14.0, 5.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.76513671875, -0.7455863952636719, -0.7260360717773438, -0.7064857482910156, -0.6869354248046875, -0.6673851013183594, -0.6478347778320312, -0.6282844543457031, -0.608734130859375, -0.5891838073730469, -0.5696334838867188, -0.5500831604003906, -0.5305328369140625, -0.5109825134277344, -0.49143218994140625, -0.4718818664550781, -0.45233154296875, -0.4327812194824219, -0.41323089599609375, -0.3936805725097656, -0.3741302490234375, -0.3545799255371094, -0.33502960205078125, -0.3154792785644531, -0.295928955078125, -0.2763786315917969, -0.25682830810546875, -0.23727798461914062, -0.2177276611328125, -0.19817733764648438, -0.17862701416015625, -0.15907669067382812, -0.1395263671875, -0.11997604370117188, -0.10042572021484375, -0.08087539672851562, -0.0613250732421875, -0.041774749755859375, -0.02222442626953125, -0.002674102783203125, 0.016876220703125, 0.036426544189453125, 0.05597686767578125, 0.07552719116210938, 0.0950775146484375, 0.11462783813476562, 0.13417816162109375, 0.15372848510742188, 0.17327880859375, 0.19282913208007812, 0.21237945556640625, 0.23192977905273438, 0.2514801025390625, 0.2710304260253906, 0.29058074951171875, 0.3101310729980469, 0.329681396484375, 0.3492317199707031, 0.36878204345703125, 0.3883323669433594, 0.4078826904296875, 0.4274330139160156, 0.44698333740234375, 0.4665336608886719, 0.486083984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 11.0, 7.0, 17.0, 18.0, 35.0, 34.0, 48.0, 80.0, 105.0, 174.0, 299.0, 450.0, 756.0, 1373.0, 2686.0, 5724.0, 13922.0, 42034.0, 223618.0, 3779433.0, 83179.0, 23263.0, 8784.0, 3755.0, 1812.0, 1011.0, 596.0, 370.0, 238.0, 162.0, 89.0, 54.0, 45.0, 25.0, 24.0, 12.0, 15.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1796875, -2.1178436279296875, -2.055999755859375, -1.9941558837890625, -1.93231201171875, -1.8704681396484375, -1.808624267578125, -1.7467803955078125, -1.6849365234375, -1.6230926513671875, -1.561248779296875, -1.4994049072265625, -1.43756103515625, -1.3757171630859375, -1.313873291015625, -1.2520294189453125, -1.190185546875, -1.1283416748046875, -1.066497802734375, -1.0046539306640625, -0.94281005859375, -0.8809661865234375, -0.819122314453125, -0.7572784423828125, -0.6954345703125, -0.6335906982421875, -0.571746826171875, -0.5099029541015625, -0.44805908203125, -0.3862152099609375, -0.324371337890625, -0.2625274658203125, -0.20068359375, -0.1388397216796875, -0.076995849609375, -0.0151519775390625, 0.04669189453125, 0.1085357666015625, 0.170379638671875, 0.2322235107421875, 0.2940673828125, 0.3559112548828125, 0.417755126953125, 0.4795989990234375, 0.54144287109375, 0.6032867431640625, 0.665130615234375, 0.7269744873046875, 0.788818359375, 0.8506622314453125, 0.912506103515625, 0.9743499755859375, 1.03619384765625, 1.0980377197265625, 1.159881591796875, 1.2217254638671875, 1.2835693359375, 1.3454132080078125, 1.407257080078125, 1.4691009521484375, 1.53094482421875, 1.5927886962890625, 1.654632568359375, 1.7164764404296875, 1.7783203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 22.0, 19.0, 54.0, 87.0, 235.0, 3332.0, 151.0, 66.0, 31.0, 26.0, 12.0, 7.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9256362915039062, -0.8986358642578125, -0.8716354370117188, -0.844635009765625, -0.8176345825195312, -0.7906341552734375, -0.7636337280273438, -0.73663330078125, -0.7096328735351562, -0.6826324462890625, -0.6556320190429688, -0.628631591796875, -0.6016311645507812, -0.5746307373046875, -0.5476303100585938, -0.5206298828125, -0.49362945556640625, -0.4666290283203125, -0.43962860107421875, -0.412628173828125, -0.38562774658203125, -0.3586273193359375, -0.33162689208984375, -0.30462646484375, -0.27762603759765625, -0.2506256103515625, -0.22362518310546875, -0.196624755859375, -0.16962432861328125, -0.1426239013671875, -0.11562347412109375, -0.088623046875, -0.06162261962890625, -0.0346221923828125, -0.00762176513671875, 0.019378662109375, 0.04637908935546875, 0.0733795166015625, 0.10037994384765625, 0.12738037109375, 0.15438079833984375, 0.1813812255859375, 0.20838165283203125, 0.235382080078125, 0.26238250732421875, 0.2893829345703125, 0.31638336181640625, 0.3433837890625, 0.37038421630859375, 0.3973846435546875, 0.42438507080078125, 0.451385498046875, 0.47838592529296875, 0.5053863525390625, 0.5323867797851562, 0.55938720703125, 0.5863876342773438, 0.6133880615234375, 0.6403884887695312, 0.667388916015625, 0.6943893432617188, 0.7213897705078125, 0.7483901977539062, 0.775390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 8.0, 25.0, 28.0, 45.0, 94.0, 129.0, 173.0, 153.0, 145.0, 81.0, 63.0, 28.0, 15.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7443273067474365, -2.642873525619507, -2.541419744491577, -2.4399657249450684, -2.3385119438171387, -2.237058162689209, -2.1356043815612793, -2.0341506004333496, -1.9326967000961304, -1.8312429189682007, -1.7297890186309814, -1.6283352375030518, -1.526881456375122, -1.4254275560379028, -1.3239737749099731, -1.222519874572754, -1.1210660934448242, -1.0196123123168945, -0.9181584119796753, -0.8167046308517456, -0.7152507901191711, -0.6137969493865967, -0.512343168258667, -0.41088932752609253, -0.30943548679351807, -0.2079816609621048, -0.10652783513069153, -0.005074024200439453, 0.09637981653213501, 0.19783365726470947, 0.29928743839263916, 0.4007412791252136, 0.5021953582763672, 0.6036491990089417, 0.7051030397415161, 0.8065568208694458, 0.9080106616020203, 1.0094645023345947, 1.1109182834625244, 1.212372064590454, 1.3138259649276733, 1.415279746055603, 1.5167336463928223, 1.618187427520752, 1.7196412086486816, 1.8210951089859009, 1.9225488901138306, 2.02400279045105, 2.1254565715789795, 2.226910352706909, 2.328364133834839, 2.4298181533813477, 2.5312719345092773, 2.632725715637207, 2.7341794967651367, 2.8356332778930664, 2.937087059020996, 3.038540840148926, 3.1399946212768555, 3.241448402404785, 3.342902421951294, 3.4443562030792236, 3.5458099842071533, 3.647263765335083, 3.748717784881592]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 10.0, 12.0, 19.0, 17.0, 16.0, 27.0, 28.0, 17.0, 41.0, 35.0, 43.0, 39.0, 57.0, 46.0, 59.0, 57.0, 43.0, 42.0, 47.0, 37.0, 38.0, 37.0, 28.0, 30.0, 30.0, 17.0, 13.0, 17.0, 12.0, 11.0, 5.0, 6.0, 3.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1311805248260498, -1.0932921171188354, -1.055403709411621, -1.0175151824951172, -0.9796267747879028, -0.9417383670806885, -0.9038499593734741, -0.865961492061615, -0.8280730247497559, -0.7901846170425415, -0.7522961497306824, -0.714407742023468, -0.6765192747116089, -0.6386308670043945, -0.6007424592971802, -0.562853991985321, -0.5249655842781067, -0.48707714676856995, -0.4491887092590332, -0.41130030155181885, -0.3734118342399597, -0.33552342653274536, -0.2976349890232086, -0.2597465515136719, -0.22185811400413513, -0.1839696764945984, -0.14608123898506165, -0.1081928163766861, -0.07030437886714935, -0.03241594135761261, 0.0054724812507629395, 0.04336091876029968, 0.08124935626983643, 0.11913779377937317, 0.1570262312889099, 0.19491465389728546, 0.2328030914068222, 0.27069151401519775, 0.3085799515247345, 0.34646838903427124, 0.384356826543808, 0.4222452640533447, 0.46013370156288147, 0.4980221390724182, 0.5359105467796326, 0.5737990140914917, 0.611687421798706, 0.6495758295059204, 0.6874642968177795, 0.7253527045249939, 0.763241171836853, 0.8011295795440674, 0.8390180468559265, 0.8769064545631409, 0.914794921875, 0.9526833295822144, 0.9905717372894287, 1.028460144996643, 1.0663485527038574, 1.1042370796203613, 1.1421254873275757, 1.18001389503479, 1.2179023027420044, 1.2557907104492188, 1.2936792373657227]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 8.0, 2.0, 13.0, 9.0, 19.0, 33.0, 58.0, 55.0, 122.0, 204.0, 324.0, 654.0, 1328.0, 2836.0, 6337.0, 14975.0, 36284.0, 89451.0, 196438.0, 293281.0, 223604.0, 106461.0, 44176.0, 17950.0, 7487.0, 3266.0, 1443.0, 748.0, 392.0, 223.0, 132.0, 89.0, 55.0, 36.0, 20.0, 14.0, 11.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.9697265625, -1.918701171875, -1.86767578125, -1.816650390625, -1.765625, -1.714599609375, -1.66357421875, -1.612548828125, -1.5615234375, -1.510498046875, -1.45947265625, -1.408447265625, -1.357421875, -1.306396484375, -1.25537109375, -1.204345703125, -1.1533203125, -1.102294921875, -1.05126953125, -1.000244140625, -0.94921875, -0.898193359375, -0.84716796875, -0.796142578125, -0.7451171875, -0.694091796875, -0.64306640625, -0.592041015625, -0.541015625, -0.489990234375, -0.43896484375, -0.387939453125, -0.3369140625, -0.285888671875, -0.23486328125, -0.183837890625, -0.1328125, -0.081787109375, -0.03076171875, 0.020263671875, 0.0712890625, 0.122314453125, 0.17333984375, 0.224365234375, 0.275390625, 0.326416015625, 0.37744140625, 0.428466796875, 0.4794921875, 0.530517578125, 0.58154296875, 0.632568359375, 0.68359375, 0.734619140625, 0.78564453125, 0.836669921875, 0.8876953125, 0.938720703125, 0.98974609375, 1.040771484375, 1.091796875, 1.142822265625, 1.19384765625, 1.244873046875, 1.2958984375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 17.0, 18.0, 16.0, 15.0, 34.0, 24.0, 28.0, 38.0, 43.0, 55.0, 53.0, 50.0, 60.0, 45.0, 45.0, 47.0, 52.0, 48.0, 43.0, 39.0, 33.0, 34.0, 24.0, 18.0, 17.0, 18.0, 14.0, 12.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72021484375, -0.7009048461914062, -0.6815948486328125, -0.6622848510742188, -0.642974853515625, -0.6236648559570312, -0.6043548583984375, -0.5850448608398438, -0.56573486328125, -0.5464248657226562, -0.5271148681640625, -0.5078048706054688, -0.488494873046875, -0.46918487548828125, -0.4498748779296875, -0.43056488037109375, -0.4112548828125, -0.39194488525390625, -0.3726348876953125, -0.35332489013671875, -0.334014892578125, -0.31470489501953125, -0.2953948974609375, -0.27608489990234375, -0.25677490234375, -0.23746490478515625, -0.2181549072265625, -0.19884490966796875, -0.179534912109375, -0.16022491455078125, -0.1409149169921875, -0.12160491943359375, -0.102294921875, -0.08298492431640625, -0.0636749267578125, -0.04436492919921875, -0.025054931640625, -0.00574493408203125, 0.0135650634765625, 0.03287506103515625, 0.05218505859375, 0.07149505615234375, 0.0908050537109375, 0.11011505126953125, 0.129425048828125, 0.14873504638671875, 0.1680450439453125, 0.18735504150390625, 0.2066650390625, 0.22597503662109375, 0.2452850341796875, 0.26459503173828125, 0.283905029296875, 0.30321502685546875, 0.3225250244140625, 0.34183502197265625, 0.36114501953125, 0.38045501708984375, 0.3997650146484375, 0.41907501220703125, 0.438385009765625, 0.45769500732421875, 0.4770050048828125, 0.49631500244140625, 0.515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 17.0, 16.0, 43.0, 45.0, 110.0, 222.0, 447.0, 1038.0, 2920.0, 12028.0, 87388.0, 622433.0, 282201.0, 31018.0, 5652.0, 1669.0, 657.0, 296.0, 140.0, 85.0, 47.0, 32.0, 24.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.539581298828125, -2.43267822265625, -2.325775146484375, -2.2188720703125, -2.111968994140625, -2.00506591796875, -1.898162841796875, -1.791259765625, -1.684356689453125, -1.57745361328125, -1.470550537109375, -1.3636474609375, -1.256744384765625, -1.14984130859375, -1.042938232421875, -0.93603515625, -0.829132080078125, -0.72222900390625, -0.615325927734375, -0.5084228515625, -0.401519775390625, -0.29461669921875, -0.187713623046875, -0.080810546875, 0.026092529296875, 0.13299560546875, 0.239898681640625, 0.3468017578125, 0.453704833984375, 0.56060791015625, 0.667510986328125, 0.7744140625, 0.881317138671875, 0.98822021484375, 1.095123291015625, 1.2020263671875, 1.308929443359375, 1.41583251953125, 1.522735595703125, 1.629638671875, 1.736541748046875, 1.84344482421875, 1.950347900390625, 2.0572509765625, 2.164154052734375, 2.27105712890625, 2.377960205078125, 2.48486328125, 2.591766357421875, 2.69866943359375, 2.805572509765625, 2.9124755859375, 3.019378662109375, 3.12628173828125, 3.233184814453125, 3.340087890625, 3.446990966796875, 3.55389404296875, 3.660797119140625, 3.7677001953125, 3.874603271484375, 3.98150634765625, 4.088409423828125, 4.1953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 5.0, 9.0, 11.0, 11.0, 15.0, 14.0, 11.0, 24.0, 20.0, 16.0, 22.0, 26.0, 25.0, 33.0, 27.0, 36.0, 30.0, 23.0, 37.0, 37.0, 33.0, 33.0, 41.0, 41.0, 31.0, 32.0, 35.0, 32.0, 36.0, 30.0, 23.0, 23.0, 30.0, 27.0, 18.0, 7.0, 13.0, 10.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.22265625, -2.1578369140625, -2.093017578125, -2.0281982421875, -1.96337890625, -1.8985595703125, -1.833740234375, -1.7689208984375, -1.7041015625, -1.6392822265625, -1.574462890625, -1.5096435546875, -1.44482421875, -1.3800048828125, -1.315185546875, -1.2503662109375, -1.185546875, -1.1207275390625, -1.055908203125, -0.9910888671875, -0.92626953125, -0.8614501953125, -0.796630859375, -0.7318115234375, -0.6669921875, -0.6021728515625, -0.537353515625, -0.4725341796875, -0.40771484375, -0.3428955078125, -0.278076171875, -0.2132568359375, -0.1484375, -0.0836181640625, -0.018798828125, 0.0460205078125, 0.11083984375, 0.1756591796875, 0.240478515625, 0.3052978515625, 0.3701171875, 0.4349365234375, 0.499755859375, 0.5645751953125, 0.62939453125, 0.6942138671875, 0.759033203125, 0.8238525390625, 0.888671875, 0.9534912109375, 1.018310546875, 1.0831298828125, 1.14794921875, 1.2127685546875, 1.277587890625, 1.3424072265625, 1.4072265625, 1.4720458984375, 1.536865234375, 1.6016845703125, 1.66650390625, 1.7313232421875, 1.796142578125, 1.8609619140625, 1.92578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 13.0, 28.0, 40.0, 66.0, 110.0, 301.0, 708.0, 2649.0, 19660.0, 433037.0, 563109.0, 24426.0, 3024.0, 781.0, 300.0, 132.0, 71.0, 32.0, 26.0, 14.0, 6.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03515625, -2.9629669189453125, -2.890777587890625, -2.8185882568359375, -2.74639892578125, -2.6742095947265625, -2.602020263671875, -2.5298309326171875, -2.4576416015625, -2.3854522705078125, -2.313262939453125, -2.2410736083984375, -2.16888427734375, -2.0966949462890625, -2.024505615234375, -1.9523162841796875, -1.880126953125, -1.8079376220703125, -1.735748291015625, -1.6635589599609375, -1.59136962890625, -1.5191802978515625, -1.446990966796875, -1.3748016357421875, -1.3026123046875, -1.2304229736328125, -1.158233642578125, -1.0860443115234375, -1.01385498046875, -0.9416656494140625, -0.869476318359375, -0.7972869873046875, -0.72509765625, -0.6529083251953125, -0.580718994140625, -0.5085296630859375, -0.43634033203125, -0.3641510009765625, -0.291961669921875, -0.2197723388671875, -0.1475830078125, -0.0753936767578125, -0.003204345703125, 0.0689849853515625, 0.14117431640625, 0.2133636474609375, 0.285552978515625, 0.3577423095703125, 0.429931640625, 0.5021209716796875, 0.574310302734375, 0.6464996337890625, 0.71868896484375, 0.7908782958984375, 0.863067626953125, 0.9352569580078125, 1.0074462890625, 1.0796356201171875, 1.151824951171875, 1.2240142822265625, 1.29620361328125, 1.3683929443359375, 1.440582275390625, 1.5127716064453125, 1.5849609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 23.0, 25.0, 41.0, 49.0, 67.0, 93.0, 125.0, 116.0, 111.0, 108.0, 68.0, 46.0, 27.0, 20.0, 24.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021719932556152344, -0.0002092607319355011, -0.00020132213830947876, -0.00019338354468345642, -0.00018544495105743408, -0.00017750635743141174, -0.0001695677638053894, -0.00016162917017936707, -0.00015369057655334473, -0.0001457519829273224, -0.00013781338930130005, -0.0001298747956752777, -0.00012193620204925537, -0.00011399760842323303, -0.0001060590147972107, -9.812042117118835e-05, -9.018182754516602e-05, -8.224323391914368e-05, -7.430464029312134e-05, -6.6366046667099e-05, -5.842745304107666e-05, -5.048885941505432e-05, -4.255026578903198e-05, -3.4611672163009644e-05, -2.6673078536987305e-05, -1.8734484910964966e-05, -1.0795891284942627e-05, -2.857297658920288e-06, 5.081295967102051e-06, 1.301988959312439e-05, 2.095848321914673e-05, 2.8897076845169067e-05, 3.6835670471191406e-05, 4.4774264097213745e-05, 5.2712857723236084e-05, 6.065145134925842e-05, 6.859004497528076e-05, 7.65286386013031e-05, 8.446723222732544e-05, 9.240582585334778e-05, 0.00010034441947937012, 0.00010828301310539246, 0.0001162216067314148, 0.00012416020035743713, 0.00013209879398345947, 0.0001400373876094818, 0.00014797598123550415, 0.0001559145748615265, 0.00016385316848754883, 0.00017179176211357117, 0.0001797303557395935, 0.00018766894936561584, 0.00019560754299163818, 0.00020354613661766052, 0.00021148473024368286, 0.0002194233238697052, 0.00022736191749572754, 0.00023530051112174988, 0.00024323910474777222, 0.00025117769837379456, 0.0002591162919998169, 0.00026705488562583923, 0.00027499347925186157, 0.0002829320728778839, 0.00029087066650390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 13.0, 7.0, 7.0, 12.0, 26.0, 41.0, 78.0, 132.0, 311.0, 665.0, 1994.0, 8965.0, 100852.0, 802014.0, 119700.0, 10106.0, 2189.0, 782.0, 299.0, 135.0, 78.0, 49.0, 37.0, 14.0, 13.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1953125, -2.1298370361328125, -2.064361572265625, -1.9988861083984375, -1.93341064453125, -1.8679351806640625, -1.802459716796875, -1.7369842529296875, -1.6715087890625, -1.6060333251953125, -1.540557861328125, -1.4750823974609375, -1.40960693359375, -1.3441314697265625, -1.278656005859375, -1.2131805419921875, -1.147705078125, -1.0822296142578125, -1.016754150390625, -0.9512786865234375, -0.88580322265625, -0.8203277587890625, -0.754852294921875, -0.6893768310546875, -0.6239013671875, -0.5584259033203125, -0.492950439453125, -0.4274749755859375, -0.36199951171875, -0.2965240478515625, -0.231048583984375, -0.1655731201171875, -0.10009765625, -0.0346221923828125, 0.030853271484375, 0.0963287353515625, 0.16180419921875, 0.2272796630859375, 0.292755126953125, 0.3582305908203125, 0.4237060546875, 0.4891815185546875, 0.554656982421875, 0.6201324462890625, 0.68560791015625, 0.7510833740234375, 0.816558837890625, 0.8820343017578125, 0.947509765625, 1.0129852294921875, 1.078460693359375, 1.1439361572265625, 1.20941162109375, 1.2748870849609375, 1.340362548828125, 1.4058380126953125, 1.4713134765625, 1.5367889404296875, 1.602264404296875, 1.6677398681640625, 1.73321533203125, 1.7986907958984375, 1.864166259765625, 1.9296417236328125, 1.9951171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 8.0, 10.0, 18.0, 28.0, 47.0, 61.0, 106.0, 119.0, 141.0, 151.0, 89.0, 76.0, 57.0, 37.0, 13.0, 13.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.029296875, -2.9669570922851562, -2.9046173095703125, -2.8422775268554688, -2.779937744140625, -2.7175979614257812, -2.6552581787109375, -2.5929183959960938, -2.53057861328125, -2.4682388305664062, -2.4058990478515625, -2.3435592651367188, -2.281219482421875, -2.2188796997070312, -2.1565399169921875, -2.0942001342773438, -2.0318603515625, -1.9695205688476562, -1.9071807861328125, -1.8448410034179688, -1.782501220703125, -1.7201614379882812, -1.6578216552734375, -1.5954818725585938, -1.53314208984375, -1.4708023071289062, -1.4084625244140625, -1.3461227416992188, -1.283782958984375, -1.2214431762695312, -1.1591033935546875, -1.0967636108398438, -1.034423828125, -0.9720840454101562, -0.9097442626953125, -0.8474044799804688, -0.785064697265625, -0.7227249145507812, -0.6603851318359375, -0.5980453491210938, -0.53570556640625, -0.47336578369140625, -0.4110260009765625, -0.34868621826171875, -0.286346435546875, -0.22400665283203125, -0.1616668701171875, -0.09932708740234375, -0.0369873046875, 0.02535247802734375, 0.0876922607421875, 0.15003204345703125, 0.212371826171875, 0.27471160888671875, 0.3370513916015625, 0.39939117431640625, 0.46173095703125, 0.5240707397460938, 0.5864105224609375, 0.6487503051757812, 0.711090087890625, 0.7734298706054688, 0.8357696533203125, 0.8981094360351562, 0.96044921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 15.0, 34.0, 87.0, 140.0, 190.0, 218.0, 144.0, 91.0, 43.0, 18.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71631622314453, -28.68522834777832, -27.65414047241211, -26.6230525970459, -25.591964721679688, -24.56087875366211, -23.5297908782959, -22.498703002929688, -21.467615127563477, -20.436527252197266, -19.405439376831055, -18.374351501464844, -17.343265533447266, -16.312175750732422, -15.281089782714844, -14.250001907348633, -13.218914031982422, -12.187826156616211, -11.15673828125, -10.125651359558105, -9.094563484191895, -8.063475608825684, -7.032388210296631, -6.001300811767578, -4.970212936401367, -3.9391252994537354, -2.9080376625061035, -1.8769500255584717, -0.8458623886108398, 0.1852254867553711, 1.2163128852844238, 2.2474002838134766, 3.2784881591796875, 4.309576034545898, 5.340663433074951, 6.371750831604004, 7.402838706970215, 8.433926582336426, 9.46501350402832, 10.496101379394531, 11.527189254760742, 12.558277130126953, 13.589365005493164, 14.620451927185059, 15.65153980255127, 16.682628631591797, 17.713714599609375, 18.744802474975586, 19.775890350341797, 20.806978225708008, 21.83806610107422, 22.86915397644043, 23.90024185180664, 24.93132781982422, 25.96241569519043, 26.99350357055664, 28.02459144592285, 29.055679321289062, 30.086767196655273, 31.117855072021484, 32.14894104003906, 33.180030822753906, 34.211116790771484, 35.24220275878906, 36.273292541503906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 15.0, 16.0, 18.0, 32.0, 22.0, 27.0, 23.0, 39.0, 34.0, 35.0, 37.0, 30.0, 44.0, 40.0, 59.0, 47.0, 53.0, 38.0, 50.0, 39.0, 33.0, 30.0, 41.0, 26.0, 23.0, 22.0, 10.0, 17.0, 7.0, 11.0, 16.0, 8.0, 3.0, 4.0, 7.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.212970733642578, -11.826147079467773, -11.439323425292969, -11.052499771118164, -10.665675163269043, -10.278851509094238, -9.892027854919434, -9.505204200744629, -9.118379592895508, -8.731555938720703, -8.344732284545898, -7.9579081535339355, -7.571084022521973, -7.184260368347168, -6.797436714172363, -6.410613059997559, -6.023789405822754, -5.636965751647949, -5.250141620635986, -4.863317966461182, -4.476493835449219, -4.089670181274414, -3.7028465270996094, -3.3160226345062256, -2.929198741912842, -2.542374849319458, -2.155550956726074, -1.7687273025512695, -1.3819034099578857, -0.995079517364502, -0.6082558631896973, -0.22143197059631348, 0.1653909683227539, 0.5522148013114929, 0.9390386343002319, 1.3258624076843262, 1.71268630027771, 2.0995101928710938, 2.4863338470458984, 2.8731577396392822, 3.259981632232666, 3.64680552482605, 4.033629417419434, 4.420453071594238, 4.807276725769043, 5.194100856781006, 5.5809245109558105, 5.967748641967773, 6.354572296142578, 6.741395950317383, 7.128220081329346, 7.51504373550415, 7.901867866516113, 8.288691520690918, 8.675515174865723, 9.062338829040527, 9.449163436889648, 9.835987091064453, 10.222810745239258, 10.609634399414062, 10.996459007263184, 11.383282661437988, 11.770106315612793, 12.156929969787598, 12.543753623962402]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 11.0, 14.0, 24.0, 21.0, 40.0, 45.0, 79.0, 99.0, 184.0, 266.0, 470.0, 748.0, 1323.0, 2562.0, 5082.0, 11871.0, 38376.0, 4010575.0, 88000.0, 19337.0, 7319.0, 3486.0, 1828.0, 963.0, 550.0, 363.0, 203.0, 126.0, 91.0, 55.0, 54.0, 23.0, 15.0, 13.0, 12.0, 12.0, 4.0, 9.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.466796875, -2.383819580078125, -2.30084228515625, -2.217864990234375, -2.1348876953125, -2.051910400390625, -1.96893310546875, -1.885955810546875, -1.802978515625, -1.720001220703125, -1.63702392578125, -1.554046630859375, -1.4710693359375, -1.388092041015625, -1.30511474609375, -1.222137451171875, -1.13916015625, -1.056182861328125, -0.97320556640625, -0.890228271484375, -0.8072509765625, -0.724273681640625, -0.64129638671875, -0.558319091796875, -0.475341796875, -0.392364501953125, -0.30938720703125, -0.226409912109375, -0.1434326171875, -0.060455322265625, 0.02252197265625, 0.105499267578125, 0.1884765625, 0.271453857421875, 0.35443115234375, 0.437408447265625, 0.5203857421875, 0.603363037109375, 0.68634033203125, 0.769317626953125, 0.852294921875, 0.935272216796875, 1.01824951171875, 1.101226806640625, 1.1842041015625, 1.267181396484375, 1.35015869140625, 1.433135986328125, 1.51611328125, 1.599090576171875, 1.68206787109375, 1.765045166015625, 1.8480224609375, 1.930999755859375, 2.01397705078125, 2.096954345703125, 2.179931640625, 2.262908935546875, 2.34588623046875, 2.428863525390625, 2.5118408203125, 2.594818115234375, 2.67779541015625, 2.760772705078125, 2.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 18.0, 15.0, 13.0, 19.0, 23.0, 25.0, 35.0, 41.0, 52.0, 59.0, 55.0, 46.0, 53.0, 59.0, 69.0, 51.0, 58.0, 42.0, 45.0, 42.0, 32.0, 26.0, 24.0, 23.0, 12.0, 15.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.8935546875, -0.8707275390625, -0.847900390625, -0.8250732421875, -0.80224609375, -0.7794189453125, -0.756591796875, -0.7337646484375, -0.7109375, -0.6881103515625, -0.665283203125, -0.6424560546875, -0.61962890625, -0.5968017578125, -0.573974609375, -0.5511474609375, -0.5283203125, -0.5054931640625, -0.482666015625, -0.4598388671875, -0.43701171875, -0.4141845703125, -0.391357421875, -0.3685302734375, -0.345703125, -0.3228759765625, -0.300048828125, -0.2772216796875, -0.25439453125, -0.2315673828125, -0.208740234375, -0.1859130859375, -0.1630859375, -0.1402587890625, -0.117431640625, -0.0946044921875, -0.07177734375, -0.0489501953125, -0.026123046875, -0.0032958984375, 0.01953125, 0.0423583984375, 0.065185546875, 0.0880126953125, 0.11083984375, 0.1336669921875, 0.156494140625, 0.1793212890625, 0.2021484375, 0.2249755859375, 0.247802734375, 0.2706298828125, 0.29345703125, 0.3162841796875, 0.339111328125, 0.3619384765625, 0.384765625, 0.4075927734375, 0.430419921875, 0.4532470703125, 0.47607421875, 0.4989013671875, 0.521728515625, 0.5445556640625, 0.5673828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 3.0, 3.0, 16.0, 24.0, 24.0, 25.0, 47.0, 37.0, 62.0, 89.0, 154.0, 255.0, 407.0, 828.0, 1852.0, 4677.0, 15771.0, 80506.0, 4007072.0, 61840.0, 12861.0, 4151.0, 1646.0, 788.0, 415.0, 227.0, 139.0, 74.0, 65.0, 56.0, 30.0, 23.0, 17.0, 13.0, 16.0, 7.0, 14.0, 10.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.305633544921875, -2.22454833984375, -2.143463134765625, -2.0623779296875, -1.981292724609375, -1.90020751953125, -1.819122314453125, -1.738037109375, -1.656951904296875, -1.57586669921875, -1.494781494140625, -1.4136962890625, -1.332611083984375, -1.25152587890625, -1.170440673828125, -1.08935546875, -1.008270263671875, -0.92718505859375, -0.846099853515625, -0.7650146484375, -0.683929443359375, -0.60284423828125, -0.521759033203125, -0.440673828125, -0.359588623046875, -0.27850341796875, -0.197418212890625, -0.1163330078125, -0.035247802734375, 0.04583740234375, 0.126922607421875, 0.2080078125, 0.289093017578125, 0.37017822265625, 0.451263427734375, 0.5323486328125, 0.613433837890625, 0.69451904296875, 0.775604248046875, 0.856689453125, 0.937774658203125, 1.01885986328125, 1.099945068359375, 1.1810302734375, 1.262115478515625, 1.34320068359375, 1.424285888671875, 1.50537109375, 1.586456298828125, 1.66754150390625, 1.748626708984375, 1.8297119140625, 1.910797119140625, 1.99188232421875, 2.072967529296875, 2.154052734375, 2.235137939453125, 2.31622314453125, 2.397308349609375, 2.4783935546875, 2.559478759765625, 2.64056396484375, 2.721649169921875, 2.802734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 17.0, 21.0, 38.0, 73.0, 3436.0, 307.0, 72.0, 39.0, 21.0, 14.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7823944091796875, -0.758636474609375, -0.7348785400390625, -0.71112060546875, -0.6873626708984375, -0.663604736328125, -0.6398468017578125, -0.6160888671875, -0.5923309326171875, -0.568572998046875, -0.5448150634765625, -0.52105712890625, -0.4972991943359375, -0.473541259765625, -0.4497833251953125, -0.426025390625, -0.4022674560546875, -0.378509521484375, -0.3547515869140625, -0.33099365234375, -0.3072357177734375, -0.283477783203125, -0.2597198486328125, -0.2359619140625, -0.2122039794921875, -0.188446044921875, -0.1646881103515625, -0.14093017578125, -0.1171722412109375, -0.093414306640625, -0.0696563720703125, -0.0458984375, -0.0221405029296875, 0.001617431640625, 0.0253753662109375, 0.04913330078125, 0.0728912353515625, 0.096649169921875, 0.1204071044921875, 0.1441650390625, 0.1679229736328125, 0.191680908203125, 0.2154388427734375, 0.23919677734375, 0.2629547119140625, 0.286712646484375, 0.3104705810546875, 0.334228515625, 0.3579864501953125, 0.381744384765625, 0.4055023193359375, 0.42926025390625, 0.4530181884765625, 0.476776123046875, 0.5005340576171875, 0.5242919921875, 0.5480499267578125, 0.571807861328125, 0.5955657958984375, 0.61932373046875, 0.6430816650390625, 0.666839599609375, 0.6905975341796875, 0.71435546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 22.0, 37.0, 83.0, 154.0, 207.0, 173.0, 143.0, 94.0, 32.0, 16.0, 14.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5912890434265137, -3.4899652004241943, -3.388641119003296, -3.2873172760009766, -3.1859934329986572, -3.084669589996338, -2.9833455085754395, -2.88202166557312, -2.780697822570801, -2.6793739795684814, -2.578049898147583, -2.4767260551452637, -2.3754022121429443, -2.274078369140625, -2.1727542877197266, -2.0714304447174072, -1.9701064825057983, -1.8687825202941895, -1.7674586772918701, -1.6661347150802612, -1.564810872077942, -1.463486909866333, -1.3621630668640137, -1.2608391046524048, -1.159515142440796, -1.058191180229187, -0.9568673372268677, -0.8555433750152588, -0.7542195320129395, -0.6528955698013306, -0.5515716671943665, -0.45024776458740234, -0.348923921585083, -0.2476000189781189, -0.1462761014699936, -0.044952183961868286, 0.056371718645095825, 0.15769565105438232, 0.25901955366134644, 0.36034345626831055, 0.46166735887527466, 0.5629912614822388, 0.6643151640892029, 0.765639066696167, 0.8669630289077759, 0.96828693151474, 1.069610834121704, 1.1709346771240234, 1.2722586393356323, 1.3735826015472412, 1.4749064445495605, 1.5762304067611694, 1.6775542497634888, 1.7788782119750977, 1.880202054977417, 1.9815260171890259, 2.0828499794006348, 2.184173822402954, 2.2854979038238525, 2.386821746826172, 2.488145589828491, 2.5894694328308105, 2.690793514251709, 2.7921173572540283, 2.8934412002563477]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 6.0, 28.0, 22.0, 28.0, 35.0, 40.0, 51.0, 49.0, 66.0, 84.0, 62.0, 70.0, 72.0, 54.0, 56.0, 54.0, 36.0, 43.0, 33.0, 24.0, 17.0, 15.0, 16.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8931628465652466, -1.8450496196746826, -1.7969363927841187, -1.7488231658935547, -1.7007099390029907, -1.6525967121124268, -1.6044834852218628, -1.5563702583312988, -1.5082570314407349, -1.460143804550171, -1.412030577659607, -1.363917350769043, -1.315804123878479, -1.267690896987915, -1.219577670097351, -1.171464443206787, -1.1233513355255127, -1.0752381086349487, -1.0271248817443848, -0.9790116548538208, -0.9308984279632568, -0.8827852010726929, -0.8346719741821289, -0.7865587472915649, -0.738445520401001, -0.690332293510437, -0.642219066619873, -0.5941058397293091, -0.5459926128387451, -0.49787938594818115, -0.4497661888599396, -0.4016529619693756, -0.35353970527648926, -0.3054264783859253, -0.25731325149536133, -0.20920003950595856, -0.1610868126153946, -0.11297358572483063, -0.06486037373542786, -0.01674714684486389, 0.03136608004570007, 0.07947930693626404, 0.127592533826828, 0.17570574581623077, 0.22381897270679474, 0.2719321846961975, 0.3200454115867615, 0.36815863847732544, 0.4162718653678894, 0.46438509225845337, 0.5124983191490173, 0.5606115460395813, 0.6087247729301453, 0.6568379998207092, 0.7049511671066284, 0.7530643939971924, 0.8011776208877563, 0.8492908477783203, 0.8974040746688843, 0.9455173015594482, 0.9936305284500122, 1.0417437553405762, 1.0898569822311401, 1.137970209121704, 1.186083436012268]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 12.0, 12.0, 13.0, 31.0, 41.0, 50.0, 91.0, 134.0, 208.0, 349.0, 666.0, 1111.0, 2119.0, 4069.0, 8125.0, 16840.0, 35536.0, 75053.0, 149863.0, 241385.0, 236329.0, 141347.0, 69723.0, 33442.0, 15836.0, 7681.0, 3955.0, 1969.0, 1051.0, 589.0, 329.0, 196.0, 119.0, 89.0, 57.0, 42.0, 29.0, 16.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.103118896484375, -1.06365966796875, -1.024200439453125, -0.9847412109375, -0.945281982421875, -0.90582275390625, -0.866363525390625, -0.826904296875, -0.787445068359375, -0.74798583984375, -0.708526611328125, -0.6690673828125, -0.629608154296875, -0.59014892578125, -0.550689697265625, -0.51123046875, -0.471771240234375, -0.43231201171875, -0.392852783203125, -0.3533935546875, -0.313934326171875, -0.27447509765625, -0.235015869140625, -0.195556640625, -0.156097412109375, -0.11663818359375, -0.077178955078125, -0.0377197265625, 0.001739501953125, 0.04119873046875, 0.080657958984375, 0.1201171875, 0.159576416015625, 0.19903564453125, 0.238494873046875, 0.2779541015625, 0.317413330078125, 0.35687255859375, 0.396331787109375, 0.435791015625, 0.475250244140625, 0.51470947265625, 0.554168701171875, 0.5936279296875, 0.633087158203125, 0.67254638671875, 0.712005615234375, 0.75146484375, 0.790924072265625, 0.83038330078125, 0.869842529296875, 0.9093017578125, 0.948760986328125, 0.98822021484375, 1.027679443359375, 1.067138671875, 1.106597900390625, 1.14605712890625, 1.185516357421875, 1.2249755859375, 1.264434814453125, 1.30389404296875, 1.343353271484375, 1.3828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 4.0, 5.0, 9.0, 11.0, 15.0, 15.0, 14.0, 24.0, 35.0, 31.0, 34.0, 53.0, 56.0, 43.0, 55.0, 49.0, 53.0, 59.0, 57.0, 51.0, 38.0, 50.0, 43.0, 40.0, 41.0, 23.0, 21.0, 12.0, 16.0, 13.0, 10.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8851470947265625, -0.861602783203125, -0.8380584716796875, -0.81451416015625, -0.7909698486328125, -0.767425537109375, -0.7438812255859375, -0.7203369140625, -0.6967926025390625, -0.673248291015625, -0.6497039794921875, -0.62615966796875, -0.6026153564453125, -0.579071044921875, -0.5555267333984375, -0.531982421875, -0.5084381103515625, -0.484893798828125, -0.4613494873046875, -0.43780517578125, -0.4142608642578125, -0.390716552734375, -0.3671722412109375, -0.3436279296875, -0.3200836181640625, -0.296539306640625, -0.2729949951171875, -0.24945068359375, -0.2259063720703125, -0.202362060546875, -0.1788177490234375, -0.1552734375, -0.1317291259765625, -0.108184814453125, -0.0846405029296875, -0.06109619140625, -0.0375518798828125, -0.014007568359375, 0.0095367431640625, 0.0330810546875, 0.0566253662109375, 0.080169677734375, 0.1037139892578125, 0.12725830078125, 0.1508026123046875, 0.174346923828125, 0.1978912353515625, 0.221435546875, 0.2449798583984375, 0.268524169921875, 0.2920684814453125, 0.31561279296875, 0.3391571044921875, 0.362701416015625, 0.3862457275390625, 0.4097900390625, 0.4333343505859375, 0.456878662109375, 0.4804229736328125, 0.50396728515625, 0.5275115966796875, 0.551055908203125, 0.5746002197265625, 0.59814453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 7.0, 14.0, 18.0, 26.0, 31.0, 49.0, 70.0, 89.0, 129.0, 170.0, 278.0, 398.0, 688.0, 1099.0, 2245.0, 5502.0, 18040.0, 71089.0, 307893.0, 472317.0, 123746.0, 29335.0, 8415.0, 3117.0, 1472.0, 794.0, 472.0, 332.0, 202.0, 129.0, 112.0, 86.0, 46.0, 40.0, 36.0, 11.0, 14.0, 12.0, 3.0, 5.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.775390625, -1.71240234375, -1.6494140625, -1.58642578125, -1.5234375, -1.46044921875, -1.3974609375, -1.33447265625, -1.271484375, -1.20849609375, -1.1455078125, -1.08251953125, -1.01953125, -0.95654296875, -0.8935546875, -0.83056640625, -0.767578125, -0.70458984375, -0.6416015625, -0.57861328125, -0.515625, -0.45263671875, -0.3896484375, -0.32666015625, -0.263671875, -0.20068359375, -0.1376953125, -0.07470703125, -0.01171875, 0.05126953125, 0.1142578125, 0.17724609375, 0.240234375, 0.30322265625, 0.3662109375, 0.42919921875, 0.4921875, 0.55517578125, 0.6181640625, 0.68115234375, 0.744140625, 0.80712890625, 0.8701171875, 0.93310546875, 0.99609375, 1.05908203125, 1.1220703125, 1.18505859375, 1.248046875, 1.31103515625, 1.3740234375, 1.43701171875, 1.5, 1.56298828125, 1.6259765625, 1.68896484375, 1.751953125, 1.81494140625, 1.8779296875, 1.94091796875, 2.00390625, 2.06689453125, 2.1298828125, 2.19287109375, 2.255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 4.0, 10.0, 13.0, 10.0, 13.0, 16.0, 26.0, 20.0, 25.0, 24.0, 27.0, 34.0, 38.0, 35.0, 39.0, 39.0, 38.0, 46.0, 53.0, 39.0, 48.0, 51.0, 50.0, 51.0, 32.0, 27.0, 27.0, 24.0, 22.0, 23.0, 10.0, 15.0, 13.0, 9.0, 6.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.6201171875, -2.537109375, -2.4541015625, -2.37109375, -2.2880859375, -2.205078125, -2.1220703125, -2.0390625, -1.9560546875, -1.873046875, -1.7900390625, -1.70703125, -1.6240234375, -1.541015625, -1.4580078125, -1.375, -1.2919921875, -1.208984375, -1.1259765625, -1.04296875, -0.9599609375, -0.876953125, -0.7939453125, -0.7109375, -0.6279296875, -0.544921875, -0.4619140625, -0.37890625, -0.2958984375, -0.212890625, -0.1298828125, -0.046875, 0.0361328125, 0.119140625, 0.2021484375, 0.28515625, 0.3681640625, 0.451171875, 0.5341796875, 0.6171875, 0.7001953125, 0.783203125, 0.8662109375, 0.94921875, 1.0322265625, 1.115234375, 1.1982421875, 1.28125, 1.3642578125, 1.447265625, 1.5302734375, 1.61328125, 1.6962890625, 1.779296875, 1.8623046875, 1.9453125, 2.0283203125, 2.111328125, 2.1943359375, 2.27734375, 2.3603515625, 2.443359375, 2.5263671875, 2.609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 6.0, 11.0, 9.0, 12.0, 20.0, 34.0, 49.0, 67.0, 94.0, 170.0, 294.0, 629.0, 1763.0, 6585.0, 43354.0, 620711.0, 341967.0, 25436.0, 4663.0, 1422.0, 574.0, 257.0, 151.0, 82.0, 59.0, 30.0, 27.0, 18.0, 13.0, 11.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8217620849609375, -1.764617919921875, -1.7074737548828125, -1.65032958984375, -1.5931854248046875, -1.536041259765625, -1.4788970947265625, -1.4217529296875, -1.3646087646484375, -1.307464599609375, -1.2503204345703125, -1.19317626953125, -1.1360321044921875, -1.078887939453125, -1.0217437744140625, -0.964599609375, -0.9074554443359375, -0.850311279296875, -0.7931671142578125, -0.73602294921875, -0.6788787841796875, -0.621734619140625, -0.5645904541015625, -0.5074462890625, -0.4503021240234375, -0.393157958984375, -0.3360137939453125, -0.27886962890625, -0.2217254638671875, -0.164581298828125, -0.1074371337890625, -0.05029296875, 0.0068511962890625, 0.063995361328125, 0.1211395263671875, 0.17828369140625, 0.2354278564453125, 0.292572021484375, 0.3497161865234375, 0.4068603515625, 0.4640045166015625, 0.521148681640625, 0.5782928466796875, 0.63543701171875, 0.6925811767578125, 0.749725341796875, 0.8068695068359375, 0.864013671875, 0.9211578369140625, 0.978302001953125, 1.0354461669921875, 1.09259033203125, 1.1497344970703125, 1.206878662109375, 1.2640228271484375, 1.3211669921875, 1.3783111572265625, 1.435455322265625, 1.4925994873046875, 1.54974365234375, 1.6068878173828125, 1.664031982421875, 1.7211761474609375, 1.7783203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 6.0, 11.0, 15.0, 13.0, 24.0, 26.0, 31.0, 32.0, 61.0, 55.0, 61.0, 92.0, 89.0, 100.0, 68.0, 57.0, 49.0, 40.0, 26.0, 30.0, 21.0, 28.0, 14.0, 10.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018846988677978516, -0.00018289871513843536, -0.00017732754349708557, -0.00017175637185573578, -0.00016618520021438599, -0.0001606140285730362, -0.0001550428569316864, -0.0001494716852903366, -0.00014390051364898682, -0.00013832934200763702, -0.00013275817036628723, -0.00012718699872493744, -0.00012161582708358765, -0.00011604465544223785, -0.00011047348380088806, -0.00010490231215953827, -9.933114051818848e-05, -9.375996887683868e-05, -8.818879723548889e-05, -8.26176255941391e-05, -7.70464539527893e-05, -7.147528231143951e-05, -6.590411067008972e-05, -6.033293902873993e-05, -5.476176738739014e-05, -4.9190595746040344e-05, -4.361942410469055e-05, -3.804825246334076e-05, -3.247708082199097e-05, -2.6905909180641174e-05, -2.1334737539291382e-05, -1.576356589794159e-05, -1.0192394256591797e-05, -4.621222615242004e-06, 9.499490261077881e-07, 6.5211206674575806e-06, 1.2092292308807373e-05, 1.7663463950157166e-05, 2.3234635591506958e-05, 2.880580723285675e-05, 3.437697887420654e-05, 3.9948150515556335e-05, 4.551932215690613e-05, 5.109049379825592e-05, 5.666166543960571e-05, 6.22328370809555e-05, 6.78040087223053e-05, 7.337518036365509e-05, 7.894635200500488e-05, 8.451752364635468e-05, 9.008869528770447e-05, 9.565986692905426e-05, 0.00010123103857040405, 0.00010680221021175385, 0.00011237338185310364, 0.00011794455349445343, 0.00012351572513580322, 0.00012908689677715302, 0.0001346580684185028, 0.0001402292400598526, 0.0001458004117012024, 0.00015137158334255219, 0.00015694275498390198, 0.00016251392662525177, 0.00016808509826660156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 6.0, 3.0, 14.0, 21.0, 36.0, 63.0, 114.0, 223.0, 463.0, 1307.0, 4500.0, 25316.0, 501983.0, 483393.0, 24400.0, 4375.0, 1321.0, 535.0, 210.0, 104.0, 55.0, 31.0, 21.0, 15.0, 13.0, 2.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6199798583984375, -1.549530029296875, -1.4790802001953125, -1.40863037109375, -1.3381805419921875, -1.267730712890625, -1.1972808837890625, -1.1268310546875, -1.0563812255859375, -0.985931396484375, -0.9154815673828125, -0.84503173828125, -0.7745819091796875, -0.704132080078125, -0.6336822509765625, -0.563232421875, -0.4927825927734375, -0.422332763671875, -0.3518829345703125, -0.28143310546875, -0.2109832763671875, -0.140533447265625, -0.0700836181640625, 0.0003662109375, 0.0708160400390625, 0.141265869140625, 0.2117156982421875, 0.28216552734375, 0.3526153564453125, 0.423065185546875, 0.4935150146484375, 0.56396484375, 0.6344146728515625, 0.704864501953125, 0.7753143310546875, 0.84576416015625, 0.9162139892578125, 0.986663818359375, 1.0571136474609375, 1.1275634765625, 1.1980133056640625, 1.268463134765625, 1.3389129638671875, 1.40936279296875, 1.4798126220703125, 1.550262451171875, 1.6207122802734375, 1.691162109375, 1.7616119384765625, 1.832061767578125, 1.9025115966796875, 1.97296142578125, 2.0434112548828125, 2.113861083984375, 2.1843109130859375, 2.2547607421875, 2.3252105712890625, 2.395660400390625, 2.4661102294921875, 2.53656005859375, 2.6070098876953125, 2.677459716796875, 2.7479095458984375, 2.818359375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 23.0, 29.0, 45.0, 77.0, 96.0, 116.0, 113.0, 127.0, 99.0, 75.0, 49.0, 36.0, 20.0, 16.0, 16.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.150390625, -2.0916900634765625, -2.032989501953125, -1.9742889404296875, -1.91558837890625, -1.8568878173828125, -1.798187255859375, -1.7394866943359375, -1.6807861328125, -1.6220855712890625, -1.563385009765625, -1.5046844482421875, -1.44598388671875, -1.3872833251953125, -1.328582763671875, -1.2698822021484375, -1.211181640625, -1.1524810791015625, -1.093780517578125, -1.0350799560546875, -0.97637939453125, -0.9176788330078125, -0.858978271484375, -0.8002777099609375, -0.7415771484375, -0.6828765869140625, -0.624176025390625, -0.5654754638671875, -0.50677490234375, -0.4480743408203125, -0.389373779296875, -0.3306732177734375, -0.27197265625, -0.2132720947265625, -0.154571533203125, -0.0958709716796875, -0.03717041015625, 0.0215301513671875, 0.080230712890625, 0.1389312744140625, 0.1976318359375, 0.2563323974609375, 0.315032958984375, 0.3737335205078125, 0.43243408203125, 0.4911346435546875, 0.549835205078125, 0.6085357666015625, 0.667236328125, 0.7259368896484375, 0.784637451171875, 0.8433380126953125, 0.90203857421875, 0.9607391357421875, 1.019439697265625, 1.0781402587890625, 1.1368408203125, 1.1955413818359375, 1.254241943359375, 1.3129425048828125, 1.37164306640625, 1.4303436279296875, 1.489044189453125, 1.5477447509765625, 1.6064453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 26.0, 53.0, 157.0, 341.0, 265.0, 116.0, 35.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.659332275390625, -33.06303024291992, -31.466724395751953, -29.87042236328125, -28.27411651611328, -26.677814483642578, -25.081510543823242, -23.485206604003906, -21.88890266418457, -20.292598724365234, -18.6962947845459, -17.099990844726562, -15.503687858581543, -13.907383918762207, -12.311080932617188, -10.714776992797852, -9.118473052978516, -7.52216911315918, -5.925865650177002, -4.329562187194824, -2.7332582473754883, -1.1369543075561523, 0.4593486785888672, 2.055652618408203, 3.651956558227539, 5.248260498046875, 6.844563961029053, 8.44086742401123, 10.037171363830566, 11.633475303649902, 13.229778289794922, 14.826082229614258, 16.422386169433594, 18.01869010925293, 19.614994049072266, 21.21129608154297, 22.807601928710938, 24.40390396118164, 26.000207901000977, 27.596511840820312, 29.19281578063965, 30.789119720458984, 32.38542175292969, 33.981727600097656, 35.57802963256836, 37.17433547973633, 38.77063751220703, 40.366943359375, 41.9632453918457, 43.559547424316406, 45.155853271484375, 46.75215530395508, 48.34846115112305, 49.94476318359375, 51.54106903076172, 53.13737106323242, 54.733673095703125, 56.32997512817383, 57.9262809753418, 59.5225830078125, 61.11888885498047, 62.71519088745117, 64.31149291992188, 65.90779876708984, 67.50410461425781]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 7.0, 8.0, 10.0, 25.0, 15.0, 16.0, 25.0, 21.0, 32.0, 39.0, 41.0, 45.0, 53.0, 51.0, 52.0, 46.0, 58.0, 48.0, 51.0, 53.0, 52.0, 38.0, 31.0, 35.0, 15.0, 18.0, 17.0, 12.0, 23.0, 9.0, 13.0, 11.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.073604583740234, -14.643697738647461, -14.213790893554688, -13.783884048461914, -13.353976249694824, -12.92406940460205, -12.494162559509277, -12.064255714416504, -11.634347915649414, -11.20444107055664, -10.774534225463867, -10.344627380371094, -9.914719581604004, -9.48481273651123, -9.054905891418457, -8.624999046325684, -8.19509220123291, -7.765185356140137, -7.335278034210205, -6.905371189117432, -6.4754638671875, -6.045557022094727, -5.615650177001953, -5.18574333190918, -4.755836009979248, -4.325929164886475, -3.896021842956543, -3.4661149978637695, -3.036207914352417, -2.6063008308410645, -2.176393985748291, -1.7464869022369385, -1.3165807723999023, -0.8866737484931946, -0.4567667245864868, -0.026859760284423828, 0.4030473232269287, 0.8329544067382812, 1.2628612518310547, 1.6927683353424072, 2.1226754188537598, 2.5525825023651123, 2.982489585876465, 3.4123964309692383, 3.842303514480591, 4.272210597991943, 4.702117443084717, 5.132024765014648, 5.561931610107422, 5.991838455200195, 6.421745777130127, 6.8516526222229, 7.281559944152832, 7.7114667892456055, 8.141373634338379, 8.571280479431152, 9.001188278198242, 9.431095123291016, 9.861001968383789, 10.290908813476562, 10.720816612243652, 11.150723457336426, 11.5806303024292, 12.010537147521973, 12.440443992614746]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 3.0, 9.0, 15.0, 15.0, 20.0, 30.0, 38.0, 57.0, 71.0, 111.0, 212.0, 317.0, 533.0, 980.0, 1919.0, 4132.0, 10943.0, 40741.0, 3676199.0, 405380.0, 34870.0, 9985.0, 3660.0, 1704.0, 895.0, 511.0, 299.0, 192.0, 122.0, 81.0, 63.0, 37.0, 29.0, 26.0, 21.0, 9.0, 9.0, 11.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.196197509765625, -2.12286376953125, -2.049530029296875, -1.9761962890625, -1.902862548828125, -1.82952880859375, -1.756195068359375, -1.682861328125, -1.609527587890625, -1.53619384765625, -1.462860107421875, -1.3895263671875, -1.316192626953125, -1.24285888671875, -1.169525146484375, -1.09619140625, -1.022857666015625, -0.94952392578125, -0.876190185546875, -0.8028564453125, -0.729522705078125, -0.65618896484375, -0.582855224609375, -0.509521484375, -0.436187744140625, -0.36285400390625, -0.289520263671875, -0.2161865234375, -0.142852783203125, -0.06951904296875, 0.003814697265625, 0.0771484375, 0.150482177734375, 0.22381591796875, 0.297149658203125, 0.3704833984375, 0.443817138671875, 0.51715087890625, 0.590484619140625, 0.663818359375, 0.737152099609375, 0.81048583984375, 0.883819580078125, 0.9571533203125, 1.030487060546875, 1.10382080078125, 1.177154541015625, 1.25048828125, 1.323822021484375, 1.39715576171875, 1.470489501953125, 1.5438232421875, 1.617156982421875, 1.69049072265625, 1.763824462890625, 1.837158203125, 1.910491943359375, 1.98382568359375, 2.057159423828125, 2.1304931640625, 2.203826904296875, 2.27716064453125, 2.350494384765625, 2.423828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 11.0, 18.0, 16.0, 20.0, 30.0, 28.0, 27.0, 44.0, 47.0, 54.0, 52.0, 55.0, 56.0, 61.0, 55.0, 58.0, 49.0, 50.0, 48.0, 32.0, 32.0, 27.0, 16.0, 20.0, 16.0, 15.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.703125, -0.67877197265625, -0.6544189453125, -0.63006591796875, -0.605712890625, -0.58135986328125, -0.5570068359375, -0.53265380859375, -0.50830078125, -0.48394775390625, -0.4595947265625, -0.43524169921875, -0.410888671875, -0.38653564453125, -0.3621826171875, -0.33782958984375, -0.3134765625, -0.28912353515625, -0.2647705078125, -0.24041748046875, -0.216064453125, -0.19171142578125, -0.1673583984375, -0.14300537109375, -0.11865234375, -0.09429931640625, -0.0699462890625, -0.04559326171875, -0.021240234375, 0.00311279296875, 0.0274658203125, 0.05181884765625, 0.076171875, 0.10052490234375, 0.1248779296875, 0.14923095703125, 0.173583984375, 0.19793701171875, 0.2222900390625, 0.24664306640625, 0.27099609375, 0.29534912109375, 0.3197021484375, 0.34405517578125, 0.368408203125, 0.39276123046875, 0.4171142578125, 0.44146728515625, 0.4658203125, 0.49017333984375, 0.5145263671875, 0.53887939453125, 0.563232421875, 0.58758544921875, 0.6119384765625, 0.63629150390625, 0.66064453125, 0.68499755859375, 0.7093505859375, 0.73370361328125, 0.758056640625, 0.78240966796875, 0.8067626953125, 0.83111572265625, 0.85546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 8.0, 18.0, 13.0, 18.0, 31.0, 29.0, 43.0, 54.0, 71.0, 83.0, 108.0, 144.0, 274.0, 1352.0, 20971.0, 4126387.0, 41596.0, 2033.0, 355.0, 159.0, 121.0, 77.0, 81.0, 64.0, 48.0, 33.0, 24.0, 16.0, 16.0, 9.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.828125, -6.61859130859375, -6.4090576171875, -6.19952392578125, -5.989990234375, -5.78045654296875, -5.5709228515625, -5.36138916015625, -5.15185546875, -4.94232177734375, -4.7327880859375, -4.52325439453125, -4.313720703125, -4.10418701171875, -3.8946533203125, -3.68511962890625, -3.4755859375, -3.26605224609375, -3.0565185546875, -2.84698486328125, -2.637451171875, -2.42791748046875, -2.2183837890625, -2.00885009765625, -1.79931640625, -1.58978271484375, -1.3802490234375, -1.17071533203125, -0.961181640625, -0.75164794921875, -0.5421142578125, -0.33258056640625, -0.123046875, 0.08648681640625, 0.2960205078125, 0.50555419921875, 0.715087890625, 0.92462158203125, 1.1341552734375, 1.34368896484375, 1.55322265625, 1.76275634765625, 1.9722900390625, 2.18182373046875, 2.391357421875, 2.60089111328125, 2.8104248046875, 3.01995849609375, 3.2294921875, 3.43902587890625, 3.6485595703125, 3.85809326171875, 4.067626953125, 4.27716064453125, 4.4866943359375, 4.69622802734375, 4.90576171875, 5.11529541015625, 5.3248291015625, 5.53436279296875, 5.743896484375, 5.95343017578125, 6.1629638671875, 6.37249755859375, 6.58203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 16.0, 32.0, 160.0, 3305.0, 437.0, 73.0, 28.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9409637451171875, -0.861419677734375, -0.7818756103515625, -0.70233154296875, -0.6227874755859375, -0.543243408203125, -0.4636993408203125, -0.3841552734375, -0.3046112060546875, -0.225067138671875, -0.1455230712890625, -0.06597900390625, 0.0135650634765625, 0.093109130859375, 0.1726531982421875, 0.252197265625, 0.3317413330078125, 0.411285400390625, 0.4908294677734375, 0.57037353515625, 0.6499176025390625, 0.729461669921875, 0.8090057373046875, 0.8885498046875, 0.9680938720703125, 1.047637939453125, 1.1271820068359375, 1.20672607421875, 1.2862701416015625, 1.365814208984375, 1.4453582763671875, 1.52490234375, 1.6044464111328125, 1.683990478515625, 1.7635345458984375, 1.84307861328125, 1.9226226806640625, 2.002166748046875, 2.0817108154296875, 2.1612548828125, 2.2407989501953125, 2.320343017578125, 2.3998870849609375, 2.47943115234375, 2.5589752197265625, 2.638519287109375, 2.7180633544921875, 2.797607421875, 2.8771514892578125, 2.956695556640625, 3.0362396240234375, 3.11578369140625, 3.1953277587890625, 3.274871826171875, 3.3544158935546875, 3.4339599609375, 3.5135040283203125, 3.593048095703125, 3.6725921630859375, 3.75213623046875, 3.8316802978515625, 3.911224365234375, 3.9907684326171875, 4.0703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 32.0, 77.0, 169.0, 324.0, 231.0, 90.0, 43.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60890007019043, -7.257029056549072, -6.905158519744873, -6.553287506103516, -6.201416492462158, -5.849545478820801, -5.497674942016602, -5.145803928375244, -4.793932914733887, -4.442061901092529, -4.09019136428833, -3.7383203506469727, -3.3864493370056152, -3.034578561782837, -2.6827077865600586, -2.330836772918701, -1.978966236114502, -1.627095341682434, -1.2752244472503662, -0.9233536720275879, -0.57148277759552, -0.21961188316345215, 0.13225889205932617, 0.4841299057006836, 0.8360006809234619, 1.1878715753555298, 1.5397424697875977, 1.891613245010376, 2.2434840202331543, 2.5953550338745117, 2.94722580909729, 3.2990968227386475, 3.650967597961426, 4.002838611602783, 4.354709148406982, 4.70658016204834, 5.058451175689697, 5.410322189331055, 5.762192726135254, 6.114063739776611, 6.465934753417969, 6.817805767059326, 7.169676303863525, 7.521547317504883, 7.87341833114624, 8.225289344787598, 8.577159881591797, 8.929031372070312, 9.280900955200195, 9.632771492004395, 9.98464298248291, 10.33651351928711, 10.688384056091309, 11.040255546569824, 11.392126083374023, 11.743997573852539, 12.095868110656738, 12.447738647460938, 12.799610137939453, 13.151480674743652, 13.503351211547852, 13.855222702026367, 14.207093238830566, 14.558963775634766, 14.910835266113281]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 15.0, 17.0, 18.0, 25.0, 37.0, 51.0, 66.0, 86.0, 77.0, 103.0, 98.0, 79.0, 74.0, 66.0, 50.0, 38.0, 21.0, 20.0, 10.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.232107162475586, -6.0413594245910645, -5.850611686706543, -5.6598639488220215, -5.4691162109375, -5.2783684730529785, -5.087620735168457, -4.8968729972839355, -4.706125259399414, -4.515377521514893, -4.324629783630371, -4.13388204574585, -3.943134307861328, -3.7523865699768066, -3.561638832092285, -3.3708910942077637, -3.180143356323242, -2.9893956184387207, -2.798647880554199, -2.6079001426696777, -2.4171524047851562, -2.2264046669006348, -2.0356569290161133, -1.8449091911315918, -1.6541614532470703, -1.4634137153625488, -1.2726659774780273, -1.0819182395935059, -0.8911705017089844, -0.7004227638244629, -0.5096750259399414, -0.3189272880554199, -0.12818002700805664, 0.06256771087646484, 0.25331544876098633, 0.4440631866455078, 0.6348109245300293, 0.8255586624145508, 1.0163064002990723, 1.2070541381835938, 1.3978018760681152, 1.5885496139526367, 1.7792973518371582, 1.9700450897216797, 2.160792827606201, 2.3515405654907227, 2.542288303375244, 2.7330360412597656, 2.923783779144287, 3.1145315170288086, 3.30527925491333, 3.4960269927978516, 3.686774730682373, 3.8775224685668945, 4.068270206451416, 4.2590179443359375, 4.449765682220459, 4.6405134201049805, 4.831261157989502, 5.022008895874023, 5.212756633758545, 5.403504371643066, 5.594252109527588, 5.784999847412109, 5.975747585296631]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 14.0, 15.0, 23.0, 22.0, 68.0, 82.0, 136.0, 250.0, 393.0, 837.0, 1676.0, 3677.0, 8558.0, 22374.0, 62300.0, 173289.0, 343815.0, 264897.0, 104686.0, 37200.0, 13769.0, 5452.0, 2409.0, 1199.0, 599.0, 306.0, 197.0, 107.0, 80.0, 43.0, 22.0, 19.0, 7.0, 11.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.58355712890625, -1.5264892578125, -1.46942138671875, -1.412353515625, -1.35528564453125, -1.2982177734375, -1.24114990234375, -1.18408203125, -1.12701416015625, -1.0699462890625, -1.01287841796875, -0.955810546875, -0.89874267578125, -0.8416748046875, -0.78460693359375, -0.7275390625, -0.67047119140625, -0.6134033203125, -0.55633544921875, -0.499267578125, -0.44219970703125, -0.3851318359375, -0.32806396484375, -0.27099609375, -0.21392822265625, -0.1568603515625, -0.09979248046875, -0.042724609375, 0.01434326171875, 0.0714111328125, 0.12847900390625, 0.185546875, 0.24261474609375, 0.2996826171875, 0.35675048828125, 0.413818359375, 0.47088623046875, 0.5279541015625, 0.58502197265625, 0.64208984375, 0.69915771484375, 0.7562255859375, 0.81329345703125, 0.870361328125, 0.92742919921875, 0.9844970703125, 1.04156494140625, 1.0986328125, 1.15570068359375, 1.2127685546875, 1.26983642578125, 1.326904296875, 1.38397216796875, 1.4410400390625, 1.49810791015625, 1.55517578125, 1.61224365234375, 1.6693115234375, 1.72637939453125, 1.783447265625, 1.84051513671875, 1.8975830078125, 1.95465087890625, 2.01171875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 14.0, 10.0, 21.0, 22.0, 17.0, 30.0, 33.0, 49.0, 67.0, 56.0, 82.0, 81.0, 74.0, 73.0, 83.0, 57.0, 58.0, 33.0, 36.0, 22.0, 16.0, 20.0, 10.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.085174560546875, -1.05023193359375, -1.015289306640625, -0.9803466796875, -0.945404052734375, -0.91046142578125, -0.875518798828125, -0.840576171875, -0.805633544921875, -0.77069091796875, -0.735748291015625, -0.7008056640625, -0.665863037109375, -0.63092041015625, -0.595977783203125, -0.56103515625, -0.526092529296875, -0.49114990234375, -0.456207275390625, -0.4212646484375, -0.386322021484375, -0.35137939453125, -0.316436767578125, -0.281494140625, -0.246551513671875, -0.21160888671875, -0.176666259765625, -0.1417236328125, -0.106781005859375, -0.07183837890625, -0.036895751953125, -0.001953125, 0.032989501953125, 0.06793212890625, 0.102874755859375, 0.1378173828125, 0.172760009765625, 0.20770263671875, 0.242645263671875, 0.277587890625, 0.312530517578125, 0.34747314453125, 0.382415771484375, 0.4173583984375, 0.452301025390625, 0.48724365234375, 0.522186279296875, 0.55712890625, 0.592071533203125, 0.62701416015625, 0.661956787109375, 0.6968994140625, 0.731842041015625, 0.76678466796875, 0.801727294921875, 0.836669921875, 0.871612548828125, 0.90655517578125, 0.941497802734375, 0.9764404296875, 1.011383056640625, 1.04632568359375, 1.081268310546875, 1.1162109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 9.0, 17.0, 19.0, 38.0, 35.0, 80.0, 127.0, 205.0, 361.0, 753.0, 1628.0, 4797.0, 26692.0, 495410.0, 483969.0, 26391.0, 4729.0, 1655.0, 711.0, 394.0, 210.0, 126.0, 62.0, 34.0, 31.0, 24.0, 10.0, 8.0, 7.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.20703125, -5.0623779296875, -4.917724609375, -4.7730712890625, -4.62841796875, -4.4837646484375, -4.339111328125, -4.1944580078125, -4.0498046875, -3.9051513671875, -3.760498046875, -3.6158447265625, -3.47119140625, -3.3265380859375, -3.181884765625, -3.0372314453125, -2.892578125, -2.7479248046875, -2.603271484375, -2.4586181640625, -2.31396484375, -2.1693115234375, -2.024658203125, -1.8800048828125, -1.7353515625, -1.5906982421875, -1.446044921875, -1.3013916015625, -1.15673828125, -1.0120849609375, -0.867431640625, -0.7227783203125, -0.578125, -0.4334716796875, -0.288818359375, -0.1441650390625, 0.00048828125, 0.1451416015625, 0.289794921875, 0.4344482421875, 0.5791015625, 0.7237548828125, 0.868408203125, 1.0130615234375, 1.15771484375, 1.3023681640625, 1.447021484375, 1.5916748046875, 1.736328125, 1.8809814453125, 2.025634765625, 2.1702880859375, 2.31494140625, 2.4595947265625, 2.604248046875, 2.7489013671875, 2.8935546875, 3.0382080078125, 3.182861328125, 3.3275146484375, 3.47216796875, 3.6168212890625, 3.761474609375, 3.9061279296875, 4.05078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 9.0, 3.0, 5.0, 8.0, 18.0, 24.0, 33.0, 47.0, 72.0, 77.0, 101.0, 86.0, 97.0, 95.0, 83.0, 65.0, 58.0, 37.0, 28.0, 16.0, 17.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.7655029296875, -4.570068359375, -4.3746337890625, -4.17919921875, -3.9837646484375, -3.788330078125, -3.5928955078125, -3.3974609375, -3.2020263671875, -3.006591796875, -2.8111572265625, -2.61572265625, -2.4202880859375, -2.224853515625, -2.0294189453125, -1.833984375, -1.6385498046875, -1.443115234375, -1.2476806640625, -1.05224609375, -0.8568115234375, -0.661376953125, -0.4659423828125, -0.2705078125, -0.0750732421875, 0.120361328125, 0.3157958984375, 0.51123046875, 0.7066650390625, 0.902099609375, 1.0975341796875, 1.29296875, 1.4884033203125, 1.683837890625, 1.8792724609375, 2.07470703125, 2.2701416015625, 2.465576171875, 2.6610107421875, 2.8564453125, 3.0518798828125, 3.247314453125, 3.4427490234375, 3.63818359375, 3.8336181640625, 4.029052734375, 4.2244873046875, 4.419921875, 4.6153564453125, 4.810791015625, 5.0062255859375, 5.20166015625, 5.3970947265625, 5.592529296875, 5.7879638671875, 5.9833984375, 6.1788330078125, 6.374267578125, 6.5697021484375, 6.76513671875, 6.9605712890625, 7.156005859375, 7.3514404296875, 7.546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 1.0, 8.0, 9.0, 8.0, 22.0, 23.0, 37.0, 54.0, 149.0, 280.0, 811.0, 3745.0, 56106.0, 913943.0, 67662.0, 4180.0, 891.0, 313.0, 121.0, 67.0, 47.0, 19.0, 12.0, 18.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.878997802734375, -1.81072998046875, -1.742462158203125, -1.6741943359375, -1.605926513671875, -1.53765869140625, -1.469390869140625, -1.401123046875, -1.332855224609375, -1.26458740234375, -1.196319580078125, -1.1280517578125, -1.059783935546875, -0.99151611328125, -0.923248291015625, -0.85498046875, -0.786712646484375, -0.71844482421875, -0.650177001953125, -0.5819091796875, -0.513641357421875, -0.44537353515625, -0.377105712890625, -0.308837890625, -0.240570068359375, -0.17230224609375, -0.104034423828125, -0.0357666015625, 0.032501220703125, 0.10076904296875, 0.169036865234375, 0.2373046875, 0.305572509765625, 0.37384033203125, 0.442108154296875, 0.5103759765625, 0.578643798828125, 0.64691162109375, 0.715179443359375, 0.783447265625, 0.851715087890625, 0.91998291015625, 0.988250732421875, 1.0565185546875, 1.124786376953125, 1.19305419921875, 1.261322021484375, 1.32958984375, 1.397857666015625, 1.46612548828125, 1.534393310546875, 1.6026611328125, 1.670928955078125, 1.73919677734375, 1.807464599609375, 1.875732421875, 1.944000244140625, 2.01226806640625, 2.080535888671875, 2.1488037109375, 2.217071533203125, 2.28533935546875, 2.353607177734375, 2.421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 11.0, 15.0, 12.0, 10.0, 25.0, 30.0, 39.0, 36.0, 46.0, 77.0, 83.0, 96.0, 94.0, 77.0, 67.0, 58.0, 43.0, 43.0, 27.0, 20.0, 19.0, 12.0, 12.0, 9.0, 9.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002117156982421875, -0.00020596943795681, -0.0002002231776714325, -0.000194476917386055, -0.0001887306571006775, -0.0001829843968153, -0.00017723813652992249, -0.00017149187624454498, -0.00016574561595916748, -0.00015999935567378998, -0.00015425309538841248, -0.00014850683510303497, -0.00014276057481765747, -0.00013701431453227997, -0.00013126805424690247, -0.00012552179396152496, -0.00011977553367614746, -0.00011402927339076996, -0.00010828301310539246, -0.00010253675282001495, -9.679049253463745e-05, -9.104423224925995e-05, -8.529797196388245e-05, -7.955171167850494e-05, -7.380545139312744e-05, -6.805919110774994e-05, -6.231293082237244e-05, -5.6566670536994934e-05, -5.082041025161743e-05, -4.507414996623993e-05, -3.932788968086243e-05, -3.3581629395484924e-05, -2.7835369110107422e-05, -2.208910882472992e-05, -1.6342848539352417e-05, -1.0596588253974915e-05, -4.850327968597412e-06, 8.959323167800903e-07, 6.642192602157593e-06, 1.2388452887535095e-05, 1.8134713172912598e-05, 2.38809734582901e-05, 2.9627233743667603e-05, 3.5373494029045105e-05, 4.111975431442261e-05, 4.686601459980011e-05, 5.261227488517761e-05, 5.8358535170555115e-05, 6.410479545593262e-05, 6.985105574131012e-05, 7.559731602668762e-05, 8.134357631206512e-05, 8.708983659744263e-05, 9.283609688282013e-05, 9.858235716819763e-05, 0.00010432861745357513, 0.00011007487773895264, 0.00011582113802433014, 0.00012156739830970764, 0.00012731365859508514, 0.00013305991888046265, 0.00013880617916584015, 0.00014455243945121765, 0.00015029869973659515, 0.00015604496002197266]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 9.0, 0.0, 4.0, 9.0, 16.0, 13.0, 33.0, 43.0, 82.0, 124.0, 223.0, 497.0, 1094.0, 3360.0, 14695.0, 176689.0, 760497.0, 77903.0, 9183.0, 2359.0, 902.0, 367.0, 170.0, 116.0, 64.0, 37.0, 24.0, 13.0, 12.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.239837646484375, -1.19451904296875, -1.149200439453125, -1.1038818359375, -1.058563232421875, -1.01324462890625, -0.967926025390625, -0.922607421875, -0.877288818359375, -0.83197021484375, -0.786651611328125, -0.7413330078125, -0.696014404296875, -0.65069580078125, -0.605377197265625, -0.56005859375, -0.514739990234375, -0.46942138671875, -0.424102783203125, -0.3787841796875, -0.333465576171875, -0.28814697265625, -0.242828369140625, -0.197509765625, -0.152191162109375, -0.10687255859375, -0.061553955078125, -0.0162353515625, 0.029083251953125, 0.07440185546875, 0.119720458984375, 0.1650390625, 0.210357666015625, 0.25567626953125, 0.300994873046875, 0.3463134765625, 0.391632080078125, 0.43695068359375, 0.482269287109375, 0.527587890625, 0.572906494140625, 0.61822509765625, 0.663543701171875, 0.7088623046875, 0.754180908203125, 0.79949951171875, 0.844818115234375, 0.89013671875, 0.935455322265625, 0.98077392578125, 1.026092529296875, 1.0714111328125, 1.116729736328125, 1.16204833984375, 1.207366943359375, 1.252685546875, 1.298004150390625, 1.34332275390625, 1.388641357421875, 1.4339599609375, 1.479278564453125, 1.52459716796875, 1.569915771484375, 1.615234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 18.0, 19.0, 32.0, 47.0, 56.0, 84.0, 93.0, 121.0, 128.0, 107.0, 85.0, 71.0, 47.0, 25.0, 20.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5253143310546875, -1.476409912109375, -1.4275054931640625, -1.37860107421875, -1.3296966552734375, -1.280792236328125, -1.2318878173828125, -1.1829833984375, -1.1340789794921875, -1.085174560546875, -1.0362701416015625, -0.98736572265625, -0.9384613037109375, -0.889556884765625, -0.8406524658203125, -0.791748046875, -0.7428436279296875, -0.693939208984375, -0.6450347900390625, -0.59613037109375, -0.5472259521484375, -0.498321533203125, -0.4494171142578125, -0.4005126953125, -0.3516082763671875, -0.302703857421875, -0.2537994384765625, -0.20489501953125, -0.1559906005859375, -0.107086181640625, -0.0581817626953125, -0.00927734375, 0.0396270751953125, 0.088531494140625, 0.1374359130859375, 0.18634033203125, 0.2352447509765625, 0.284149169921875, 0.3330535888671875, 0.3819580078125, 0.4308624267578125, 0.479766845703125, 0.5286712646484375, 0.57757568359375, 0.6264801025390625, 0.675384521484375, 0.7242889404296875, 0.773193359375, 0.8220977783203125, 0.871002197265625, 0.9199066162109375, 0.96881103515625, 1.0177154541015625, 1.066619873046875, 1.1155242919921875, 1.1644287109375, 1.2133331298828125, 1.262237548828125, 1.3111419677734375, 1.36004638671875, 1.4089508056640625, 1.457855224609375, 1.5067596435546875, 1.5556640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 8.0, 6.0, 20.0, 16.0, 61.0, 88.0, 96.0, 157.0, 150.0, 150.0, 82.0, 68.0, 42.0, 25.0, 13.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.493077278137207, -12.710075378417969, -11.927074432373047, -11.144072532653809, -10.36107063293457, -9.578068733215332, -8.795066833496094, -8.012065887451172, -7.229063987731934, -6.446062088012695, -5.663060665130615, -4.880059242248535, -4.097057342529297, -3.3140556812286377, -2.5310540199279785, -1.7480525970458984, -0.9650506973266602, -0.18204903602600098, 0.6009526252746582, 1.3839542865753174, 2.1669559478759766, 2.9499576091766357, 3.732959270477295, 4.515960693359375, 5.298962593078613, 6.081964492797852, 6.864965915679932, 7.647967338562012, 8.43096923828125, 9.213971138000488, 9.996973037719727, 10.779973983764648, 11.562976837158203, 12.345978736877441, 13.12898063659668, 13.911981582641602, 14.69498348236084, 15.477985382080078, 16.260986328125, 17.043987274169922, 17.826990127563477, 18.6099910736084, 19.392993927001953, 20.175994873046875, 20.958995819091797, 21.74199867248535, 22.524999618530273, 23.308002471923828, 24.09100341796875, 24.874004364013672, 25.657007217407227, 26.44000816345215, 27.223011016845703, 28.006011962890625, 28.789012908935547, 29.57201385498047, 30.355016708374023, 31.138017654418945, 31.9210205078125, 32.70402145385742, 33.487022399902344, 34.270023345947266, 35.05302810668945, 35.836029052734375, 36.6190299987793]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 7.0, 17.0, 9.0, 14.0, 17.0, 15.0, 23.0, 28.0, 22.0, 35.0, 38.0, 52.0, 48.0, 56.0, 57.0, 47.0, 61.0, 51.0, 53.0, 35.0, 44.0, 40.0, 33.0, 28.0, 20.0, 22.0, 16.0, 20.0, 15.0, 15.0, 6.0, 8.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.971073150634766, -19.428203582763672, -18.885332107543945, -18.34246253967285, -17.799591064453125, -17.25672149658203, -16.713850021362305, -16.17098045349121, -15.6281099319458, -15.08523941040039, -14.54236888885498, -13.99949836730957, -13.456628799438477, -12.91375732421875, -12.370887756347656, -11.828017234802246, -11.285146713256836, -10.742276191711426, -10.199405670166016, -9.656535148620605, -9.113664627075195, -8.570795059204102, -8.027924537658691, -7.485054016113281, -6.942183494567871, -6.399312973022461, -5.856442451477051, -5.313572406768799, -4.770701885223389, -4.2278313636779785, -3.6849610805511475, -3.1420907974243164, -2.59921932220459, -2.0563488006591797, -1.5134785175323486, -0.970608115196228, -0.4277377128601074, 0.11513280868530273, 0.6580030918121338, 1.2008733749389648, 1.743743896484375, 2.286614418029785, 2.829484701156616, 3.3723549842834473, 3.9152255058288574, 4.458096027374268, 5.0009660720825195, 5.54383659362793, 6.08670711517334, 6.62957763671875, 7.17244815826416, 7.715318202972412, 8.258188247680664, 8.80105972290039, 9.343929290771484, 9.886799812316895, 10.429670333862305, 10.972540855407715, 11.515411376953125, 12.058281898498535, 12.601152420043945, 13.144021987915039, 13.68689250946045, 14.22976303100586, 14.77263355255127]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 13.0, 20.0, 28.0, 45.0, 40.0, 76.0, 96.0, 171.0, 225.0, 385.0, 549.0, 958.0, 1603.0, 3143.0, 6553.0, 16224.0, 52841.0, 381845.0, 3438502.0, 224179.0, 41242.0, 13433.0, 5646.0, 2698.0, 1412.0, 843.0, 514.0, 321.0, 202.0, 138.0, 86.0, 74.0, 46.0, 29.0, 27.0, 20.0, 10.0, 8.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.547088623046875, -1.49261474609375, -1.438140869140625, -1.3836669921875, -1.329193115234375, -1.27471923828125, -1.220245361328125, -1.165771484375, -1.111297607421875, -1.05682373046875, -1.002349853515625, -0.9478759765625, -0.893402099609375, -0.83892822265625, -0.784454345703125, -0.72998046875, -0.675506591796875, -0.62103271484375, -0.566558837890625, -0.5120849609375, -0.457611083984375, -0.40313720703125, -0.348663330078125, -0.294189453125, -0.239715576171875, -0.18524169921875, -0.130767822265625, -0.0762939453125, -0.021820068359375, 0.03265380859375, 0.087127685546875, 0.1416015625, 0.196075439453125, 0.25054931640625, 0.305023193359375, 0.3594970703125, 0.413970947265625, 0.46844482421875, 0.522918701171875, 0.577392578125, 0.631866455078125, 0.68634033203125, 0.740814208984375, 0.7952880859375, 0.849761962890625, 0.90423583984375, 0.958709716796875, 1.01318359375, 1.067657470703125, 1.12213134765625, 1.176605224609375, 1.2310791015625, 1.285552978515625, 1.34002685546875, 1.394500732421875, 1.448974609375, 1.503448486328125, 1.55792236328125, 1.612396240234375, 1.6668701171875, 1.721343994140625, 1.77581787109375, 1.830291748046875, 1.884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 11.0, 21.0, 25.0, 33.0, 36.0, 51.0, 60.0, 55.0, 89.0, 94.0, 92.0, 80.0, 70.0, 48.0, 48.0, 38.0, 40.0, 28.0, 25.0, 16.0, 12.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.458984375, -1.425994873046875, -1.39300537109375, -1.360015869140625, -1.3270263671875, -1.294036865234375, -1.26104736328125, -1.228057861328125, -1.195068359375, -1.162078857421875, -1.12908935546875, -1.096099853515625, -1.0631103515625, -1.030120849609375, -0.99713134765625, -0.964141845703125, -0.93115234375, -0.898162841796875, -0.86517333984375, -0.832183837890625, -0.7991943359375, -0.766204833984375, -0.73321533203125, -0.700225830078125, -0.667236328125, -0.634246826171875, -0.60125732421875, -0.568267822265625, -0.5352783203125, -0.502288818359375, -0.46929931640625, -0.436309814453125, -0.4033203125, -0.370330810546875, -0.33734130859375, -0.304351806640625, -0.2713623046875, -0.238372802734375, -0.20538330078125, -0.172393798828125, -0.139404296875, -0.106414794921875, -0.07342529296875, -0.040435791015625, -0.0074462890625, 0.025543212890625, 0.05853271484375, 0.091522216796875, 0.12451171875, 0.157501220703125, 0.19049072265625, 0.223480224609375, 0.2564697265625, 0.289459228515625, 0.32244873046875, 0.355438232421875, 0.388427734375, 0.421417236328125, 0.45440673828125, 0.487396240234375, 0.5203857421875, 0.553375244140625, 0.58636474609375, 0.619354248046875, 0.65234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 15.0, 18.0, 26.0, 47.0, 77.0, 177.0, 422.0, 1103.0, 4306.0, 24159.0, 313242.0, 3743988.0, 91562.0, 11545.0, 2374.0, 644.0, 261.0, 127.0, 56.0, 32.0, 22.0, 21.0, 11.0, 11.0, 10.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.96710205078125, -2.8658447265625, -2.76458740234375, -2.663330078125, -2.56207275390625, -2.4608154296875, -2.35955810546875, -2.25830078125, -2.15704345703125, -2.0557861328125, -1.95452880859375, -1.853271484375, -1.75201416015625, -1.6507568359375, -1.54949951171875, -1.4482421875, -1.34698486328125, -1.2457275390625, -1.14447021484375, -1.043212890625, -0.94195556640625, -0.8406982421875, -0.73944091796875, -0.63818359375, -0.53692626953125, -0.4356689453125, -0.33441162109375, -0.233154296875, -0.13189697265625, -0.0306396484375, 0.07061767578125, 0.171875, 0.27313232421875, 0.3743896484375, 0.47564697265625, 0.576904296875, 0.67816162109375, 0.7794189453125, 0.88067626953125, 0.98193359375, 1.08319091796875, 1.1844482421875, 1.28570556640625, 1.386962890625, 1.48822021484375, 1.5894775390625, 1.69073486328125, 1.7919921875, 1.89324951171875, 1.9945068359375, 2.09576416015625, 2.197021484375, 2.29827880859375, 2.3995361328125, 2.50079345703125, 2.60205078125, 2.70330810546875, 2.8045654296875, 2.90582275390625, 3.007080078125, 3.10833740234375, 3.2095947265625, 3.31085205078125, 3.412109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 14.0, 27.0, 31.0, 66.0, 90.0, 182.0, 461.0, 1615.0, 944.0, 291.0, 126.0, 67.0, 46.0, 23.0, 15.0, 16.0, 6.0, 4.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.396331787109375, -3.30633544921875, -3.216339111328125, -3.1263427734375, -3.036346435546875, -2.94635009765625, -2.856353759765625, -2.766357421875, -2.676361083984375, -2.58636474609375, -2.496368408203125, -2.4063720703125, -2.316375732421875, -2.22637939453125, -2.136383056640625, -2.04638671875, -1.956390380859375, -1.86639404296875, -1.776397705078125, -1.6864013671875, -1.596405029296875, -1.50640869140625, -1.416412353515625, -1.326416015625, -1.236419677734375, -1.14642333984375, -1.056427001953125, -0.9664306640625, -0.876434326171875, -0.78643798828125, -0.696441650390625, -0.6064453125, -0.516448974609375, -0.42645263671875, -0.336456298828125, -0.2464599609375, -0.156463623046875, -0.06646728515625, 0.023529052734375, 0.113525390625, 0.203521728515625, 0.29351806640625, 0.383514404296875, 0.4735107421875, 0.563507080078125, 0.65350341796875, 0.743499755859375, 0.83349609375, 0.923492431640625, 1.01348876953125, 1.103485107421875, 1.1934814453125, 1.283477783203125, 1.37347412109375, 1.463470458984375, 1.553466796875, 1.643463134765625, 1.73345947265625, 1.823455810546875, 1.9134521484375, 2.003448486328125, 2.09344482421875, 2.183441162109375, 2.2734375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 15.0, 35.0, 62.0, 118.0, 170.0, 202.0, 147.0, 96.0, 67.0, 35.0, 12.0, 10.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.216615676879883, -22.61217498779297, -22.007732391357422, -21.403291702270508, -20.798851013183594, -20.194408416748047, -19.589967727661133, -18.98552703857422, -18.381084442138672, -17.776643753051758, -17.17220115661621, -16.567760467529297, -15.963318824768066, -15.358877182006836, -14.754436492919922, -14.149994850158691, -13.545553207397461, -12.94111156463623, -12.336669921875, -11.732229232788086, -11.127787590026855, -10.523345947265625, -9.918905258178711, -9.31446361541748, -8.71002197265625, -8.10558032989502, -7.501139163970947, -6.896697998046875, -6.2922563552856445, -5.687814712524414, -5.083373546600342, -4.4789323806762695, -3.8744897842407227, -3.2700483798980713, -2.66560697555542, -2.0611655712127686, -1.4567241668701172, -0.8522827625274658, -0.24784135818481445, 0.3565998077392578, 0.9610414505004883, 1.5654828548431396, 2.169924259185791, 2.7743656635284424, 3.3788070678710938, 3.983248472213745, 4.5876898765563965, 5.192131042480469, 5.796572685241699, 6.40101432800293, 7.005455493927002, 7.609896659851074, 8.214338302612305, 8.818779945373535, 9.423221588134766, 10.02766227722168, 10.63210391998291, 11.23654556274414, 11.840986251831055, 12.445427894592285, 13.049869537353516, 13.654311180114746, 14.258752822875977, 14.86319351196289, 15.467635154724121]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 13.0, 7.0, 10.0, 25.0, 32.0, 21.0, 39.0, 41.0, 49.0, 48.0, 37.0, 57.0, 65.0, 68.0, 57.0, 59.0, 51.0, 44.0, 38.0, 38.0, 38.0, 33.0, 25.0, 19.0, 15.0, 15.0, 15.0, 8.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.658726692199707, -8.326745986938477, -7.994765758514404, -7.662785053253174, -7.330804824829102, -6.998824119567871, -6.666843414306641, -6.33486270904541, -6.002882480621338, -5.670901775360107, -5.338921546936035, -5.006940841674805, -4.674960136413574, -4.342979907989502, -4.0109992027282715, -3.67901873588562, -3.3470382690429688, -3.0150578022003174, -2.683077335357666, -2.3510966300964355, -2.019116163253784, -1.6871356964111328, -1.355155110359192, -1.023174524307251, -0.6911940574645996, -0.35921353101730347, -0.027233004570007324, 0.3047475218772888, 0.636728048324585, 0.9687085151672363, 1.3006891012191772, 1.6326696872711182, 1.964651107788086, 2.2966315746307373, 2.6286120414733887, 2.960592746734619, 3.2925732135772705, 3.624553680419922, 3.9565343856811523, 4.288515090942383, 4.620495319366455, 4.9524760246276855, 5.284456253051758, 5.616436958312988, 5.948417663574219, 6.280397891998291, 6.6123785972595215, 6.944358825683594, 7.276339530944824, 7.608320236206055, 7.940300464630127, 8.2722806930542, 8.60426139831543, 8.93624210357666, 9.26822280883789, 9.600203514099121, 9.932184219360352, 10.264164924621582, 10.596145629882812, 10.928125381469727, 11.260106086730957, 11.592086791992188, 11.924067497253418, 12.256048202514648, 12.588027954101562]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 8.0, 19.0, 24.0, 32.0, 50.0, 70.0, 119.0, 173.0, 261.0, 517.0, 832.0, 1553.0, 3109.0, 6451.0, 14397.0, 31671.0, 74086.0, 168985.0, 304422.0, 241089.0, 112237.0, 48518.0, 21053.0, 9507.0, 4425.0, 2195.0, 1169.0, 629.0, 338.0, 210.0, 147.0, 76.0, 56.0, 42.0, 28.0, 14.0, 13.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.341796875, -1.29815673828125, -1.2545166015625, -1.21087646484375, -1.167236328125, -1.12359619140625, -1.0799560546875, -1.03631591796875, -0.99267578125, -0.94903564453125, -0.9053955078125, -0.86175537109375, -0.818115234375, -0.77447509765625, -0.7308349609375, -0.68719482421875, -0.6435546875, -0.59991455078125, -0.5562744140625, -0.51263427734375, -0.468994140625, -0.42535400390625, -0.3817138671875, -0.33807373046875, -0.29443359375, -0.25079345703125, -0.2071533203125, -0.16351318359375, -0.119873046875, -0.07623291015625, -0.0325927734375, 0.01104736328125, 0.0546875, 0.09832763671875, 0.1419677734375, 0.18560791015625, 0.229248046875, 0.27288818359375, 0.3165283203125, 0.36016845703125, 0.40380859375, 0.44744873046875, 0.4910888671875, 0.53472900390625, 0.578369140625, 0.62200927734375, 0.6656494140625, 0.70928955078125, 0.7529296875, 0.79656982421875, 0.8402099609375, 0.88385009765625, 0.927490234375, 0.97113037109375, 1.0147705078125, 1.05841064453125, 1.10205078125, 1.14569091796875, 1.1893310546875, 1.23297119140625, 1.276611328125, 1.32025146484375, 1.3638916015625, 1.40753173828125, 1.451171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 7.0, 11.0, 9.0, 13.0, 10.0, 29.0, 16.0, 35.0, 28.0, 28.0, 44.0, 56.0, 68.0, 48.0, 58.0, 62.0, 50.0, 49.0, 34.0, 53.0, 32.0, 41.0, 31.0, 32.0, 33.0, 26.0, 21.0, 16.0, 10.0, 11.0, 9.0, 10.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6677703857421875, -0.644622802734375, -0.6214752197265625, -0.59832763671875, -0.5751800537109375, -0.552032470703125, -0.5288848876953125, -0.5057373046875, -0.4825897216796875, -0.459442138671875, -0.4362945556640625, -0.41314697265625, -0.3899993896484375, -0.366851806640625, -0.3437042236328125, -0.320556640625, -0.2974090576171875, -0.274261474609375, -0.2511138916015625, -0.22796630859375, -0.2048187255859375, -0.181671142578125, -0.1585235595703125, -0.1353759765625, -0.1122283935546875, -0.089080810546875, -0.0659332275390625, -0.04278564453125, -0.0196380615234375, 0.003509521484375, 0.0266571044921875, 0.0498046875, 0.0729522705078125, 0.096099853515625, 0.1192474365234375, 0.14239501953125, 0.1655426025390625, 0.188690185546875, 0.2118377685546875, 0.2349853515625, 0.2581329345703125, 0.281280517578125, 0.3044281005859375, 0.32757568359375, 0.3507232666015625, 0.373870849609375, 0.3970184326171875, 0.420166015625, 0.4433135986328125, 0.466461181640625, 0.4896087646484375, 0.51275634765625, 0.5359039306640625, 0.559051513671875, 0.5821990966796875, 0.6053466796875, 0.6284942626953125, 0.651641845703125, 0.6747894287109375, 0.69793701171875, 0.7210845947265625, 0.744232177734375, 0.7673797607421875, 0.79052734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 6.0, 9.0, 19.0, 13.0, 22.0, 47.0, 64.0, 65.0, 126.0, 172.0, 277.0, 543.0, 918.0, 1874.0, 4862.0, 20427.0, 177775.0, 719470.0, 100769.0, 13769.0, 3823.0, 1513.0, 776.0, 426.0, 273.0, 172.0, 105.0, 64.0, 54.0, 41.0, 20.0, 18.0, 14.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.40234375, -3.3004150390625, -3.198486328125, -3.0965576171875, -2.99462890625, -2.8927001953125, -2.790771484375, -2.6888427734375, -2.5869140625, -2.4849853515625, -2.383056640625, -2.2811279296875, -2.17919921875, -2.0772705078125, -1.975341796875, -1.8734130859375, -1.771484375, -1.6695556640625, -1.567626953125, -1.4656982421875, -1.36376953125, -1.2618408203125, -1.159912109375, -1.0579833984375, -0.9560546875, -0.8541259765625, -0.752197265625, -0.6502685546875, -0.54833984375, -0.4464111328125, -0.344482421875, -0.2425537109375, -0.140625, -0.0386962890625, 0.063232421875, 0.1651611328125, 0.26708984375, 0.3690185546875, 0.470947265625, 0.5728759765625, 0.6748046875, 0.7767333984375, 0.878662109375, 0.9805908203125, 1.08251953125, 1.1844482421875, 1.286376953125, 1.3883056640625, 1.490234375, 1.5921630859375, 1.694091796875, 1.7960205078125, 1.89794921875, 1.9998779296875, 2.101806640625, 2.2037353515625, 2.3056640625, 2.4075927734375, 2.509521484375, 2.6114501953125, 2.71337890625, 2.8153076171875, 2.917236328125, 3.0191650390625, 3.12109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 12.0, 10.0, 21.0, 9.0, 18.0, 21.0, 22.0, 33.0, 26.0, 28.0, 21.0, 33.0, 34.0, 34.0, 50.0, 48.0, 43.0, 43.0, 51.0, 48.0, 49.0, 36.0, 48.0, 33.0, 32.0, 26.0, 25.0, 23.0, 18.0, 13.0, 15.0, 19.0, 10.0, 8.0, 6.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.395294189453125, -2.30621337890625, -2.217132568359375, -2.1280517578125, -2.038970947265625, -1.94989013671875, -1.860809326171875, -1.771728515625, -1.682647705078125, -1.59356689453125, -1.504486083984375, -1.4154052734375, -1.326324462890625, -1.23724365234375, -1.148162841796875, -1.05908203125, -0.970001220703125, -0.88092041015625, -0.791839599609375, -0.7027587890625, -0.613677978515625, -0.52459716796875, -0.435516357421875, -0.346435546875, -0.257354736328125, -0.16827392578125, -0.079193115234375, 0.0098876953125, 0.098968505859375, 0.18804931640625, 0.277130126953125, 0.3662109375, 0.455291748046875, 0.54437255859375, 0.633453369140625, 0.7225341796875, 0.811614990234375, 0.90069580078125, 0.989776611328125, 1.078857421875, 1.167938232421875, 1.25701904296875, 1.346099853515625, 1.4351806640625, 1.524261474609375, 1.61334228515625, 1.702423095703125, 1.79150390625, 1.880584716796875, 1.96966552734375, 2.058746337890625, 2.1478271484375, 2.236907958984375, 2.32598876953125, 2.415069580078125, 2.504150390625, 2.593231201171875, 2.68231201171875, 2.771392822265625, 2.8604736328125, 2.949554443359375, 3.03863525390625, 3.127716064453125, 3.216796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 14.0, 11.0, 17.0, 30.0, 49.0, 74.0, 113.0, 170.0, 272.0, 558.0, 1235.0, 3172.0, 11951.0, 80550.0, 772863.0, 152236.0, 17895.0, 4224.0, 1483.0, 715.0, 362.0, 200.0, 118.0, 64.0, 45.0, 35.0, 16.0, 22.0, 12.0, 11.0, 11.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.6689453125, -1.6245880126953125, -1.580230712890625, -1.5358734130859375, -1.49151611328125, -1.4471588134765625, -1.402801513671875, -1.3584442138671875, -1.3140869140625, -1.2697296142578125, -1.225372314453125, -1.1810150146484375, -1.13665771484375, -1.0923004150390625, -1.047943115234375, -1.0035858154296875, -0.959228515625, -0.9148712158203125, -0.870513916015625, -0.8261566162109375, -0.78179931640625, -0.7374420166015625, -0.693084716796875, -0.6487274169921875, -0.6043701171875, -0.5600128173828125, -0.515655517578125, -0.4712982177734375, -0.42694091796875, -0.3825836181640625, -0.338226318359375, -0.2938690185546875, -0.24951171875, -0.2051544189453125, -0.160797119140625, -0.1164398193359375, -0.07208251953125, -0.0277252197265625, 0.016632080078125, 0.0609893798828125, 0.1053466796875, 0.1497039794921875, 0.194061279296875, 0.2384185791015625, 0.28277587890625, 0.3271331787109375, 0.371490478515625, 0.4158477783203125, 0.460205078125, 0.5045623779296875, 0.548919677734375, 0.5932769775390625, 0.63763427734375, 0.6819915771484375, 0.726348876953125, 0.7707061767578125, 0.8150634765625, 0.8594207763671875, 0.903778076171875, 0.9481353759765625, 0.99249267578125, 1.0368499755859375, 1.081207275390625, 1.1255645751953125, 1.169921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 10.0, 13.0, 16.0, 13.0, 24.0, 36.0, 29.0, 46.0, 47.0, 74.0, 69.0, 102.0, 85.0, 89.0, 65.0, 37.0, 38.0, 30.0, 28.0, 24.0, 22.0, 11.0, 10.0, 13.0, 5.0, 6.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015103816986083984, -0.00014526955783367157, -0.0001395009458065033, -0.00013373233377933502, -0.00012796372175216675, -0.00012219510972499847, -0.0001164264976978302, -0.00011065788567066193, -0.00010488927364349365, -9.912066161632538e-05, -9.33520495891571e-05, -8.758343756198883e-05, -8.181482553482056e-05, -7.604621350765228e-05, -7.027760148048401e-05, -6.450898945331573e-05, -5.874037742614746e-05, -5.297176539897919e-05, -4.720315337181091e-05, -4.143454134464264e-05, -3.5665929317474365e-05, -2.989731729030609e-05, -2.4128705263137817e-05, -1.8360093235969543e-05, -1.259148120880127e-05, -6.822869181632996e-06, -1.0542571544647217e-06, 4.714354872703552e-06, 1.0482966899871826e-05, 1.62515789270401e-05, 2.2020190954208374e-05, 2.7788802981376648e-05, 3.355741500854492e-05, 3.9326027035713196e-05, 4.509463906288147e-05, 5.0863251090049744e-05, 5.663186311721802e-05, 6.240047514438629e-05, 6.816908717155457e-05, 7.393769919872284e-05, 7.970631122589111e-05, 8.547492325305939e-05, 9.124353528022766e-05, 9.701214730739594e-05, 0.00010278075933456421, 0.00010854937136173248, 0.00011431798338890076, 0.00012008659541606903, 0.0001258552074432373, 0.00013162381947040558, 0.00013739243149757385, 0.00014316104352474213, 0.0001489296555519104, 0.00015469826757907867, 0.00016046687960624695, 0.00016623549163341522, 0.0001720041036605835, 0.00017777271568775177, 0.00018354132771492004, 0.00018930993974208832, 0.0001950785517692566, 0.00020084716379642487, 0.00020661577582359314, 0.00021238438785076141, 0.0002181529998779297]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 9.0, 27.0, 24.0, 48.0, 74.0, 88.0, 187.0, 326.0, 746.0, 1652.0, 5338.0, 29599.0, 409100.0, 557193.0, 34714.0, 5974.0, 1790.0, 786.0, 380.0, 213.0, 108.0, 63.0, 34.0, 22.0, 18.0, 11.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2329254150390625, -1.185577392578125, -1.1382293701171875, -1.09088134765625, -1.0435333251953125, -0.996185302734375, -0.9488372802734375, -0.9014892578125, -0.8541412353515625, -0.806793212890625, -0.7594451904296875, -0.71209716796875, -0.6647491455078125, -0.617401123046875, -0.5700531005859375, -0.522705078125, -0.4753570556640625, -0.428009033203125, -0.3806610107421875, -0.33331298828125, -0.2859649658203125, -0.238616943359375, -0.1912689208984375, -0.1439208984375, -0.0965728759765625, -0.049224853515625, -0.0018768310546875, 0.04547119140625, 0.0928192138671875, 0.140167236328125, 0.1875152587890625, 0.23486328125, 0.2822113037109375, 0.329559326171875, 0.3769073486328125, 0.42425537109375, 0.4716033935546875, 0.518951416015625, 0.5662994384765625, 0.6136474609375, 0.6609954833984375, 0.708343505859375, 0.7556915283203125, 0.80303955078125, 0.8503875732421875, 0.897735595703125, 0.9450836181640625, 0.992431640625, 1.0397796630859375, 1.087127685546875, 1.1344757080078125, 1.18182373046875, 1.2291717529296875, 1.276519775390625, 1.3238677978515625, 1.3712158203125, 1.4185638427734375, 1.465911865234375, 1.5132598876953125, 1.56060791015625, 1.6079559326171875, 1.655303955078125, 1.7026519775390625, 1.75]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 5.0, 7.0, 13.0, 16.0, 19.0, 22.0, 42.0, 41.0, 54.0, 81.0, 80.0, 108.0, 104.0, 74.0, 72.0, 62.0, 42.0, 25.0, 19.0, 25.0, 21.0, 14.0, 8.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.62109375, -1.5816268920898438, -1.5421600341796875, -1.5026931762695312, -1.463226318359375, -1.4237594604492188, -1.3842926025390625, -1.3448257446289062, -1.30535888671875, -1.2658920288085938, -1.2264251708984375, -1.1869583129882812, -1.147491455078125, -1.1080245971679688, -1.0685577392578125, -1.0290908813476562, -0.9896240234375, -0.9501571655273438, -0.9106903076171875, -0.8712234497070312, -0.831756591796875, -0.7922897338867188, -0.7528228759765625, -0.7133560180664062, -0.67388916015625, -0.6344223022460938, -0.5949554443359375, -0.5554885864257812, -0.516021728515625, -0.47655487060546875, -0.4370880126953125, -0.39762115478515625, -0.358154296875, -0.31868743896484375, -0.2792205810546875, -0.23975372314453125, -0.200286865234375, -0.16082000732421875, -0.1213531494140625, -0.08188629150390625, -0.04241943359375, -0.00295257568359375, 0.0365142822265625, 0.07598114013671875, 0.115447998046875, 0.15491485595703125, 0.1943817138671875, 0.23384857177734375, 0.2733154296875, 0.31278228759765625, 0.3522491455078125, 0.39171600341796875, 0.431182861328125, 0.47064971923828125, 0.5101165771484375, 0.5495834350585938, 0.58905029296875, 0.6285171508789062, 0.6679840087890625, 0.7074508666992188, 0.746917724609375, 0.7863845825195312, 0.8258514404296875, 0.8653182983398438, 0.90478515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 18.0, 56.0, 137.0, 323.0, 264.0, 134.0, 33.0, 20.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.43658447265625, -13.213057518005371, -11.989530563354492, -10.766002655029297, -9.542476654052734, -8.318948745727539, -7.09542179107666, -5.871894836425781, -4.648367881774902, -3.4248409271240234, -2.2013137340545654, -0.9777865409851074, 0.24574041366577148, 1.4692673683166504, 2.6927947998046875, 3.9163217544555664, 5.139848709106445, 6.363375663757324, 7.586902618408203, 8.810430526733398, 10.033956527709961, 11.257484436035156, 12.481011390686035, 13.704538345336914, 14.928065299987793, 16.151592254638672, 17.375120162963867, 18.59864616394043, 19.822174072265625, 21.045700073242188, 22.269227981567383, 23.492755889892578, 24.71628189086914, 25.939809799194336, 27.1633358001709, 28.386863708496094, 29.610389709472656, 30.83391761779785, 32.05744552612305, 33.28097152709961, 34.50449752807617, 35.728023529052734, 36.95155334472656, 38.175079345703125, 39.39860534667969, 40.62213134765625, 41.84566116333008, 43.06918716430664, 44.29271697998047, 45.51624298095703, 46.73977279663086, 47.96329879760742, 49.186824798583984, 50.41035079956055, 51.633880615234375, 52.85740661621094, 54.0809326171875, 55.30445861816406, 56.52798843383789, 57.75151443481445, 58.975040435791016, 60.19856643676758, 61.422096252441406, 62.64562225341797, 63.86914825439453]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 4.0, 7.0, 11.0, 8.0, 11.0, 21.0, 46.0, 39.0, 33.0, 53.0, 65.0, 69.0, 80.0, 89.0, 71.0, 58.0, 46.0, 38.0, 37.0, 46.0, 34.0, 22.0, 24.0, 16.0, 14.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.751739501953125, -11.231823921203613, -10.711908340454102, -10.19199275970459, -9.672077178955078, -9.152161598205566, -8.632246017456055, -8.112329483032227, -7.592414379119873, -7.072498798370361, -6.55258321762085, -6.03266716003418, -5.512751579284668, -4.992835998535156, -4.4729204177856445, -3.953004837036133, -3.433089256286621, -2.9131736755371094, -2.3932580947875977, -1.8733422756195068, -1.3534266948699951, -0.8335111141204834, -0.3135952949523926, 0.20632028579711914, 0.7262358665466309, 1.2461514472961426, 1.7660671472549438, 2.285982847213745, 2.805898427963257, 3.3258140087127686, 3.8457298278808594, 4.365645408630371, 4.885560989379883, 5.4054765701293945, 5.925392150878906, 6.445307731628418, 6.96522331237793, 7.485138893127441, 8.005054473876953, 8.524971008300781, 9.044885635375977, 9.564801216125488, 10.084716796875, 10.604632377624512, 11.124547958374023, 11.644463539123535, 12.164379119873047, 12.684295654296875, 13.204211235046387, 13.724126815795898, 14.24404239654541, 14.763957977294922, 15.283873558044434, 15.803789138793945, 16.323705673217773, 16.84362030029297, 17.363536834716797, 17.883453369140625, 18.40336799621582, 18.92328453063965, 19.443199157714844, 19.963115692138672, 20.483030319213867, 21.002946853637695, 21.52286148071289]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 12.0, 15.0, 11.0, 16.0, 19.0, 19.0, 47.0, 38.0, 66.0, 83.0, 116.0, 151.0, 283.0, 678.0, 2367.0, 11775.0, 127311.0, 3897709.0, 137602.0, 11780.0, 2342.0, 784.0, 344.0, 205.0, 104.0, 84.0, 70.0, 53.0, 37.0, 37.0, 22.0, 19.0, 23.0, 11.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.927734375, -2.831787109375, -2.73583984375, -2.639892578125, -2.5439453125, -2.447998046875, -2.35205078125, -2.256103515625, -2.16015625, -2.064208984375, -1.96826171875, -1.872314453125, -1.7763671875, -1.680419921875, -1.58447265625, -1.488525390625, -1.392578125, -1.296630859375, -1.20068359375, -1.104736328125, -1.0087890625, -0.912841796875, -0.81689453125, -0.720947265625, -0.625, -0.529052734375, -0.43310546875, -0.337158203125, -0.2412109375, -0.145263671875, -0.04931640625, 0.046630859375, 0.142578125, 0.238525390625, 0.33447265625, 0.430419921875, 0.5263671875, 0.622314453125, 0.71826171875, 0.814208984375, 0.91015625, 1.006103515625, 1.10205078125, 1.197998046875, 1.2939453125, 1.389892578125, 1.48583984375, 1.581787109375, 1.677734375, 1.773681640625, 1.86962890625, 1.965576171875, 2.0615234375, 2.157470703125, 2.25341796875, 2.349365234375, 2.4453125, 2.541259765625, 2.63720703125, 2.733154296875, 2.8291015625, 2.925048828125, 3.02099609375, 3.116943359375, 3.212890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 13.0, 27.0, 44.0, 44.0, 70.0, 99.0, 108.0, 111.0, 117.0, 88.0, 85.0, 66.0, 51.0, 33.0, 17.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.7859725952148438, -0.7394256591796875, -0.6928787231445312, -0.646331787109375, -0.5997848510742188, -0.5532379150390625, -0.5066909790039062, -0.46014404296875, -0.41359710693359375, -0.3670501708984375, -0.32050323486328125, -0.273956298828125, -0.22740936279296875, -0.1808624267578125, -0.13431549072265625, -0.0877685546875, -0.04122161865234375, 0.0053253173828125, 0.05187225341796875, 0.098419189453125, 0.14496612548828125, 0.1915130615234375, 0.23805999755859375, 0.28460693359375, 0.33115386962890625, 0.3777008056640625, 0.42424774169921875, 0.470794677734375, 0.5173416137695312, 0.5638885498046875, 0.6104354858398438, 0.656982421875, 0.7035293579101562, 0.7500762939453125, 0.7966232299804688, 0.843170166015625, 0.8897171020507812, 0.9362640380859375, 0.9828109741210938, 1.02935791015625, 1.0759048461914062, 1.1224517822265625, 1.1689987182617188, 1.215545654296875, 1.2620925903320312, 1.3086395263671875, 1.3551864624023438, 1.4017333984375, 1.4482803344726562, 1.4948272705078125, 1.5413742065429688, 1.587921142578125, 1.6344680786132812, 1.6810150146484375, 1.7275619506835938, 1.77410888671875, 1.8206558227539062, 1.8672027587890625, 1.9137496948242188, 1.960296630859375, 2.0068435668945312, 2.0533905029296875, 2.0999374389648438, 2.146484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 7.0, 11.0, 14.0, 22.0, 45.0, 96.0, 196.0, 478.0, 1216.0, 3835.0, 12734.0, 54186.0, 584974.0, 3351725.0, 150708.0, 24559.0, 6208.0, 1979.0, 753.0, 279.0, 116.0, 61.0, 33.0, 14.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.3266448974609375, -2.258758544921875, -2.1908721923828125, -2.12298583984375, -2.0550994873046875, -1.987213134765625, -1.9193267822265625, -1.8514404296875, -1.7835540771484375, -1.715667724609375, -1.6477813720703125, -1.57989501953125, -1.5120086669921875, -1.444122314453125, -1.3762359619140625, -1.308349609375, -1.2404632568359375, -1.172576904296875, -1.1046905517578125, -1.03680419921875, -0.9689178466796875, -0.901031494140625, -0.8331451416015625, -0.7652587890625, -0.6973724365234375, -0.629486083984375, -0.5615997314453125, -0.49371337890625, -0.4258270263671875, -0.357940673828125, -0.2900543212890625, -0.22216796875, -0.1542816162109375, -0.086395263671875, -0.0185089111328125, 0.04937744140625, 0.1172637939453125, 0.185150146484375, 0.2530364990234375, 0.3209228515625, 0.3888092041015625, 0.456695556640625, 0.5245819091796875, 0.59246826171875, 0.6603546142578125, 0.728240966796875, 0.7961273193359375, 0.864013671875, 0.9319000244140625, 0.999786376953125, 1.0676727294921875, 1.13555908203125, 1.2034454345703125, 1.271331787109375, 1.3392181396484375, 1.4071044921875, 1.4749908447265625, 1.542877197265625, 1.6107635498046875, 1.67864990234375, 1.7465362548828125, 1.814422607421875, 1.8823089599609375, 1.9501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 11.0, 22.0, 30.0, 32.0, 44.0, 69.0, 114.0, 191.0, 357.0, 753.0, 1146.0, 631.0, 287.0, 129.0, 94.0, 35.0, 34.0, 13.0, 17.0, 10.0, 6.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.2656402587890625, -2.203155517578125, -2.1406707763671875, -2.07818603515625, -2.0157012939453125, -1.953216552734375, -1.8907318115234375, -1.8282470703125, -1.7657623291015625, -1.703277587890625, -1.6407928466796875, -1.57830810546875, -1.5158233642578125, -1.453338623046875, -1.3908538818359375, -1.328369140625, -1.2658843994140625, -1.203399658203125, -1.1409149169921875, -1.07843017578125, -1.0159454345703125, -0.953460693359375, -0.8909759521484375, -0.8284912109375, -0.7660064697265625, -0.703521728515625, -0.6410369873046875, -0.57855224609375, -0.5160675048828125, -0.453582763671875, -0.3910980224609375, -0.32861328125, -0.2661285400390625, -0.203643798828125, -0.1411590576171875, -0.07867431640625, -0.0161895751953125, 0.046295166015625, 0.1087799072265625, 0.1712646484375, 0.2337493896484375, 0.296234130859375, 0.3587188720703125, 0.42120361328125, 0.4836883544921875, 0.546173095703125, 0.6086578369140625, 0.671142578125, 0.7336273193359375, 0.796112060546875, 0.8585968017578125, 0.92108154296875, 0.9835662841796875, 1.046051025390625, 1.1085357666015625, 1.1710205078125, 1.2335052490234375, 1.295989990234375, 1.3584747314453125, 1.42095947265625, 1.4834442138671875, 1.545928955078125, 1.6084136962890625, 1.6708984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 13.0, 17.0, 47.0, 192.0, 378.0, 262.0, 68.0, 9.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.10574722290039, -25.055419921875, -24.00509262084961, -22.95476531982422, -21.904438018798828, -20.854110717773438, -19.80378532409668, -18.75345802307129, -17.7031307220459, -16.652803421020508, -15.602476119995117, -14.552149772644043, -13.501822471618652, -12.451495170593262, -11.401168823242188, -10.350841522216797, -9.300514221191406, -8.250186920166016, -7.199860095977783, -6.149533271789551, -5.09920597076416, -4.0488786697387695, -2.998551845550537, -1.9482250213623047, -0.8978977203369141, 0.15242934226989746, 1.202756404876709, 2.2530834674835205, 3.303410530090332, 4.353737831115723, 5.404064655303955, 6.4543914794921875, 7.504722595214844, 8.555049896240234, 9.605377197265625, 10.6557035446167, 11.70603084564209, 12.75635814666748, 13.806684494018555, 14.857011795043945, 15.907339096069336, 16.957666397094727, 18.007993698120117, 19.058320999145508, 20.108646392822266, 21.158973693847656, 22.209300994873047, 23.259628295898438, 24.309955596923828, 25.36028289794922, 26.41061019897461, 27.4609375, 28.51126480102539, 29.56159210205078, 30.61191749572754, 31.66224479675293, 32.71257019042969, 33.76289749145508, 34.81322479248047, 35.86355209350586, 36.91387939453125, 37.96420669555664, 39.01453399658203, 40.064857482910156, 41.11518859863281]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 8.0, 18.0, 24.0, 25.0, 32.0, 23.0, 35.0, 42.0, 37.0, 42.0, 49.0, 42.0, 63.0, 54.0, 57.0, 64.0, 46.0, 41.0, 45.0, 42.0, 34.0, 27.0, 27.0, 24.0, 14.0, 16.0, 12.0, 8.0, 11.0, 3.0, 8.0, 4.0, 4.0, 0.0, 3.0], "bins": [-10.711135864257812, -10.457696914672852, -10.204257011413574, -9.950818061828613, -9.697378158569336, -9.443939208984375, -9.190499305725098, -8.937060356140137, -8.68362045288086, -8.430181503295898, -8.176741600036621, -7.923302173614502, -7.669862747192383, -7.416423797607422, -7.162984371185303, -6.909544944763184, -6.656105995178223, -6.4026665687561035, -6.149227142333984, -5.895787715911865, -5.642348289489746, -5.388909339904785, -5.135469913482666, -4.882030487060547, -4.628591060638428, -4.375151634216309, -4.1217122077941895, -3.8682730197906494, -3.6148335933685303, -3.361394166946411, -3.107954978942871, -2.854515552520752, -2.601077079772949, -2.34763765335083, -2.094198226928711, -1.840759038925171, -1.5873196125030518, -1.3338801860809326, -1.080440878868103, -0.8270015716552734, -0.5735621452331543, -0.32012277841567993, -0.06668341159820557, 0.1867559552192688, 0.44019532203674316, 0.6936347484588623, 0.9470740556716919, 1.2005133628845215, 1.4539527893066406, 1.7073922157287598, 1.9608315229415894, 2.214270830154419, 2.467710256576538, 2.7211496829986572, 2.9745888710021973, 3.2280282974243164, 3.4814677238464355, 3.7349071502685547, 3.988346576690674, 4.241786003112793, 4.495224952697754, 4.748664855957031, 5.002103805541992, 5.255543231964111, 5.5089826583862305]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 5.0, 13.0, 13.0, 9.0, 35.0, 47.0, 61.0, 106.0, 172.0, 288.0, 445.0, 816.0, 1507.0, 2882.0, 5551.0, 11118.0, 23821.0, 53453.0, 127223.0, 285567.0, 294750.0, 134754.0, 56726.0, 25182.0, 11806.0, 5649.0, 2898.0, 1573.0, 898.0, 443.0, 296.0, 180.0, 99.0, 59.0, 37.0, 26.0, 17.0, 12.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.0942840576171875, -1.053802490234375, -1.0133209228515625, -0.97283935546875, -0.9323577880859375, -0.891876220703125, -0.8513946533203125, -0.8109130859375, -0.7704315185546875, -0.729949951171875, -0.6894683837890625, -0.64898681640625, -0.6085052490234375, -0.568023681640625, -0.5275421142578125, -0.487060546875, -0.4465789794921875, -0.406097412109375, -0.3656158447265625, -0.32513427734375, -0.2846527099609375, -0.244171142578125, -0.2036895751953125, -0.1632080078125, -0.1227264404296875, -0.082244873046875, -0.0417633056640625, -0.00128173828125, 0.0391998291015625, 0.079681396484375, 0.1201629638671875, 0.16064453125, 0.2011260986328125, 0.241607666015625, 0.2820892333984375, 0.32257080078125, 0.3630523681640625, 0.403533935546875, 0.4440155029296875, 0.4844970703125, 0.5249786376953125, 0.565460205078125, 0.6059417724609375, 0.64642333984375, 0.6869049072265625, 0.727386474609375, 0.7678680419921875, 0.808349609375, 0.8488311767578125, 0.889312744140625, 0.9297943115234375, 0.97027587890625, 1.0107574462890625, 1.051239013671875, 1.0917205810546875, 1.1322021484375, 1.1726837158203125, 1.213165283203125, 1.2536468505859375, 1.29412841796875, 1.3346099853515625, 1.375091552734375, 1.4155731201171875, 1.4560546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 5.0, 5.0, 9.0, 19.0, 25.0, 19.0, 31.0, 33.0, 42.0, 40.0, 40.0, 44.0, 50.0, 59.0, 51.0, 56.0, 47.0, 56.0, 46.0, 55.0, 41.0, 41.0, 30.0, 29.0, 33.0, 23.0, 11.0, 11.0, 9.0, 8.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6350555419921875, -0.611907958984375, -0.5887603759765625, -0.56561279296875, -0.5424652099609375, -0.519317626953125, -0.4961700439453125, -0.4730224609375, -0.4498748779296875, -0.426727294921875, -0.4035797119140625, -0.38043212890625, -0.3572845458984375, -0.334136962890625, -0.3109893798828125, -0.287841796875, -0.2646942138671875, -0.241546630859375, -0.2183990478515625, -0.19525146484375, -0.1721038818359375, -0.148956298828125, -0.1258087158203125, -0.1026611328125, -0.0795135498046875, -0.056365966796875, -0.0332183837890625, -0.01007080078125, 0.0130767822265625, 0.036224365234375, 0.0593719482421875, 0.08251953125, 0.1056671142578125, 0.128814697265625, 0.1519622802734375, 0.17510986328125, 0.1982574462890625, 0.221405029296875, 0.2445526123046875, 0.2677001953125, 0.2908477783203125, 0.313995361328125, 0.3371429443359375, 0.36029052734375, 0.3834381103515625, 0.406585693359375, 0.4297332763671875, 0.452880859375, 0.4760284423828125, 0.499176025390625, 0.5223236083984375, 0.54547119140625, 0.5686187744140625, 0.591766357421875, 0.6149139404296875, 0.6380615234375, 0.6612091064453125, 0.684356689453125, 0.7075042724609375, 0.73065185546875, 0.7537994384765625, 0.776947021484375, 0.8000946044921875, 0.8232421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 6.0, 10.0, 4.0, 10.0, 13.0, 24.0, 17.0, 38.0, 44.0, 62.0, 74.0, 137.0, 173.0, 250.0, 415.0, 619.0, 1048.0, 2073.0, 4542.0, 12419.0, 40258.0, 154658.0, 550894.0, 203435.0, 50745.0, 15429.0, 5493.0, 2410.0, 1250.0, 662.0, 448.0, 270.0, 184.0, 121.0, 100.0, 55.0, 34.0, 30.0, 21.0, 22.0, 16.0, 11.0, 5.0, 4.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8623046875, -1.8033599853515625, -1.744415283203125, -1.6854705810546875, -1.62652587890625, -1.5675811767578125, -1.508636474609375, -1.4496917724609375, -1.3907470703125, -1.3318023681640625, -1.272857666015625, -1.2139129638671875, -1.15496826171875, -1.0960235595703125, -1.037078857421875, -0.9781341552734375, -0.919189453125, -0.8602447509765625, -0.801300048828125, -0.7423553466796875, -0.68341064453125, -0.6244659423828125, -0.565521240234375, -0.5065765380859375, -0.4476318359375, -0.3886871337890625, -0.329742431640625, -0.2707977294921875, -0.21185302734375, -0.1529083251953125, -0.093963623046875, -0.0350189208984375, 0.02392578125, 0.0828704833984375, 0.141815185546875, 0.2007598876953125, 0.25970458984375, 0.3186492919921875, 0.377593994140625, 0.4365386962890625, 0.4954833984375, 0.5544281005859375, 0.613372802734375, 0.6723175048828125, 0.73126220703125, 0.7902069091796875, 0.849151611328125, 0.9080963134765625, 0.967041015625, 1.0259857177734375, 1.084930419921875, 1.1438751220703125, 1.20281982421875, 1.2617645263671875, 1.320709228515625, 1.3796539306640625, 1.4385986328125, 1.4975433349609375, 1.556488037109375, 1.6154327392578125, 1.67437744140625, 1.7333221435546875, 1.792266845703125, 1.8512115478515625, 1.91015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 8.0, 3.0, 11.0, 11.0, 16.0, 18.0, 14.0, 20.0, 22.0, 27.0, 37.0, 37.0, 33.0, 33.0, 28.0, 24.0, 41.0, 45.0, 34.0, 43.0, 43.0, 35.0, 39.0, 34.0, 30.0, 34.0, 38.0, 24.0, 29.0, 19.0, 24.0, 23.0, 14.0, 20.0, 11.0, 11.0, 10.0, 5.0, 16.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0234375, -1.95928955078125, -1.8951416015625, -1.83099365234375, -1.766845703125, -1.70269775390625, -1.6385498046875, -1.57440185546875, -1.51025390625, -1.44610595703125, -1.3819580078125, -1.31781005859375, -1.253662109375, -1.18951416015625, -1.1253662109375, -1.06121826171875, -0.9970703125, -0.93292236328125, -0.8687744140625, -0.80462646484375, -0.740478515625, -0.67633056640625, -0.6121826171875, -0.54803466796875, -0.48388671875, -0.41973876953125, -0.3555908203125, -0.29144287109375, -0.227294921875, -0.16314697265625, -0.0989990234375, -0.03485107421875, 0.029296875, 0.09344482421875, 0.1575927734375, 0.22174072265625, 0.285888671875, 0.35003662109375, 0.4141845703125, 0.47833251953125, 0.54248046875, 0.60662841796875, 0.6707763671875, 0.73492431640625, 0.799072265625, 0.86322021484375, 0.9273681640625, 0.99151611328125, 1.0556640625, 1.11981201171875, 1.1839599609375, 1.24810791015625, 1.312255859375, 1.37640380859375, 1.4405517578125, 1.50469970703125, 1.56884765625, 1.63299560546875, 1.6971435546875, 1.76129150390625, 1.825439453125, 1.88958740234375, 1.9537353515625, 2.01788330078125, 2.08203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 15.0, 17.0, 27.0, 36.0, 49.0, 84.0, 157.0, 336.0, 775.0, 2115.0, 9312.0, 91134.0, 817017.0, 112861.0, 10738.0, 2321.0, 772.0, 344.0, 155.0, 96.0, 55.0, 38.0, 29.0, 17.0, 11.0, 9.0, 9.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.358856201171875, -1.30950927734375, -1.260162353515625, -1.2108154296875, -1.161468505859375, -1.11212158203125, -1.062774658203125, -1.013427734375, -0.964080810546875, -0.91473388671875, -0.865386962890625, -0.8160400390625, -0.766693115234375, -0.71734619140625, -0.667999267578125, -0.61865234375, -0.569305419921875, -0.51995849609375, -0.470611572265625, -0.4212646484375, -0.371917724609375, -0.32257080078125, -0.273223876953125, -0.223876953125, -0.174530029296875, -0.12518310546875, -0.075836181640625, -0.0264892578125, 0.022857666015625, 0.07220458984375, 0.121551513671875, 0.1708984375, 0.220245361328125, 0.26959228515625, 0.318939208984375, 0.3682861328125, 0.417633056640625, 0.46697998046875, 0.516326904296875, 0.565673828125, 0.615020751953125, 0.66436767578125, 0.713714599609375, 0.7630615234375, 0.812408447265625, 0.86175537109375, 0.911102294921875, 0.96044921875, 1.009796142578125, 1.05914306640625, 1.108489990234375, 1.1578369140625, 1.207183837890625, 1.25653076171875, 1.305877685546875, 1.355224609375, 1.404571533203125, 1.45391845703125, 1.503265380859375, 1.5526123046875, 1.601959228515625, 1.65130615234375, 1.700653076171875, 1.75]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 13.0, 26.0, 46.0, 92.0, 194.0, 238.0, 191.0, 87.0, 42.0, 23.0, 11.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000377655029296875, -0.00036153942346572876, -0.0003454238176345825, -0.0003293082118034363, -0.00031319260597229004, -0.0002970770001411438, -0.00028096139430999756, -0.0002648457884788513, -0.0002487301826477051, -0.00023261457681655884, -0.0002164989709854126, -0.00020038336515426636, -0.00018426775932312012, -0.00016815215349197388, -0.00015203654766082764, -0.0001359209418296814, -0.00011980533599853516, -0.00010368973016738892, -8.757412433624268e-05, -7.145851850509644e-05, -5.5342912673950195e-05, -3.9227306842803955e-05, -2.3111701011657715e-05, -6.996095180511475e-06, 9.119510650634766e-06, 2.5235116481781006e-05, 4.1350722312927246e-05, 5.7466328144073486e-05, 7.358193397521973e-05, 8.969753980636597e-05, 0.00010581314563751221, 0.00012192875146865845, 0.0001380443572998047, 0.00015415996313095093, 0.00017027556896209717, 0.0001863911747932434, 0.00020250678062438965, 0.0002186223864555359, 0.00023473799228668213, 0.00025085359811782837, 0.0002669692039489746, 0.00028308480978012085, 0.0002992004156112671, 0.00031531602144241333, 0.00033143162727355957, 0.0003475472331047058, 0.00036366283893585205, 0.0003797784447669983, 0.00039589405059814453, 0.00041200965642929077, 0.000428125262260437, 0.00044424086809158325, 0.0004603564739227295, 0.00047647207975387573, 0.000492587685585022, 0.0005087032914161682, 0.0005248188972473145, 0.0005409345030784607, 0.0005570501089096069, 0.0005731657147407532, 0.0005892813205718994, 0.0006053969264030457, 0.0006215125322341919, 0.0006376281380653381, 0.0006537437438964844]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 12.0, 27.0, 25.0, 39.0, 59.0, 87.0, 114.0, 206.0, 332.0, 606.0, 1262.0, 2951.0, 8537.0, 35387.0, 229789.0, 630006.0, 109721.0, 19550.0, 5557.0, 2104.0, 926.0, 445.0, 277.0, 152.0, 101.0, 71.0, 56.0, 44.0, 26.0, 16.0, 9.0, 15.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9628753662109375, -0.933074951171875, -0.9032745361328125, -0.87347412109375, -0.8436737060546875, -0.813873291015625, -0.7840728759765625, -0.7542724609375, -0.7244720458984375, -0.694671630859375, -0.6648712158203125, -0.63507080078125, -0.6052703857421875, -0.575469970703125, -0.5456695556640625, -0.515869140625, -0.4860687255859375, -0.456268310546875, -0.4264678955078125, -0.39666748046875, -0.3668670654296875, -0.337066650390625, -0.3072662353515625, -0.2774658203125, -0.2476654052734375, -0.217864990234375, -0.1880645751953125, -0.15826416015625, -0.1284637451171875, -0.098663330078125, -0.0688629150390625, -0.0390625, -0.0092620849609375, 0.020538330078125, 0.0503387451171875, 0.08013916015625, 0.1099395751953125, 0.139739990234375, 0.1695404052734375, 0.1993408203125, 0.2291412353515625, 0.258941650390625, 0.2887420654296875, 0.31854248046875, 0.3483428955078125, 0.378143310546875, 0.4079437255859375, 0.437744140625, 0.4675445556640625, 0.497344970703125, 0.5271453857421875, 0.55694580078125, 0.5867462158203125, 0.616546630859375, 0.6463470458984375, 0.6761474609375, 0.7059478759765625, 0.735748291015625, 0.7655487060546875, 0.79534912109375, 0.8251495361328125, 0.854949951171875, 0.8847503662109375, 0.91455078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 3.0, 8.0, 14.0, 11.0, 18.0, 13.0, 25.0, 32.0, 32.0, 40.0, 50.0, 52.0, 58.0, 70.0, 64.0, 85.0, 65.0, 64.0, 44.0, 40.0, 37.0, 27.0, 27.0, 23.0, 14.0, 13.0, 11.0, 9.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5370025634765625, -0.514434814453125, -0.4918670654296875, -0.46929931640625, -0.4467315673828125, -0.424163818359375, -0.4015960693359375, -0.3790283203125, -0.3564605712890625, -0.333892822265625, -0.3113250732421875, -0.28875732421875, -0.2661895751953125, -0.243621826171875, -0.2210540771484375, -0.198486328125, -0.1759185791015625, -0.153350830078125, -0.1307830810546875, -0.10821533203125, -0.0856475830078125, -0.063079833984375, -0.0405120849609375, -0.0179443359375, 0.0046234130859375, 0.027191162109375, 0.0497589111328125, 0.07232666015625, 0.0948944091796875, 0.117462158203125, 0.1400299072265625, 0.16259765625, 0.1851654052734375, 0.207733154296875, 0.2303009033203125, 0.25286865234375, 0.2754364013671875, 0.298004150390625, 0.3205718994140625, 0.3431396484375, 0.3657073974609375, 0.388275146484375, 0.4108428955078125, 0.43341064453125, 0.4559783935546875, 0.478546142578125, 0.5011138916015625, 0.523681640625, 0.5462493896484375, 0.568817138671875, 0.5913848876953125, 0.61395263671875, 0.6365203857421875, 0.659088134765625, 0.6816558837890625, 0.7042236328125, 0.7267913818359375, 0.749359130859375, 0.7719268798828125, 0.79449462890625, 0.8170623779296875, 0.839630126953125, 0.8621978759765625, 0.884765625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 21.0, 51.0, 129.0, 244.0, 279.0, 137.0, 67.0, 31.0, 12.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.25227165222168, -27.34659767150879, -26.4409236907959, -25.535247802734375, -24.629573822021484, -23.723899841308594, -22.818225860595703, -21.912551879882812, -21.006877899169922, -20.10120391845703, -19.19552993774414, -18.28985595703125, -17.384180068969727, -16.478506088256836, -15.572832107543945, -14.667158126831055, -13.761483192443848, -12.855809211730957, -11.95013427734375, -11.04446029663086, -10.138786315917969, -9.233112335205078, -8.327437400817871, -7.4217634201049805, -6.516088962554932, -5.610414505004883, -4.704740524291992, -3.7990660667419434, -2.8933918476104736, -1.987717628479004, -1.082043170928955, -0.17636919021606445, 0.7293052673339844, 1.634979486465454, 2.540653705596924, 3.4463281631469727, 4.352002143859863, 5.257676601409912, 6.163351058959961, 7.069025039672852, 7.9746994972229, 8.88037395477295, 9.78604793548584, 10.691722869873047, 11.597396850585938, 12.503070831298828, 13.408744812011719, 14.31441879272461, 15.220093727111816, 16.125768661499023, 17.031442642211914, 17.937116622924805, 18.842790603637695, 19.748464584350586, 20.65414047241211, 21.559814453125, 22.46548843383789, 23.37116241455078, 24.276836395263672, 25.182510375976562, 26.088186264038086, 26.993860244750977, 27.899534225463867, 28.805208206176758, 29.71088218688965]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 4.0, 6.0, 9.0, 17.0, 11.0, 10.0, 14.0, 25.0, 20.0, 29.0, 29.0, 32.0, 38.0, 35.0, 41.0, 51.0, 70.0, 61.0, 57.0, 55.0, 48.0, 47.0, 38.0, 38.0, 40.0, 25.0, 32.0, 20.0, 15.0, 13.0, 8.0, 12.0, 10.0, 9.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.498224258422852, -12.157544136047363, -11.816864967346191, -11.476184844970703, -11.135505676269531, -10.794825553894043, -10.454146385192871, -10.113466262817383, -9.772787094116211, -9.432106971740723, -9.09142780303955, -8.750747680664062, -8.41006851196289, -8.069388389587402, -7.7287092208862305, -7.388029098510742, -7.047349452972412, -6.706669807434082, -6.365990161895752, -6.025310516357422, -5.684630870819092, -5.343951225280762, -5.003271102905273, -4.662591934204102, -4.321911811828613, -3.981232166290283, -3.640552520751953, -3.299872875213623, -2.959193229675293, -2.618513584136963, -2.2778337001800537, -1.9371540546417236, -1.5964746475219727, -1.2557950019836426, -0.9151152968406677, -0.5744355916976929, -0.2337559461593628, 0.10692369937896729, 0.4476034641265869, 0.788283109664917, 1.128962755203247, 1.4696424007415771, 1.8103220462799072, 2.1510019302368164, 2.4916815757751465, 2.8323612213134766, 3.1730408668518066, 3.5137205123901367, 3.854400157928467, 4.195079803466797, 4.535759449005127, 4.876439094543457, 5.217118740081787, 5.557798385620117, 5.8984785079956055, 6.239157676696777, 6.579837799072266, 6.920517444610596, 7.261197090148926, 7.601876735687256, 7.942556381225586, 8.283236503601074, 8.623915672302246, 8.964595794677734, 9.305274963378906]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 6.0, 7.0, 15.0, 36.0, 31.0, 47.0, 82.0, 128.0, 258.0, 556.0, 1492.0, 4192.0, 13673.0, 53873.0, 323976.0, 2676048.0, 972448.0, 111423.0, 24484.0, 7242.0, 2403.0, 955.0, 406.0, 202.0, 113.0, 58.0, 29.0, 24.0, 14.0, 18.0, 6.0, 7.0, 8.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7373046875, -1.6956710815429688, -1.6540374755859375, -1.6124038696289062, -1.570770263671875, -1.5291366577148438, -1.4875030517578125, -1.4458694458007812, -1.40423583984375, -1.3626022338867188, -1.3209686279296875, -1.2793350219726562, -1.237701416015625, -1.1960678100585938, -1.1544342041015625, -1.1128005981445312, -1.0711669921875, -1.0295333862304688, -0.9878997802734375, -0.9462661743164062, -0.904632568359375, -0.8629989624023438, -0.8213653564453125, -0.7797317504882812, -0.73809814453125, -0.6964645385742188, -0.6548309326171875, -0.6131973266601562, -0.571563720703125, -0.5299301147460938, -0.4882965087890625, -0.44666290283203125, -0.405029296875, -0.36339569091796875, -0.3217620849609375, -0.28012847900390625, -0.238494873046875, -0.19686126708984375, -0.1552276611328125, -0.11359405517578125, -0.07196044921875, -0.03032684326171875, 0.0113067626953125, 0.05294036865234375, 0.094573974609375, 0.13620758056640625, 0.1778411865234375, 0.21947479248046875, 0.2611083984375, 0.30274200439453125, 0.3443756103515625, 0.38600921630859375, 0.427642822265625, 0.46927642822265625, 0.5109100341796875, 0.5525436401367188, 0.59417724609375, 0.6358108520507812, 0.6774444580078125, 0.7190780639648438, 0.760711669921875, 0.8023452758789062, 0.8439788818359375, 0.8856124877929688, 0.92724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 11.0, 7.0, 17.0, 21.0, 17.0, 24.0, 41.0, 30.0, 52.0, 43.0, 40.0, 60.0, 55.0, 56.0, 69.0, 45.0, 48.0, 54.0, 42.0, 35.0, 36.0, 34.0, 30.0, 23.0, 24.0, 23.0, 12.0, 11.0, 10.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7147216796875, -0.692626953125, -0.6705322265625, -0.6484375, -0.6263427734375, -0.604248046875, -0.5821533203125, -0.56005859375, -0.5379638671875, -0.515869140625, -0.4937744140625, -0.4716796875, -0.4495849609375, -0.427490234375, -0.4053955078125, -0.38330078125, -0.3612060546875, -0.339111328125, -0.3170166015625, -0.294921875, -0.2728271484375, -0.250732421875, -0.2286376953125, -0.20654296875, -0.1844482421875, -0.162353515625, -0.1402587890625, -0.1181640625, -0.0960693359375, -0.073974609375, -0.0518798828125, -0.02978515625, -0.0076904296875, 0.014404296875, 0.0364990234375, 0.05859375, 0.0806884765625, 0.102783203125, 0.1248779296875, 0.14697265625, 0.1690673828125, 0.191162109375, 0.2132568359375, 0.2353515625, 0.2574462890625, 0.279541015625, 0.3016357421875, 0.32373046875, 0.3458251953125, 0.367919921875, 0.3900146484375, 0.412109375, 0.4342041015625, 0.456298828125, 0.4783935546875, 0.50048828125, 0.5225830078125, 0.544677734375, 0.5667724609375, 0.5888671875, 0.6109619140625, 0.633056640625, 0.6551513671875, 0.67724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 2.0, 12.0, 19.0, 23.0, 30.0, 40.0, 85.0, 194.0, 444.0, 1163.0, 3794.0, 17310.0, 131148.0, 2880317.0, 1076710.0, 67455.0, 11192.0, 2654.0, 906.0, 375.0, 154.0, 103.0, 54.0, 26.0, 17.0, 21.0, 16.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.5935821533203125, -2.525054931640625, -2.4565277099609375, -2.38800048828125, -2.3194732666015625, -2.250946044921875, -2.1824188232421875, -2.1138916015625, -2.0453643798828125, -1.976837158203125, -1.9083099365234375, -1.83978271484375, -1.7712554931640625, -1.702728271484375, -1.6342010498046875, -1.565673828125, -1.4971466064453125, -1.428619384765625, -1.3600921630859375, -1.29156494140625, -1.2230377197265625, -1.154510498046875, -1.0859832763671875, -1.0174560546875, -0.9489288330078125, -0.880401611328125, -0.8118743896484375, -0.74334716796875, -0.6748199462890625, -0.606292724609375, -0.5377655029296875, -0.46923828125, -0.4007110595703125, -0.332183837890625, -0.2636566162109375, -0.19512939453125, -0.1266021728515625, -0.058074951171875, 0.0104522705078125, 0.0789794921875, 0.1475067138671875, 0.216033935546875, 0.2845611572265625, 0.35308837890625, 0.4216156005859375, 0.490142822265625, 0.5586700439453125, 0.627197265625, 0.6957244873046875, 0.764251708984375, 0.8327789306640625, 0.90130615234375, 0.9698333740234375, 1.038360595703125, 1.1068878173828125, 1.1754150390625, 1.2439422607421875, 1.312469482421875, 1.3809967041015625, 1.44952392578125, 1.5180511474609375, 1.586578369140625, 1.6551055908203125, 1.7236328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 8.0, 12.0, 19.0, 25.0, 38.0, 50.0, 63.0, 80.0, 130.0, 173.0, 342.0, 495.0, 729.0, 666.0, 412.0, 255.0, 155.0, 119.0, 70.0, 54.0, 33.0, 36.0, 26.0, 15.0, 16.0, 12.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4846649169921875, -1.429290771484375, -1.3739166259765625, -1.31854248046875, -1.2631683349609375, -1.207794189453125, -1.1524200439453125, -1.0970458984375, -1.0416717529296875, -0.986297607421875, -0.9309234619140625, -0.87554931640625, -0.8201751708984375, -0.764801025390625, -0.7094268798828125, -0.654052734375, -0.5986785888671875, -0.543304443359375, -0.4879302978515625, -0.43255615234375, -0.3771820068359375, -0.321807861328125, -0.2664337158203125, -0.2110595703125, -0.1556854248046875, -0.100311279296875, -0.0449371337890625, 0.01043701171875, 0.0658111572265625, 0.121185302734375, 0.1765594482421875, 0.23193359375, 0.2873077392578125, 0.342681884765625, 0.3980560302734375, 0.45343017578125, 0.5088043212890625, 0.564178466796875, 0.6195526123046875, 0.6749267578125, 0.7303009033203125, 0.785675048828125, 0.8410491943359375, 0.89642333984375, 0.9517974853515625, 1.007171630859375, 1.0625457763671875, 1.117919921875, 1.1732940673828125, 1.228668212890625, 1.2840423583984375, 1.33941650390625, 1.3947906494140625, 1.450164794921875, 1.5055389404296875, 1.5609130859375, 1.6162872314453125, 1.671661376953125, 1.7270355224609375, 1.78240966796875, 1.8377838134765625, 1.893157958984375, 1.9485321044921875, 2.00390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 29.0, 81.0, 255.0, 330.0, 201.0, 64.0, 20.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90439224243164, -53.773372650146484, -52.64234924316406, -51.511329650878906, -50.380306243896484, -49.24928665161133, -48.118263244628906, -46.98724365234375, -45.856224060058594, -44.72520446777344, -43.594181060791016, -42.46316146850586, -41.33213806152344, -40.20111846923828, -39.07009506225586, -37.9390754699707, -36.80805206298828, -35.677032470703125, -34.5460090637207, -33.41498947143555, -32.283966064453125, -31.15294647216797, -30.02192497253418, -28.89090347290039, -27.7598819732666, -26.628860473632812, -25.497838973999023, -24.366817474365234, -23.235797882080078, -22.104774475097656, -20.9737548828125, -19.84273338317871, -18.711713790893555, -17.580692291259766, -16.449670791625977, -15.318650245666504, -14.187628746032715, -13.056607246398926, -11.925586700439453, -10.794565200805664, -9.663543701171875, -8.532522201538086, -7.401501178741455, -6.270480155944824, -5.139458656311035, -4.008437156677246, -2.8774161338806152, -1.7463951110839844, -0.6153736114501953, 0.5156476497650146, 1.6466689109802246, 2.7776901721954346, 3.9087114334106445, 5.039732933044434, 6.1707539558410645, 7.301774978637695, 8.432796478271484, 9.563817977905273, 10.694839477539062, 11.825860023498535, 12.956881523132324, 14.087903022766113, 15.218923568725586, 16.349945068359375, 17.480966567993164]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 9.0, 8.0, 15.0, 12.0, 15.0, 20.0, 24.0, 25.0, 23.0, 27.0, 30.0, 31.0, 45.0, 44.0, 50.0, 51.0, 39.0, 54.0, 27.0, 46.0, 40.0, 45.0, 39.0, 30.0, 44.0, 21.0, 25.0, 20.0, 20.0, 23.0, 12.0, 12.0, 9.0, 12.0, 6.0, 11.0, 2.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.35908031463623, -8.098928451538086, -7.838776111602783, -7.578624248504639, -7.318471908569336, -7.058320045471191, -6.798168182373047, -6.538016319274902, -6.2778639793396, -6.017712116241455, -5.757559776306152, -5.497407913208008, -5.237256050109863, -4.9771037101745605, -4.716951847076416, -4.456799507141113, -4.196647644042969, -3.936495542526245, -3.6763434410095215, -3.416191577911377, -3.1560394763946533, -2.8958873748779297, -2.635735511779785, -2.3755834102630615, -2.115431308746338, -1.8552792072296143, -1.5951272249221802, -1.334975242614746, -1.0748231410980225, -0.8146710395812988, -0.5545190572738647, -0.29436707496643066, -0.03421592712402344, 0.22593611478805542, 0.4860881567001343, 0.7462401986122131, 1.006392240524292, 1.2665443420410156, 1.5266963243484497, 1.7868483066558838, 2.0470004081726074, 2.307152509689331, 2.5673046112060547, 2.827456474304199, 3.087608575820923, 3.3477606773376465, 3.607912540435791, 3.8680646419525146, 4.128216743469238, 4.388368606567383, 4.6485209465026855, 4.90867280960083, 5.168825149536133, 5.428977012634277, 5.689128875732422, 5.949280738830566, 6.209433078765869, 6.469584941864014, 6.729737281799316, 6.989889144897461, 7.2500410079956055, 7.510193347930908, 7.770345211029053, 8.030497550964355, 8.2906494140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 15.0, 16.0, 49.0, 78.0, 125.0, 239.0, 431.0, 927.0, 2036.0, 4847.0, 12062.0, 31841.0, 82588.0, 203607.0, 344478.0, 218392.0, 89557.0, 34546.0, 13095.0, 5298.0, 2217.0, 1003.0, 478.0, 269.0, 137.0, 77.0, 51.0, 23.0, 18.0, 15.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.106292724609375, -1.06121826171875, -1.016143798828125, -0.9710693359375, -0.925994873046875, -0.88092041015625, -0.835845947265625, -0.790771484375, -0.745697021484375, -0.70062255859375, -0.655548095703125, -0.6104736328125, -0.565399169921875, -0.52032470703125, -0.475250244140625, -0.43017578125, -0.385101318359375, -0.34002685546875, -0.294952392578125, -0.2498779296875, -0.204803466796875, -0.15972900390625, -0.114654541015625, -0.069580078125, -0.024505615234375, 0.02056884765625, 0.065643310546875, 0.1107177734375, 0.155792236328125, 0.20086669921875, 0.245941162109375, 0.291015625, 0.336090087890625, 0.38116455078125, 0.426239013671875, 0.4713134765625, 0.516387939453125, 0.56146240234375, 0.606536865234375, 0.651611328125, 0.696685791015625, 0.74176025390625, 0.786834716796875, 0.8319091796875, 0.876983642578125, 0.92205810546875, 0.967132568359375, 1.01220703125, 1.057281494140625, 1.10235595703125, 1.147430419921875, 1.1925048828125, 1.237579345703125, 1.28265380859375, 1.327728271484375, 1.372802734375, 1.417877197265625, 1.46295166015625, 1.508026123046875, 1.5531005859375, 1.598175048828125, 1.64324951171875, 1.688323974609375, 1.7333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 7.0, 13.0, 8.0, 7.0, 13.0, 10.0, 16.0, 17.0, 17.0, 28.0, 29.0, 27.0, 33.0, 29.0, 30.0, 28.0, 29.0, 23.0, 36.0, 34.0, 49.0, 43.0, 46.0, 42.0, 32.0, 33.0, 38.0, 29.0, 31.0, 31.0, 28.0, 22.0, 20.0, 16.0, 18.0, 17.0, 13.0, 5.0, 6.0, 5.0, 8.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.515625, -0.4998435974121094, -0.48406219482421875, -0.4682807922363281, -0.4524993896484375, -0.4367179870605469, -0.42093658447265625, -0.4051551818847656, -0.389373779296875, -0.3735923767089844, -0.35781097412109375, -0.3420295715332031, -0.3262481689453125, -0.3104667663574219, -0.29468536376953125, -0.2789039611816406, -0.26312255859375, -0.24734115600585938, -0.23155975341796875, -0.21577835083007812, -0.1999969482421875, -0.18421554565429688, -0.16843414306640625, -0.15265274047851562, -0.136871337890625, -0.12108993530273438, -0.10530853271484375, -0.08952713012695312, -0.0737457275390625, -0.057964324951171875, -0.04218292236328125, -0.026401519775390625, -0.0106201171875, 0.005161285400390625, 0.02094268798828125, 0.036724090576171875, 0.0525054931640625, 0.06828689575195312, 0.08406829833984375, 0.09984970092773438, 0.115631103515625, 0.13141250610351562, 0.14719390869140625, 0.16297531127929688, 0.1787567138671875, 0.19453811645507812, 0.21031951904296875, 0.22610092163085938, 0.24188232421875, 0.2576637268066406, 0.27344512939453125, 0.2892265319824219, 0.3050079345703125, 0.3207893371582031, 0.33657073974609375, 0.3523521423339844, 0.368133544921875, 0.3839149475097656, 0.39969635009765625, 0.4154777526855469, 0.4312591552734375, 0.4470405578613281, 0.46282196044921875, 0.4786033630371094, 0.494384765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 12.0, 7.0, 13.0, 11.0, 24.0, 36.0, 39.0, 57.0, 68.0, 105.0, 166.0, 230.0, 348.0, 526.0, 732.0, 1217.0, 2170.0, 4676.0, 14292.0, 65677.0, 391515.0, 472778.0, 68178.0, 14930.0, 4936.0, 2194.0, 1222.0, 755.0, 484.0, 379.0, 219.0, 153.0, 134.0, 77.0, 59.0, 42.0, 28.0, 22.0, 16.0, 9.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.689453125, -2.616790771484375, -2.54412841796875, -2.471466064453125, -2.3988037109375, -2.326141357421875, -2.25347900390625, -2.180816650390625, -2.108154296875, -2.035491943359375, -1.96282958984375, -1.890167236328125, -1.8175048828125, -1.744842529296875, -1.67218017578125, -1.599517822265625, -1.52685546875, -1.454193115234375, -1.38153076171875, -1.308868408203125, -1.2362060546875, -1.163543701171875, -1.09088134765625, -1.018218994140625, -0.945556640625, -0.872894287109375, -0.80023193359375, -0.727569580078125, -0.6549072265625, -0.582244873046875, -0.50958251953125, -0.436920166015625, -0.3642578125, -0.291595458984375, -0.21893310546875, -0.146270751953125, -0.0736083984375, -0.000946044921875, 0.07171630859375, 0.144378662109375, 0.217041015625, 0.289703369140625, 0.36236572265625, 0.435028076171875, 0.5076904296875, 0.580352783203125, 0.65301513671875, 0.725677490234375, 0.79833984375, 0.871002197265625, 0.94366455078125, 1.016326904296875, 1.0889892578125, 1.161651611328125, 1.23431396484375, 1.306976318359375, 1.379638671875, 1.452301025390625, 1.52496337890625, 1.597625732421875, 1.6702880859375, 1.742950439453125, 1.81561279296875, 1.888275146484375, 1.9609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 7.0, 9.0, 17.0, 9.0, 29.0, 33.0, 28.0, 38.0, 34.0, 29.0, 51.0, 41.0, 52.0, 55.0, 63.0, 69.0, 51.0, 56.0, 44.0, 51.0, 37.0, 45.0, 25.0, 21.0, 19.0, 21.0, 10.0, 11.0, 10.0, 5.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.7890625, -3.689208984375, -3.58935546875, -3.489501953125, -3.3896484375, -3.289794921875, -3.18994140625, -3.090087890625, -2.990234375, -2.890380859375, -2.79052734375, -2.690673828125, -2.5908203125, -2.490966796875, -2.39111328125, -2.291259765625, -2.19140625, -2.091552734375, -1.99169921875, -1.891845703125, -1.7919921875, -1.692138671875, -1.59228515625, -1.492431640625, -1.392578125, -1.292724609375, -1.19287109375, -1.093017578125, -0.9931640625, -0.893310546875, -0.79345703125, -0.693603515625, -0.59375, -0.493896484375, -0.39404296875, -0.294189453125, -0.1943359375, -0.094482421875, 0.00537109375, 0.105224609375, 0.205078125, 0.304931640625, 0.40478515625, 0.504638671875, 0.6044921875, 0.704345703125, 0.80419921875, 0.904052734375, 1.00390625, 1.103759765625, 1.20361328125, 1.303466796875, 1.4033203125, 1.503173828125, 1.60302734375, 1.702880859375, 1.802734375, 1.902587890625, 2.00244140625, 2.102294921875, 2.2021484375, 2.302001953125, 2.40185546875, 2.501708984375, 2.6015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 19.0, 16.0, 33.0, 29.0, 38.0, 76.0, 135.0, 235.0, 524.0, 1445.0, 5552.0, 42367.0, 720266.0, 252519.0, 20027.0, 3400.0, 973.0, 374.0, 178.0, 100.0, 63.0, 54.0, 27.0, 21.0, 18.0, 15.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263702392578125, -1.22271728515625, -1.181732177734375, -1.1407470703125, -1.099761962890625, -1.05877685546875, -1.017791748046875, -0.976806640625, -0.935821533203125, -0.89483642578125, -0.853851318359375, -0.8128662109375, -0.771881103515625, -0.73089599609375, -0.689910888671875, -0.64892578125, -0.607940673828125, -0.56695556640625, -0.525970458984375, -0.4849853515625, -0.444000244140625, -0.40301513671875, -0.362030029296875, -0.321044921875, -0.280059814453125, -0.23907470703125, -0.198089599609375, -0.1571044921875, -0.116119384765625, -0.07513427734375, -0.034149169921875, 0.0068359375, 0.047821044921875, 0.08880615234375, 0.129791259765625, 0.1707763671875, 0.211761474609375, 0.25274658203125, 0.293731689453125, 0.334716796875, 0.375701904296875, 0.41668701171875, 0.457672119140625, 0.4986572265625, 0.539642333984375, 0.58062744140625, 0.621612548828125, 0.66259765625, 0.703582763671875, 0.74456787109375, 0.785552978515625, 0.8265380859375, 0.867523193359375, 0.90850830078125, 0.949493408203125, 0.990478515625, 1.031463623046875, 1.07244873046875, 1.113433837890625, 1.1544189453125, 1.195404052734375, 1.23638916015625, 1.277374267578125, 1.318359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 8.0, 14.0, 7.0, 14.0, 16.0, 18.0, 23.0, 25.0, 39.0, 35.0, 53.0, 75.0, 93.0, 105.0, 101.0, 66.0, 62.0, 45.0, 34.0, 31.0, 21.0, 14.0, 11.0, 9.0, 9.0, 13.0, 7.0, 6.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023496150970458984, -0.0002283584326505661, -0.00022175535559654236, -0.00021515227854251862, -0.00020854920148849487, -0.00020194612443447113, -0.0001953430473804474, -0.00018873997032642365, -0.0001821368932723999, -0.00017553381621837616, -0.00016893073916435242, -0.00016232766211032867, -0.00015572458505630493, -0.0001491215080022812, -0.00014251843094825745, -0.0001359153538942337, -0.00012931227684020996, -0.00012270919978618622, -0.00011610612273216248, -0.00010950304567813873, -0.00010289996862411499, -9.629689157009125e-05, -8.96938145160675e-05, -8.309073746204376e-05, -7.648766040802002e-05, -6.988458335399628e-05, -6.328150629997253e-05, -5.667842924594879e-05, -5.007535219192505e-05, -4.3472275137901306e-05, -3.6869198083877563e-05, -3.026612102985382e-05, -2.3663043975830078e-05, -1.7059966921806335e-05, -1.0456889867782593e-05, -3.85381281375885e-06, 2.7492642402648926e-06, 9.352341294288635e-06, 1.5955418348312378e-05, 2.255849540233612e-05, 2.9161572456359863e-05, 3.5764649510383606e-05, 4.236772656440735e-05, 4.897080361843109e-05, 5.5573880672454834e-05, 6.217695772647858e-05, 6.878003478050232e-05, 7.538311183452606e-05, 8.19861888885498e-05, 8.858926594257355e-05, 9.519234299659729e-05, 0.00010179542005062103, 0.00010839849710464478, 0.00011500157415866852, 0.00012160465121269226, 0.000128207728266716, 0.00013481080532073975, 0.0001414138823747635, 0.00014801695942878723, 0.00015462003648281097, 0.00016122311353683472, 0.00016782619059085846, 0.0001744292676448822, 0.00018103234469890594, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 6.0, 9.0, 11.0, 16.0, 18.0, 27.0, 56.0, 114.0, 167.0, 353.0, 786.0, 2018.0, 7340.0, 61731.0, 859465.0, 102354.0, 9918.0, 2437.0, 890.0, 371.0, 188.0, 103.0, 54.0, 40.0, 23.0, 15.0, 14.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2694091796875, -1.223388671875, -1.1773681640625, -1.13134765625, -1.0853271484375, -1.039306640625, -0.9932861328125, -0.947265625, -0.9012451171875, -0.855224609375, -0.8092041015625, -0.76318359375, -0.7171630859375, -0.671142578125, -0.6251220703125, -0.5791015625, -0.5330810546875, -0.487060546875, -0.4410400390625, -0.39501953125, -0.3489990234375, -0.302978515625, -0.2569580078125, -0.2109375, -0.1649169921875, -0.118896484375, -0.0728759765625, -0.02685546875, 0.0191650390625, 0.065185546875, 0.1112060546875, 0.1572265625, 0.2032470703125, 0.249267578125, 0.2952880859375, 0.34130859375, 0.3873291015625, 0.433349609375, 0.4793701171875, 0.525390625, 0.5714111328125, 0.617431640625, 0.6634521484375, 0.70947265625, 0.7554931640625, 0.801513671875, 0.8475341796875, 0.8935546875, 0.9395751953125, 0.985595703125, 1.0316162109375, 1.07763671875, 1.1236572265625, 1.169677734375, 1.2156982421875, 1.26171875, 1.3077392578125, 1.353759765625, 1.3997802734375, 1.44580078125, 1.4918212890625, 1.537841796875, 1.5838623046875, 1.6298828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 9.0, 12.0, 14.0, 10.0, 26.0, 22.0, 18.0, 44.0, 44.0, 62.0, 60.0, 64.0, 78.0, 77.0, 65.0, 69.0, 53.0, 50.0, 36.0, 20.0, 29.0, 24.0, 20.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.578155517578125, -0.55523681640625, -0.532318115234375, -0.5093994140625, -0.486480712890625, -0.46356201171875, -0.440643310546875, -0.417724609375, -0.394805908203125, -0.37188720703125, -0.348968505859375, -0.3260498046875, -0.303131103515625, -0.28021240234375, -0.257293701171875, -0.234375, -0.211456298828125, -0.18853759765625, -0.165618896484375, -0.1427001953125, -0.119781494140625, -0.09686279296875, -0.073944091796875, -0.051025390625, -0.028106689453125, -0.00518798828125, 0.017730712890625, 0.0406494140625, 0.063568115234375, 0.08648681640625, 0.109405517578125, 0.13232421875, 0.155242919921875, 0.17816162109375, 0.201080322265625, 0.2239990234375, 0.246917724609375, 0.26983642578125, 0.292755126953125, 0.315673828125, 0.338592529296875, 0.36151123046875, 0.384429931640625, 0.4073486328125, 0.430267333984375, 0.45318603515625, 0.476104736328125, 0.4990234375, 0.521942138671875, 0.54486083984375, 0.567779541015625, 0.5906982421875, 0.613616943359375, 0.63653564453125, 0.659454345703125, 0.682373046875, 0.705291748046875, 0.72821044921875, 0.751129150390625, 0.7740478515625, 0.796966552734375, 0.81988525390625, 0.842803955078125, 0.86572265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 26.0, 63.0, 113.0, 180.0, 270.0, 154.0, 87.0, 41.0, 15.0, 9.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.599945068359375, -23.90130043029785, -23.202655792236328, -22.504009246826172, -21.80536460876465, -21.106719970703125, -20.4080753326416, -19.709430694580078, -19.010784149169922, -18.3121395111084, -17.613494873046875, -16.91484832763672, -16.216203689575195, -15.517559051513672, -14.818914413452148, -14.120268821716309, -13.421624183654785, -12.722979545593262, -12.024333953857422, -11.325689315795898, -10.627043724060059, -9.928399085998535, -9.229753494262695, -8.531108856201172, -7.83246374130249, -7.133818626403809, -6.435173511505127, -5.736528396606445, -5.037883758544922, -4.339238166809082, -3.6405935287475586, -2.941948413848877, -2.2433032989501953, -1.5446581840515137, -0.8460131883621216, -0.1473681926727295, 0.5512769222259521, 1.2499220371246338, 1.9485669136047363, 2.647212028503418, 3.3458571434020996, 4.044502258300781, 4.743147373199463, 5.4417924880981445, 6.140437126159668, 6.839082717895508, 7.537727355957031, 8.236371994018555, 8.935017585754395, 9.633662223815918, 10.332307815551758, 11.030952453613281, 11.729598045349121, 12.428242683410645, 13.126888275146484, 13.825532913208008, 14.524177551269531, 15.222822189331055, 15.921467781066895, 16.620113372802734, 17.318758010864258, 18.01740264892578, 18.716047286987305, 19.414691925048828, 20.113338470458984]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 13.0, 14.0, 9.0, 18.0, 16.0, 26.0, 30.0, 41.0, 50.0, 60.0, 73.0, 99.0, 117.0, 91.0, 74.0, 55.0, 57.0, 30.0, 35.0, 23.0, 23.0, 14.0, 13.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.525236129760742, -9.979242324829102, -9.433248519897461, -8.88725471496582, -8.341261863708496, -7.7952680587768555, -7.249274253845215, -6.703280448913574, -6.157287120819092, -5.611293315887451, -5.065299987792969, -4.519306182861328, -3.9733126163482666, -3.427319049835205, -2.8813252449035645, -2.335331678390503, -1.7893381118774414, -1.2433445453643799, -0.6973508596420288, -0.15135717391967773, 0.3946363925933838, 0.9406299591064453, 1.486623764038086, 2.0326173305511475, 2.578610897064209, 3.1246044635772705, 3.670598030090332, 4.216591835021973, 4.762585639953613, 5.308578968048096, 5.854572772979736, 6.400566101074219, 6.946559906005859, 7.4925537109375, 8.03854751586914, 8.584541320800781, 9.130534172058105, 9.676527976989746, 10.222521781921387, 10.768515586853027, 11.314508438110352, 11.860502243041992, 12.406496047973633, 12.952489852905273, 13.498482704162598, 14.044476509094238, 14.590470314025879, 15.13646411895752, 15.68245792388916, 16.228450775146484, 16.774444580078125, 17.320438385009766, 17.866432189941406, 18.412425994873047, 18.958419799804688, 19.504413604736328, 20.05040740966797, 20.59640121459961, 21.14239501953125, 21.68838882446289, 22.23438262939453, 22.780376434326172, 23.326370239257812, 23.87236213684082, 24.41835594177246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 15.0, 55.0, 257.0, 1042.0, 4667.0, 46949.0, 2914864.0, 1198761.0, 24539.0, 2457.0, 436.0, 117.0, 45.0, 20.0, 14.0, 14.0, 8.0, 3.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.623046875, -3.5423431396484375, -3.461639404296875, -3.3809356689453125, -3.30023193359375, -3.2195281982421875, -3.138824462890625, -3.0581207275390625, -2.9774169921875, -2.8967132568359375, -2.816009521484375, -2.7353057861328125, -2.65460205078125, -2.5738983154296875, -2.493194580078125, -2.4124908447265625, -2.331787109375, -2.2510833740234375, -2.170379638671875, -2.0896759033203125, -2.00897216796875, -1.9282684326171875, -1.847564697265625, -1.7668609619140625, -1.6861572265625, -1.6054534912109375, -1.524749755859375, -1.4440460205078125, -1.36334228515625, -1.2826385498046875, -1.201934814453125, -1.1212310791015625, -1.04052734375, -0.9598236083984375, -0.879119873046875, -0.7984161376953125, -0.71771240234375, -0.6370086669921875, -0.556304931640625, -0.4756011962890625, -0.3948974609375, -0.3141937255859375, -0.233489990234375, -0.1527862548828125, -0.07208251953125, 0.0086212158203125, 0.089324951171875, 0.1700286865234375, 0.250732421875, 0.3314361572265625, 0.412139892578125, 0.4928436279296875, 0.57354736328125, 0.6542510986328125, 0.734954833984375, 0.8156585693359375, 0.8963623046875, 0.9770660400390625, 1.057769775390625, 1.1384735107421875, 1.21917724609375, 1.2998809814453125, 1.380584716796875, 1.4612884521484375, 1.5419921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 15.0, 29.0, 64.0, 83.0, 118.0, 155.0, 181.0, 145.0, 99.0, 68.0, 32.0, 17.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.675811767578125, -0.60943603515625, -0.543060302734375, -0.4766845703125, -0.410308837890625, -0.34393310546875, -0.277557373046875, -0.211181640625, -0.144805908203125, -0.07843017578125, -0.012054443359375, 0.0543212890625, 0.120697021484375, 0.18707275390625, 0.253448486328125, 0.31982421875, 0.386199951171875, 0.45257568359375, 0.518951416015625, 0.5853271484375, 0.651702880859375, 0.71807861328125, 0.784454345703125, 0.850830078125, 0.917205810546875, 0.98358154296875, 1.049957275390625, 1.1163330078125, 1.182708740234375, 1.24908447265625, 1.315460205078125, 1.3818359375, 1.448211669921875, 1.51458740234375, 1.580963134765625, 1.6473388671875, 1.713714599609375, 1.78009033203125, 1.846466064453125, 1.912841796875, 1.979217529296875, 2.04559326171875, 2.111968994140625, 2.1783447265625, 2.244720458984375, 2.31109619140625, 2.377471923828125, 2.44384765625, 2.510223388671875, 2.57659912109375, 2.642974853515625, 2.7093505859375, 2.775726318359375, 2.84210205078125, 2.908477783203125, 2.974853515625, 3.041229248046875, 3.10760498046875, 3.173980712890625, 3.2403564453125, 3.306732177734375, 3.37310791015625, 3.439483642578125, 3.505859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 20.0, 48.0, 102.0, 174.0, 487.0, 1607.0, 7692.0, 73917.0, 3426148.0, 653429.0, 25689.0, 3623.0, 870.0, 269.0, 97.0, 48.0, 21.0, 14.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.078125, -3.98907470703125, -3.9000244140625, -3.81097412109375, -3.721923828125, -3.63287353515625, -3.5438232421875, -3.45477294921875, -3.36572265625, -3.27667236328125, -3.1876220703125, -3.09857177734375, -3.009521484375, -2.92047119140625, -2.8314208984375, -2.74237060546875, -2.6533203125, -2.56427001953125, -2.4752197265625, -2.38616943359375, -2.297119140625, -2.20806884765625, -2.1190185546875, -2.02996826171875, -1.94091796875, -1.85186767578125, -1.7628173828125, -1.67376708984375, -1.584716796875, -1.49566650390625, -1.4066162109375, -1.31756591796875, -1.228515625, -1.13946533203125, -1.0504150390625, -0.96136474609375, -0.872314453125, -0.78326416015625, -0.6942138671875, -0.60516357421875, -0.51611328125, -0.42706298828125, -0.3380126953125, -0.24896240234375, -0.159912109375, -0.07086181640625, 0.0181884765625, 0.10723876953125, 0.1962890625, 0.28533935546875, 0.3743896484375, 0.46343994140625, 0.552490234375, 0.64154052734375, 0.7305908203125, 0.81964111328125, 0.90869140625, 0.99774169921875, 1.0867919921875, 1.17584228515625, 1.264892578125, 1.35394287109375, 1.4429931640625, 1.53204345703125, 1.62109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 21.0, 21.0, 27.0, 41.0, 55.0, 97.0, 126.0, 217.0, 397.0, 595.0, 732.0, 627.0, 386.0, 231.0, 133.0, 82.0, 55.0, 49.0, 25.0, 25.0, 20.0, 15.0, 6.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.6910247802734375, -1.638885498046875, -1.5867462158203125, -1.53460693359375, -1.4824676513671875, -1.430328369140625, -1.3781890869140625, -1.3260498046875, -1.2739105224609375, -1.221771240234375, -1.1696319580078125, -1.11749267578125, -1.0653533935546875, -1.013214111328125, -0.9610748291015625, -0.908935546875, -0.8567962646484375, -0.804656982421875, -0.7525177001953125, -0.70037841796875, -0.6482391357421875, -0.596099853515625, -0.5439605712890625, -0.4918212890625, -0.4396820068359375, -0.387542724609375, -0.3354034423828125, -0.28326416015625, -0.2311248779296875, -0.178985595703125, -0.1268463134765625, -0.07470703125, -0.0225677490234375, 0.029571533203125, 0.0817108154296875, 0.13385009765625, 0.1859893798828125, 0.238128662109375, 0.2902679443359375, 0.3424072265625, 0.3945465087890625, 0.446685791015625, 0.4988250732421875, 0.55096435546875, 0.6031036376953125, 0.655242919921875, 0.7073822021484375, 0.759521484375, 0.8116607666015625, 0.863800048828125, 0.9159393310546875, 0.96807861328125, 1.0202178955078125, 1.072357177734375, 1.1244964599609375, 1.1766357421875, 1.2287750244140625, 1.280914306640625, 1.3330535888671875, 1.38519287109375, 1.4373321533203125, 1.489471435546875, 1.5416107177734375, 1.59375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 13.0, 16.0, 53.0, 111.0, 170.0, 193.0, 175.0, 122.0, 63.0, 23.0, 25.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.957542419433594, -14.393253326416016, -13.828963279724121, -13.264674186706543, -12.700385093688965, -12.13609504699707, -11.571805953979492, -11.007516860961914, -10.443227767944336, -9.878938674926758, -9.314648628234863, -8.750359535217285, -8.186070442199707, -7.621780872344971, -7.057491302490234, -6.493202209472656, -5.928912162780762, -5.364622592926025, -4.800333499908447, -4.236043930053711, -3.6717545986175537, -3.1074652671813965, -2.54317569732666, -1.978886365890503, -1.4145970344543457, -0.8503076434135437, -0.2860182523727417, 0.2782711982727051, 0.8425605297088623, 1.4068498611450195, 1.9711394309997559, 2.535428762435913, 3.0997180938720703, 3.6640074253082275, 4.228296756744385, 4.792586326599121, 5.356875419616699, 5.9211649894714355, 6.485454559326172, 7.04974365234375, 7.614033222198486, 8.178322792053223, 8.7426118850708, 9.306901931762695, 9.871191024780273, 10.435480117797852, 10.99976921081543, 11.564059257507324, 12.128348350524902, 12.69263744354248, 13.256927490234375, 13.821216583251953, 14.385505676269531, 14.94979476928711, 15.514084815979004, 16.0783748626709, 16.642663955688477, 17.206953048706055, 17.771242141723633, 18.335533142089844, 18.899822235107422, 19.464111328125, 20.028400421142578, 20.592689514160156, 21.156978607177734]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 14.0, 10.0, 11.0, 22.0, 33.0, 40.0, 61.0, 56.0, 85.0, 71.0, 79.0, 82.0, 65.0, 72.0, 57.0, 62.0, 45.0, 29.0, 26.0, 20.0, 18.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.44374656677246, -16.060718536376953, -15.677689552307129, -15.294661521911621, -14.911632537841797, -14.528604507446289, -14.145576477050781, -13.762548446655273, -13.37951946258545, -12.996491432189941, -12.613462448120117, -12.23043441772461, -11.847406387329102, -11.464377403259277, -11.08134937286377, -10.698320388793945, -10.315292358398438, -9.93226432800293, -9.549235343933105, -9.166207313537598, -8.783178329467773, -8.400150299072266, -8.017122268676758, -7.634093761444092, -7.251065254211426, -6.86803674697876, -6.485008239746094, -6.101980209350586, -5.71895170211792, -5.335923194885254, -4.952895164489746, -4.56986665725708, -4.186838150024414, -3.803809642791748, -3.420781373977661, -3.037753105163574, -2.654724597930908, -2.271696090698242, -1.8886678218841553, -1.5056395530700684, -1.1226110458374023, -0.7395826578140259, -0.3565542697906494, 0.02647411823272705, 0.4095025062561035, 0.79253089427948, 1.1755592823028564, 1.5585875511169434, 1.9416160583496094, 2.3246445655822754, 2.7076728343963623, 3.090701103210449, 3.4737296104431152, 3.8567581176757812, 4.239786148071289, 4.622814655303955, 5.005843162536621, 5.388871669769287, 5.771900177001953, 6.154928207397461, 6.537956714630127, 6.920985221862793, 7.304013252258301, 7.687041759490967, 8.070070266723633]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 11.0, 19.0, 23.0, 42.0, 74.0, 118.0, 205.0, 378.0, 718.0, 1452.0, 2901.0, 7281.0, 18523.0, 53303.0, 164197.0, 408276.0, 260752.0, 83273.0, 28320.0, 10423.0, 4313.0, 1918.0, 911.0, 474.0, 264.0, 147.0, 88.0, 53.0, 30.0, 21.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.419921875, -1.370452880859375, -1.32098388671875, -1.271514892578125, -1.2220458984375, -1.172576904296875, -1.12310791015625, -1.073638916015625, -1.024169921875, -0.974700927734375, -0.92523193359375, -0.875762939453125, -0.8262939453125, -0.776824951171875, -0.72735595703125, -0.677886962890625, -0.62841796875, -0.578948974609375, -0.52947998046875, -0.480010986328125, -0.4305419921875, -0.381072998046875, -0.33160400390625, -0.282135009765625, -0.232666015625, -0.183197021484375, -0.13372802734375, -0.084259033203125, -0.0347900390625, 0.014678955078125, 0.06414794921875, 0.113616943359375, 0.1630859375, 0.212554931640625, 0.26202392578125, 0.311492919921875, 0.3609619140625, 0.410430908203125, 0.45989990234375, 0.509368896484375, 0.558837890625, 0.608306884765625, 0.65777587890625, 0.707244873046875, 0.7567138671875, 0.806182861328125, 0.85565185546875, 0.905120849609375, 0.95458984375, 1.004058837890625, 1.05352783203125, 1.102996826171875, 1.1524658203125, 1.201934814453125, 1.25140380859375, 1.300872802734375, 1.350341796875, 1.399810791015625, 1.44927978515625, 1.498748779296875, 1.5482177734375, 1.597686767578125, 1.64715576171875, 1.696624755859375, 1.74609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 29.0, 30.0, 45.0, 58.0, 58.0, 70.0, 80.0, 82.0, 89.0, 87.0, 68.0, 71.0, 49.0, 29.0, 39.0, 29.0, 18.0, 17.0, 14.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5282058715820312, -0.4934234619140625, -0.45864105224609375, -0.423858642578125, -0.38907623291015625, -0.3542938232421875, -0.31951141357421875, -0.28472900390625, -0.24994659423828125, -0.2151641845703125, -0.18038177490234375, -0.145599365234375, -0.11081695556640625, -0.0760345458984375, -0.04125213623046875, -0.0064697265625, 0.02831268310546875, 0.0630950927734375, 0.09787750244140625, 0.132659912109375, 0.16744232177734375, 0.2022247314453125, 0.23700714111328125, 0.27178955078125, 0.30657196044921875, 0.3413543701171875, 0.37613677978515625, 0.410919189453125, 0.44570159912109375, 0.4804840087890625, 0.5152664184570312, 0.550048828125, 0.5848312377929688, 0.6196136474609375, 0.6543960571289062, 0.689178466796875, 0.7239608764648438, 0.7587432861328125, 0.7935256958007812, 0.82830810546875, 0.8630905151367188, 0.8978729248046875, 0.9326553344726562, 0.967437744140625, 1.0022201538085938, 1.0370025634765625, 1.0717849731445312, 1.1065673828125, 1.1413497924804688, 1.1761322021484375, 1.2109146118164062, 1.245697021484375, 1.2804794311523438, 1.3152618408203125, 1.3500442504882812, 1.38482666015625, 1.4196090698242188, 1.4543914794921875, 1.4891738891601562, 1.523956298828125, 1.5587387084960938, 1.5935211181640625, 1.6283035278320312, 1.6630859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 7.0, 7.0, 18.0, 19.0, 21.0, 25.0, 33.0, 60.0, 76.0, 135.0, 167.0, 294.0, 454.0, 716.0, 1255.0, 2922.0, 8322.0, 38360.0, 280128.0, 625771.0, 69217.0, 12745.0, 3829.0, 1613.0, 886.0, 491.0, 325.0, 199.0, 140.0, 101.0, 54.0, 41.0, 38.0, 26.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.29254150390625, -2.2081298828125, -2.12371826171875, -2.039306640625, -1.95489501953125, -1.8704833984375, -1.78607177734375, -1.70166015625, -1.61724853515625, -1.5328369140625, -1.44842529296875, -1.364013671875, -1.27960205078125, -1.1951904296875, -1.11077880859375, -1.0263671875, -0.94195556640625, -0.8575439453125, -0.77313232421875, -0.688720703125, -0.60430908203125, -0.5198974609375, -0.43548583984375, -0.35107421875, -0.26666259765625, -0.1822509765625, -0.09783935546875, -0.013427734375, 0.07098388671875, 0.1553955078125, 0.23980712890625, 0.32421875, 0.40863037109375, 0.4930419921875, 0.57745361328125, 0.661865234375, 0.74627685546875, 0.8306884765625, 0.91510009765625, 0.99951171875, 1.08392333984375, 1.1683349609375, 1.25274658203125, 1.337158203125, 1.42156982421875, 1.5059814453125, 1.59039306640625, 1.6748046875, 1.75921630859375, 1.8436279296875, 1.92803955078125, 2.012451171875, 2.09686279296875, 2.1812744140625, 2.26568603515625, 2.35009765625, 2.43450927734375, 2.5189208984375, 2.60333251953125, 2.687744140625, 2.77215576171875, 2.8565673828125, 2.94097900390625, 3.025390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 11.0, 11.0, 21.0, 18.0, 27.0, 22.0, 46.0, 34.0, 47.0, 49.0, 50.0, 68.0, 56.0, 76.0, 70.0, 65.0, 58.0, 49.0, 42.0, 36.0, 30.0, 23.0, 20.0, 24.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.14373779296875, -3.0355224609375, -2.92730712890625, -2.819091796875, -2.71087646484375, -2.6026611328125, -2.49444580078125, -2.38623046875, -2.27801513671875, -2.1697998046875, -2.06158447265625, -1.953369140625, -1.84515380859375, -1.7369384765625, -1.62872314453125, -1.5205078125, -1.41229248046875, -1.3040771484375, -1.19586181640625, -1.087646484375, -0.97943115234375, -0.8712158203125, -0.76300048828125, -0.65478515625, -0.54656982421875, -0.4383544921875, -0.33013916015625, -0.221923828125, -0.11370849609375, -0.0054931640625, 0.10272216796875, 0.2109375, 0.31915283203125, 0.4273681640625, 0.53558349609375, 0.643798828125, 0.75201416015625, 0.8602294921875, 0.96844482421875, 1.07666015625, 1.18487548828125, 1.2930908203125, 1.40130615234375, 1.509521484375, 1.61773681640625, 1.7259521484375, 1.83416748046875, 1.9423828125, 2.05059814453125, 2.1588134765625, 2.26702880859375, 2.375244140625, 2.48345947265625, 2.5916748046875, 2.69989013671875, 2.80810546875, 2.91632080078125, 3.0245361328125, 3.13275146484375, 3.240966796875, 3.34918212890625, 3.4573974609375, 3.56561279296875, 3.673828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 9.0, 15.0, 10.0, 14.0, 20.0, 33.0, 47.0, 53.0, 97.0, 121.0, 190.0, 301.0, 586.0, 1281.0, 3112.0, 9623.0, 38005.0, 218747.0, 645597.0, 99831.0, 20830.0, 5848.0, 2073.0, 945.0, 445.0, 239.0, 137.0, 97.0, 54.0, 51.0, 31.0, 24.0, 17.0, 14.0, 15.0, 13.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.81591796875, -0.794036865234375, -0.77215576171875, -0.750274658203125, -0.7283935546875, -0.706512451171875, -0.68463134765625, -0.662750244140625, -0.640869140625, -0.618988037109375, -0.59710693359375, -0.575225830078125, -0.5533447265625, -0.531463623046875, -0.50958251953125, -0.487701416015625, -0.4658203125, -0.443939208984375, -0.42205810546875, -0.400177001953125, -0.3782958984375, -0.356414794921875, -0.33453369140625, -0.312652587890625, -0.290771484375, -0.268890380859375, -0.24700927734375, -0.225128173828125, -0.2032470703125, -0.181365966796875, -0.15948486328125, -0.137603759765625, -0.11572265625, -0.093841552734375, -0.07196044921875, -0.050079345703125, -0.0281982421875, -0.006317138671875, 0.01556396484375, 0.037445068359375, 0.059326171875, 0.081207275390625, 0.10308837890625, 0.124969482421875, 0.1468505859375, 0.168731689453125, 0.19061279296875, 0.212493896484375, 0.234375, 0.256256103515625, 0.27813720703125, 0.300018310546875, 0.3218994140625, 0.343780517578125, 0.36566162109375, 0.387542724609375, 0.409423828125, 0.431304931640625, 0.45318603515625, 0.475067138671875, 0.4969482421875, 0.518829345703125, 0.54071044921875, 0.562591552734375, 0.58447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 20.0, 21.0, 23.0, 28.0, 38.0, 34.0, 59.0, 97.0, 118.0, 104.0, 109.0, 68.0, 61.0, 42.0, 31.0, 14.0, 15.0, 12.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001690387725830078, -0.0001623295247554779, -0.000155620276927948, -0.0001489110291004181, -0.00014220178127288818, -0.00013549253344535828, -0.00012878328561782837, -0.00012207403779029846, -0.00011536478996276855, -0.00010865554213523865, -0.00010194629430770874, -9.523704648017883e-05, -8.852779865264893e-05, -8.181855082511902e-05, -7.510930299758911e-05, -6.84000551700592e-05, -6.16908073425293e-05, -5.498155951499939e-05, -4.827231168746948e-05, -4.1563063859939575e-05, -3.485381603240967e-05, -2.814456820487976e-05, -2.1435320377349854e-05, -1.4726072549819946e-05, -8.016824722290039e-06, -1.3075768947601318e-06, 5.401670932769775e-06, 1.2110918760299683e-05, 1.882016658782959e-05, 2.5529414415359497e-05, 3.2238662242889404e-05, 3.894791007041931e-05, 4.565715789794922e-05, 5.2366405725479126e-05, 5.907565355300903e-05, 6.578490138053894e-05, 7.249414920806885e-05, 7.920339703559875e-05, 8.591264486312866e-05, 9.262189269065857e-05, 9.933114051818848e-05, 0.00010604038834571838, 0.00011274963617324829, 0.0001194588840007782, 0.0001261681318283081, 0.000132877379655838, 0.00013958662748336792, 0.00014629587531089783, 0.00015300512313842773, 0.00015971437096595764, 0.00016642361879348755, 0.00017313286662101746, 0.00017984211444854736, 0.00018655136227607727, 0.00019326061010360718, 0.00019996985793113708, 0.000206679105758667, 0.0002133883535861969, 0.0002200976014137268, 0.00022680684924125671, 0.00023351609706878662, 0.00024022534489631653, 0.00024693459272384644, 0.00025364384055137634, 0.00026035308837890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 10.0, 10.0, 14.0, 18.0, 24.0, 31.0, 38.0, 50.0, 79.0, 114.0, 162.0, 262.0, 385.0, 634.0, 1290.0, 2538.0, 5771.0, 17482.0, 71620.0, 500067.0, 354282.0, 65996.0, 16461.0, 5707.0, 2487.0, 1156.0, 651.0, 382.0, 257.0, 182.0, 97.0, 69.0, 50.0, 54.0, 28.0, 17.0, 15.0, 13.0, 15.0, 7.0, 7.0, 7.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5637130737304688, -0.5449066162109375, -0.5261001586914062, -0.507293701171875, -0.48848724365234375, -0.4696807861328125, -0.45087432861328125, -0.43206787109375, -0.41326141357421875, -0.3944549560546875, -0.37564849853515625, -0.356842041015625, -0.33803558349609375, -0.3192291259765625, -0.30042266845703125, -0.2816162109375, -0.26280975341796875, -0.2440032958984375, -0.22519683837890625, -0.206390380859375, -0.18758392333984375, -0.1687774658203125, -0.14997100830078125, -0.13116455078125, -0.11235809326171875, -0.0935516357421875, -0.07474517822265625, -0.055938720703125, -0.03713226318359375, -0.0183258056640625, 0.00048065185546875, 0.019287109375, 0.03809356689453125, 0.0569000244140625, 0.07570648193359375, 0.094512939453125, 0.11331939697265625, 0.1321258544921875, 0.15093231201171875, 0.16973876953125, 0.18854522705078125, 0.2073516845703125, 0.22615814208984375, 0.244964599609375, 0.26377105712890625, 0.2825775146484375, 0.30138397216796875, 0.3201904296875, 0.33899688720703125, 0.3578033447265625, 0.37660980224609375, 0.395416259765625, 0.41422271728515625, 0.4330291748046875, 0.45183563232421875, 0.47064208984375, 0.48944854736328125, 0.5082550048828125, 0.5270614624023438, 0.545867919921875, 0.5646743774414062, 0.5834808349609375, 0.6022872924804688, 0.62109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 4.0, 15.0, 12.0, 19.0, 25.0, 19.0, 35.0, 45.0, 58.0, 57.0, 90.0, 73.0, 91.0, 86.0, 85.0, 49.0, 49.0, 33.0, 31.0, 37.0, 23.0, 10.0, 12.0, 9.0, 6.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5829315185546875, -0.560882568359375, -0.5388336181640625, -0.51678466796875, -0.4947357177734375, -0.472686767578125, -0.4506378173828125, -0.4285888671875, -0.4065399169921875, -0.384490966796875, -0.3624420166015625, -0.34039306640625, -0.3183441162109375, -0.296295166015625, -0.2742462158203125, -0.252197265625, -0.2301483154296875, -0.208099365234375, -0.1860504150390625, -0.16400146484375, -0.1419525146484375, -0.119903564453125, -0.0978546142578125, -0.0758056640625, -0.0537567138671875, -0.031707763671875, -0.0096588134765625, 0.01239013671875, 0.0344390869140625, 0.056488037109375, 0.0785369873046875, 0.1005859375, 0.1226348876953125, 0.144683837890625, 0.1667327880859375, 0.18878173828125, 0.2108306884765625, 0.232879638671875, 0.2549285888671875, 0.2769775390625, 0.2990264892578125, 0.321075439453125, 0.3431243896484375, 0.36517333984375, 0.3872222900390625, 0.409271240234375, 0.4313201904296875, 0.453369140625, 0.4754180908203125, 0.497467041015625, 0.5195159912109375, 0.54156494140625, 0.5636138916015625, 0.585662841796875, 0.6077117919921875, 0.6297607421875, 0.6518096923828125, 0.673858642578125, 0.6959075927734375, 0.71795654296875, 0.7400054931640625, 0.762054443359375, 0.7841033935546875, 0.80615234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 23.0, 46.0, 74.0, 151.0, 277.0, 181.0, 122.0, 43.0, 22.0, 10.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.37348747253418, -19.767303466796875, -19.161121368408203, -18.5549373626709, -17.948753356933594, -17.342571258544922, -16.736387252807617, -16.130203247070312, -15.524020195007324, -14.917837142944336, -14.311653137207031, -13.705470085144043, -13.099287033081055, -12.49310302734375, -11.886919975280762, -11.280736923217773, -10.674552917480469, -10.06836986541748, -9.462185859680176, -8.856002807617188, -8.249818801879883, -7.6436357498168945, -7.037452697753906, -6.43126916885376, -5.825085639953613, -5.218902111053467, -4.61271858215332, -4.006535530090332, -3.4003520011901855, -2.794168472290039, -2.1879851818084717, -1.5818018913269043, -0.9756202697753906, -0.3694368600845337, 0.23674654960632324, 0.8429299592971802, 1.449113368988037, 2.0552968978881836, 2.661480188369751, 3.2676634788513184, 3.873847007751465, 4.480030536651611, 5.086214065551758, 5.692397117614746, 6.298580646514893, 6.904764175415039, 7.510947227478027, 8.117130279541016, 8.72331428527832, 9.329497337341309, 9.935681343078613, 10.541864395141602, 11.148048400878906, 11.754231452941895, 12.360414505004883, 12.966598510742188, 13.572781562805176, 14.178964614868164, 14.785148620605469, 15.391331672668457, 15.997514724731445, 16.60369873046875, 17.209882736206055, 17.816064834594727, 18.42224884033203]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 10.0, 12.0, 8.0, 22.0, 18.0, 25.0, 28.0, 31.0, 36.0, 33.0, 54.0, 62.0, 77.0, 92.0, 83.0, 70.0, 50.0, 49.0, 44.0, 29.0, 21.0, 27.0, 22.0, 15.0, 26.0, 16.0, 12.0, 6.0, 5.0, 3.0, 6.0, 3.0, 5.0], "bins": [-17.341094970703125, -16.954734802246094, -16.568374633789062, -16.1820125579834, -15.795652389526367, -15.409292221069336, -15.022931098937988, -14.63656997680664, -14.25020980834961, -13.863849639892578, -13.47748851776123, -13.091127395629883, -12.704767227172852, -12.31840705871582, -11.932045936584473, -11.545684814453125, -11.159324645996094, -10.772964477539062, -10.386603355407715, -10.000242233276367, -9.613882064819336, -9.227521896362305, -8.841160774230957, -8.45479965209961, -8.068439483642578, -7.682078838348389, -7.295718193054199, -6.90935754776001, -6.52299690246582, -6.136636257171631, -5.750275611877441, -5.363914966583252, -4.9775543212890625, -4.591193675994873, -4.204833030700684, -3.818472385406494, -3.4321117401123047, -3.0457510948181152, -2.659390449523926, -2.2730298042297363, -1.8866691589355469, -1.5003085136413574, -1.113947868347168, -0.7275872230529785, -0.34122657775878906, 0.04513406753540039, 0.43149471282958984, 0.8178553581237793, 1.2042160034179688, 1.5905766487121582, 1.9769372940063477, 2.363297939300537, 2.7496585845947266, 3.136019229888916, 3.5223798751831055, 3.908740520477295, 4.295101165771484, 4.681461811065674, 5.067822456359863, 5.454183101654053, 5.840543746948242, 6.226904392242432, 6.613265037536621, 6.9996256828308105, 7.385986328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 9.0, 19.0, 29.0, 57.0, 102.0, 189.0, 392.0, 861.0, 2279.0, 7320.0, 30377.0, 260644.0, 3068399.0, 748603.0, 57948.0, 11458.0, 3393.0, 1216.0, 511.0, 225.0, 115.0, 61.0, 30.0, 23.0, 8.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.6155319213867188, -1.5767669677734375, -1.5380020141601562, -1.499237060546875, -1.4604721069335938, -1.4217071533203125, -1.3829421997070312, -1.34417724609375, -1.3054122924804688, -1.2666473388671875, -1.2278823852539062, -1.189117431640625, -1.1503524780273438, -1.1115875244140625, -1.0728225708007812, -1.0340576171875, -0.9952926635742188, -0.9565277099609375, -0.9177627563476562, -0.878997802734375, -0.8402328491210938, -0.8014678955078125, -0.7627029418945312, -0.72393798828125, -0.6851730346679688, -0.6464080810546875, -0.6076431274414062, -0.568878173828125, -0.5301132202148438, -0.4913482666015625, -0.45258331298828125, -0.413818359375, -0.37505340576171875, -0.3362884521484375, -0.29752349853515625, -0.258758544921875, -0.21999359130859375, -0.1812286376953125, -0.14246368408203125, -0.10369873046875, -0.06493377685546875, -0.0261688232421875, 0.01259613037109375, 0.051361083984375, 0.09012603759765625, 0.1288909912109375, 0.16765594482421875, 0.2064208984375, 0.24518585205078125, 0.2839508056640625, 0.32271575927734375, 0.361480712890625, 0.40024566650390625, 0.4390106201171875, 0.47777557373046875, 0.51654052734375, 0.5553054809570312, 0.5940704345703125, 0.6328353881835938, 0.671600341796875, 0.7103652954101562, 0.7491302490234375, 0.7878952026367188, 0.82666015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 8.0, 6.0, 8.0, 10.0, 18.0, 13.0, 20.0, 23.0, 18.0, 26.0, 21.0, 34.0, 45.0, 33.0, 42.0, 41.0, 49.0, 45.0, 40.0, 55.0, 37.0, 52.0, 31.0, 42.0, 41.0, 29.0, 36.0, 31.0, 12.0, 19.0, 17.0, 19.0, 19.0, 14.0, 8.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634765625, -0.546112060546875, -0.52874755859375, -0.511383056640625, -0.4940185546875, -0.476654052734375, -0.45928955078125, -0.441925048828125, -0.424560546875, -0.407196044921875, -0.38983154296875, -0.372467041015625, -0.3551025390625, -0.337738037109375, -0.32037353515625, -0.303009033203125, -0.28564453125, -0.268280029296875, -0.25091552734375, -0.233551025390625, -0.2161865234375, -0.198822021484375, -0.18145751953125, -0.164093017578125, -0.146728515625, -0.129364013671875, -0.11199951171875, -0.094635009765625, -0.0772705078125, -0.059906005859375, -0.04254150390625, -0.025177001953125, -0.0078125, 0.009552001953125, 0.02691650390625, 0.044281005859375, 0.0616455078125, 0.079010009765625, 0.09637451171875, 0.113739013671875, 0.131103515625, 0.148468017578125, 0.16583251953125, 0.183197021484375, 0.2005615234375, 0.217926025390625, 0.23529052734375, 0.252655029296875, 0.27001953125, 0.287384033203125, 0.30474853515625, 0.322113037109375, 0.3394775390625, 0.356842041015625, 0.37420654296875, 0.391571044921875, 0.408935546875, 0.426300048828125, 0.44366455078125, 0.461029052734375, 0.4783935546875, 0.495758056640625, 0.51312255859375, 0.530487060546875, 0.5478515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 22.0, 32.0, 46.0, 64.0, 137.0, 227.0, 442.0, 1129.0, 3310.0, 16194.0, 193549.0, 3803599.0, 158031.0, 13113.0, 2586.0, 870.0, 370.0, 202.0, 106.0, 67.0, 51.0, 31.0, 26.0, 14.0, 8.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.880859375, -2.8078765869140625, -2.734893798828125, -2.6619110107421875, -2.58892822265625, -2.5159454345703125, -2.442962646484375, -2.3699798583984375, -2.2969970703125, -2.2240142822265625, -2.151031494140625, -2.0780487060546875, -2.00506591796875, -1.9320831298828125, -1.859100341796875, -1.7861175537109375, -1.713134765625, -1.6401519775390625, -1.567169189453125, -1.4941864013671875, -1.42120361328125, -1.3482208251953125, -1.275238037109375, -1.2022552490234375, -1.1292724609375, -1.0562896728515625, -0.983306884765625, -0.9103240966796875, -0.83734130859375, -0.7643585205078125, -0.691375732421875, -0.6183929443359375, -0.54541015625, -0.4724273681640625, -0.399444580078125, -0.3264617919921875, -0.25347900390625, -0.1804962158203125, -0.107513427734375, -0.0345306396484375, 0.0384521484375, 0.1114349365234375, 0.184417724609375, 0.2574005126953125, 0.33038330078125, 0.4033660888671875, 0.476348876953125, 0.5493316650390625, 0.622314453125, 0.6952972412109375, 0.768280029296875, 0.8412628173828125, 0.91424560546875, 0.9872283935546875, 1.060211181640625, 1.1331939697265625, 1.2061767578125, 1.2791595458984375, 1.352142333984375, 1.4251251220703125, 1.49810791015625, 1.5710906982421875, 1.644073486328125, 1.7170562744140625, 1.7900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 12.0, 14.0, 12.0, 24.0, 39.0, 40.0, 50.0, 98.0, 160.0, 272.0, 532.0, 835.0, 789.0, 492.0, 271.0, 135.0, 97.0, 54.0, 38.0, 23.0, 16.0, 17.0, 10.0, 10.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.473175048828125, -1.42388916015625, -1.374603271484375, -1.3253173828125, -1.276031494140625, -1.22674560546875, -1.177459716796875, -1.128173828125, -1.078887939453125, -1.02960205078125, -0.980316162109375, -0.9310302734375, -0.881744384765625, -0.83245849609375, -0.783172607421875, -0.73388671875, -0.684600830078125, -0.63531494140625, -0.586029052734375, -0.5367431640625, -0.487457275390625, -0.43817138671875, -0.388885498046875, -0.339599609375, -0.290313720703125, -0.24102783203125, -0.191741943359375, -0.1424560546875, -0.093170166015625, -0.04388427734375, 0.005401611328125, 0.0546875, 0.103973388671875, 0.15325927734375, 0.202545166015625, 0.2518310546875, 0.301116943359375, 0.35040283203125, 0.399688720703125, 0.448974609375, 0.498260498046875, 0.54754638671875, 0.596832275390625, 0.6461181640625, 0.695404052734375, 0.74468994140625, 0.793975830078125, 0.84326171875, 0.892547607421875, 0.94183349609375, 0.991119384765625, 1.0404052734375, 1.089691162109375, 1.13897705078125, 1.188262939453125, 1.237548828125, 1.286834716796875, 1.33612060546875, 1.385406494140625, 1.4346923828125, 1.483978271484375, 1.53326416015625, 1.582550048828125, 1.6318359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 14.0, 40.0, 82.0, 140.0, 212.0, 206.0, 155.0, 75.0, 26.0, 12.0, 4.0, 7.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.668704986572266, -20.125930786132812, -19.58315658569336, -19.040382385253906, -18.497608184814453, -17.954833984375, -17.412059783935547, -16.869287490844727, -16.326513290405273, -15.78373908996582, -15.240964889526367, -14.698190689086914, -14.155417442321777, -13.612643241882324, -13.069869041442871, -12.527094841003418, -11.984320640563965, -11.441546440124512, -10.898772239685059, -10.355998992919922, -9.813224792480469, -9.270450592041016, -8.727676391601562, -8.18490219116211, -7.6421284675598145, -7.099354267120361, -6.556580543518066, -6.013806343078613, -5.47103214263916, -4.928258419036865, -4.385484218597412, -3.842710256576538, -3.2999353408813477, -2.7571613788604736, -2.2143874168395996, -1.6716132164001465, -1.1288392543792725, -0.5860652923583984, -0.04329109191894531, 0.4994828701019287, 1.0422568321228027, 1.5850307941436768, 2.127804756164551, 2.670578956604004, 3.213352918624878, 3.756126880645752, 4.298901081085205, 4.8416748046875, 5.384449005126953, 5.927223205566406, 6.469996929168701, 7.012771129608154, 7.555544853210449, 8.098319053649902, 8.641093254089355, 9.183867454528809, 9.726640701293945, 10.269414901733398, 10.812189102172852, 11.354963302612305, 11.897736549377441, 12.440510749816895, 12.983284950256348, 13.5260591506958, 14.068833351135254]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 5.0, 11.0, 12.0, 15.0, 11.0, 21.0, 18.0, 24.0, 27.0, 20.0, 25.0, 43.0, 51.0, 39.0, 38.0, 58.0, 37.0, 58.0, 58.0, 43.0, 35.0, 43.0, 43.0, 39.0, 30.0, 31.0, 20.0, 26.0, 21.0, 23.0, 18.0, 5.0, 10.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.182754039764404, -5.995802879333496, -5.80885124206543, -5.6219000816345215, -5.434948921203613, -5.247997283935547, -5.061046123504639, -4.8740949630737305, -4.687143325805664, -4.500192165374756, -4.3132405281066895, -4.126289367675781, -3.939337968826294, -3.7523865699768066, -3.5654354095458984, -3.378484010696411, -3.191532850265503, -3.0045814514160156, -2.8176302909851074, -2.63067889213562, -2.443727493286133, -2.2567763328552246, -2.0698249340057373, -1.88287353515625, -1.6959222555160522, -1.5089709758758545, -1.3220195770263672, -1.1350682973861694, -0.9481169581413269, -0.7611656188964844, -0.5742143392562866, -0.3872629404067993, -0.20031166076660156, -0.013360336422920227, 0.1735909879207611, 0.36054229736328125, 0.5474936366081238, 0.7344449758529663, 0.9213962554931641, 1.1083476543426514, 1.2952989339828491, 1.4822502136230469, 1.6692016124725342, 1.856152892112732, 2.0431041717529297, 2.230055570602417, 2.4170069694519043, 2.6039581298828125, 2.7909095287323, 2.977860927581787, 3.1648120880126953, 3.3517634868621826, 3.53871488571167, 3.725666046142578, 3.9126174449920654, 4.099568843841553, 4.286520004272461, 4.473471164703369, 4.6604228019714355, 4.847373962402344, 5.034325122833252, 5.221276760101318, 5.408227920532227, 5.595179557800293, 5.782130718231201]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 7.0, 11.0, 14.0, 21.0, 29.0, 36.0, 54.0, 86.0, 135.0, 214.0, 368.0, 592.0, 1016.0, 1940.0, 3553.0, 7141.0, 14957.0, 31964.0, 71876.0, 153282.0, 260911.0, 245957.0, 136652.0, 62580.0, 28179.0, 13134.0, 6379.0, 3248.0, 1785.0, 937.0, 563.0, 350.0, 213.0, 117.0, 72.0, 56.0, 31.0, 21.0, 13.0, 12.0, 8.0, 7.0, 6.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.84375, -0.8164596557617188, -0.7891693115234375, -0.7618789672851562, -0.734588623046875, -0.7072982788085938, -0.6800079345703125, -0.6527175903320312, -0.62542724609375, -0.5981369018554688, -0.5708465576171875, -0.5435562133789062, -0.516265869140625, -0.48897552490234375, -0.4616851806640625, -0.43439483642578125, -0.4071044921875, -0.37981414794921875, -0.3525238037109375, -0.32523345947265625, -0.297943115234375, -0.27065277099609375, -0.2433624267578125, -0.21607208251953125, -0.18878173828125, -0.16149139404296875, -0.1342010498046875, -0.10691070556640625, -0.079620361328125, -0.05233001708984375, -0.0250396728515625, 0.00225067138671875, 0.029541015625, 0.05683135986328125, 0.0841217041015625, 0.11141204833984375, 0.138702392578125, 0.16599273681640625, 0.1932830810546875, 0.22057342529296875, 0.24786376953125, 0.27515411376953125, 0.3024444580078125, 0.32973480224609375, 0.357025146484375, 0.38431549072265625, 0.4116058349609375, 0.43889617919921875, 0.4661865234375, 0.49347686767578125, 0.5207672119140625, 0.5480575561523438, 0.575347900390625, 0.6026382446289062, 0.6299285888671875, 0.6572189331054688, 0.68450927734375, 0.7117996215820312, 0.7390899658203125, 0.7663803100585938, 0.793670654296875, 0.8209609985351562, 0.8482513427734375, 0.8755416870117188, 0.90283203125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 6.0, 11.0, 8.0, 4.0, 13.0, 16.0, 15.0, 14.0, 18.0, 25.0, 17.0, 29.0, 28.0, 29.0, 31.0, 36.0, 36.0, 37.0, 37.0, 39.0, 40.0, 42.0, 39.0, 34.0, 36.0, 41.0, 35.0, 30.0, 36.0, 29.0, 21.0, 27.0, 22.0, 26.0, 16.0, 11.0, 9.0, 12.0, 13.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.48802947998046875, -0.4721527099609375, -0.45627593994140625, -0.440399169921875, -0.42452239990234375, -0.4086456298828125, -0.39276885986328125, -0.37689208984375, -0.36101531982421875, -0.3451385498046875, -0.32926177978515625, -0.313385009765625, -0.29750823974609375, -0.2816314697265625, -0.26575469970703125, -0.2498779296875, -0.23400115966796875, -0.2181243896484375, -0.20224761962890625, -0.186370849609375, -0.17049407958984375, -0.1546173095703125, -0.13874053955078125, -0.12286376953125, -0.10698699951171875, -0.0911102294921875, -0.07523345947265625, -0.059356689453125, -0.04347991943359375, -0.0276031494140625, -0.01172637939453125, 0.004150390625, 0.02002716064453125, 0.0359039306640625, 0.05178070068359375, 0.067657470703125, 0.08353424072265625, 0.0994110107421875, 0.11528778076171875, 0.13116455078125, 0.14704132080078125, 0.1629180908203125, 0.17879486083984375, 0.194671630859375, 0.21054840087890625, 0.2264251708984375, 0.24230194091796875, 0.2581787109375, 0.27405548095703125, 0.2899322509765625, 0.30580902099609375, 0.321685791015625, 0.33756256103515625, 0.3534393310546875, 0.36931610107421875, 0.38519287109375, 0.40106964111328125, 0.4169464111328125, 0.43282318115234375, 0.448699951171875, 0.46457672119140625, 0.4804534912109375, 0.49633026123046875, 0.51220703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 4.0, 6.0, 8.0, 8.0, 13.0, 15.0, 26.0, 29.0, 49.0, 60.0, 68.0, 143.0, 254.0, 390.0, 712.0, 1400.0, 3386.0, 8985.0, 30838.0, 133240.0, 576979.0, 219317.0, 50567.0, 13230.0, 4678.0, 1975.0, 964.0, 473.0, 244.0, 152.0, 87.0, 73.0, 38.0, 45.0, 25.0, 16.0, 8.0, 14.0, 5.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5634765625, -1.5141143798828125, -1.464752197265625, -1.4153900146484375, -1.36602783203125, -1.3166656494140625, -1.267303466796875, -1.2179412841796875, -1.1685791015625, -1.1192169189453125, -1.069854736328125, -1.0204925537109375, -0.97113037109375, -0.9217681884765625, -0.872406005859375, -0.8230438232421875, -0.773681640625, -0.7243194580078125, -0.674957275390625, -0.6255950927734375, -0.57623291015625, -0.5268707275390625, -0.477508544921875, -0.4281463623046875, -0.3787841796875, -0.3294219970703125, -0.280059814453125, -0.2306976318359375, -0.18133544921875, -0.1319732666015625, -0.082611083984375, -0.0332489013671875, 0.01611328125, 0.0654754638671875, 0.114837646484375, 0.1641998291015625, 0.21356201171875, 0.2629241943359375, 0.312286376953125, 0.3616485595703125, 0.4110107421875, 0.4603729248046875, 0.509735107421875, 0.5590972900390625, 0.60845947265625, 0.6578216552734375, 0.707183837890625, 0.7565460205078125, 0.805908203125, 0.8552703857421875, 0.904632568359375, 0.9539947509765625, 1.00335693359375, 1.0527191162109375, 1.102081298828125, 1.1514434814453125, 1.2008056640625, 1.2501678466796875, 1.299530029296875, 1.3488922119140625, 1.39825439453125, 1.4476165771484375, 1.496978759765625, 1.5463409423828125, 1.595703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 11.0, 13.0, 8.0, 24.0, 22.0, 34.0, 39.0, 36.0, 40.0, 28.0, 58.0, 56.0, 50.0, 61.0, 51.0, 53.0, 51.0, 57.0, 38.0, 47.0, 30.0, 35.0, 29.0, 22.0, 21.0, 12.0, 19.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.818359375, -2.7443695068359375, -2.670379638671875, -2.5963897705078125, -2.52239990234375, -2.4484100341796875, -2.374420166015625, -2.3004302978515625, -2.2264404296875, -2.1524505615234375, -2.078460693359375, -2.0044708251953125, -1.93048095703125, -1.8564910888671875, -1.782501220703125, -1.7085113525390625, -1.634521484375, -1.5605316162109375, -1.486541748046875, -1.4125518798828125, -1.33856201171875, -1.2645721435546875, -1.190582275390625, -1.1165924072265625, -1.0426025390625, -0.9686126708984375, -0.894622802734375, -0.8206329345703125, -0.74664306640625, -0.6726531982421875, -0.598663330078125, -0.5246734619140625, -0.45068359375, -0.3766937255859375, -0.302703857421875, -0.2287139892578125, -0.15472412109375, -0.0807342529296875, -0.006744384765625, 0.0672454833984375, 0.1412353515625, 0.2152252197265625, 0.289215087890625, 0.3632049560546875, 0.43719482421875, 0.5111846923828125, 0.585174560546875, 0.6591644287109375, 0.733154296875, 0.8071441650390625, 0.881134033203125, 0.9551239013671875, 1.02911376953125, 1.1031036376953125, 1.177093505859375, 1.2510833740234375, 1.3250732421875, 1.3990631103515625, 1.473052978515625, 1.5470428466796875, 1.62103271484375, 1.6950225830078125, 1.769012451171875, 1.8430023193359375, 1.9169921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 13.0, 12.0, 29.0, 34.0, 72.0, 105.0, 170.0, 360.0, 728.0, 1881.0, 5074.0, 16057.0, 56837.0, 214863.0, 568301.0, 132209.0, 35339.0, 10410.0, 3527.0, 1307.0, 604.0, 257.0, 127.0, 85.0, 52.0, 31.0, 28.0, 12.0, 8.0, 2.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3587799072265625, -0.344024658203125, -0.3292694091796875, -0.31451416015625, -0.2997589111328125, -0.285003662109375, -0.2702484130859375, -0.2554931640625, -0.2407379150390625, -0.225982666015625, -0.2112274169921875, -0.19647216796875, -0.1817169189453125, -0.166961669921875, -0.1522064208984375, -0.137451171875, -0.1226959228515625, -0.107940673828125, -0.0931854248046875, -0.07843017578125, -0.0636749267578125, -0.048919677734375, -0.0341644287109375, -0.0194091796875, -0.0046539306640625, 0.010101318359375, 0.0248565673828125, 0.03961181640625, 0.0543670654296875, 0.069122314453125, 0.0838775634765625, 0.0986328125, 0.1133880615234375, 0.128143310546875, 0.1428985595703125, 0.15765380859375, 0.1724090576171875, 0.187164306640625, 0.2019195556640625, 0.2166748046875, 0.2314300537109375, 0.246185302734375, 0.2609405517578125, 0.27569580078125, 0.2904510498046875, 0.305206298828125, 0.3199615478515625, 0.334716796875, 0.3494720458984375, 0.364227294921875, 0.3789825439453125, 0.39373779296875, 0.4084930419921875, 0.423248291015625, 0.4380035400390625, 0.4527587890625, 0.4675140380859375, 0.482269287109375, 0.4970245361328125, 0.51177978515625, 0.5265350341796875, 0.541290283203125, 0.5560455322265625, 0.57080078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 9.0, 6.0, 18.0, 10.0, 28.0, 25.0, 48.0, 61.0, 67.0, 97.0, 142.0, 130.0, 90.0, 64.0, 46.0, 41.0, 32.0, 31.0, 12.0, 12.0, 11.0, 4.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015664100646972656, -0.00015059113502502441, -0.00014454126358032227, -0.00013849139213562012, -0.00013244152069091797, -0.00012639164924621582, -0.00012034177780151367, -0.00011429190635681152, -0.00010824203491210938, -0.00010219216346740723, -9.614229202270508e-05, -9.009242057800293e-05, -8.404254913330078e-05, -7.799267768859863e-05, -7.194280624389648e-05, -6.589293479919434e-05, -5.984306335449219e-05, -5.379319190979004e-05, -4.774332046508789e-05, -4.169344902038574e-05, -3.5643577575683594e-05, -2.9593706130981445e-05, -2.3543834686279297e-05, -1.749396324157715e-05, -1.1444091796875e-05, -5.3942203521728516e-06, 6.556510925292969e-07, 6.705522537231445e-06, 1.2755393981933594e-05, 1.8805265426635742e-05, 2.485513687133789e-05, 3.090500831604004e-05, 3.695487976074219e-05, 4.3004751205444336e-05, 4.9054622650146484e-05, 5.510449409484863e-05, 6.115436553955078e-05, 6.720423698425293e-05, 7.325410842895508e-05, 7.930397987365723e-05, 8.535385131835938e-05, 9.140372276306152e-05, 9.745359420776367e-05, 0.00010350346565246582, 0.00010955333709716797, 0.00011560320854187012, 0.00012165307998657227, 0.00012770295143127441, 0.00013375282287597656, 0.0001398026943206787, 0.00014585256576538086, 0.000151902437210083, 0.00015795230865478516, 0.0001640021800994873, 0.00017005205154418945, 0.0001761019229888916, 0.00018215179443359375, 0.0001882016658782959, 0.00019425153732299805, 0.0002003014087677002, 0.00020635128021240234, 0.0002124011516571045, 0.00021845102310180664, 0.0002245008945465088, 0.00023055076599121094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 3.0, 7.0, 27.0, 30.0, 55.0, 109.0, 217.0, 493.0, 1225.0, 3978.0, 16274.0, 89280.0, 606463.0, 270414.0, 46605.0, 9223.0, 2588.0, 853.0, 369.0, 140.0, 85.0, 40.0, 24.0, 14.0, 12.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.634765625, -0.6148147583007812, -0.5948638916015625, -0.5749130249023438, -0.554962158203125, -0.5350112915039062, -0.5150604248046875, -0.49510955810546875, -0.47515869140625, -0.45520782470703125, -0.4352569580078125, -0.41530609130859375, -0.395355224609375, -0.37540435791015625, -0.3554534912109375, -0.33550262451171875, -0.3155517578125, -0.29560089111328125, -0.2756500244140625, -0.25569915771484375, -0.235748291015625, -0.21579742431640625, -0.1958465576171875, -0.17589569091796875, -0.15594482421875, -0.13599395751953125, -0.1160430908203125, -0.09609222412109375, -0.076141357421875, -0.05619049072265625, -0.0362396240234375, -0.01628875732421875, 0.003662109375, 0.02361297607421875, 0.0435638427734375, 0.06351470947265625, 0.083465576171875, 0.10341644287109375, 0.1233673095703125, 0.14331817626953125, 0.16326904296875, 0.18321990966796875, 0.2031707763671875, 0.22312164306640625, 0.243072509765625, 0.26302337646484375, 0.2829742431640625, 0.30292510986328125, 0.3228759765625, 0.34282684326171875, 0.3627777099609375, 0.38272857666015625, 0.402679443359375, 0.42263031005859375, 0.4425811767578125, 0.46253204345703125, 0.48248291015625, 0.5024337768554688, 0.5223846435546875, 0.5423355102539062, 0.562286376953125, 0.5822372436523438, 0.6021881103515625, 0.6221389770507812, 0.64208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 4.0, 9.0, 5.0, 9.0, 14.0, 24.0, 25.0, 42.0, 62.0, 73.0, 92.0, 67.0, 107.0, 96.0, 81.0, 72.0, 58.0, 35.0, 42.0, 25.0, 17.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.572479248046875, -0.55169677734375, -0.530914306640625, -0.5101318359375, -0.489349365234375, -0.46856689453125, -0.447784423828125, -0.427001953125, -0.406219482421875, -0.38543701171875, -0.364654541015625, -0.3438720703125, -0.323089599609375, -0.30230712890625, -0.281524658203125, -0.2607421875, -0.239959716796875, -0.21917724609375, -0.198394775390625, -0.1776123046875, -0.156829833984375, -0.13604736328125, -0.115264892578125, -0.094482421875, -0.073699951171875, -0.05291748046875, -0.032135009765625, -0.0113525390625, 0.009429931640625, 0.03021240234375, 0.050994873046875, 0.07177734375, 0.092559814453125, 0.11334228515625, 0.134124755859375, 0.1549072265625, 0.175689697265625, 0.19647216796875, 0.217254638671875, 0.238037109375, 0.258819580078125, 0.27960205078125, 0.300384521484375, 0.3211669921875, 0.341949462890625, 0.36273193359375, 0.383514404296875, 0.404296875, 0.425079345703125, 0.44586181640625, 0.466644287109375, 0.4874267578125, 0.508209228515625, 0.52899169921875, 0.549774169921875, 0.570556640625, 0.591339111328125, 0.61212158203125, 0.632904052734375, 0.6536865234375, 0.674468994140625, 0.69525146484375, 0.716033935546875, 0.73681640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 13.0, 18.0, 50.0, 97.0, 147.0, 239.0, 165.0, 106.0, 63.0, 38.0, 20.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.703070640563965, -13.25552749633789, -12.8079833984375, -12.360440254211426, -11.912897109985352, -11.465353012084961, -11.017809867858887, -10.570266723632812, -10.122723579406738, -9.675180435180664, -9.227636337280273, -8.7800931930542, -8.332550048828125, -7.885006427764893, -7.43746280670166, -6.989919662475586, -6.5423760414123535, -6.094832420349121, -5.647289276123047, -5.1997456550598145, -4.75220251083374, -4.304658889770508, -3.8571155071258545, -3.409572124481201, -2.962028741836548, -2.5144853591918945, -2.066941976547241, -1.6193984746932983, -1.171855092048645, -0.7243115901947021, -0.27676820755004883, 0.1707751750946045, 0.6183185577392578, 1.0658619403839111, 1.5134053230285645, 1.9609488248825073, 2.408492088317871, 2.8560357093811035, 3.303579092025757, 3.75112247467041, 4.198665618896484, 4.646209239959717, 5.093752384185791, 5.541296005249023, 5.988839149475098, 6.43638277053833, 6.8839263916015625, 7.331469535827637, 7.779013156890869, 8.226556777954102, 8.674099922180176, 9.12164306640625, 9.56918716430664, 10.016730308532715, 10.464273452758789, 10.91181755065918, 11.359360694885254, 11.806903839111328, 12.254447937011719, 12.701991081237793, 13.149534225463867, 13.597078323364258, 14.044621467590332, 14.492164611816406, 14.93970775604248]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 7.0, 14.0, 13.0, 14.0, 13.0, 19.0, 24.0, 26.0, 36.0, 32.0, 31.0, 55.0, 72.0, 78.0, 78.0, 82.0, 50.0, 48.0, 33.0, 44.0, 21.0, 24.0, 30.0, 20.0, 19.0, 13.0, 10.0, 19.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.953629493713379, -8.69128704071045, -8.428945541381836, -8.166603088378906, -7.904261112213135, -7.641919136047363, -7.379577159881592, -7.11723518371582, -6.854892730712891, -6.592550754547119, -6.330208778381348, -6.067866325378418, -5.8055243492126465, -5.543182373046875, -5.2808403968811035, -5.018498420715332, -4.7561564445495605, -4.493814468383789, -4.231472492218018, -3.969130277633667, -3.7067880630493164, -3.444446086883545, -3.1821041107177734, -2.919762134552002, -2.6574199199676514, -2.39507794380188, -2.1327357292175293, -1.8703937530517578, -1.6080516576766968, -1.3457095623016357, -1.0833675861358643, -0.8210254907608032, -0.5586833953857422, -0.29634132981300354, -0.03399926424026489, 0.22834277153015137, 0.4906848669052124, 0.7530269622802734, 1.015368938446045, 1.277711033821106, 1.540053129196167, 1.802395224571228, 2.064737319946289, 2.3270792961120605, 2.589421272277832, 2.8517634868621826, 3.114105463027954, 3.3764476776123047, 3.638789653778076, 3.9011316299438477, 4.163473606109619, 4.425815582275391, 4.68815803527832, 4.950500011444092, 5.212841987609863, 5.475183963775635, 5.737525939941406, 5.999867916107178, 6.262209892272949, 6.524552345275879, 6.78689432144165, 7.049236297607422, 7.311578273773193, 7.573920249938965, 7.8362627029418945]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 16.0, 14.0, 35.0, 57.0, 86.0, 181.0, 370.0, 720.0, 1741.0, 4141.0, 13256.0, 59743.0, 595464.0, 2961386.0, 485799.0, 52620.0, 11966.0, 3843.0, 1536.0, 659.0, 298.0, 151.0, 81.0, 52.0, 35.0, 12.0, 7.0, 6.0, 4.0, 1.0, 1.0], "bins": [-1.546875, -1.513580322265625, -1.48028564453125, -1.446990966796875, -1.4136962890625, -1.380401611328125, -1.34710693359375, -1.313812255859375, -1.280517578125, -1.247222900390625, -1.21392822265625, -1.180633544921875, -1.1473388671875, -1.114044189453125, -1.08074951171875, -1.047454833984375, -1.01416015625, -0.980865478515625, -0.94757080078125, -0.914276123046875, -0.8809814453125, -0.847686767578125, -0.81439208984375, -0.781097412109375, -0.747802734375, -0.714508056640625, -0.68121337890625, -0.647918701171875, -0.6146240234375, -0.581329345703125, -0.54803466796875, -0.514739990234375, -0.4814453125, -0.448150634765625, -0.41485595703125, -0.381561279296875, -0.3482666015625, -0.314971923828125, -0.28167724609375, -0.248382568359375, -0.215087890625, -0.181793212890625, -0.14849853515625, -0.115203857421875, -0.0819091796875, -0.048614501953125, -0.01531982421875, 0.017974853515625, 0.05126953125, 0.084564208984375, 0.11785888671875, 0.151153564453125, 0.1844482421875, 0.217742919921875, 0.25103759765625, 0.284332275390625, 0.317626953125, 0.350921630859375, 0.38421630859375, 0.417510986328125, 0.4508056640625, 0.484100341796875, 0.51739501953125, 0.550689697265625, 0.583984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 11.0, 3.0, 6.0, 13.0, 8.0, 9.0, 17.0, 20.0, 16.0, 27.0, 36.0, 35.0, 26.0, 34.0, 33.0, 41.0, 40.0, 54.0, 53.0, 54.0, 49.0, 49.0, 44.0, 50.0, 37.0, 26.0, 30.0, 22.0, 28.0, 35.0, 18.0, 14.0, 13.0, 8.0, 6.0, 8.0, 4.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5704193115234375, -0.552459716796875, -0.5345001220703125, -0.51654052734375, -0.4985809326171875, -0.480621337890625, -0.4626617431640625, -0.4447021484375, -0.4267425537109375, -0.408782958984375, -0.3908233642578125, -0.37286376953125, -0.3549041748046875, -0.336944580078125, -0.3189849853515625, -0.301025390625, -0.2830657958984375, -0.265106201171875, -0.2471466064453125, -0.22918701171875, -0.2112274169921875, -0.193267822265625, -0.1753082275390625, -0.1573486328125, -0.1393890380859375, -0.121429443359375, -0.1034698486328125, -0.08551025390625, -0.0675506591796875, -0.049591064453125, -0.0316314697265625, -0.013671875, 0.0042877197265625, 0.022247314453125, 0.0402069091796875, 0.05816650390625, 0.0761260986328125, 0.094085693359375, 0.1120452880859375, 0.1300048828125, 0.1479644775390625, 0.165924072265625, 0.1838836669921875, 0.20184326171875, 0.2198028564453125, 0.237762451171875, 0.2557220458984375, 0.273681640625, 0.2916412353515625, 0.309600830078125, 0.3275604248046875, 0.34552001953125, 0.3634796142578125, 0.381439208984375, 0.3993988037109375, 0.4173583984375, 0.4353179931640625, 0.453277587890625, 0.4712371826171875, 0.48919677734375, 0.5071563720703125, 0.525115966796875, 0.5430755615234375, 0.56103515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 8.0, 6.0, 14.0, 19.0, 31.0, 77.0, 227.0, 685.0, 3127.0, 36685.0, 3689478.0, 450783.0, 10972.0, 1487.0, 408.0, 152.0, 46.0, 37.0, 15.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.82806396484375, -2.7362060546875, -2.64434814453125, -2.552490234375, -2.46063232421875, -2.3687744140625, -2.27691650390625, -2.18505859375, -2.09320068359375, -2.0013427734375, -1.90948486328125, -1.817626953125, -1.72576904296875, -1.6339111328125, -1.54205322265625, -1.4501953125, -1.35833740234375, -1.2664794921875, -1.17462158203125, -1.082763671875, -0.99090576171875, -0.8990478515625, -0.80718994140625, -0.71533203125, -0.62347412109375, -0.5316162109375, -0.43975830078125, -0.347900390625, -0.25604248046875, -0.1641845703125, -0.07232666015625, 0.01953125, 0.11138916015625, 0.2032470703125, 0.29510498046875, 0.386962890625, 0.47882080078125, 0.5706787109375, 0.66253662109375, 0.75439453125, 0.84625244140625, 0.9381103515625, 1.02996826171875, 1.121826171875, 1.21368408203125, 1.3055419921875, 1.39739990234375, 1.4892578125, 1.58111572265625, 1.6729736328125, 1.76483154296875, 1.856689453125, 1.94854736328125, 2.0404052734375, 2.13226318359375, 2.22412109375, 2.31597900390625, 2.4078369140625, 2.49969482421875, 2.591552734375, 2.68341064453125, 2.7752685546875, 2.86712646484375, 2.958984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 3.0, 15.0, 15.0, 18.0, 27.0, 63.0, 112.0, 174.0, 316.0, 677.0, 1021.0, 759.0, 386.0, 202.0, 117.0, 59.0, 37.0, 20.0, 13.0, 9.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.695556640625, -1.64013671875, -1.584716796875, -1.529296875, -1.473876953125, -1.41845703125, -1.363037109375, -1.3076171875, -1.252197265625, -1.19677734375, -1.141357421875, -1.0859375, -1.030517578125, -0.97509765625, -0.919677734375, -0.8642578125, -0.808837890625, -0.75341796875, -0.697998046875, -0.642578125, -0.587158203125, -0.53173828125, -0.476318359375, -0.4208984375, -0.365478515625, -0.31005859375, -0.254638671875, -0.19921875, -0.143798828125, -0.08837890625, -0.032958984375, 0.0224609375, 0.077880859375, 0.13330078125, 0.188720703125, 0.244140625, 0.299560546875, 0.35498046875, 0.410400390625, 0.4658203125, 0.521240234375, 0.57666015625, 0.632080078125, 0.6875, 0.742919921875, 0.79833984375, 0.853759765625, 0.9091796875, 0.964599609375, 1.02001953125, 1.075439453125, 1.130859375, 1.186279296875, 1.24169921875, 1.297119140625, 1.3525390625, 1.407958984375, 1.46337890625, 1.518798828125, 1.57421875, 1.629638671875, 1.68505859375, 1.740478515625, 1.7958984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 9.0, 18.0, 52.0, 98.0, 219.0, 271.0, 184.0, 82.0, 40.0, 10.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.194992065429688, -19.655071258544922, -19.115150451660156, -18.575227737426758, -18.035306930541992, -17.495386123657227, -16.955463409423828, -16.415542602539062, -15.875621795654297, -15.335700988769531, -14.79577922821045, -14.255857467651367, -13.715936660766602, -13.176015853881836, -12.636094093322754, -12.096172332763672, -11.556251525878906, -11.01633071899414, -10.476408958435059, -9.936487197875977, -9.396566390991211, -8.856645584106445, -8.316723823547363, -7.7768025398254395, -7.236881256103516, -6.696959972381592, -6.157038688659668, -5.617117404937744, -5.07719612121582, -4.5372748374938965, -3.9973535537719727, -3.457432270050049, -2.917510986328125, -2.377589702606201, -1.8376684188842773, -1.2977471351623535, -0.7578258514404297, -0.21790456771850586, 0.32201671600341797, 0.8619379997253418, 1.4018592834472656, 1.9417805671691895, 2.4817018508911133, 3.021623134613037, 3.561544418334961, 4.101465702056885, 4.641386985778809, 5.181308269500732, 5.721229553222656, 6.26115083694458, 6.801072120666504, 7.340993404388428, 7.880914688110352, 8.420835494995117, 8.9607572555542, 9.500679016113281, 10.040599822998047, 10.580520629882812, 11.120442390441895, 11.660364151000977, 12.200284957885742, 12.740205764770508, 13.28012752532959, 13.820049285888672, 14.359970092773438]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 7.0, 9.0, 12.0, 18.0, 18.0, 9.0, 19.0, 24.0, 25.0, 26.0, 37.0, 34.0, 39.0, 37.0, 48.0, 49.0, 48.0, 54.0, 57.0, 59.0, 39.0, 40.0, 35.0, 28.0, 44.0, 23.0, 25.0, 22.0, 18.0, 16.0, 14.0, 17.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.991859436035156, -5.827316761016846, -5.662774085998535, -5.498231887817383, -5.333689212799072, -5.169146537780762, -5.004603862762451, -4.840061187744141, -4.675518989562988, -4.510976314544678, -4.346433639526367, -4.181891441345215, -4.017348766326904, -3.8528060913085938, -3.688263416290283, -3.5237207412719727, -3.359178066253662, -3.1946353912353516, -3.03009295463562, -2.8655502796173096, -2.701007843017578, -2.5364651679992676, -2.371922492980957, -2.2073798179626465, -2.042837381362915, -1.878294825553894, -1.713752269744873, -1.5492095947265625, -1.3846670389175415, -1.2201244831085205, -1.05558180809021, -0.891039252281189, -0.7264962196350098, -0.5619536638259888, -0.397411048412323, -0.23286846280097961, -0.06832587718963623, 0.09621667861938477, 0.26075929403305054, 0.4253019094467163, 0.5898444652557373, 0.7543870210647583, 0.9189296364784241, 1.0834722518920898, 1.2480148077011108, 1.4125573635101318, 1.5771000385284424, 1.7416425943374634, 1.9061851501464844, 2.070727825164795, 2.2352702617645264, 2.399812936782837, 2.5643553733825684, 2.728898048400879, 2.8934407234191895, 3.0579833984375, 3.2225258350372314, 3.387068510055542, 3.5516109466552734, 3.716153621673584, 3.8806962966918945, 4.045238494873047, 4.209781169891357, 4.374323844909668, 4.5388665199279785]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 11.0, 7.0, 21.0, 28.0, 22.0, 44.0, 63.0, 104.0, 145.0, 228.0, 396.0, 653.0, 1017.0, 1898.0, 3415.0, 6542.0, 13640.0, 29302.0, 63128.0, 141338.0, 269096.0, 263878.0, 136480.0, 61584.0, 28057.0, 13164.0, 6389.0, 3436.0, 1805.0, 1008.0, 630.0, 352.0, 243.0, 141.0, 91.0, 74.0, 48.0, 29.0, 13.0, 6.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.86767578125, -0.8435592651367188, -0.8194427490234375, -0.7953262329101562, -0.771209716796875, -0.7470932006835938, -0.7229766845703125, -0.6988601684570312, -0.67474365234375, -0.6506271362304688, -0.6265106201171875, -0.6023941040039062, -0.578277587890625, -0.5541610717773438, -0.5300445556640625, -0.5059280395507812, -0.4818115234375, -0.45769500732421875, -0.4335784912109375, -0.40946197509765625, -0.385345458984375, -0.36122894287109375, -0.3371124267578125, -0.31299591064453125, -0.28887939453125, -0.26476287841796875, -0.2406463623046875, -0.21652984619140625, -0.192413330078125, -0.16829681396484375, -0.1441802978515625, -0.12006378173828125, -0.095947265625, -0.07183074951171875, -0.0477142333984375, -0.02359771728515625, 0.000518798828125, 0.02463531494140625, 0.0487518310546875, 0.07286834716796875, 0.09698486328125, 0.12110137939453125, 0.1452178955078125, 0.16933441162109375, 0.193450927734375, 0.21756744384765625, 0.2416839599609375, 0.26580047607421875, 0.2899169921875, 0.31403350830078125, 0.3381500244140625, 0.36226654052734375, 0.386383056640625, 0.41049957275390625, 0.4346160888671875, 0.45873260498046875, 0.48284912109375, 0.5069656372070312, 0.5310821533203125, 0.5551986694335938, 0.579315185546875, 0.6034317016601562, 0.6275482177734375, 0.6516647338867188, 0.67578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 6.0, 8.0, 13.0, 13.0, 21.0, 20.0, 20.0, 26.0, 33.0, 34.0, 25.0, 32.0, 31.0, 36.0, 35.0, 38.0, 33.0, 44.0, 54.0, 46.0, 48.0, 34.0, 35.0, 29.0, 38.0, 33.0, 31.0, 20.0, 28.0, 17.0, 14.0, 11.0, 15.0, 11.0, 7.0, 5.0, 9.0, 6.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5849609375, -0.5680007934570312, -0.5510406494140625, -0.5340805053710938, -0.517120361328125, -0.5001602172851562, -0.4832000732421875, -0.46623992919921875, -0.44927978515625, -0.43231964111328125, -0.4153594970703125, -0.39839935302734375, -0.381439208984375, -0.36447906494140625, -0.3475189208984375, -0.33055877685546875, -0.3135986328125, -0.29663848876953125, -0.2796783447265625, -0.26271820068359375, -0.245758056640625, -0.22879791259765625, -0.2118377685546875, -0.19487762451171875, -0.17791748046875, -0.16095733642578125, -0.1439971923828125, -0.12703704833984375, -0.110076904296875, -0.09311676025390625, -0.0761566162109375, -0.05919647216796875, -0.042236328125, -0.02527618408203125, -0.0083160400390625, 0.00864410400390625, 0.025604248046875, 0.04256439208984375, 0.0595245361328125, 0.07648468017578125, 0.09344482421875, 0.11040496826171875, 0.1273651123046875, 0.14432525634765625, 0.161285400390625, 0.17824554443359375, 0.1952056884765625, 0.21216583251953125, 0.2291259765625, 0.24608612060546875, 0.2630462646484375, 0.28000640869140625, 0.296966552734375, 0.31392669677734375, 0.3308868408203125, 0.34784698486328125, 0.36480712890625, 0.38176727294921875, 0.3987274169921875, 0.41568756103515625, 0.432647705078125, 0.44960784912109375, 0.4665679931640625, 0.48352813720703125, 0.50048828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 8.0, 12.0, 26.0, 34.0, 44.0, 65.0, 83.0, 133.0, 180.0, 302.0, 498.0, 985.0, 2467.0, 7771.0, 35268.0, 207488.0, 664104.0, 101764.0, 18863.0, 4787.0, 1703.0, 742.0, 383.0, 257.0, 183.0, 93.0, 104.0, 45.0, 42.0, 17.0, 22.0, 18.0, 8.0, 10.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.4253387451171875, -1.373138427734375, -1.3209381103515625, -1.26873779296875, -1.2165374755859375, -1.164337158203125, -1.1121368408203125, -1.0599365234375, -1.0077362060546875, -0.955535888671875, -0.9033355712890625, -0.85113525390625, -0.7989349365234375, -0.746734619140625, -0.6945343017578125, -0.642333984375, -0.5901336669921875, -0.537933349609375, -0.4857330322265625, -0.43353271484375, -0.3813323974609375, -0.329132080078125, -0.2769317626953125, -0.2247314453125, -0.1725311279296875, -0.120330810546875, -0.0681304931640625, -0.01593017578125, 0.0362701416015625, 0.088470458984375, 0.1406707763671875, 0.19287109375, 0.2450714111328125, 0.297271728515625, 0.3494720458984375, 0.40167236328125, 0.4538726806640625, 0.506072998046875, 0.5582733154296875, 0.6104736328125, 0.6626739501953125, 0.714874267578125, 0.7670745849609375, 0.81927490234375, 0.8714752197265625, 0.923675537109375, 0.9758758544921875, 1.028076171875, 1.0802764892578125, 1.132476806640625, 1.1846771240234375, 1.23687744140625, 1.2890777587890625, 1.341278076171875, 1.3934783935546875, 1.4456787109375, 1.4978790283203125, 1.550079345703125, 1.6022796630859375, 1.65447998046875, 1.7066802978515625, 1.758880615234375, 1.8110809326171875, 1.86328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 8.0, 9.0, 11.0, 13.0, 19.0, 23.0, 25.0, 34.0, 42.0, 44.0, 39.0, 38.0, 52.0, 42.0, 51.0, 70.0, 63.0, 59.0, 45.0, 45.0, 42.0, 40.0, 30.0, 21.0, 19.0, 14.0, 13.0, 21.0, 12.0, 7.0, 6.0, 10.0, 7.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.630859375, -2.5587310791015625, -2.486602783203125, -2.4144744873046875, -2.34234619140625, -2.2702178955078125, -2.198089599609375, -2.1259613037109375, -2.0538330078125, -1.9817047119140625, -1.909576416015625, -1.8374481201171875, -1.76531982421875, -1.6931915283203125, -1.621063232421875, -1.5489349365234375, -1.476806640625, -1.4046783447265625, -1.332550048828125, -1.2604217529296875, -1.18829345703125, -1.1161651611328125, -1.044036865234375, -0.9719085693359375, -0.8997802734375, -0.8276519775390625, -0.755523681640625, -0.6833953857421875, -0.61126708984375, -0.5391387939453125, -0.467010498046875, -0.3948822021484375, -0.32275390625, -0.2506256103515625, -0.178497314453125, -0.1063690185546875, -0.03424072265625, 0.0378875732421875, 0.110015869140625, 0.1821441650390625, 0.2542724609375, 0.3264007568359375, 0.398529052734375, 0.4706573486328125, 0.54278564453125, 0.6149139404296875, 0.687042236328125, 0.7591705322265625, 0.831298828125, 0.9034271240234375, 0.975555419921875, 1.0476837158203125, 1.11981201171875, 1.1919403076171875, 1.264068603515625, 1.3361968994140625, 1.4083251953125, 1.4804534912109375, 1.552581787109375, 1.6247100830078125, 1.69683837890625, 1.7689666748046875, 1.841094970703125, 1.9132232666015625, 1.9853515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 14.0, 13.0, 35.0, 42.0, 68.0, 80.0, 149.0, 241.0, 430.0, 875.0, 1965.0, 5243.0, 16186.0, 57625.0, 307185.0, 563682.0, 66498.0, 18060.0, 5878.0, 2128.0, 954.0, 481.0, 265.0, 153.0, 90.0, 53.0, 43.0, 30.0, 13.0, 15.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.457672119140625, -0.44293212890625, -0.428192138671875, -0.4134521484375, -0.398712158203125, -0.38397216796875, -0.369232177734375, -0.3544921875, -0.339752197265625, -0.32501220703125, -0.310272216796875, -0.2955322265625, -0.280792236328125, -0.26605224609375, -0.251312255859375, -0.236572265625, -0.221832275390625, -0.20709228515625, -0.192352294921875, -0.1776123046875, -0.162872314453125, -0.14813232421875, -0.133392333984375, -0.11865234375, -0.103912353515625, -0.08917236328125, -0.074432373046875, -0.0596923828125, -0.044952392578125, -0.03021240234375, -0.015472412109375, -0.000732421875, 0.014007568359375, 0.02874755859375, 0.043487548828125, 0.0582275390625, 0.072967529296875, 0.08770751953125, 0.102447509765625, 0.1171875, 0.131927490234375, 0.14666748046875, 0.161407470703125, 0.1761474609375, 0.190887451171875, 0.20562744140625, 0.220367431640625, 0.235107421875, 0.249847412109375, 0.26458740234375, 0.279327392578125, 0.2940673828125, 0.308807373046875, 0.32354736328125, 0.338287353515625, 0.35302734375, 0.367767333984375, 0.38250732421875, 0.397247314453125, 0.4119873046875, 0.426727294921875, 0.44146728515625, 0.456207275390625, 0.470947265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 9.0, 7.0, 10.0, 8.0, 20.0, 22.0, 29.0, 25.0, 33.0, 47.0, 67.0, 69.0, 107.0, 107.0, 112.0, 81.0, 57.0, 37.0, 37.0, 21.0, 20.0, 16.0, 7.0, 11.0, 3.0, 4.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013256072998046875, -0.00012819841504096985, -0.00012383610010147095, -0.00011947378516197205, -0.00011511147022247314, -0.00011074915528297424, -0.00010638684034347534, -0.00010202452540397644, -9.766221046447754e-05, -9.329989552497864e-05, -8.893758058547974e-05, -8.457526564598083e-05, -8.021295070648193e-05, -7.585063576698303e-05, -7.148832082748413e-05, -6.712600588798523e-05, -6.276369094848633e-05, -5.840137600898743e-05, -5.4039061069488525e-05, -4.9676746129989624e-05, -4.531443119049072e-05, -4.095211625099182e-05, -3.658980131149292e-05, -3.222748637199402e-05, -2.7865171432495117e-05, -2.3502856492996216e-05, -1.9140541553497314e-05, -1.4778226613998413e-05, -1.0415911674499512e-05, -6.05359673500061e-06, -1.691281795501709e-06, 2.6710331439971924e-06, 7.033348083496094e-06, 1.1395663022994995e-05, 1.5757977962493896e-05, 2.0120292901992798e-05, 2.44826078414917e-05, 2.88449227809906e-05, 3.32072377204895e-05, 3.75695526599884e-05, 4.1931867599487305e-05, 4.6294182538986206e-05, 5.065649747848511e-05, 5.501881241798401e-05, 5.938112735748291e-05, 6.374344229698181e-05, 6.810575723648071e-05, 7.246807217597961e-05, 7.683038711547852e-05, 8.119270205497742e-05, 8.555501699447632e-05, 8.991733193397522e-05, 9.427964687347412e-05, 9.864196181297302e-05, 0.00010300427675247192, 0.00010736659169197083, 0.00011172890663146973, 0.00011609122157096863, 0.00012045353651046753, 0.00012481585144996643, 0.00012917816638946533, 0.00013354048132896423, 0.00013790279626846313, 0.00014226511120796204, 0.00014662742614746094]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 14.0, 8.0, 21.0, 25.0, 38.0, 72.0, 142.0, 310.0, 601.0, 1451.0, 3829.0, 13245.0, 61697.0, 647738.0, 265193.0, 40036.0, 9191.0, 2835.0, 1073.0, 529.0, 239.0, 116.0, 47.0, 37.0, 24.0, 13.0, 17.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63720703125, -0.6183929443359375, -0.599578857421875, -0.5807647705078125, -0.56195068359375, -0.5431365966796875, -0.524322509765625, -0.5055084228515625, -0.4866943359375, -0.4678802490234375, -0.449066162109375, -0.4302520751953125, -0.41143798828125, -0.3926239013671875, -0.373809814453125, -0.3549957275390625, -0.336181640625, -0.3173675537109375, -0.298553466796875, -0.2797393798828125, -0.26092529296875, -0.2421112060546875, -0.223297119140625, -0.2044830322265625, -0.1856689453125, -0.1668548583984375, -0.148040771484375, -0.1292266845703125, -0.11041259765625, -0.0915985107421875, -0.072784423828125, -0.0539703369140625, -0.03515625, -0.0163421630859375, 0.002471923828125, 0.0212860107421875, 0.04010009765625, 0.0589141845703125, 0.077728271484375, 0.0965423583984375, 0.1153564453125, 0.1341705322265625, 0.152984619140625, 0.1717987060546875, 0.19061279296875, 0.2094268798828125, 0.228240966796875, 0.2470550537109375, 0.265869140625, 0.2846832275390625, 0.303497314453125, 0.3223114013671875, 0.34112548828125, 0.3599395751953125, 0.378753662109375, 0.3975677490234375, 0.4163818359375, 0.4351959228515625, 0.454010009765625, 0.4728240966796875, 0.49163818359375, 0.5104522705078125, 0.529266357421875, 0.5480804443359375, 0.56689453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 0.0, 3.0, 9.0, 19.0, 23.0, 21.0, 39.0, 69.0, 68.0, 80.0, 120.0, 103.0, 82.0, 91.0, 57.0, 54.0, 46.0, 27.0, 26.0, 12.0, 10.0, 7.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5475692749023438, -0.5301971435546875, -0.5128250122070312, -0.495452880859375, -0.47808074951171875, -0.4607086181640625, -0.44333648681640625, -0.42596435546875, -0.40859222412109375, -0.3912200927734375, -0.37384796142578125, -0.356475830078125, -0.33910369873046875, -0.3217315673828125, -0.30435943603515625, -0.2869873046875, -0.26961517333984375, -0.2522430419921875, -0.23487091064453125, -0.217498779296875, -0.20012664794921875, -0.1827545166015625, -0.16538238525390625, -0.14801025390625, -0.13063812255859375, -0.1132659912109375, -0.09589385986328125, -0.078521728515625, -0.06114959716796875, -0.0437774658203125, -0.02640533447265625, -0.009033203125, 0.00833892822265625, 0.0257110595703125, 0.04308319091796875, 0.060455322265625, 0.07782745361328125, 0.0951995849609375, 0.11257171630859375, 0.12994384765625, 0.14731597900390625, 0.1646881103515625, 0.18206024169921875, 0.199432373046875, 0.21680450439453125, 0.2341766357421875, 0.25154876708984375, 0.2689208984375, 0.28629302978515625, 0.3036651611328125, 0.32103729248046875, 0.338409423828125, 0.35578155517578125, 0.3731536865234375, 0.39052581787109375, 0.40789794921875, 0.42527008056640625, 0.4426422119140625, 0.46001434326171875, 0.477386474609375, 0.49475860595703125, 0.5121307373046875, 0.5295028686523438, 0.546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 20.0, 36.0, 60.0, 84.0, 244.0, 245.0, 129.0, 73.0, 40.0, 20.0, 19.0, 9.0, 12.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.146360397338867, -7.738837718963623, -7.331315040588379, -6.923792362213135, -6.516269683837891, -6.108746528625488, -5.701224327087402, -5.293701171875, -4.886178970336914, -4.47865629196167, -4.071133613586426, -3.6636109352111816, -3.2560882568359375, -2.8485653400421143, -2.44104266166687, -2.033519983291626, -1.6259970664978027, -1.2184743881225586, -0.8109516501426697, -0.40342891216278076, 0.004093766212463379, 0.41161656379699707, 0.8191392421722412, 1.2266619205474854, 1.6341845989227295, 2.0417072772979736, 2.4492299556732178, 2.856752872467041, 3.264275550842285, 3.6717982292175293, 4.079320907592773, 4.486843585968018, 4.894366264343262, 5.301888942718506, 5.70941162109375, 6.116934299468994, 6.524456977844238, 6.931980133056641, 7.339502334594727, 7.747025489807129, 8.154547691345215, 8.562070846557617, 8.969593048095703, 9.377116203308105, 9.784638404846191, 10.192161560058594, 10.59968376159668, 11.007206916809082, 11.414730072021484, 11.822253227233887, 12.229775428771973, 12.637298583984375, 13.044820785522461, 13.452343940734863, 13.85986614227295, 14.267389297485352, 14.674911499023438, 15.08243465423584, 15.489956855773926, 15.897480010986328, 16.305002212524414, 16.7125244140625, 17.12004852294922, 17.527570724487305, 17.93509292602539]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 7.0, 8.0, 9.0, 17.0, 12.0, 13.0, 9.0, 24.0, 17.0, 27.0, 26.0, 20.0, 32.0, 33.0, 39.0, 56.0, 112.0, 102.0, 75.0, 51.0, 36.0, 38.0, 38.0, 31.0, 24.0, 29.0, 18.0, 19.0, 11.0, 16.0, 12.0, 15.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.032028198242188, -8.775113105773926, -8.518198013305664, -8.261282920837402, -8.00436782836914, -7.747452735900879, -7.490537643432617, -7.2336225509643555, -6.976707458496094, -6.719792366027832, -6.46287727355957, -6.205962181091309, -5.949047088623047, -5.692131996154785, -5.435216903686523, -5.178301811218262, -4.921386241912842, -4.66447114944458, -4.407556056976318, -4.150640964508057, -3.893725872039795, -3.636810779571533, -3.3798954486846924, -3.1229803562164307, -2.866065263748169, -2.6091501712799072, -2.3522350788116455, -2.0953197479248047, -1.8384047746658325, -1.5814896821975708, -1.3245744705200195, -1.0676593780517578, -0.8107442855834961, -0.5538291931152344, -0.2969140410423279, -0.03999888896942139, 0.21691620349884033, 0.47383129596710205, 0.7307465076446533, 0.987661600112915, 1.2445766925811768, 1.5014917850494385, 1.7584068775177002, 2.015322208404541, 2.2722373008728027, 2.5291523933410645, 2.786067485809326, 3.042982578277588, 3.2998976707458496, 3.5568127632141113, 3.813727855682373, 4.070642948150635, 4.3275580406188965, 4.584473133087158, 4.841388702392578, 5.09830379486084, 5.355218887329102, 5.612133979797363, 5.869049072265625, 6.125964164733887, 6.382879257202148, 6.63979434967041, 6.896709442138672, 7.153624534606934, 7.410539627075195]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 29.0, 43.0, 69.0, 112.0, 196.0, 412.0, 765.0, 1795.0, 4235.0, 11848.0, 42340.0, 220783.0, 1457748.0, 2023795.0, 345597.0, 59522.0, 15405.0, 5392.0, 2144.0, 965.0, 484.0, 256.0, 127.0, 86.0, 54.0, 29.0, 12.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-1.1240234375, -1.0979537963867188, -1.0718841552734375, -1.0458145141601562, -1.019744873046875, -0.9936752319335938, -0.9676055908203125, -0.9415359497070312, -0.91546630859375, -0.8893966674804688, -0.8633270263671875, -0.8372573852539062, -0.811187744140625, -0.7851181030273438, -0.7590484619140625, -0.7329788208007812, -0.7069091796875, -0.6808395385742188, -0.6547698974609375, -0.6287002563476562, -0.602630615234375, -0.5765609741210938, -0.5504913330078125, -0.5244216918945312, -0.49835205078125, -0.47228240966796875, -0.4462127685546875, -0.42014312744140625, -0.394073486328125, -0.36800384521484375, -0.3419342041015625, -0.31586456298828125, -0.289794921875, -0.26372528076171875, -0.2376556396484375, -0.21158599853515625, -0.185516357421875, -0.15944671630859375, -0.1333770751953125, -0.10730743408203125, -0.08123779296875, -0.05516815185546875, -0.0290985107421875, -0.00302886962890625, 0.023040771484375, 0.04911041259765625, 0.0751800537109375, 0.10124969482421875, 0.1273193359375, 0.15338897705078125, 0.1794586181640625, 0.20552825927734375, 0.231597900390625, 0.25766754150390625, 0.2837371826171875, 0.30980682373046875, 0.33587646484375, 0.36194610595703125, 0.3880157470703125, 0.41408538818359375, 0.440155029296875, 0.46622467041015625, 0.4922943115234375, 0.5183639526367188, 0.54443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 16.0, 12.0, 16.0, 23.0, 25.0, 27.0, 20.0, 38.0, 30.0, 30.0, 40.0, 35.0, 35.0, 45.0, 35.0, 44.0, 46.0, 45.0, 48.0, 50.0, 43.0, 32.0, 34.0, 36.0, 29.0, 24.0, 19.0, 20.0, 18.0, 10.0, 10.0, 11.0, 6.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5561599731445312, -0.5385894775390625, -0.5210189819335938, -0.503448486328125, -0.48587799072265625, -0.4683074951171875, -0.45073699951171875, -0.43316650390625, -0.41559600830078125, -0.3980255126953125, -0.38045501708984375, -0.362884521484375, -0.34531402587890625, -0.3277435302734375, -0.31017303466796875, -0.2926025390625, -0.27503204345703125, -0.2574615478515625, -0.23989105224609375, -0.222320556640625, -0.20475006103515625, -0.1871795654296875, -0.16960906982421875, -0.15203857421875, -0.13446807861328125, -0.1168975830078125, -0.09932708740234375, -0.081756591796875, -0.06418609619140625, -0.0466156005859375, -0.02904510498046875, -0.011474609375, 0.00609588623046875, 0.0236663818359375, 0.04123687744140625, 0.058807373046875, 0.07637786865234375, 0.0939483642578125, 0.11151885986328125, 0.12908935546875, 0.14665985107421875, 0.1642303466796875, 0.18180084228515625, 0.199371337890625, 0.21694183349609375, 0.2345123291015625, 0.25208282470703125, 0.2696533203125, 0.28722381591796875, 0.3047943115234375, 0.32236480712890625, 0.339935302734375, 0.35750579833984375, 0.3750762939453125, 0.39264678955078125, 0.41021728515625, 0.42778778076171875, 0.4453582763671875, 0.46292877197265625, 0.480499267578125, 0.49806976318359375, 0.5156402587890625, 0.5332107543945312, 0.55078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 8.0, 4.0, 10.0, 8.0, 19.0, 27.0, 31.0, 38.0, 75.0, 101.0, 185.0, 358.0, 737.0, 1818.0, 6261.0, 31972.0, 340834.0, 3442645.0, 329319.0, 30881.0, 5870.0, 1645.0, 664.0, 293.0, 161.0, 90.0, 67.0, 47.0, 25.0, 23.0, 19.0, 9.0, 11.0, 9.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.534271240234375, -1.48846435546875, -1.442657470703125, -1.3968505859375, -1.351043701171875, -1.30523681640625, -1.259429931640625, -1.213623046875, -1.167816162109375, -1.12200927734375, -1.076202392578125, -1.0303955078125, -0.984588623046875, -0.93878173828125, -0.892974853515625, -0.84716796875, -0.801361083984375, -0.75555419921875, -0.709747314453125, -0.6639404296875, -0.618133544921875, -0.57232666015625, -0.526519775390625, -0.480712890625, -0.434906005859375, -0.38909912109375, -0.343292236328125, -0.2974853515625, -0.251678466796875, -0.20587158203125, -0.160064697265625, -0.1142578125, -0.068450927734375, -0.02264404296875, 0.023162841796875, 0.0689697265625, 0.114776611328125, 0.16058349609375, 0.206390380859375, 0.252197265625, 0.298004150390625, 0.34381103515625, 0.389617919921875, 0.4354248046875, 0.481231689453125, 0.52703857421875, 0.572845458984375, 0.61865234375, 0.664459228515625, 0.71026611328125, 0.756072998046875, 0.8018798828125, 0.847686767578125, 0.89349365234375, 0.939300537109375, 0.985107421875, 1.030914306640625, 1.07672119140625, 1.122528076171875, 1.1683349609375, 1.214141845703125, 1.25994873046875, 1.305755615234375, 1.3515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 14.0, 14.0, 18.0, 32.0, 41.0, 45.0, 91.0, 166.0, 242.0, 395.0, 596.0, 763.0, 619.0, 360.0, 248.0, 152.0, 76.0, 63.0, 37.0, 25.0, 10.0, 16.0, 13.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.47412109375, -1.4287109375, -1.38330078125, -1.337890625, -1.29248046875, -1.2470703125, -1.20166015625, -1.15625, -1.11083984375, -1.0654296875, -1.02001953125, -0.974609375, -0.92919921875, -0.8837890625, -0.83837890625, -0.79296875, -0.74755859375, -0.7021484375, -0.65673828125, -0.611328125, -0.56591796875, -0.5205078125, -0.47509765625, -0.4296875, -0.38427734375, -0.3388671875, -0.29345703125, -0.248046875, -0.20263671875, -0.1572265625, -0.11181640625, -0.06640625, -0.02099609375, 0.0244140625, 0.06982421875, 0.115234375, 0.16064453125, 0.2060546875, 0.25146484375, 0.296875, 0.34228515625, 0.3876953125, 0.43310546875, 0.478515625, 0.52392578125, 0.5693359375, 0.61474609375, 0.66015625, 0.70556640625, 0.7509765625, 0.79638671875, 0.841796875, 0.88720703125, 0.9326171875, 0.97802734375, 1.0234375, 1.06884765625, 1.1142578125, 1.15966796875, 1.205078125, 1.25048828125, 1.2958984375, 1.34130859375, 1.38671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 17.0, 29.0, 58.0, 163.0, 210.0, 218.0, 143.0, 87.0, 29.0, 14.0, 9.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.287250518798828, -14.811155319213867, -14.335061073303223, -13.858966827392578, -13.382871627807617, -12.906776428222656, -12.430682182312012, -11.954587936401367, -11.478492736816406, -11.002397537231445, -10.5263032913208, -10.050209045410156, -9.574113845825195, -9.098018646240234, -8.62192440032959, -8.145830154418945, -7.669734954833984, -7.193640232086182, -6.717545509338379, -6.241450786590576, -5.765356063842773, -5.289261341094971, -4.813166618347168, -4.337071895599365, -3.8609771728515625, -3.3848824501037598, -2.908787727355957, -2.4326930046081543, -1.9565982818603516, -1.4805035591125488, -1.004408836364746, -0.5283141136169434, -0.05221843719482422, 0.4238762855529785, 0.8999710083007812, 1.376065731048584, 1.8521604537963867, 2.3282551765441895, 2.804349899291992, 3.280444622039795, 3.7565393447875977, 4.2326340675354, 4.708728790283203, 5.184823513031006, 5.660918235778809, 6.137012958526611, 6.613107681274414, 7.089202404022217, 7.5652971267700195, 8.041391372680664, 8.517486572265625, 8.993581771850586, 9.46967601776123, 9.945770263671875, 10.421865463256836, 10.897960662841797, 11.374054908752441, 11.850149154663086, 12.326244354248047, 12.802339553833008, 13.278433799743652, 13.754528045654297, 14.230623245239258, 14.706718444824219, 15.182812690734863]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 10.0, 5.0, 9.0, 8.0, 12.0, 4.0, 12.0, 18.0, 17.0, 21.0, 14.0, 30.0, 35.0, 35.0, 38.0, 40.0, 41.0, 38.0, 32.0, 36.0, 34.0, 42.0, 43.0, 40.0, 34.0, 35.0, 36.0, 41.0, 36.0, 27.0, 26.0, 17.0, 16.0, 19.0, 13.0, 11.0, 12.0, 9.0, 10.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.812309741973877, -4.6557722091674805, -4.499234676361084, -4.342697620391846, -4.186160087585449, -4.029622554779053, -3.8730850219726562, -3.7165474891662598, -3.5600101947784424, -3.403472661972046, -3.2469353675842285, -3.090397834777832, -2.9338603019714355, -2.777323007583618, -2.6207854747772217, -2.4642481803894043, -2.307710647583008, -2.1511731147766113, -1.994635820388794, -1.8380982875823975, -1.6815608739852905, -1.5250234603881836, -1.368485927581787, -1.2119485139846802, -1.0554111003875732, -0.8988736867904663, -0.7423362135887146, -0.5857987403869629, -0.42926132678985596, -0.272723913192749, -0.11618643999099731, 0.040351033210754395, 0.19688892364501953, 0.35342636704444885, 0.5099638104438782, 0.6665012836456299, 0.8230386972427368, 0.9795761108398438, 1.1361136436462402, 1.2926510572433472, 1.449188470840454, 1.605725884437561, 1.762263298034668, 1.9188008308410645, 2.075338363647461, 2.2318756580352783, 2.388413190841675, 2.544950485229492, 2.7014880180358887, 2.858025550842285, 3.0145628452301025, 3.171100378036499, 3.3276376724243164, 3.484175205230713, 3.6407127380371094, 3.797250270843506, 3.9537875652313232, 4.110324859619141, 4.266862392425537, 4.423399925231934, 4.57993745803833, 4.736474990844727, 4.893012046813965, 5.049549579620361, 5.206087112426758]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 8.0, 6.0, 10.0, 11.0, 19.0, 22.0, 30.0, 35.0, 57.0, 79.0, 120.0, 207.0, 326.0, 525.0, 844.0, 1446.0, 2432.0, 4237.0, 7397.0, 13395.0, 25705.0, 50767.0, 106179.0, 224537.0, 289985.0, 163552.0, 76136.0, 37023.0, 19400.0, 10117.0, 5731.0, 3317.0, 1934.0, 1073.0, 659.0, 432.0, 258.0, 191.0, 108.0, 80.0, 59.0, 38.0, 25.0, 13.0, 7.0, 10.0, 8.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7568359375, -0.730072021484375, -0.70330810546875, -0.676544189453125, -0.6497802734375, -0.623016357421875, -0.59625244140625, -0.569488525390625, -0.542724609375, -0.515960693359375, -0.48919677734375, -0.462432861328125, -0.4356689453125, -0.408905029296875, -0.38214111328125, -0.355377197265625, -0.32861328125, -0.301849365234375, -0.27508544921875, -0.248321533203125, -0.2215576171875, -0.194793701171875, -0.16802978515625, -0.141265869140625, -0.114501953125, -0.087738037109375, -0.06097412109375, -0.034210205078125, -0.0074462890625, 0.019317626953125, 0.04608154296875, 0.072845458984375, 0.099609375, 0.126373291015625, 0.15313720703125, 0.179901123046875, 0.2066650390625, 0.233428955078125, 0.26019287109375, 0.286956787109375, 0.313720703125, 0.340484619140625, 0.36724853515625, 0.394012451171875, 0.4207763671875, 0.447540283203125, 0.47430419921875, 0.501068115234375, 0.52783203125, 0.554595947265625, 0.58135986328125, 0.608123779296875, 0.6348876953125, 0.661651611328125, 0.68841552734375, 0.715179443359375, 0.741943359375, 0.768707275390625, 0.79547119140625, 0.822235107421875, 0.8489990234375, 0.875762939453125, 0.90252685546875, 0.929290771484375, 0.9560546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 6.0, 2.0, 7.0, 11.0, 7.0, 13.0, 15.0, 19.0, 16.0, 17.0, 23.0, 28.0, 22.0, 23.0, 36.0, 32.0, 28.0, 33.0, 42.0, 35.0, 56.0, 45.0, 45.0, 42.0, 45.0, 36.0, 38.0, 41.0, 29.0, 34.0, 19.0, 25.0, 14.0, 15.0, 13.0, 21.0, 11.0, 10.0, 6.0, 7.0, 10.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.58837890625, -0.5712203979492188, -0.5540618896484375, -0.5369033813476562, -0.519744873046875, -0.5025863647460938, -0.4854278564453125, -0.46826934814453125, -0.45111083984375, -0.43395233154296875, -0.4167938232421875, -0.39963531494140625, -0.382476806640625, -0.36531829833984375, -0.3481597900390625, -0.33100128173828125, -0.3138427734375, -0.29668426513671875, -0.2795257568359375, -0.26236724853515625, -0.245208740234375, -0.22805023193359375, -0.2108917236328125, -0.19373321533203125, -0.17657470703125, -0.15941619873046875, -0.1422576904296875, -0.12509918212890625, -0.107940673828125, -0.09078216552734375, -0.0736236572265625, -0.05646514892578125, -0.039306640625, -0.02214813232421875, -0.0049896240234375, 0.01216888427734375, 0.029327392578125, 0.04648590087890625, 0.0636444091796875, 0.08080291748046875, 0.09796142578125, 0.11511993408203125, 0.1322784423828125, 0.14943695068359375, 0.166595458984375, 0.18375396728515625, 0.2009124755859375, 0.21807098388671875, 0.2352294921875, 0.25238800048828125, 0.2695465087890625, 0.28670501708984375, 0.303863525390625, 0.32102203369140625, 0.3381805419921875, 0.35533905029296875, 0.37249755859375, 0.38965606689453125, 0.4068145751953125, 0.42397308349609375, 0.441131591796875, 0.45829010009765625, 0.4754486083984375, 0.49260711669921875, 0.509765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 9.0, 6.0, 5.0, 10.0, 20.0, 26.0, 22.0, 51.0, 60.0, 73.0, 116.0, 168.0, 255.0, 374.0, 543.0, 1116.0, 2200.0, 5934.0, 22111.0, 128637.0, 746062.0, 110814.0, 19456.0, 5431.0, 2113.0, 1129.0, 597.0, 398.0, 242.0, 178.0, 128.0, 78.0, 49.0, 34.0, 33.0, 29.0, 12.0, 11.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.52630615234375, -1.4686279296875, -1.41094970703125, -1.353271484375, -1.29559326171875, -1.2379150390625, -1.18023681640625, -1.12255859375, -1.06488037109375, -1.0072021484375, -0.94952392578125, -0.891845703125, -0.83416748046875, -0.7764892578125, -0.71881103515625, -0.6611328125, -0.60345458984375, -0.5457763671875, -0.48809814453125, -0.430419921875, -0.37274169921875, -0.3150634765625, -0.25738525390625, -0.19970703125, -0.14202880859375, -0.0843505859375, -0.02667236328125, 0.031005859375, 0.08868408203125, 0.1463623046875, 0.20404052734375, 0.26171875, 0.31939697265625, 0.3770751953125, 0.43475341796875, 0.492431640625, 0.55010986328125, 0.6077880859375, 0.66546630859375, 0.72314453125, 0.78082275390625, 0.8385009765625, 0.89617919921875, 0.953857421875, 1.01153564453125, 1.0692138671875, 1.12689208984375, 1.1845703125, 1.24224853515625, 1.2999267578125, 1.35760498046875, 1.415283203125, 1.47296142578125, 1.5306396484375, 1.58831787109375, 1.64599609375, 1.70367431640625, 1.7613525390625, 1.81903076171875, 1.876708984375, 1.93438720703125, 1.9920654296875, 2.04974365234375, 2.107421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 5.0, 5.0, 8.0, 15.0, 13.0, 12.0, 20.0, 32.0, 40.0, 27.0, 36.0, 49.0, 44.0, 56.0, 58.0, 61.0, 49.0, 42.0, 56.0, 49.0, 39.0, 41.0, 31.0, 29.0, 30.0, 18.0, 17.0, 14.0, 17.0, 7.0, 18.0, 6.0, 7.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-2.5859375, -2.5176544189453125, -2.449371337890625, -2.3810882568359375, -2.31280517578125, -2.2445220947265625, -2.176239013671875, -2.1079559326171875, -2.0396728515625, -1.9713897705078125, -1.903106689453125, -1.8348236083984375, -1.76654052734375, -1.6982574462890625, -1.629974365234375, -1.5616912841796875, -1.493408203125, -1.4251251220703125, -1.356842041015625, -1.2885589599609375, -1.22027587890625, -1.1519927978515625, -1.083709716796875, -1.0154266357421875, -0.9471435546875, -0.8788604736328125, -0.810577392578125, -0.7422943115234375, -0.67401123046875, -0.6057281494140625, -0.537445068359375, -0.4691619873046875, -0.40087890625, -0.3325958251953125, -0.264312744140625, -0.1960296630859375, -0.12774658203125, -0.0594635009765625, 0.008819580078125, 0.0771026611328125, 0.1453857421875, 0.2136688232421875, 0.281951904296875, 0.3502349853515625, 0.41851806640625, 0.4868011474609375, 0.555084228515625, 0.6233673095703125, 0.691650390625, 0.7599334716796875, 0.828216552734375, 0.8964996337890625, 0.96478271484375, 1.0330657958984375, 1.101348876953125, 1.1696319580078125, 1.2379150390625, 1.3061981201171875, 1.374481201171875, 1.4427642822265625, 1.51104736328125, 1.5793304443359375, 1.647613525390625, 1.7158966064453125, 1.7841796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 12.0, 19.0, 26.0, 32.0, 54.0, 70.0, 128.0, 187.0, 339.0, 515.0, 1033.0, 2182.0, 5526.0, 18674.0, 91503.0, 772014.0, 121673.0, 22895.0, 6420.0, 2491.0, 1168.0, 566.0, 327.0, 219.0, 149.0, 87.0, 69.0, 39.0, 39.0, 22.0, 19.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.576690673828125, -0.55718994140625, -0.537689208984375, -0.5181884765625, -0.498687744140625, -0.47918701171875, -0.459686279296875, -0.440185546875, -0.420684814453125, -0.40118408203125, -0.381683349609375, -0.3621826171875, -0.342681884765625, -0.32318115234375, -0.303680419921875, -0.2841796875, -0.264678955078125, -0.24517822265625, -0.225677490234375, -0.2061767578125, -0.186676025390625, -0.16717529296875, -0.147674560546875, -0.128173828125, -0.108673095703125, -0.08917236328125, -0.069671630859375, -0.0501708984375, -0.030670166015625, -0.01116943359375, 0.008331298828125, 0.02783203125, 0.047332763671875, 0.06683349609375, 0.086334228515625, 0.1058349609375, 0.125335693359375, 0.14483642578125, 0.164337158203125, 0.183837890625, 0.203338623046875, 0.22283935546875, 0.242340087890625, 0.2618408203125, 0.281341552734375, 0.30084228515625, 0.320343017578125, 0.33984375, 0.359344482421875, 0.37884521484375, 0.398345947265625, 0.4178466796875, 0.437347412109375, 0.45684814453125, 0.476348876953125, 0.495849609375, 0.515350341796875, 0.53485107421875, 0.554351806640625, 0.5738525390625, 0.593353271484375, 0.61285400390625, 0.632354736328125, 0.65185546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 9.0, 10.0, 7.0, 11.0, 14.0, 18.0, 26.0, 30.0, 29.0, 60.0, 90.0, 109.0, 113.0, 93.0, 88.0, 77.0, 42.0, 29.0, 28.0, 20.0, 12.0, 15.0, 8.0, 12.0, 6.0, 4.0, 3.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.00013723596930503845, -0.00013189762830734253, -0.0001265592873096466, -0.00012122094631195068, -0.00011588260531425476, -0.00011054426431655884, -0.00010520592331886292, -9.986758232116699e-05, -9.452924132347107e-05, -8.919090032577515e-05, -8.385255932807922e-05, -7.85142183303833e-05, -7.317587733268738e-05, -6.783753633499146e-05, -6.249919533729553e-05, -5.716085433959961e-05, -5.1822513341903687e-05, -4.6484172344207764e-05, -4.114583134651184e-05, -3.580749034881592e-05, -3.0469149351119995e-05, -2.5130808353424072e-05, -1.979246735572815e-05, -1.4454126358032227e-05, -9.115785360336304e-06, -3.777444362640381e-06, 1.560896635055542e-06, 6.899237632751465e-06, 1.2237578630447388e-05, 1.757591962814331e-05, 2.2914260625839233e-05, 2.8252601623535156e-05, 3.359094262123108e-05, 3.8929283618927e-05, 4.4267624616622925e-05, 4.960596561431885e-05, 5.494430661201477e-05, 6.028264760971069e-05, 6.562098860740662e-05, 7.095932960510254e-05, 7.629767060279846e-05, 8.163601160049438e-05, 8.697435259819031e-05, 9.231269359588623e-05, 9.765103459358215e-05, 0.00010298937559127808, 0.000108327716588974, 0.00011366605758666992, 0.00011900439858436584, 0.00012434273958206177, 0.0001296810805797577, 0.0001350194215774536, 0.00014035776257514954, 0.00014569610357284546, 0.00015103444457054138, 0.0001563727855682373, 0.00016171112656593323, 0.00016704946756362915, 0.00017238780856132507, 0.000177726149559021, 0.00018306449055671692, 0.00018840283155441284, 0.00019374117255210876, 0.0001990795135498047]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 10.0, 13.0, 13.0, 18.0, 12.0, 53.0, 78.0, 124.0, 250.0, 411.0, 858.0, 2253.0, 7268.0, 31518.0, 227059.0, 705129.0, 56793.0, 11078.0, 3169.0, 1217.0, 536.0, 291.0, 158.0, 89.0, 56.0, 27.0, 21.0, 19.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5978546142578125, -0.578033447265625, -0.5582122802734375, -0.53839111328125, -0.5185699462890625, -0.498748779296875, -0.4789276123046875, -0.4591064453125, -0.4392852783203125, -0.419464111328125, -0.3996429443359375, -0.37982177734375, -0.3600006103515625, -0.340179443359375, -0.3203582763671875, -0.300537109375, -0.2807159423828125, -0.260894775390625, -0.2410736083984375, -0.22125244140625, -0.2014312744140625, -0.181610107421875, -0.1617889404296875, -0.1419677734375, -0.1221466064453125, -0.102325439453125, -0.0825042724609375, -0.06268310546875, -0.0428619384765625, -0.023040771484375, -0.0032196044921875, 0.0166015625, 0.0364227294921875, 0.056243896484375, 0.0760650634765625, 0.09588623046875, 0.1157073974609375, 0.135528564453125, 0.1553497314453125, 0.1751708984375, 0.1949920654296875, 0.214813232421875, 0.2346343994140625, 0.25445556640625, 0.2742767333984375, 0.294097900390625, 0.3139190673828125, 0.333740234375, 0.3535614013671875, 0.373382568359375, 0.3932037353515625, 0.41302490234375, 0.4328460693359375, 0.452667236328125, 0.4724884033203125, 0.4923095703125, 0.5121307373046875, 0.531951904296875, 0.5517730712890625, 0.57159423828125, 0.5914154052734375, 0.611236572265625, 0.6310577392578125, 0.65087890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 8.0, 1.0, 8.0, 12.0, 7.0, 10.0, 16.0, 21.0, 14.0, 17.0, 21.0, 22.0, 21.0, 35.0, 26.0, 39.0, 47.0, 72.0, 58.0, 77.0, 68.0, 58.0, 46.0, 36.0, 31.0, 29.0, 22.0, 18.0, 32.0, 18.0, 19.0, 17.0, 5.0, 10.0, 17.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2541007995605469, -0.24404144287109375, -0.23398208618164062, -0.2239227294921875, -0.21386337280273438, -0.20380401611328125, -0.19374465942382812, -0.183685302734375, -0.17362594604492188, -0.16356658935546875, -0.15350723266601562, -0.1434478759765625, -0.13338851928710938, -0.12332916259765625, -0.11326980590820312, -0.10321044921875, -0.09315109252929688, -0.08309173583984375, -0.07303237915039062, -0.0629730224609375, -0.052913665771484375, -0.04285430908203125, -0.032794952392578125, -0.022735595703125, -0.012676239013671875, -0.00261688232421875, 0.007442474365234375, 0.0175018310546875, 0.027561187744140625, 0.03762054443359375, 0.047679901123046875, 0.0577392578125, 0.06779861450195312, 0.07785797119140625, 0.08791732788085938, 0.0979766845703125, 0.10803604125976562, 0.11809539794921875, 0.12815475463867188, 0.138214111328125, 0.14827346801757812, 0.15833282470703125, 0.16839218139648438, 0.1784515380859375, 0.18851089477539062, 0.19857025146484375, 0.20862960815429688, 0.21868896484375, 0.22874832153320312, 0.23880767822265625, 0.24886703491210938, 0.2589263916015625, 0.2689857482910156, 0.27904510498046875, 0.2891044616699219, 0.299163818359375, 0.3092231750488281, 0.31928253173828125, 0.3293418884277344, 0.3394012451171875, 0.3494606018066406, 0.35951995849609375, 0.3695793151855469, 0.379638671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 25.0, 49.0, 167.0, 456.0, 142.0, 71.0, 39.0, 19.0, 11.0, 6.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.847379684448242, -9.04951286315918, -8.2516450881958, -7.453778266906738, -6.655910968780518, -5.858043670654297, -5.060176849365234, -4.262309551239014, -3.464442253112793, -2.6665749549865723, -1.8687078952789307, -1.070840835571289, -0.27297353744506836, 0.5248937606811523, 1.3227605819702148, 2.1206278800964355, 2.9184951782226562, 3.716362476348877, 4.514229774475098, 5.31209659576416, 6.109963893890381, 6.907831192016602, 7.705698013305664, 8.503564834594727, 9.301432609558105, 10.099299430847168, 10.897167205810547, 11.69503402709961, 12.492900848388672, 13.29076862335205, 14.088635444641113, 14.886503219604492, 15.684368133544922, 16.482234954833984, 17.280101776123047, 18.07796859741211, 18.875837326049805, 19.673704147338867, 20.47157096862793, 21.269437789916992, 22.067306518554688, 22.86517333984375, 23.663040161132812, 24.460906982421875, 25.25877571105957, 26.056642532348633, 26.854509353637695, 27.652376174926758, 28.45024299621582, 29.248109817504883, 30.045976638793945, 30.84384536743164, 31.641712188720703, 32.439579010009766, 33.23744583129883, 34.03531265258789, 34.83317947387695, 35.631046295166016, 36.42891311645508, 37.22677993774414, 38.0246467590332, 38.82251739501953, 39.620384216308594, 40.418251037597656, 41.21611785888672]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 4.0, 5.0, 9.0, 5.0, 11.0, 9.0, 19.0, 12.0, 15.0, 15.0, 18.0, 11.0, 23.0, 21.0, 16.0, 27.0, 27.0, 45.0, 63.0, 120.0, 132.0, 66.0, 32.0, 26.0, 39.0, 21.0, 23.0, 17.0, 30.0, 16.0, 15.0, 13.0, 12.0, 14.0, 14.0, 5.0, 7.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.11758804321289, -7.879914283752441, -7.64224100112915, -7.404567241668701, -7.16689395904541, -6.929220199584961, -6.691546440124512, -6.453873157501221, -6.2161993980407715, -5.978525638580322, -5.740852355957031, -5.503178596496582, -5.265505313873291, -5.027831554412842, -4.790158271789551, -4.552484512329102, -4.314810752868652, -4.077136993408203, -3.839463710784912, -3.601789951324463, -3.3641164302825928, -3.1264429092407227, -2.8887693881988525, -2.6510958671569824, -2.4134225845336914, -2.1757490634918213, -1.9380754232406616, -1.7004019021987915, -1.4627282619476318, -1.2250547409057617, -0.9873812198638916, -0.7497075796127319, -0.5120339393615723, -0.2743603587150574, -0.03668680787086487, 0.20098674297332764, 0.43866032361984253, 0.6763339042663574, 0.9140074253082275, 1.1516810655593872, 1.3893545866012573, 1.6270281076431274, 1.864701747894287, 2.1023752689361572, 2.3400487899780273, 2.5777225494384766, 2.8153958320617676, 3.053069591522217, 3.290743112564087, 3.528416633605957, 3.766090154647827, 4.003763675689697, 4.2414374351501465, 4.4791107177734375, 4.716784477233887, 4.954458236694336, 5.192131519317627, 5.429805278778076, 5.667478561401367, 5.905152320861816, 6.142825603485107, 6.380499362945557, 6.618172645568848, 6.855846405029297, 7.093520164489746]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 10.0, 4.0, 6.0, 15.0, 19.0, 30.0, 38.0, 68.0, 123.0, 179.0, 311.0, 570.0, 1064.0, 2163.0, 5158.0, 14676.0, 52826.0, 259936.0, 1266269.0, 1936595.0, 516528.0, 98933.0, 24204.0, 8143.0, 3213.0, 1432.0, 744.0, 404.0, 237.0, 156.0, 92.0, 51.0, 41.0, 21.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.0703048706054688, -1.0380706787109375, -1.0058364868164062, -0.973602294921875, -0.9413681030273438, -0.9091339111328125, -0.8768997192382812, -0.84466552734375, -0.8124313354492188, -0.7801971435546875, -0.7479629516601562, -0.715728759765625, -0.6834945678710938, -0.6512603759765625, -0.6190261840820312, -0.5867919921875, -0.5545578002929688, -0.5223236083984375, -0.49008941650390625, -0.457855224609375, -0.42562103271484375, -0.3933868408203125, -0.36115264892578125, -0.32891845703125, -0.29668426513671875, -0.2644500732421875, -0.23221588134765625, -0.199981689453125, -0.16774749755859375, -0.1355133056640625, -0.10327911376953125, -0.071044921875, -0.03881072998046875, -0.0065765380859375, 0.02565765380859375, 0.057891845703125, 0.09012603759765625, 0.1223602294921875, 0.15459442138671875, 0.18682861328125, 0.21906280517578125, 0.2512969970703125, 0.28353118896484375, 0.315765380859375, 0.34799957275390625, 0.3802337646484375, 0.41246795654296875, 0.4447021484375, 0.47693634033203125, 0.5091705322265625, 0.5414047241210938, 0.573638916015625, 0.6058731079101562, 0.6381072998046875, 0.6703414916992188, 0.70257568359375, 0.7348098754882812, 0.7670440673828125, 0.7992782592773438, 0.831512451171875, 0.8637466430664062, 0.8959808349609375, 0.9282150268554688, 0.96044921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 0.0, 3.0, 4.0, 3.0, 10.0, 12.0, 11.0, 10.0, 13.0, 20.0, 15.0, 18.0, 30.0, 26.0, 28.0, 30.0, 38.0, 33.0, 32.0, 53.0, 48.0, 44.0, 44.0, 44.0, 44.0, 53.0, 35.0, 41.0, 32.0, 29.0, 31.0, 18.0, 27.0, 23.0, 18.0, 15.0, 16.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5313034057617188, -0.5137786865234375, -0.49625396728515625, -0.478729248046875, -0.46120452880859375, -0.4436798095703125, -0.42615509033203125, -0.40863037109375, -0.39110565185546875, -0.3735809326171875, -0.35605621337890625, -0.338531494140625, -0.32100677490234375, -0.3034820556640625, -0.28595733642578125, -0.2684326171875, -0.25090789794921875, -0.2333831787109375, -0.21585845947265625, -0.198333740234375, -0.18080902099609375, -0.1632843017578125, -0.14575958251953125, -0.12823486328125, -0.11071014404296875, -0.0931854248046875, -0.07566070556640625, -0.058135986328125, -0.04061126708984375, -0.0230865478515625, -0.00556182861328125, 0.011962890625, 0.02948760986328125, 0.0470123291015625, 0.06453704833984375, 0.082061767578125, 0.09958648681640625, 0.1171112060546875, 0.13463592529296875, 0.15216064453125, 0.16968536376953125, 0.1872100830078125, 0.20473480224609375, 0.222259521484375, 0.23978424072265625, 0.2573089599609375, 0.27483367919921875, 0.2923583984375, 0.30988311767578125, 0.3274078369140625, 0.34493255615234375, 0.362457275390625, 0.37998199462890625, 0.3975067138671875, 0.41503143310546875, 0.43255615234375, 0.45008087158203125, 0.4676055908203125, 0.48513031005859375, 0.502655029296875, 0.5201797485351562, 0.5377044677734375, 0.5552291870117188, 0.57275390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 5.0, 12.0, 11.0, 21.0, 17.0, 46.0, 100.0, 233.0, 441.0, 1193.0, 4743.0, 141935.0, 4020870.0, 20856.0, 2339.0, 782.0, 298.0, 176.0, 81.0, 48.0, 25.0, 19.0, 12.0, 5.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.55078125, -4.38409423828125, -4.2174072265625, -4.05072021484375, -3.884033203125, -3.71734619140625, -3.5506591796875, -3.38397216796875, -3.21728515625, -3.05059814453125, -2.8839111328125, -2.71722412109375, -2.550537109375, -2.38385009765625, -2.2171630859375, -2.05047607421875, -1.8837890625, -1.71710205078125, -1.5504150390625, -1.38372802734375, -1.217041015625, -1.05035400390625, -0.8836669921875, -0.71697998046875, -0.55029296875, -0.38360595703125, -0.2169189453125, -0.05023193359375, 0.116455078125, 0.28314208984375, 0.4498291015625, 0.61651611328125, 0.783203125, 0.94989013671875, 1.1165771484375, 1.28326416015625, 1.449951171875, 1.61663818359375, 1.7833251953125, 1.95001220703125, 2.11669921875, 2.28338623046875, 2.4500732421875, 2.61676025390625, 2.783447265625, 2.95013427734375, 3.1168212890625, 3.28350830078125, 3.4501953125, 3.61688232421875, 3.7835693359375, 3.95025634765625, 4.116943359375, 4.28363037109375, 4.4503173828125, 4.61700439453125, 4.78369140625, 4.95037841796875, 5.1170654296875, 5.28375244140625, 5.450439453125, 5.61712646484375, 5.7838134765625, 5.95050048828125, 6.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 13.0, 23.0, 35.0, 81.0, 145.0, 275.0, 554.0, 1086.0, 922.0, 480.0, 238.0, 113.0, 44.0, 29.0, 13.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74578857421875, -3.6243896484375, -3.50299072265625, -3.381591796875, -3.26019287109375, -3.1387939453125, -3.01739501953125, -2.89599609375, -2.77459716796875, -2.6531982421875, -2.53179931640625, -2.410400390625, -2.28900146484375, -2.1676025390625, -2.04620361328125, -1.9248046875, -1.80340576171875, -1.6820068359375, -1.56060791015625, -1.439208984375, -1.31781005859375, -1.1964111328125, -1.07501220703125, -0.95361328125, -0.83221435546875, -0.7108154296875, -0.58941650390625, -0.468017578125, -0.34661865234375, -0.2252197265625, -0.10382080078125, 0.017578125, 0.13897705078125, 0.2603759765625, 0.38177490234375, 0.503173828125, 0.62457275390625, 0.7459716796875, 0.86737060546875, 0.98876953125, 1.11016845703125, 1.2315673828125, 1.35296630859375, 1.474365234375, 1.59576416015625, 1.7171630859375, 1.83856201171875, 1.9599609375, 2.08135986328125, 2.2027587890625, 2.32415771484375, 2.445556640625, 2.56695556640625, 2.6883544921875, 2.80975341796875, 2.93115234375, 3.05255126953125, 3.1739501953125, 3.29534912109375, 3.416748046875, 3.53814697265625, 3.6595458984375, 3.78094482421875, 3.90234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 12.0, 21.0, 68.0, 128.0, 238.0, 250.0, 144.0, 57.0, 33.0, 21.0, 11.0, 7.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.005016326904297, -23.92644691467285, -22.847877502441406, -21.76930809020996, -20.690738677978516, -19.612171173095703, -18.533601760864258, -17.455032348632812, -16.376462936401367, -15.297893524169922, -14.219324111938477, -13.140755653381348, -12.062186241149902, -10.983616828918457, -9.905048370361328, -8.826478958129883, -7.7479095458984375, -6.669340133666992, -5.590771198272705, -4.512202262878418, -3.4336328506469727, -2.3550634384155273, -1.2764945030212402, -0.19792556762695312, 0.8806438446044922, 1.9592130184173584, 3.0377821922302246, 4.116351127624512, 5.194920539855957, 6.273489952087402, 7.3520588874816895, 8.430627822875977, 9.509193420410156, 10.587762832641602, 11.666332244873047, 12.744900703430176, 13.823470115661621, 14.902039527893066, 15.980607986450195, 17.05917739868164, 18.137746810913086, 19.21631622314453, 20.294885635375977, 21.373455047607422, 22.452022552490234, 23.530593872070312, 24.609161376953125, 25.68773078918457, 26.766300201416016, 27.84486961364746, 28.923439025878906, 30.00200843811035, 31.080577850341797, 32.15914535522461, 33.23771667480469, 34.3162841796875, 35.39485168457031, 36.473419189453125, 37.5519905090332, 38.630558013916016, 39.709129333496094, 40.787696838378906, 41.866268157958984, 42.9448356628418, 44.023406982421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 12.0, 17.0, 17.0, 19.0, 29.0, 28.0, 31.0, 48.0, 57.0, 68.0, 70.0, 91.0, 102.0, 84.0, 48.0, 44.0, 54.0, 28.0, 30.0, 25.0, 18.0, 18.0, 11.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.929338455200195, -15.431610107421875, -14.933880805969238, -14.436152458190918, -13.938424110412598, -13.440694808959961, -12.94296646118164, -12.44523811340332, -11.947508811950684, -11.449780464172363, -10.952051162719727, -10.454322814941406, -9.956594467163086, -9.45886516571045, -8.961136817932129, -8.463407516479492, -7.96567964553833, -7.467950820922852, -6.970222473144531, -6.472493648529053, -5.974764823913574, -5.477036476135254, -4.979307651519775, -4.481578826904297, -3.9838502407073975, -3.486121654510498, -2.9883928298950195, -2.49066424369812, -1.9929355382919312, -1.4952068328857422, -0.9974782466888428, -0.49974942207336426, -0.0020208358764648438, 0.49570783972740173, 0.9934365153312683, 1.4911651611328125, 1.9888938665390015, 2.4866225719451904, 2.98435115814209, 3.4820799827575684, 3.9798085689544678, 4.477537155151367, 4.975265979766846, 5.472994804382324, 5.9707231521606445, 6.468451976776123, 6.966180801391602, 7.463909149169922, 7.9616379737854, 8.459366798400879, 8.9570951461792, 9.454824447631836, 9.952552795410156, 10.450281143188477, 10.948009490966797, 11.445738792419434, 11.943467140197754, 12.441195487976074, 12.938924789428711, 13.436653137207031, 13.934381484985352, 14.432110786437988, 14.929839134216309, 15.427568435668945, 15.925296783447266]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 8.0, 14.0, 13.0, 31.0, 52.0, 67.0, 138.0, 239.0, 438.0, 842.0, 1913.0, 4453.0, 11916.0, 39216.0, 167780.0, 618235.0, 148905.0, 35546.0, 10922.0, 4190.0, 1790.0, 845.0, 422.0, 224.0, 121.0, 97.0, 36.0, 25.0, 20.0, 17.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5806732177734375, -1.537322998046875, -1.4939727783203125, -1.45062255859375, -1.4072723388671875, -1.363922119140625, -1.3205718994140625, -1.2772216796875, -1.2338714599609375, -1.190521240234375, -1.1471710205078125, -1.10382080078125, -1.0604705810546875, -1.017120361328125, -0.9737701416015625, -0.930419921875, -0.8870697021484375, -0.843719482421875, -0.8003692626953125, -0.75701904296875, -0.7136688232421875, -0.670318603515625, -0.6269683837890625, -0.5836181640625, -0.5402679443359375, -0.496917724609375, -0.4535675048828125, -0.41021728515625, -0.3668670654296875, -0.323516845703125, -0.2801666259765625, -0.23681640625, -0.1934661865234375, -0.150115966796875, -0.1067657470703125, -0.06341552734375, -0.0200653076171875, 0.023284912109375, 0.0666351318359375, 0.1099853515625, 0.1533355712890625, 0.196685791015625, 0.2400360107421875, 0.28338623046875, 0.3267364501953125, 0.370086669921875, 0.4134368896484375, 0.456787109375, 0.5001373291015625, 0.543487548828125, 0.5868377685546875, 0.63018798828125, 0.6735382080078125, 0.716888427734375, 0.7602386474609375, 0.8035888671875, 0.8469390869140625, 0.890289306640625, 0.9336395263671875, 0.97698974609375, 1.0203399658203125, 1.063690185546875, 1.1070404052734375, 1.150390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 15.0, 7.0, 23.0, 18.0, 25.0, 28.0, 29.0, 55.0, 58.0, 41.0, 58.0, 61.0, 52.0, 62.0, 54.0, 50.0, 56.0, 47.0, 39.0, 34.0, 23.0, 29.0, 23.0, 13.0, 12.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.93310546875, -0.9070281982421875, -0.880950927734375, -0.8548736572265625, -0.82879638671875, -0.8027191162109375, -0.776641845703125, -0.7505645751953125, -0.7244873046875, -0.6984100341796875, -0.672332763671875, -0.6462554931640625, -0.62017822265625, -0.5941009521484375, -0.568023681640625, -0.5419464111328125, -0.515869140625, -0.4897918701171875, -0.463714599609375, -0.4376373291015625, -0.41156005859375, -0.3854827880859375, -0.359405517578125, -0.3333282470703125, -0.3072509765625, -0.2811737060546875, -0.255096435546875, -0.2290191650390625, -0.20294189453125, -0.1768646240234375, -0.150787353515625, -0.1247100830078125, -0.0986328125, -0.0725555419921875, -0.046478271484375, -0.0204010009765625, 0.00567626953125, 0.0317535400390625, 0.057830810546875, 0.0839080810546875, 0.1099853515625, 0.1360626220703125, 0.162139892578125, 0.1882171630859375, 0.21429443359375, 0.2403717041015625, 0.266448974609375, 0.2925262451171875, 0.318603515625, 0.3446807861328125, 0.370758056640625, 0.3968353271484375, 0.42291259765625, 0.4489898681640625, 0.475067138671875, 0.5011444091796875, 0.5272216796875, 0.5532989501953125, 0.579376220703125, 0.6054534912109375, 0.63153076171875, 0.6576080322265625, 0.683685302734375, 0.7097625732421875, 0.73583984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 7.0, 8.0, 18.0, 17.0, 25.0, 35.0, 45.0, 71.0, 114.0, 187.0, 337.0, 631.0, 1538.0, 5789.0, 42898.0, 898877.0, 84894.0, 9184.0, 2057.0, 795.0, 388.0, 219.0, 139.0, 78.0, 59.0, 33.0, 28.0, 18.0, 15.0, 13.0, 7.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5299835205078125, -1.465240478515625, -1.4004974365234375, -1.33575439453125, -1.2710113525390625, -1.206268310546875, -1.1415252685546875, -1.0767822265625, -1.0120391845703125, -0.947296142578125, -0.8825531005859375, -0.81781005859375, -0.7530670166015625, -0.688323974609375, -0.6235809326171875, -0.558837890625, -0.4940948486328125, -0.429351806640625, -0.3646087646484375, -0.29986572265625, -0.2351226806640625, -0.170379638671875, -0.1056365966796875, -0.0408935546875, 0.0238494873046875, 0.088592529296875, 0.1533355712890625, 0.21807861328125, 0.2828216552734375, 0.347564697265625, 0.4123077392578125, 0.47705078125, 0.5417938232421875, 0.606536865234375, 0.6712799072265625, 0.73602294921875, 0.8007659912109375, 0.865509033203125, 0.9302520751953125, 0.9949951171875, 1.0597381591796875, 1.124481201171875, 1.1892242431640625, 1.25396728515625, 1.3187103271484375, 1.383453369140625, 1.4481964111328125, 1.512939453125, 1.5776824951171875, 1.642425537109375, 1.7071685791015625, 1.77191162109375, 1.8366546630859375, 1.901397705078125, 1.9661407470703125, 2.0308837890625, 2.0956268310546875, 2.160369873046875, 2.2251129150390625, 2.28985595703125, 2.3545989990234375, 2.419342041015625, 2.4840850830078125, 2.548828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 7.0, 6.0, 9.0, 10.0, 8.0, 22.0, 21.0, 23.0, 19.0, 39.0, 47.0, 49.0, 66.0, 76.0, 98.0, 96.0, 77.0, 75.0, 55.0, 40.0, 30.0, 21.0, 18.0, 15.0, 18.0, 14.0, 9.0, 11.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8343505859375, -2.715576171875, -2.5968017578125, -2.47802734375, -2.3592529296875, -2.240478515625, -2.1217041015625, -2.0029296875, -1.8841552734375, -1.765380859375, -1.6466064453125, -1.52783203125, -1.4090576171875, -1.290283203125, -1.1715087890625, -1.052734375, -0.9339599609375, -0.815185546875, -0.6964111328125, -0.57763671875, -0.4588623046875, -0.340087890625, -0.2213134765625, -0.1025390625, 0.0162353515625, 0.135009765625, 0.2537841796875, 0.37255859375, 0.4913330078125, 0.610107421875, 0.7288818359375, 0.84765625, 0.9664306640625, 1.085205078125, 1.2039794921875, 1.32275390625, 1.4415283203125, 1.560302734375, 1.6790771484375, 1.7978515625, 1.9166259765625, 2.035400390625, 2.1541748046875, 2.27294921875, 2.3917236328125, 2.510498046875, 2.6292724609375, 2.748046875, 2.8668212890625, 2.985595703125, 3.1043701171875, 3.22314453125, 3.3419189453125, 3.460693359375, 3.5794677734375, 3.6982421875, 3.8170166015625, 3.935791015625, 4.0545654296875, 4.17333984375, 4.2921142578125, 4.410888671875, 4.5296630859375, 4.6484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 13.0, 13.0, 18.0, 35.0, 42.0, 63.0, 112.0, 215.0, 335.0, 810.0, 2301.0, 7831.0, 40920.0, 879908.0, 96580.0, 13659.0, 3448.0, 1137.0, 482.0, 234.0, 135.0, 84.0, 46.0, 27.0, 24.0, 16.0, 14.0, 11.0, 2.0, 4.0, 0.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.431396484375, -0.4193077087402344, -0.40721893310546875, -0.3951301574707031, -0.3830413818359375, -0.3709526062011719, -0.35886383056640625, -0.3467750549316406, -0.334686279296875, -0.3225975036621094, -0.31050872802734375, -0.2984199523925781, -0.2863311767578125, -0.2742424011230469, -0.26215362548828125, -0.2500648498535156, -0.23797607421875, -0.22588729858398438, -0.21379852294921875, -0.20170974731445312, -0.1896209716796875, -0.17753219604492188, -0.16544342041015625, -0.15335464477539062, -0.141265869140625, -0.12917709350585938, -0.11708831787109375, -0.10499954223632812, -0.0929107666015625, -0.08082199096679688, -0.06873321533203125, -0.056644439697265625, -0.0445556640625, -0.032466888427734375, -0.02037811279296875, -0.008289337158203125, 0.0037994384765625, 0.015888214111328125, 0.02797698974609375, 0.040065765380859375, 0.052154541015625, 0.06424331665039062, 0.07633209228515625, 0.08842086791992188, 0.1005096435546875, 0.11259841918945312, 0.12468719482421875, 0.13677597045898438, 0.14886474609375, 0.16095352172851562, 0.17304229736328125, 0.18513107299804688, 0.1972198486328125, 0.20930862426757812, 0.22139739990234375, 0.23348617553710938, 0.245574951171875, 0.2576637268066406, 0.26975250244140625, 0.2818412780761719, 0.2939300537109375, 0.3060188293457031, 0.31810760498046875, 0.3301963806152344, 0.34228515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 2.0, 9.0, 8.0, 12.0, 13.0, 22.0, 17.0, 25.0, 29.0, 38.0, 56.0, 95.0, 103.0, 117.0, 114.0, 79.0, 55.0, 40.0, 27.0, 25.0, 21.0, 10.0, 13.0, 4.0, 5.0, 9.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.0001055002212524414, -0.00010260380804538727, -9.970739483833313e-05, -9.681098163127899e-05, -9.391456842422485e-05, -9.101815521717072e-05, -8.812174201011658e-05, -8.522532880306244e-05, -8.23289155960083e-05, -7.943250238895416e-05, -7.653608918190002e-05, -7.363967597484589e-05, -7.074326276779175e-05, -6.784684956073761e-05, -6.495043635368347e-05, -6.205402314662933e-05, -5.9157609939575195e-05, -5.626119673252106e-05, -5.336478352546692e-05, -5.046837031841278e-05, -4.757195711135864e-05, -4.4675543904304504e-05, -4.1779130697250366e-05, -3.888271749019623e-05, -3.598630428314209e-05, -3.308989107608795e-05, -3.0193477869033813e-05, -2.7297064661979675e-05, -2.4400651454925537e-05, -2.15042382478714e-05, -1.860782504081726e-05, -1.5711411833763123e-05, -1.2814998626708984e-05, -9.918585419654846e-06, -7.022172212600708e-06, -4.12575900554657e-06, -1.2293457984924316e-06, 1.6670674085617065e-06, 4.563480615615845e-06, 7.459893822669983e-06, 1.0356307029724121e-05, 1.325272023677826e-05, 1.6149133443832397e-05, 1.9045546650886536e-05, 2.1941959857940674e-05, 2.4838373064994812e-05, 2.773478627204895e-05, 3.063119947910309e-05, 3.3527612686157227e-05, 3.6424025893211365e-05, 3.93204391002655e-05, 4.221685230731964e-05, 4.511326551437378e-05, 4.800967872142792e-05, 5.0906091928482056e-05, 5.3802505135536194e-05, 5.669891834259033e-05, 5.959533154964447e-05, 6.249174475669861e-05, 6.538815796375275e-05, 6.828457117080688e-05, 7.118098437786102e-05, 7.407739758491516e-05, 7.69738107919693e-05, 7.987022399902344e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 12.0, 8.0, 17.0, 17.0, 32.0, 34.0, 72.0, 103.0, 233.0, 429.0, 844.0, 1846.0, 4766.0, 15544.0, 69960.0, 835197.0, 91254.0, 18443.0, 5662.0, 2156.0, 922.0, 446.0, 214.0, 128.0, 70.0, 46.0, 31.0, 23.0, 13.0, 8.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.330078125, -0.3217353820800781, -0.31339263916015625, -0.3050498962402344, -0.2967071533203125, -0.2883644104003906, -0.28002166748046875, -0.2716789245605469, -0.263336181640625, -0.2549934387207031, -0.24665069580078125, -0.23830795288085938, -0.2299652099609375, -0.22162246704101562, -0.21327972412109375, -0.20493698120117188, -0.19659423828125, -0.18825149536132812, -0.17990875244140625, -0.17156600952148438, -0.1632232666015625, -0.15488052368164062, -0.14653778076171875, -0.13819503784179688, -0.129852294921875, -0.12150955200195312, -0.11316680908203125, -0.10482406616210938, -0.0964813232421875, -0.08813858032226562, -0.07979583740234375, -0.07145309448242188, -0.0631103515625, -0.054767608642578125, -0.04642486572265625, -0.038082122802734375, -0.0297393798828125, -0.021396636962890625, -0.01305389404296875, -0.004711151123046875, 0.003631591796875, 0.011974334716796875, 0.02031707763671875, 0.028659820556640625, 0.0370025634765625, 0.045345306396484375, 0.05368804931640625, 0.062030792236328125, 0.07037353515625, 0.07871627807617188, 0.08705902099609375, 0.09540176391601562, 0.1037445068359375, 0.11208724975585938, 0.12042999267578125, 0.12877273559570312, 0.137115478515625, 0.14545822143554688, 0.15380096435546875, 0.16214370727539062, 0.1704864501953125, 0.17882919311523438, 0.18717193603515625, 0.19551467895507812, 0.203857421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 10.0, 4.0, 8.0, 7.0, 9.0, 5.0, 16.0, 13.0, 29.0, 20.0, 29.0, 31.0, 44.0, 62.0, 70.0, 74.0, 76.0, 65.0, 65.0, 62.0, 52.0, 53.0, 38.0, 23.0, 23.0, 22.0, 11.0, 12.0, 7.0, 5.0, 10.0, 7.0, 2.0, 4.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.232421875, -0.22484970092773438, -0.21727752685546875, -0.20970535278320312, -0.2021331787109375, -0.19456100463867188, -0.18698883056640625, -0.17941665649414062, -0.171844482421875, -0.16427230834960938, -0.15670013427734375, -0.14912796020507812, -0.1415557861328125, -0.13398361206054688, -0.12641143798828125, -0.11883926391601562, -0.11126708984375, -0.10369491577148438, -0.09612274169921875, -0.08855056762695312, -0.0809783935546875, -0.07340621948242188, -0.06583404541015625, -0.058261871337890625, -0.050689697265625, -0.043117523193359375, -0.03554534912109375, -0.027973175048828125, -0.0204010009765625, -0.012828826904296875, -0.00525665283203125, 0.002315521240234375, 0.0098876953125, 0.017459869384765625, 0.02503204345703125, 0.032604217529296875, 0.0401763916015625, 0.047748565673828125, 0.05532073974609375, 0.06289291381835938, 0.070465087890625, 0.07803726196289062, 0.08560943603515625, 0.09318161010742188, 0.1007537841796875, 0.10832595825195312, 0.11589813232421875, 0.12347030639648438, 0.13104248046875, 0.13861465454101562, 0.14618682861328125, 0.15375900268554688, 0.1613311767578125, 0.16890335083007812, 0.17647552490234375, 0.18404769897460938, 0.191619873046875, 0.19919204711914062, 0.20676422119140625, 0.21433639526367188, 0.2219085693359375, 0.22948074340820312, 0.23705291748046875, 0.24462509155273438, 0.252197265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 14.0, 32.0, 76.0, 325.0, 383.0, 87.0, 42.0, 23.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.62642478942871, -23.036149978637695, -22.44587516784668, -21.855600357055664, -21.26532745361328, -20.675052642822266, -20.08477783203125, -19.494503021240234, -18.90422821044922, -18.313953399658203, -17.723678588867188, -17.133403778076172, -16.543128967285156, -15.952855110168457, -15.362581253051758, -14.772306442260742, -14.182031631469727, -13.591756820678711, -13.001482009887695, -12.411208152770996, -11.82093334197998, -11.230658531188965, -10.640384674072266, -10.05010986328125, -9.459835052490234, -8.869560241699219, -8.279285430908203, -7.689011573791504, -7.098736763000488, -6.508461952209473, -5.918187618255615, -5.327913284301758, -4.737639427185059, -4.147364616394043, -3.5570902824401855, -2.966815710067749, -2.3765411376953125, -1.786266565322876, -1.1959919929504395, -0.605717658996582, -0.015442848205566406, 0.5748317241668701, 1.1651062965393066, 1.7553808689117432, 2.3456554412841797, 2.935930013656616, 3.5262045860290527, 4.11647891998291, 4.706753730773926, 5.297028541564941, 5.887302875518799, 6.477577209472656, 7.067852020263672, 7.6581268310546875, 8.248401641845703, 8.838675498962402, 9.428950309753418, 10.019225120544434, 10.609498977661133, 11.199773788452148, 11.790048599243164, 12.38032341003418, 12.970598220825195, 13.560872077941895, 14.15114688873291]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 7.0, 7.0, 7.0, 6.0, 9.0, 16.0, 14.0, 16.0, 17.0, 18.0, 16.0, 19.0, 27.0, 29.0, 37.0, 127.0, 213.0, 170.0, 46.0, 25.0, 27.0, 15.0, 22.0, 21.0, 11.0, 12.0, 15.0, 8.0, 9.0, 5.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.838184356689453, -8.559163093566895, -8.280141830444336, -8.001120567321777, -7.722099781036377, -7.443078517913818, -7.164057731628418, -6.885036468505859, -6.606015205383301, -6.326993942260742, -6.047972679138184, -5.768951892852783, -5.489930629730225, -5.210909366607666, -4.931888580322266, -4.652867317199707, -4.373846054077148, -4.09482479095459, -3.8158037662506104, -3.536782741546631, -3.2577614784240723, -2.9787402153015137, -2.699719190597534, -2.4206981658935547, -2.141676902770996, -1.862655758857727, -1.583634614944458, -1.304613471031189, -1.02559232711792, -0.7465711832046509, -0.46755003929138184, -0.1885288953781128, 0.09049224853515625, 0.3695133924484253, 0.6485345363616943, 0.9275556802749634, 1.2065768241882324, 1.4855979681015015, 1.7646191120147705, 2.04364013671875, 2.3226613998413086, 2.601682662963867, 2.8807036876678467, 3.159724712371826, 3.4387459754943848, 3.7177672386169434, 3.996788263320923, 4.275809288024902, 4.554830551147461, 4.8338518142700195, 5.112873077392578, 5.3918938636779785, 5.670915126800537, 5.949936389923096, 6.228957176208496, 6.507978439331055, 6.786999702453613, 7.066020965576172, 7.3450422286987305, 7.624063014984131, 7.9030842781066895, 8.18210506439209, 8.461126327514648, 8.740147590637207, 9.019168853759766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 4.0, 6.0, 13.0, 7.0, 12.0, 10.0, 17.0, 20.0, 23.0, 19.0, 35.0, 15.0, 41.0, 55.0, 162.0, 222.0, 80.0, 32.0, 25.0, 26.0, 32.0, 19.0, 14.0, 23.0, 16.0, 15.0, 6.0, 11.0, 4.0, 5.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6606674194335938, -0.6387176513671875, -0.6167678833007812, -0.594818115234375, -0.5728683471679688, -0.5509185791015625, -0.5289688110351562, -0.50701904296875, -0.48506927490234375, -0.4631195068359375, -0.44116973876953125, -0.419219970703125, -0.39727020263671875, -0.3753204345703125, -0.35337066650390625, -0.3314208984375, -0.30947113037109375, -0.2875213623046875, -0.26557159423828125, -0.243621826171875, -0.22167205810546875, -0.1997222900390625, -0.17777252197265625, -0.15582275390625, -0.13387298583984375, -0.1119232177734375, -0.08997344970703125, -0.068023681640625, -0.04607391357421875, -0.0241241455078125, -0.00217437744140625, 0.019775390625, 0.04172515869140625, 0.0636749267578125, 0.08562469482421875, 0.107574462890625, 0.12952423095703125, 0.1514739990234375, 0.17342376708984375, 0.19537353515625, 0.21732330322265625, 0.2392730712890625, 0.26122283935546875, 0.283172607421875, 0.30512237548828125, 0.3270721435546875, 0.34902191162109375, 0.3709716796875, 0.39292144775390625, 0.4148712158203125, 0.43682098388671875, 0.458770751953125, 0.48072052001953125, 0.5026702880859375, 0.5246200561523438, 0.54656982421875, 0.5685195922851562, 0.5904693603515625, 0.6124191284179688, 0.634368896484375, 0.6563186645507812, 0.6782684326171875, 0.7002182006835938, 0.72216796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 12.0, 8.0, 12.0, 18.0, 17.0, 18.0, 57.0, 68.0, 103.0, 192.0, 373.0, 799.0, 2397.0, 9712.0, 8288435.0, 77246.0, 6049.0, 1673.0, 612.0, 303.0, 151.0, 97.0, 61.0, 35.0, 33.0, 17.0, 13.0, 8.0, 8.0, 6.0, 5.0, 14.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-6.545567989349365, -6.340040683746338, -6.134513854980469, -5.928986549377441, -5.723459243774414, -5.517932415008545, -5.312405109405518, -5.106878280639648, -4.901350975036621, -4.695823669433594, -4.490296840667725, -4.284769535064697, -4.079242706298828, -3.873715400695801, -3.6681880950927734, -3.462661027908325, -3.257133960723877, -3.0516068935394287, -2.8460798263549805, -2.640552520751953, -2.435025453567505, -2.2294983863830566, -2.0239710807800293, -1.818444013595581, -1.6129169464111328, -1.4073898792266846, -1.2018626928329468, -0.9963355660438538, -0.7908084392547607, -0.5852813720703125, -0.3797541856765747, -0.17422699928283691, 0.03130054473876953, 0.23682767152786255, 0.44235479831695557, 0.6478819251060486, 0.8534090518951416, 1.0589361190795898, 1.2644633054733276, 1.4699904918670654, 1.6755175590515137, 1.881044626235962, 2.08657169342041, 2.2920989990234375, 2.4976260662078857, 2.703153133392334, 2.9086804389953613, 3.1142075061798096, 3.319734573364258, 3.525261640548706, 3.7307887077331543, 3.9363160133361816, 4.141842842102051, 4.347370147705078, 4.5528974533081055, 4.758424758911133, 4.963951587677002, 5.169478893280029, 5.375005722045898, 5.580533027648926, 5.786060333251953, 5.991587162017822, 6.19711446762085, 6.402641296386719, 6.608168601989746]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.11011028289795, -7.809652328491211, -7.509194374084473, -7.208736419677734, -6.908278465270996, -6.607820510864258, -6.307363033294678, -6.0069050788879395, -5.706447124481201, -5.405989170074463, -5.105531215667725, -4.805073261260986, -4.504615783691406, -4.204157829284668, -3.9036998748779297, -3.6032419204711914, -3.302783966064453, -3.002326011657715, -2.7018680572509766, -2.4014103412628174, -2.100952386856079, -1.8004944324493408, -1.500036597251892, -1.1995787620544434, -0.8991208076477051, -0.5986629128456116, -0.29820501804351807, 0.0022528767585754395, 0.30271077156066895, 0.6031687259674072, 0.903626561164856, 1.2040843963623047, 1.5045413970947266, 1.8049993515014648, 2.105457305908203, 2.4059150218963623, 2.7063729763031006, 3.006830930709839, 3.307288646697998, 3.6077466011047363, 3.9082045555114746, 4.208662509918213, 4.509120464324951, 4.8095784187316895, 5.1100358963012695, 5.410493850708008, 5.710951805114746, 6.011409759521484, 6.311867713928223, 6.612325668334961, 6.912783622741699, 7.2132415771484375, 7.513699531555176, 7.814157485961914, 8.114615440368652, 8.41507339477539, 8.715530395507812, 9.01598834991455, 9.316446304321289, 9.616904258728027, 9.917362213134766, 10.217820167541504, 10.518278121948242, 10.818735122680664, 11.119194030761719]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 15.0, 16.0, 17.0, 26.0, 40.0, 57.0, 61.0, 88.0, 149.0, 226.0, 315.0, 564.0, 1189.0, 2517.0, 5919.0, 14978.0, 38231.0, 100967.0, 183434.0, 107136.0, 40611.0, 15714.0, 6474.0, 2715.0, 1197.0, 609.0, 340.0, 217.0, 132.0, 80.0, 53.0, 51.0, 30.0, 27.0, 13.0, 5.0, 10.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5390625, -5.378662109375, -5.21826171875, -5.057861328125, -4.8974609375, -4.737060546875, -4.57666015625, -4.416259765625, -4.255859375, -4.095458984375, -3.93505859375, -3.774658203125, -3.6142578125, -3.453857421875, -3.29345703125, -3.133056640625, -2.97265625, -2.812255859375, -2.65185546875, -2.491455078125, -2.3310546875, -2.170654296875, -2.01025390625, -1.849853515625, -1.689453125, -1.529052734375, -1.36865234375, -1.208251953125, -1.0478515625, -0.887451171875, -0.72705078125, -0.566650390625, -0.40625, -0.245849609375, -0.08544921875, 0.074951171875, 0.2353515625, 0.395751953125, 0.55615234375, 0.716552734375, 0.876953125, 1.037353515625, 1.19775390625, 1.358154296875, 1.5185546875, 1.678955078125, 1.83935546875, 1.999755859375, 2.16015625, 2.320556640625, 2.48095703125, 2.641357421875, 2.8017578125, 2.962158203125, 3.12255859375, 3.282958984375, 3.443359375, 3.603759765625, 3.76416015625, 3.924560546875, 4.0849609375, 4.245361328125, 4.40576171875, 4.566162109375, 4.7265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 10.0, 5.0, 10.0, 16.0, 17.0, 15.0, 26.0, 30.0, 39.0, 46.0, 41.0, 63.0, 75.0, 66.0, 76.0, 70.0, 77.0, 52.0, 44.0, 41.0, 32.0, 23.0, 23.0, 18.0, 21.0, 17.0, 10.0, 5.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9388046264648438, -0.9122772216796875, -0.8857498168945312, -0.859222412109375, -0.8326950073242188, -0.8061676025390625, -0.7796401977539062, -0.75311279296875, -0.7265853881835938, -0.7000579833984375, -0.6735305786132812, -0.647003173828125, -0.6204757690429688, -0.5939483642578125, -0.5674209594726562, -0.5408935546875, -0.5143661499023438, -0.4878387451171875, -0.46131134033203125, -0.434783935546875, -0.40825653076171875, -0.3817291259765625, -0.35520172119140625, -0.32867431640625, -0.30214691162109375, -0.2756195068359375, -0.24909210205078125, -0.222564697265625, -0.19603729248046875, -0.1695098876953125, -0.14298248291015625, -0.116455078125, -0.08992767333984375, -0.0634002685546875, -0.03687286376953125, -0.010345458984375, 0.01618194580078125, 0.0427093505859375, 0.06923675537109375, 0.09576416015625, 0.12229156494140625, 0.1488189697265625, 0.17534637451171875, 0.201873779296875, 0.22840118408203125, 0.2549285888671875, 0.28145599365234375, 0.3079833984375, 0.33451080322265625, 0.3610382080078125, 0.38756561279296875, 0.414093017578125, 0.44062042236328125, 0.4671478271484375, 0.49367523193359375, 0.52020263671875, 0.5467300415039062, 0.5732574462890625, 0.5997848510742188, 0.626312255859375, 0.6528396606445312, 0.6793670654296875, 0.7058944702148438, 0.732421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 5.0, 6.0, 9.0, 9.0, 26.0, 40.0, 65.0, 83.0, 101.0, 66.0, 33.0, 14.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2566556930542, -8.99672794342041, -8.736799240112305, -8.476871490478516, -8.216943740844727, -7.957015514373779, -7.697087287902832, -7.437159538269043, -7.177231311798096, -6.917303085327148, -6.657375335693359, -6.397447109222412, -6.137518882751465, -5.877591133117676, -5.6176629066467285, -5.357734680175781, -5.097806930541992, -4.837878704071045, -4.577950954437256, -4.318022727966309, -4.0580949783325195, -3.7981667518615723, -3.538238525390625, -3.278310537338257, -3.0183825492858887, -2.7584545612335205, -2.4985265731811523, -2.238598346710205, -1.978670358657837, -1.7187423706054688, -1.458814263343811, -1.1988861560821533, -0.9389572143554688, -0.6790291666984558, -0.41910111904144287, -0.15917307138442993, 0.10075497627258301, 0.36068296432495117, 0.6206110715866089, 0.8805391788482666, 1.1404671669006348, 1.400395154953003, 1.6603232622146606, 1.9202513694763184, 2.1801793575286865, 2.4401073455810547, 2.700035572052002, 2.95996356010437, 3.2198915481567383, 3.4798195362091064, 3.7397475242614746, 3.999675750732422, 4.259603500366211, 4.519531726837158, 4.7794599533081055, 5.0393877029418945, 5.299315929412842, 5.559244155883789, 5.819171905517578, 6.079100131988525, 6.339028358459473, 6.598956108093262, 6.858884334564209, 7.118812561035156, 7.378740310668945]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 10.0, 24.0, 34.0, 92.0, 118.0, 85.0, 35.0, 4.0, 9.0, 7.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.105400562286377, -4.955692768096924, -4.805984973907471, -4.656276702880859, -4.506568908691406, -4.356861114501953, -4.2071533203125, -4.057445526123047, -3.9077374935150146, -3.7580296993255615, -3.6083216667175293, -3.458613872528076, -3.308906078338623, -3.159198045730591, -3.0094902515411377, -2.8597822189331055, -2.7100744247436523, -2.560366630554199, -2.410658597946167, -2.260950803756714, -2.1112427711486816, -1.9615349769592285, -1.8118271827697754, -1.6621192693710327, -1.51241135597229, -1.3627034425735474, -1.2129955291748047, -1.0632877349853516, -0.9135798215866089, -0.7638719081878662, -0.6141640543937683, -0.4644562005996704, -0.31474876403808594, -0.16504088044166565, -0.015332996845245361, 0.13437488675117493, 0.2840827703475952, 0.4337906837463379, 0.5834985375404358, 0.7332063913345337, 0.8829143047332764, 1.032622218132019, 1.1823301315307617, 1.3320379257202148, 1.4817458391189575, 1.6314537525177002, 1.7811615467071533, 1.930869460105896, 2.0805773735046387, 2.230285167694092, 2.379993200302124, 2.529700994491577, 2.6794090270996094, 2.8291168212890625, 2.9788246154785156, 3.1285324096679688, 3.278240442276001, 3.427948236465454, 3.5776562690734863, 3.7273640632629395, 3.8770718574523926, 4.026780128479004, 4.176487922668457, 4.32619571685791, 4.475903511047363]}, "eval/loss": 5.307173728942871, "eval/wer": 0.9908171360571202, "eval/runtime": 583.899, "eval/samples_per_second": 4.525, "eval/steps_per_second": 0.567} \ No newline at end of file +{"train/loss": 3.2607, "train/learning_rate": 1.8429334916864606e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 44177, "_timestamp": 1646991416, "_step": 7504, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 7.0, 7.0, 9.0, 11.0, 12.0, 13.0, 14.0, 28.0, 22.0, 33.0, 32.0, 28.0, 32.0, 38.0, 39.0, 34.0, 41.0, 38.0, 44.0, 43.0, 46.0, 35.0, 50.0, 39.0, 38.0, 38.0, 39.0, 24.0, 21.0, 26.0, 17.0, 15.0, 16.0, 9.0, 14.0, 8.0, 11.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.254911422729492, -16.86276626586914, -16.47062110900879, -16.078475952148438, -15.686330795288086, -15.294185638427734, -14.902040481567383, -14.509895324707031, -14.11775016784668, -13.725605010986328, -13.333459854125977, -12.941314697265625, -12.549169540405273, -12.157024383544922, -11.76487922668457, -11.372734069824219, -10.980588912963867, -10.588443756103516, -10.196298599243164, -9.804153442382812, -9.412008285522461, -9.01986312866211, -8.627717971801758, -8.235572814941406, -7.843428611755371, -7.4512834548950195, -7.059138298034668, -6.666993141174316, -6.274847984313965, -5.882702827453613, -5.490557670593262, -5.09841251373291, -4.7062668800354, -4.314121723175049, -3.9219765663146973, -3.5298314094543457, -3.137686252593994, -2.7455410957336426, -2.35339617729187, -1.9612510204315186, -1.569105863571167, -1.1769607067108154, -0.7848156094551086, -0.39267051219940186, -0.000525355339050293, 0.39161980152130127, 0.7837648391723633, 1.1759099960327148, 1.5680551528930664, 1.960200309753418, 2.3523454666137695, 2.744490623474121, 3.1366357803344727, 3.528780937194824, 3.9209258556365967, 4.313071250915527, 4.705216407775879, 5.0973615646362305, 5.489506721496582, 5.881651878356934, 6.273797035217285, 6.665942192077637, 7.058087348937988, 7.45023250579834, 7.842377185821533]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 17.0, 14.0, 9.0, 19.0, 23.0, 16.0, 25.0, 20.0, 29.0, 34.0, 32.0, 36.0, 34.0, 41.0, 35.0, 33.0, 39.0, 48.0, 33.0, 32.0, 39.0, 42.0, 28.0, 39.0, 30.0, 22.0, 23.0, 26.0, 18.0, 20.0, 15.0, 19.0, 16.0, 8.0, 16.0, 13.0, 9.0, 9.0, 3.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.805580139160156, -14.359040260314941, -13.912500381469727, -13.465961456298828, -13.019421577453613, -12.572881698608398, -12.126341819763184, -11.679801940917969, -11.23326301574707, -10.786723136901855, -10.34018325805664, -9.893644332885742, -9.447104454040527, -9.000564575195312, -8.554024696350098, -8.107484817504883, -7.660945415496826, -7.214405536651611, -6.767866134643555, -6.32132625579834, -5.874786853790283, -5.428246974945068, -4.981707572937012, -4.535167694091797, -4.088627815246582, -3.6420881748199463, -3.1955485343933105, -2.7490086555480957, -2.302469253540039, -1.8559293746948242, -1.4093897342681885, -0.9628500938415527, -0.5163106918334961, -0.06977102160453796, 0.37676864862442017, 0.8233083486557007, 1.2698479890823364, 1.7163877487182617, 2.1629273891448975, 2.609467029571533, 3.056006669998169, 3.5025463104248047, 3.9490859508514404, 4.395625591278076, 4.842165470123291, 5.288704872131348, 5.7352447509765625, 6.181784629821777, 6.628324031829834, 7.074863910675049, 7.5214033126831055, 7.96794319152832, 8.414483070373535, 8.86102294921875, 9.307561874389648, 9.754101753234863, 10.200641632080078, 10.647181510925293, 11.093721389770508, 11.540260314941406, 11.986800193786621, 12.433340072631836, 12.87987995147705, 13.326419830322266, 13.772958755493164]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 16.0, 42.0, 59.0, 100.0, 223.0, 393.0, 696.0, 1183.0, 2063.0, 3569.0, 6141.0, 10123.0, 16824.0, 27323.0, 43788.0, 68626.0, 104268.0, 152374.0, 212584.0, 283299.0, 353208.0, 411612.0, 443020.0, 439161.0, 400287.0, 339023.0, 267308.0, 199873.0, 140187.0, 97015.0, 63800.0, 40785.0, 25528.0, 15856.0, 9787.0, 5837.0, 3487.0, 2042.0, 1183.0, 663.0, 409.0, 226.0, 120.0, 69.0, 40.0, 26.0, 13.0, 13.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.2109375, -11.850830078125, -11.49072265625, -11.130615234375, -10.7705078125, -10.410400390625, -10.05029296875, -9.690185546875, -9.330078125, -8.969970703125, -8.60986328125, -8.249755859375, -7.8896484375, -7.529541015625, -7.16943359375, -6.809326171875, -6.44921875, -6.089111328125, -5.72900390625, -5.368896484375, -5.0087890625, -4.648681640625, -4.28857421875, -3.928466796875, -3.568359375, -3.208251953125, -2.84814453125, -2.488037109375, -2.1279296875, -1.767822265625, -1.40771484375, -1.047607421875, -0.6875, -0.327392578125, 0.03271484375, 0.392822265625, 0.7529296875, 1.113037109375, 1.47314453125, 1.833251953125, 2.193359375, 2.553466796875, 2.91357421875, 3.273681640625, 3.6337890625, 3.993896484375, 4.35400390625, 4.714111328125, 5.07421875, 5.434326171875, 5.79443359375, 6.154541015625, 6.5146484375, 6.874755859375, 7.23486328125, 7.594970703125, 7.955078125, 8.315185546875, 8.67529296875, 9.035400390625, 9.3955078125, 9.755615234375, 10.11572265625, 10.475830078125, 10.8359375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 11.0, 24.0, 22.0, 28.0, 22.0, 27.0, 25.0, 36.0, 21.0, 35.0, 35.0, 45.0, 35.0, 30.0, 42.0, 44.0, 29.0, 28.0, 32.0, 33.0, 38.0, 42.0, 19.0, 28.0, 17.0, 29.0, 19.0, 20.0, 19.0, 13.0, 22.0, 10.0, 9.0, 15.0, 11.0, 7.0, 6.0, 5.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.09375, -11.7308349609375, -11.367919921875, -11.0050048828125, -10.64208984375, -10.2791748046875, -9.916259765625, -9.5533447265625, -9.1904296875, -8.8275146484375, -8.464599609375, -8.1016845703125, -7.73876953125, -7.3758544921875, -7.012939453125, -6.6500244140625, -6.287109375, -5.9241943359375, -5.561279296875, -5.1983642578125, -4.83544921875, -4.4725341796875, -4.109619140625, -3.7467041015625, -3.3837890625, -3.0208740234375, -2.657958984375, -2.2950439453125, -1.93212890625, -1.5692138671875, -1.206298828125, -0.8433837890625, -0.48046875, -0.1175537109375, 0.245361328125, 0.6082763671875, 0.97119140625, 1.3341064453125, 1.697021484375, 2.0599365234375, 2.4228515625, 2.7857666015625, 3.148681640625, 3.5115966796875, 3.87451171875, 4.2374267578125, 4.600341796875, 4.9632568359375, 5.326171875, 5.6890869140625, 6.052001953125, 6.4149169921875, 6.77783203125, 7.1407470703125, 7.503662109375, 7.8665771484375, 8.2294921875, 8.5924072265625, 8.955322265625, 9.3182373046875, 9.68115234375, 10.0440673828125, 10.406982421875, 10.7698974609375, 11.1328125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 13.0, 33.0, 53.0, 79.0, 157.0, 264.0, 524.0, 947.0, 1673.0, 2978.0, 5076.0, 8819.0, 14937.0, 24682.0, 39491.0, 61853.0, 93678.0, 135445.0, 189347.0, 248826.0, 311837.0, 365434.0, 404651.0, 416190.0, 403465.0, 360874.0, 305242.0, 242713.0, 181805.0, 130563.0, 89286.0, 58844.0, 37881.0, 23448.0, 13999.0, 8115.0, 4836.0, 2728.0, 1515.0, 873.0, 488.0, 274.0, 155.0, 82.0, 48.0, 28.0, 16.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.03125, -11.6715087890625, -11.311767578125, -10.9520263671875, -10.59228515625, -10.2325439453125, -9.872802734375, -9.5130615234375, -9.1533203125, -8.7935791015625, -8.433837890625, -8.0740966796875, -7.71435546875, -7.3546142578125, -6.994873046875, -6.6351318359375, -6.275390625, -5.9156494140625, -5.555908203125, -5.1961669921875, -4.83642578125, -4.4766845703125, -4.116943359375, -3.7572021484375, -3.3974609375, -3.0377197265625, -2.677978515625, -2.3182373046875, -1.95849609375, -1.5987548828125, -1.239013671875, -0.8792724609375, -0.51953125, -0.1597900390625, 0.199951171875, 0.5596923828125, 0.91943359375, 1.2791748046875, 1.638916015625, 1.9986572265625, 2.3583984375, 2.7181396484375, 3.077880859375, 3.4376220703125, 3.79736328125, 4.1571044921875, 4.516845703125, 4.8765869140625, 5.236328125, 5.5960693359375, 5.955810546875, 6.3155517578125, 6.67529296875, 7.0350341796875, 7.394775390625, 7.7545166015625, 8.1142578125, 8.4739990234375, 8.833740234375, 9.1934814453125, 9.55322265625, 9.9129638671875, 10.272705078125, 10.6324462890625, 10.9921875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 4.0, 10.0, 17.0, 20.0, 9.0, 18.0, 33.0, 32.0, 49.0, 49.0, 50.0, 74.0, 88.0, 116.0, 111.0, 121.0, 149.0, 144.0, 169.0, 185.0, 209.0, 186.0, 205.0, 208.0, 208.0, 207.0, 198.0, 179.0, 155.0, 162.0, 132.0, 101.0, 80.0, 83.0, 68.0, 59.0, 46.0, 30.0, 18.0, 21.0, 23.0, 15.0, 11.0, 4.0, 8.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.6953125, -6.4876708984375, -6.280029296875, -6.0723876953125, -5.86474609375, -5.6571044921875, -5.449462890625, -5.2418212890625, -5.0341796875, -4.8265380859375, -4.618896484375, -4.4112548828125, -4.20361328125, -3.9959716796875, -3.788330078125, -3.5806884765625, -3.373046875, -3.1654052734375, -2.957763671875, -2.7501220703125, -2.54248046875, -2.3348388671875, -2.127197265625, -1.9195556640625, -1.7119140625, -1.5042724609375, -1.296630859375, -1.0889892578125, -0.88134765625, -0.6737060546875, -0.466064453125, -0.2584228515625, -0.05078125, 0.1568603515625, 0.364501953125, 0.5721435546875, 0.77978515625, 0.9874267578125, 1.195068359375, 1.4027099609375, 1.6103515625, 1.8179931640625, 2.025634765625, 2.2332763671875, 2.44091796875, 2.6485595703125, 2.856201171875, 3.0638427734375, 3.271484375, 3.4791259765625, 3.686767578125, 3.8944091796875, 4.10205078125, 4.3096923828125, 4.517333984375, 4.7249755859375, 4.9326171875, 5.1402587890625, 5.347900390625, 5.5555419921875, 5.76318359375, 5.9708251953125, 6.178466796875, 6.3861083984375, 6.59375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 6.0, 10.0, 12.0, 12.0, 12.0, 14.0, 21.0, 27.0, 26.0, 27.0, 30.0, 26.0, 35.0, 32.0, 52.0, 44.0, 45.0, 28.0, 45.0, 45.0, 50.0, 47.0, 37.0, 44.0, 37.0, 25.0, 32.0, 26.0, 20.0, 22.0, 7.0, 19.0, 17.0, 13.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.535197257995605, -14.042600631713867, -13.550004959106445, -13.057408332824707, -12.564811706542969, -12.07221508026123, -11.579618453979492, -11.08702278137207, -10.594426155090332, -10.101829528808594, -9.609233856201172, -9.116637229919434, -8.624040603637695, -8.131443977355957, -7.638847827911377, -7.146251678466797, -6.653655052185059, -6.16105842590332, -5.66846227645874, -5.17586612701416, -4.683269500732422, -4.190672874450684, -3.6980767250061035, -3.2054803371429443, -2.712883949279785, -2.220287561416626, -1.7276911735534668, -1.2350947856903076, -0.7424983978271484, -0.24990200996398926, 0.24269437789916992, 0.7352907657623291, 1.2278881072998047, 1.7204844951629639, 2.213080883026123, 2.7056772708892822, 3.1982736587524414, 3.6908700466156006, 4.18346643447876, 4.67606258392334, 5.168659210205078, 5.661255836486816, 6.1538519859313965, 6.646448135375977, 7.139044761657715, 7.631641387939453, 8.124237060546875, 8.616833686828613, 9.109430313110352, 9.60202693939209, 10.094623565673828, 10.58721923828125, 11.079815864562988, 11.572412490844727, 12.065008163452148, 12.557604789733887, 13.050201416015625, 13.542798042297363, 14.035394668579102, 14.527990341186523, 15.020586967468262, 15.51318359375, 16.005779266357422, 16.498376846313477, 16.9909725189209]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 13.0, 12.0, 10.0, 9.0, 17.0, 18.0, 18.0, 20.0, 20.0, 29.0, 29.0, 32.0, 24.0, 24.0, 30.0, 32.0, 38.0, 35.0, 35.0, 38.0, 32.0, 43.0, 28.0, 36.0, 27.0, 35.0, 20.0, 29.0, 25.0, 26.0, 21.0, 30.0, 22.0, 18.0, 18.0, 13.0, 13.0, 10.0, 11.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-16.54274559020996, -16.04191017150879, -15.541075706481934, -15.040241241455078, -14.539405822753906, -14.03857135772705, -13.537736892700195, -13.036901473999023, -12.536067008972168, -12.035232543945312, -11.53439712524414, -11.033562660217285, -10.53272819519043, -10.031892776489258, -9.531058311462402, -9.030223846435547, -8.529388427734375, -8.02855396270752, -7.527718544006348, -7.026884078979492, -6.5260491371154785, -6.025214195251465, -5.524379730224609, -5.023544788360596, -4.522709846496582, -4.021874904632568, -3.521040201187134, -3.020205497741699, -2.5193705558776855, -2.018535614013672, -1.5177009105682373, -1.0168662071228027, -0.5160312652587891, -0.015196442604064941, 0.4856383800506592, 0.9864732027053833, 1.4873080253601074, 1.988142967224121, 2.4889776706695557, 2.9898123741149902, 3.490647315979004, 3.9914822578430176, 4.492317199707031, 4.993151664733887, 5.4939866065979, 5.994821548461914, 6.4956560134887695, 6.996490955352783, 7.497325897216797, 7.9981608390808105, 8.498995780944824, 8.99983024597168, 9.500665664672852, 10.001500129699707, 10.502334594726562, 11.003170013427734, 11.50400447845459, 12.004838943481445, 12.505674362182617, 13.006508827209473, 13.507343292236328, 14.0081787109375, 14.509013175964355, 15.009847640991211, 15.510683059692383]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 9.0, 15.0, 13.0, 18.0, 38.0, 50.0, 52.0, 78.0, 128.0, 200.0, 269.0, 410.0, 638.0, 1074.0, 1580.0, 2467.0, 4077.0, 7199.0, 12401.0, 22537.0, 42377.0, 79991.0, 145070.0, 219320.0, 210387.0, 135248.0, 74510.0, 38917.0, 20601.0, 11618.0, 6508.0, 4084.0, 2399.0, 1519.0, 934.0, 604.0, 411.0, 238.0, 172.0, 136.0, 71.0, 60.0, 43.0, 30.0, 14.0, 16.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-9.7890625, -9.5006103515625, -9.212158203125, -8.9237060546875, -8.63525390625, -8.3468017578125, -8.058349609375, -7.7698974609375, -7.4814453125, -7.1929931640625, -6.904541015625, -6.6160888671875, -6.32763671875, -6.0391845703125, -5.750732421875, -5.4622802734375, -5.173828125, -4.8853759765625, -4.596923828125, -4.3084716796875, -4.02001953125, -3.7315673828125, -3.443115234375, -3.1546630859375, -2.8662109375, -2.5777587890625, -2.289306640625, -2.0008544921875, -1.71240234375, -1.4239501953125, -1.135498046875, -0.8470458984375, -0.55859375, -0.2701416015625, 0.018310546875, 0.3067626953125, 0.59521484375, 0.8836669921875, 1.172119140625, 1.4605712890625, 1.7490234375, 2.0374755859375, 2.325927734375, 2.6143798828125, 2.90283203125, 3.1912841796875, 3.479736328125, 3.7681884765625, 4.056640625, 4.3450927734375, 4.633544921875, 4.9219970703125, 5.21044921875, 5.4989013671875, 5.787353515625, 6.0758056640625, 6.3642578125, 6.6527099609375, 6.941162109375, 7.2296142578125, 7.51806640625, 7.8065185546875, 8.094970703125, 8.3834228515625, 8.671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 12.0, 14.0, 10.0, 9.0, 17.0, 15.0, 20.0, 19.0, 23.0, 29.0, 25.0, 33.0, 23.0, 26.0, 29.0, 38.0, 32.0, 34.0, 35.0, 41.0, 33.0, 38.0, 32.0, 35.0, 26.0, 37.0, 24.0, 23.0, 27.0, 25.0, 23.0, 31.0, 21.0, 11.0, 24.0, 14.0, 14.0, 8.0, 8.0, 12.0, 9.0, 6.0, 6.0, 4.0, 1.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0], "bins": [-16.59375, -16.0946044921875, -15.595458984375, -15.0963134765625, -14.59716796875, -14.0980224609375, -13.598876953125, -13.0997314453125, -12.6005859375, -12.1014404296875, -11.602294921875, -11.1031494140625, -10.60400390625, -10.1048583984375, -9.605712890625, -9.1065673828125, -8.607421875, -8.1082763671875, -7.609130859375, -7.1099853515625, -6.61083984375, -6.1116943359375, -5.612548828125, -5.1134033203125, -4.6142578125, -4.1151123046875, -3.615966796875, -3.1168212890625, -2.61767578125, -2.1185302734375, -1.619384765625, -1.1202392578125, -0.62109375, -0.1219482421875, 0.377197265625, 0.8763427734375, 1.37548828125, 1.8746337890625, 2.373779296875, 2.8729248046875, 3.3720703125, 3.8712158203125, 4.370361328125, 4.8695068359375, 5.36865234375, 5.8677978515625, 6.366943359375, 6.8660888671875, 7.365234375, 7.8643798828125, 8.363525390625, 8.8626708984375, 9.36181640625, 9.8609619140625, 10.360107421875, 10.8592529296875, 11.3583984375, 11.8575439453125, 12.356689453125, 12.8558349609375, 13.35498046875, 13.8541259765625, 14.353271484375, 14.8524169921875, 15.3515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 6.0, 6.0, 14.0, 16.0, 19.0, 22.0, 28.0, 40.0, 72.0, 71.0, 111.0, 183.0, 289.0, 420.0, 670.0, 1194.0, 2257.0, 4695.0, 11472.0, 37253.0, 181611.0, 580848.0, 170639.0, 35571.0, 11212.0, 4598.0, 2186.0, 1187.0, 639.0, 369.0, 277.0, 150.0, 116.0, 83.0, 59.0, 38.0, 30.0, 37.0, 15.0, 15.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-20.0, -19.4517822265625, -18.903564453125, -18.3553466796875, -17.80712890625, -17.2589111328125, -16.710693359375, -16.1624755859375, -15.6142578125, -15.0660400390625, -14.517822265625, -13.9696044921875, -13.42138671875, -12.8731689453125, -12.324951171875, -11.7767333984375, -11.228515625, -10.6802978515625, -10.132080078125, -9.5838623046875, -9.03564453125, -8.4874267578125, -7.939208984375, -7.3909912109375, -6.8427734375, -6.2945556640625, -5.746337890625, -5.1981201171875, -4.64990234375, -4.1016845703125, -3.553466796875, -3.0052490234375, -2.45703125, -1.9088134765625, -1.360595703125, -0.8123779296875, -0.26416015625, 0.2840576171875, 0.832275390625, 1.3804931640625, 1.9287109375, 2.4769287109375, 3.025146484375, 3.5733642578125, 4.12158203125, 4.6697998046875, 5.218017578125, 5.7662353515625, 6.314453125, 6.8626708984375, 7.410888671875, 7.9591064453125, 8.50732421875, 9.0555419921875, 9.603759765625, 10.1519775390625, 10.7001953125, 11.2484130859375, 11.796630859375, 12.3448486328125, 12.89306640625, 13.4412841796875, 13.989501953125, 14.5377197265625, 15.0859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 6.0, 10.0, 8.0, 9.0, 11.0, 17.0, 10.0, 13.0, 12.0, 22.0, 18.0, 23.0, 23.0, 25.0, 35.0, 23.0, 31.0, 36.0, 33.0, 40.0, 28.0, 38.0, 44.0, 35.0, 30.0, 31.0, 36.0, 30.0, 30.0, 22.0, 22.0, 31.0, 18.0, 20.0, 15.0, 18.0, 21.0, 17.0, 15.0, 12.0, 11.0, 16.0, 12.0, 3.0, 3.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.4375, -10.100341796875, -9.76318359375, -9.426025390625, -9.0888671875, -8.751708984375, -8.41455078125, -8.077392578125, -7.740234375, -7.403076171875, -7.06591796875, -6.728759765625, -6.3916015625, -6.054443359375, -5.71728515625, -5.380126953125, -5.04296875, -4.705810546875, -4.36865234375, -4.031494140625, -3.6943359375, -3.357177734375, -3.02001953125, -2.682861328125, -2.345703125, -2.008544921875, -1.67138671875, -1.334228515625, -0.9970703125, -0.659912109375, -0.32275390625, 0.014404296875, 0.3515625, 0.688720703125, 1.02587890625, 1.363037109375, 1.7001953125, 2.037353515625, 2.37451171875, 2.711669921875, 3.048828125, 3.385986328125, 3.72314453125, 4.060302734375, 4.3974609375, 4.734619140625, 5.07177734375, 5.408935546875, 5.74609375, 6.083251953125, 6.42041015625, 6.757568359375, 7.0947265625, 7.431884765625, 7.76904296875, 8.106201171875, 8.443359375, 8.780517578125, 9.11767578125, 9.454833984375, 9.7919921875, 10.129150390625, 10.46630859375, 10.803466796875, 11.140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 10.0, 4.0, 11.0, 26.0, 26.0, 36.0, 52.0, 72.0, 97.0, 144.0, 229.0, 347.0, 583.0, 875.0, 1691.0, 3193.0, 7176.0, 22831.0, 261852.0, 691011.0, 39716.0, 9680.0, 3986.0, 1947.0, 1092.0, 638.0, 406.0, 265.0, 171.0, 98.0, 99.0, 52.0, 38.0, 32.0, 15.0, 13.0, 7.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.25, -22.588623046875, -21.92724609375, -21.265869140625, -20.6044921875, -19.943115234375, -19.28173828125, -18.620361328125, -17.958984375, -17.297607421875, -16.63623046875, -15.974853515625, -15.3134765625, -14.652099609375, -13.99072265625, -13.329345703125, -12.66796875, -12.006591796875, -11.34521484375, -10.683837890625, -10.0224609375, -9.361083984375, -8.69970703125, -8.038330078125, -7.376953125, -6.715576171875, -6.05419921875, -5.392822265625, -4.7314453125, -4.070068359375, -3.40869140625, -2.747314453125, -2.0859375, -1.424560546875, -0.76318359375, -0.101806640625, 0.5595703125, 1.220947265625, 1.88232421875, 2.543701171875, 3.205078125, 3.866455078125, 4.52783203125, 5.189208984375, 5.8505859375, 6.511962890625, 7.17333984375, 7.834716796875, 8.49609375, 9.157470703125, 9.81884765625, 10.480224609375, 11.1416015625, 11.802978515625, 12.46435546875, 13.125732421875, 13.787109375, 14.448486328125, 15.10986328125, 15.771240234375, 16.4326171875, 17.093994140625, 17.75537109375, 18.416748046875, 19.078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 10.0, 27.0, 48.0, 86.0, 168.0, 201.0, 167.0, 123.0, 40.0, 34.0, 18.0, 8.0, 8.0, 3.0, 5.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000995635986328125, -0.0009631365537643433, -0.0009306371212005615, -0.0008981376886367798, -0.000865638256072998, -0.0008331388235092163, -0.0008006393909454346, -0.0007681399583816528, -0.0007356405258178711, -0.0007031410932540894, -0.0006706416606903076, -0.0006381422281265259, -0.0006056427955627441, -0.0005731433629989624, -0.0005406439304351807, -0.0005081444978713989, -0.0004756450653076172, -0.00044314563274383545, -0.0004106462001800537, -0.00037814676761627197, -0.00034564733505249023, -0.0003131479024887085, -0.00028064846992492676, -0.000248149037361145, -0.00021564960479736328, -0.00018315017223358154, -0.0001506507396697998, -0.00011815130710601807, -8.565187454223633e-05, -5.315244197845459e-05, -2.065300941467285e-05, 1.1846423149108887e-05, 4.4345855712890625e-05, 7.684528827667236e-05, 0.0001093447208404541, 0.00014184415340423584, 0.00017434358596801758, 0.00020684301853179932, 0.00023934245109558105, 0.0002718418836593628, 0.00030434131622314453, 0.00033684074878692627, 0.000369340181350708, 0.00040183961391448975, 0.0004343390464782715, 0.0004668384790420532, 0.000499337911605835, 0.0005318373441696167, 0.0005643367767333984, 0.0005968362092971802, 0.0006293356418609619, 0.0006618350744247437, 0.0006943345069885254, 0.0007268339395523071, 0.0007593333721160889, 0.0007918328046798706, 0.0008243322372436523, 0.0008568316698074341, 0.0008893311023712158, 0.0009218305349349976, 0.0009543299674987793, 0.000986829400062561, 0.0010193288326263428, 0.0010518282651901245, 0.0010843276977539062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 9.0, 8.0, 14.0, 16.0, 22.0, 31.0, 45.0, 71.0, 81.0, 115.0, 167.0, 218.0, 373.0, 502.0, 818.0, 1324.0, 2186.0, 4026.0, 8295.0, 21131.0, 79353.0, 384830.0, 414247.0, 88957.0, 22440.0, 8819.0, 4297.0, 2243.0, 1398.0, 834.0, 492.0, 356.0, 246.0, 174.0, 106.0, 86.0, 70.0, 48.0, 30.0, 26.0, 10.0, 17.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-20.265625, -19.670166015625, -19.07470703125, -18.479248046875, -17.8837890625, -17.288330078125, -16.69287109375, -16.097412109375, -15.501953125, -14.906494140625, -14.31103515625, -13.715576171875, -13.1201171875, -12.524658203125, -11.92919921875, -11.333740234375, -10.73828125, -10.142822265625, -9.54736328125, -8.951904296875, -8.3564453125, -7.760986328125, -7.16552734375, -6.570068359375, -5.974609375, -5.379150390625, -4.78369140625, -4.188232421875, -3.5927734375, -2.997314453125, -2.40185546875, -1.806396484375, -1.2109375, -0.615478515625, -0.02001953125, 0.575439453125, 1.1708984375, 1.766357421875, 2.36181640625, 2.957275390625, 3.552734375, 4.148193359375, 4.74365234375, 5.339111328125, 5.9345703125, 6.530029296875, 7.12548828125, 7.720947265625, 8.31640625, 8.911865234375, 9.50732421875, 10.102783203125, 10.6982421875, 11.293701171875, 11.88916015625, 12.484619140625, 13.080078125, 13.675537109375, 14.27099609375, 14.866455078125, 15.4619140625, 16.057373046875, 16.65283203125, 17.248291015625, 17.84375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 11.0, 14.0, 22.0, 33.0, 65.0, 60.0, 89.0, 77.0, 100.0, 92.0, 83.0, 78.0, 52.0, 38.0, 47.0, 42.0, 24.0, 12.0, 10.0, 4.0, 9.0, 5.0, 3.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.716033935546875, -3.57855224609375, -3.441070556640625, -3.3035888671875, -3.166107177734375, -3.02862548828125, -2.891143798828125, -2.753662109375, -2.616180419921875, -2.47869873046875, -2.341217041015625, -2.2037353515625, -2.066253662109375, -1.92877197265625, -1.791290283203125, -1.65380859375, -1.516326904296875, -1.37884521484375, -1.241363525390625, -1.1038818359375, -0.966400146484375, -0.82891845703125, -0.691436767578125, -0.553955078125, -0.416473388671875, -0.27899169921875, -0.141510009765625, -0.0040283203125, 0.133453369140625, 0.27093505859375, 0.408416748046875, 0.5458984375, 0.683380126953125, 0.82086181640625, 0.958343505859375, 1.0958251953125, 1.233306884765625, 1.37078857421875, 1.508270263671875, 1.645751953125, 1.783233642578125, 1.92071533203125, 2.058197021484375, 2.1956787109375, 2.333160400390625, 2.47064208984375, 2.608123779296875, 2.74560546875, 2.883087158203125, 3.02056884765625, 3.158050537109375, 3.2955322265625, 3.433013916015625, 3.57049560546875, 3.707977294921875, 3.845458984375, 3.982940673828125, 4.12042236328125, 4.257904052734375, 4.3953857421875, 4.532867431640625, 4.67034912109375, 4.807830810546875, 4.9453125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 11.0, 9.0, 12.0, 8.0, 19.0, 20.0, 18.0, 31.0, 24.0, 30.0, 26.0, 46.0, 32.0, 24.0, 48.0, 36.0, 35.0, 52.0, 51.0, 43.0, 44.0, 43.0, 39.0, 48.0, 33.0, 20.0, 26.0, 25.0, 20.0, 18.0, 10.0, 15.0, 14.0, 15.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.332239151000977, -13.833210945129395, -13.334181785583496, -12.835153579711914, -12.336125373840332, -11.83709716796875, -11.338068008422852, -10.83903980255127, -10.340011596679688, -9.840983390808105, -9.341954231262207, -8.842926025390625, -8.343897819519043, -7.844869136810303, -7.3458404541015625, -6.8468122482299805, -6.34778356552124, -5.8487548828125, -5.349726676940918, -4.850697994232178, -4.351669788360596, -3.8526411056518555, -3.3536126613616943, -2.854584217071533, -2.355555772781372, -1.856527328491211, -1.3574988842010498, -0.8584703207015991, -0.359441876411438, 0.1395866870880127, 0.6386151313781738, 1.137643575668335, 1.636672019958496, 2.1357004642486572, 2.6347289085388184, 3.1337575912475586, 3.6327857971191406, 4.131814479827881, 4.630843162536621, 5.129871368408203, 5.628899574279785, 6.127928256988525, 6.626956462860107, 7.125985145568848, 7.62501335144043, 8.124042510986328, 8.62307071685791, 9.122098922729492, 9.62112808227539, 10.120156288146973, 10.619185447692871, 11.118213653564453, 11.617241859436035, 12.116270065307617, 12.615299224853516, 13.114327430725098, 13.61335563659668, 14.112383842468262, 14.61141300201416, 15.110441207885742, 15.609469413757324, 16.108497619628906, 16.607526779174805, 17.106555938720703, 17.60558319091797]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 13.0, 8.0, 17.0, 9.0, 13.0, 15.0, 18.0, 24.0, 22.0, 24.0, 36.0, 29.0, 25.0, 32.0, 33.0, 29.0, 24.0, 31.0, 41.0, 32.0, 35.0, 42.0, 34.0, 20.0, 32.0, 30.0, 34.0, 26.0, 12.0, 25.0, 30.0, 22.0, 27.0, 21.0, 15.0, 16.0, 13.0, 12.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 5.0, 2.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0], "bins": [-16.49007225036621, -15.979050636291504, -15.46802806854248, -14.957006454467773, -14.445984840393066, -13.93496322631836, -13.423940658569336, -12.912919044494629, -12.401897430419922, -11.890875816345215, -11.379853248596191, -10.868831634521484, -10.357810020446777, -9.84678840637207, -9.335765838623047, -8.82474422454834, -8.313721656799316, -7.802699565887451, -7.291677951812744, -6.780655860900879, -6.269634246826172, -5.758612155914307, -5.247590065002441, -4.736568450927734, -4.225546360015869, -3.714524507522583, -3.203502655029297, -2.6924805641174316, -2.1814587116241455, -1.6704368591308594, -1.1594147682189941, -0.648392915725708, -0.13737106323242188, 0.37365084886550903, 0.8846727609634399, 1.3956947326660156, 1.9067165851593018, 2.417738437652588, 2.928760528564453, 3.4397823810577393, 3.9508042335510254, 4.461826324462891, 4.972847938537598, 5.483870029449463, 5.994892120361328, 6.505913734436035, 7.0169358253479, 7.527957916259766, 8.038979530334473, 8.55000114440918, 9.061023712158203, 9.57204532623291, 10.083066940307617, 10.59408950805664, 11.105111122131348, 11.616132736206055, 12.127155303955078, 12.638176918029785, 13.149199485778809, 13.660221099853516, 14.171242713928223, 14.68226432800293, 15.193286895751953, 15.70430850982666, 16.215330123901367]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 14.0, 23.0, 43.0, 59.0, 87.0, 143.0, 223.0, 336.0, 494.0, 744.0, 1182.0, 1720.0, 2519.0, 3746.0, 5408.0, 7471.0, 10649.0, 14310.0, 19300.0, 25787.0, 33064.0, 41395.0, 49880.0, 58735.0, 66540.0, 72980.0, 77878.0, 78255.0, 76297.0, 71709.0, 65292.0, 56526.0, 47875.0, 39175.0, 31225.0, 23904.0, 18195.0, 13379.0, 9742.0, 7009.0, 4864.0, 3438.0, 2360.0, 1565.0, 1066.0, 710.0, 432.0, 313.0, 207.0, 127.0, 72.0, 33.0, 27.0, 17.0, 7.0, 10.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.09375, -8.803955078125, -8.51416015625, -8.224365234375, -7.9345703125, -7.644775390625, -7.35498046875, -7.065185546875, -6.775390625, -6.485595703125, -6.19580078125, -5.906005859375, -5.6162109375, -5.326416015625, -5.03662109375, -4.746826171875, -4.45703125, -4.167236328125, -3.87744140625, -3.587646484375, -3.2978515625, -3.008056640625, -2.71826171875, -2.428466796875, -2.138671875, -1.848876953125, -1.55908203125, -1.269287109375, -0.9794921875, -0.689697265625, -0.39990234375, -0.110107421875, 0.1796875, 0.469482421875, 0.75927734375, 1.049072265625, 1.3388671875, 1.628662109375, 1.91845703125, 2.208251953125, 2.498046875, 2.787841796875, 3.07763671875, 3.367431640625, 3.6572265625, 3.947021484375, 4.23681640625, 4.526611328125, 4.81640625, 5.106201171875, 5.39599609375, 5.685791015625, 5.9755859375, 6.265380859375, 6.55517578125, 6.844970703125, 7.134765625, 7.424560546875, 7.71435546875, 8.004150390625, 8.2939453125, 8.583740234375, 8.87353515625, 9.163330078125, 9.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 3.0, 4.0, 10.0, 12.0, 11.0, 11.0, 13.0, 12.0, 12.0, 16.0, 21.0, 21.0, 26.0, 23.0, 40.0, 23.0, 27.0, 39.0, 25.0, 28.0, 27.0, 37.0, 35.0, 33.0, 32.0, 44.0, 29.0, 22.0, 33.0, 30.0, 35.0, 23.0, 12.0, 31.0, 28.0, 18.0, 27.0, 25.0, 10.0, 16.0, 12.0, 13.0, 15.0, 6.0, 8.0, 6.0, 6.0, 2.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 0.0, 2.0], "bins": [-16.15625, -15.65234375, -15.1484375, -14.64453125, -14.140625, -13.63671875, -13.1328125, -12.62890625, -12.125, -11.62109375, -11.1171875, -10.61328125, -10.109375, -9.60546875, -9.1015625, -8.59765625, -8.09375, -7.58984375, -7.0859375, -6.58203125, -6.078125, -5.57421875, -5.0703125, -4.56640625, -4.0625, -3.55859375, -3.0546875, -2.55078125, -2.046875, -1.54296875, -1.0390625, -0.53515625, -0.03125, 0.47265625, 0.9765625, 1.48046875, 1.984375, 2.48828125, 2.9921875, 3.49609375, 4.0, 4.50390625, 5.0078125, 5.51171875, 6.015625, 6.51953125, 7.0234375, 7.52734375, 8.03125, 8.53515625, 9.0390625, 9.54296875, 10.046875, 10.55078125, 11.0546875, 11.55859375, 12.0625, 12.56640625, 13.0703125, 13.57421875, 14.078125, 14.58203125, 15.0859375, 15.58984375, 16.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 19.0, 22.0, 28.0, 65.0, 88.0, 150.0, 198.0, 345.0, 505.0, 713.0, 1195.0, 1767.0, 2708.0, 4057.0, 6352.0, 9258.0, 13982.0, 19858.0, 28730.0, 40123.0, 53113.0, 67367.0, 81310.0, 92579.0, 99245.0, 98957.0, 92847.0, 81286.0, 67524.0, 53112.0, 40236.0, 28939.0, 20355.0, 13831.0, 9471.0, 6298.0, 4060.0, 2734.0, 1743.0, 1175.0, 800.0, 493.0, 324.0, 188.0, 147.0, 84.0, 39.0, 49.0, 29.0, 11.0, 18.0, 9.0, 5.0, 2.0, 4.0], "bins": [-13.96875, -13.5579833984375, -13.147216796875, -12.7364501953125, -12.32568359375, -11.9149169921875, -11.504150390625, -11.0933837890625, -10.6826171875, -10.2718505859375, -9.861083984375, -9.4503173828125, -9.03955078125, -8.6287841796875, -8.218017578125, -7.8072509765625, -7.396484375, -6.9857177734375, -6.574951171875, -6.1641845703125, -5.75341796875, -5.3426513671875, -4.931884765625, -4.5211181640625, -4.1103515625, -3.6995849609375, -3.288818359375, -2.8780517578125, -2.46728515625, -2.0565185546875, -1.645751953125, -1.2349853515625, -0.82421875, -0.4134521484375, -0.002685546875, 0.4080810546875, 0.81884765625, 1.2296142578125, 1.640380859375, 2.0511474609375, 2.4619140625, 2.8726806640625, 3.283447265625, 3.6942138671875, 4.10498046875, 4.5157470703125, 4.926513671875, 5.3372802734375, 5.748046875, 6.1588134765625, 6.569580078125, 6.9803466796875, 7.39111328125, 7.8018798828125, 8.212646484375, 8.6234130859375, 9.0341796875, 9.4449462890625, 9.855712890625, 10.2664794921875, 10.67724609375, 11.0880126953125, 11.498779296875, 11.9095458984375, 12.3203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 14.0, 15.0, 11.0, 18.0, 20.0, 18.0, 33.0, 27.0, 22.0, 41.0, 33.0, 37.0, 42.0, 37.0, 38.0, 34.0, 48.0, 29.0, 41.0, 30.0, 44.0, 39.0, 27.0, 37.0, 42.0, 25.0, 23.0, 20.0, 18.0, 20.0, 18.0, 11.0, 12.0, 14.0, 8.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-14.3984375, -13.9503173828125, -13.502197265625, -13.0540771484375, -12.60595703125, -12.1578369140625, -11.709716796875, -11.2615966796875, -10.8134765625, -10.3653564453125, -9.917236328125, -9.4691162109375, -9.02099609375, -8.5728759765625, -8.124755859375, -7.6766357421875, -7.228515625, -6.7803955078125, -6.332275390625, -5.8841552734375, -5.43603515625, -4.9879150390625, -4.539794921875, -4.0916748046875, -3.6435546875, -3.1954345703125, -2.747314453125, -2.2991943359375, -1.85107421875, -1.4029541015625, -0.954833984375, -0.5067138671875, -0.05859375, 0.3895263671875, 0.837646484375, 1.2857666015625, 1.73388671875, 2.1820068359375, 2.630126953125, 3.0782470703125, 3.5263671875, 3.9744873046875, 4.422607421875, 4.8707275390625, 5.31884765625, 5.7669677734375, 6.215087890625, 6.6632080078125, 7.111328125, 7.5594482421875, 8.007568359375, 8.4556884765625, 8.90380859375, 9.3519287109375, 9.800048828125, 10.2481689453125, 10.6962890625, 11.1444091796875, 11.592529296875, 12.0406494140625, 12.48876953125, 12.9368896484375, 13.385009765625, 13.8331298828125, 14.28125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 10.0, 16.0, 26.0, 30.0, 52.0, 87.0, 113.0, 179.0, 250.0, 449.0, 566.0, 949.0, 1354.0, 1997.0, 3136.0, 4785.0, 6816.0, 10473.0, 16263.0, 23960.0, 35128.0, 49664.0, 67878.0, 86519.0, 102946.0, 112893.0, 112050.0, 102609.0, 85785.0, 67478.0, 49373.0, 34441.0, 23681.0, 15624.0, 10444.0, 6917.0, 4544.0, 2982.0, 2011.0, 1355.0, 898.0, 611.0, 391.0, 268.0, 204.0, 106.0, 70.0, 56.0, 41.0, 26.0, 22.0, 13.0, 3.0, 3.0, 4.0, 4.0, 1.0], "bins": [-5.58203125, -5.41278076171875, -5.2435302734375, -5.07427978515625, -4.905029296875, -4.73577880859375, -4.5665283203125, -4.39727783203125, -4.22802734375, -4.05877685546875, -3.8895263671875, -3.72027587890625, -3.551025390625, -3.38177490234375, -3.2125244140625, -3.04327392578125, -2.8740234375, -2.70477294921875, -2.5355224609375, -2.36627197265625, -2.197021484375, -2.02777099609375, -1.8585205078125, -1.68927001953125, -1.52001953125, -1.35076904296875, -1.1815185546875, -1.01226806640625, -0.843017578125, -0.67376708984375, -0.5045166015625, -0.33526611328125, -0.166015625, 0.00323486328125, 0.1724853515625, 0.34173583984375, 0.510986328125, 0.68023681640625, 0.8494873046875, 1.01873779296875, 1.18798828125, 1.35723876953125, 1.5264892578125, 1.69573974609375, 1.864990234375, 2.03424072265625, 2.2034912109375, 2.37274169921875, 2.5419921875, 2.71124267578125, 2.8804931640625, 3.04974365234375, 3.218994140625, 3.38824462890625, 3.5574951171875, 3.72674560546875, 3.89599609375, 4.06524658203125, 4.2344970703125, 4.40374755859375, 4.572998046875, 4.74224853515625, 4.9114990234375, 5.08074951171875, 5.25]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 5.0, 13.0, 6.0, 10.0, 19.0, 15.0, 26.0, 32.0, 22.0, 31.0, 37.0, 44.0, 50.0, 59.0, 34.0, 57.0, 37.0, 49.0, 46.0, 44.0, 52.0, 62.0, 29.0, 30.0, 36.0, 27.0, 26.0, 14.0, 12.0, 9.0, 13.0, 12.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008134841918945312, -0.0007901489734649658, -0.0007668137550354004, -0.000743478536605835, -0.0007201433181762695, -0.0006968080997467041, -0.0006734728813171387, -0.0006501376628875732, -0.0006268024444580078, -0.0006034672260284424, -0.000580132007598877, -0.0005567967891693115, -0.0005334615707397461, -0.0005101263523101807, -0.00048679113388061523, -0.0004634559154510498, -0.0004401206970214844, -0.00041678547859191895, -0.0003934502601623535, -0.0003701150417327881, -0.00034677982330322266, -0.0003234446048736572, -0.0003001093864440918, -0.00027677416801452637, -0.00025343894958496094, -0.0002301037311553955, -0.00020676851272583008, -0.00018343329429626465, -0.00016009807586669922, -0.0001367628574371338, -0.00011342763900756836, -9.009242057800293e-05, -6.67572021484375e-05, -4.342198371887207e-05, -2.008676528930664e-05, 3.248453140258789e-06, 2.658367156982422e-05, 4.991888999938965e-05, 7.325410842895508e-05, 9.658932685852051e-05, 0.00011992454528808594, 0.00014325976371765137, 0.0001665949821472168, 0.00018993020057678223, 0.00021326541900634766, 0.00023660063743591309, 0.0002599358558654785, 0.00028327107429504395, 0.0003066062927246094, 0.0003299415111541748, 0.00035327672958374023, 0.00037661194801330566, 0.0003999471664428711, 0.0004232823848724365, 0.00044661760330200195, 0.0004699528217315674, 0.0004932880401611328, 0.0005166232585906982, 0.0005399584770202637, 0.0005632936954498291, 0.0005866289138793945, 0.00060996413230896, 0.0006332993507385254, 0.0006566345691680908, 0.0006799697875976562]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 5.0, 12.0, 16.0, 26.0, 46.0, 64.0, 95.0, 151.0, 216.0, 342.0, 604.0, 903.0, 1488.0, 2337.0, 3831.0, 5966.0, 9586.0, 14674.0, 22503.0, 33168.0, 47745.0, 64366.0, 81965.0, 97544.0, 108317.0, 110405.0, 103889.0, 90140.0, 73598.0, 55581.0, 40185.0, 27796.0, 18549.0, 11909.0, 7558.0, 4761.0, 3022.0, 1871.0, 1225.0, 750.0, 440.0, 301.0, 193.0, 144.0, 96.0, 59.0, 34.0, 31.0, 15.0, 13.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.6015625, -4.454345703125, -4.30712890625, -4.159912109375, -4.0126953125, -3.865478515625, -3.71826171875, -3.571044921875, -3.423828125, -3.276611328125, -3.12939453125, -2.982177734375, -2.8349609375, -2.687744140625, -2.54052734375, -2.393310546875, -2.24609375, -2.098876953125, -1.95166015625, -1.804443359375, -1.6572265625, -1.510009765625, -1.36279296875, -1.215576171875, -1.068359375, -0.921142578125, -0.77392578125, -0.626708984375, -0.4794921875, -0.332275390625, -0.18505859375, -0.037841796875, 0.109375, 0.256591796875, 0.40380859375, 0.551025390625, 0.6982421875, 0.845458984375, 0.99267578125, 1.139892578125, 1.287109375, 1.434326171875, 1.58154296875, 1.728759765625, 1.8759765625, 2.023193359375, 2.17041015625, 2.317626953125, 2.46484375, 2.612060546875, 2.75927734375, 2.906494140625, 3.0537109375, 3.200927734375, 3.34814453125, 3.495361328125, 3.642578125, 3.789794921875, 3.93701171875, 4.084228515625, 4.2314453125, 4.378662109375, 4.52587890625, 4.673095703125, 4.8203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 7.0, 12.0, 12.0, 14.0, 16.0, 29.0, 22.0, 29.0, 39.0, 38.0, 56.0, 53.0, 55.0, 52.0, 54.0, 66.0, 65.0, 49.0, 45.0, 46.0, 43.0, 33.0, 26.0, 26.0, 26.0, 17.0, 15.0, 9.0, 12.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.193359375, -3.097198486328125, -3.00103759765625, -2.904876708984375, -2.8087158203125, -2.712554931640625, -2.61639404296875, -2.520233154296875, -2.424072265625, -2.327911376953125, -2.23175048828125, -2.135589599609375, -2.0394287109375, -1.943267822265625, -1.84710693359375, -1.750946044921875, -1.65478515625, -1.558624267578125, -1.46246337890625, -1.366302490234375, -1.2701416015625, -1.173980712890625, -1.07781982421875, -0.981658935546875, -0.885498046875, -0.789337158203125, -0.69317626953125, -0.597015380859375, -0.5008544921875, -0.404693603515625, -0.30853271484375, -0.212371826171875, -0.1162109375, -0.020050048828125, 0.07611083984375, 0.172271728515625, 0.2684326171875, 0.364593505859375, 0.46075439453125, 0.556915283203125, 0.653076171875, 0.749237060546875, 0.84539794921875, 0.941558837890625, 1.0377197265625, 1.133880615234375, 1.23004150390625, 1.326202392578125, 1.42236328125, 1.518524169921875, 1.61468505859375, 1.710845947265625, 1.8070068359375, 1.903167724609375, 1.99932861328125, 2.095489501953125, 2.191650390625, 2.287811279296875, 2.38397216796875, 2.480133056640625, 2.5762939453125, 2.672454833984375, 2.76861572265625, 2.864776611328125, 2.9609375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 8.0, 12.0, 5.0, 11.0, 13.0, 10.0, 17.0, 14.0, 13.0, 23.0, 35.0, 39.0, 32.0, 37.0, 56.0, 39.0, 32.0, 38.0, 42.0, 55.0, 40.0, 47.0, 47.0, 46.0, 42.0, 43.0, 27.0, 29.0, 21.0, 24.0, 12.0, 15.0, 11.0, 12.0, 12.0, 7.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.9888858795166, -17.45688819885254, -16.924890518188477, -16.39289093017578, -15.860894203186035, -15.328895568847656, -14.796897888183594, -14.264900207519531, -13.732902526855469, -13.200904846191406, -12.668906211853027, -12.136908531188965, -11.604910850524902, -11.072912216186523, -10.540914535522461, -10.008916854858398, -9.47691822052002, -8.944920539855957, -8.412921905517578, -7.880924224853516, -7.348926544189453, -6.816928386688232, -6.284930229187012, -5.752932548522949, -5.2209343910217285, -4.688936233520508, -4.156938552856445, -3.6249403953552246, -3.092942476272583, -2.5609445571899414, -2.0289463996887207, -1.496948480606079, -0.9649505615234375, -0.4329525828361511, 0.09904539585113525, 0.6310434341430664, 1.163041353225708, 1.6950392723083496, 2.2270374298095703, 2.759035348892212, 3.2910332679748535, 3.823031187057495, 4.355029106140137, 4.887027263641357, 5.419025421142578, 5.951023101806641, 6.483021259307861, 7.015019416809082, 7.5470170974731445, 8.079014778137207, 8.611013412475586, 9.143011093139648, 9.675008773803711, 10.207006454467773, 10.739005088806152, 11.271002769470215, 11.803001403808594, 12.334999084472656, 12.866997718811035, 13.398995399475098, 13.93099308013916, 14.462991714477539, 14.994989395141602, 15.526987075805664, 16.058984756469727]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 8.0, 8.0, 19.0, 21.0, 22.0, 22.0, 24.0, 19.0, 23.0, 37.0, 39.0, 38.0, 23.0, 49.0, 31.0, 32.0, 38.0, 37.0, 31.0, 31.0, 39.0, 37.0, 29.0, 28.0, 26.0, 36.0, 28.0, 21.0, 25.0, 30.0, 22.0, 20.0, 15.0, 8.0, 15.0, 11.0, 8.0, 5.0, 4.0, 6.0, 8.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.16267204284668, -17.577363967895508, -16.99205780029297, -16.406749725341797, -15.821443557739258, -15.236135482788086, -14.65082836151123, -14.065521240234375, -13.48021411895752, -12.894906997680664, -12.309599876403809, -11.724292755126953, -11.138984680175781, -10.553678512573242, -9.96837043762207, -9.383063316345215, -8.79775619506836, -8.212449073791504, -7.627141952514648, -7.041834354400635, -6.456527233123779, -5.871220111846924, -5.28591251373291, -4.700605392456055, -4.115298271179199, -3.5299911499023438, -2.944683790206909, -2.3593764305114746, -1.7740693092346191, -1.1887621879577637, -0.6034548282623291, -0.01814746856689453, 0.5671615600585938, 1.1524688005447388, 1.7377760410308838, 2.3230834007263184, 2.908390522003174, 3.4936976432800293, 4.079005241394043, 4.664312362670898, 5.249619483947754, 5.834926605224609, 6.420233726501465, 7.0055413246154785, 7.590848445892334, 8.176155090332031, 8.761463165283203, 9.346770286560059, 9.932077407836914, 10.51738452911377, 11.102691650390625, 11.68799877166748, 12.273305892944336, 12.858613967895508, 13.443921089172363, 14.029228210449219, 14.614535331726074, 15.19984245300293, 15.785149574279785, 16.37045669555664, 16.955764770507812, 17.54107093811035, 18.126379013061523, 18.711685180664062, 19.296993255615234]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 11.0, 10.0, 36.0, 50.0, 72.0, 126.0, 203.0, 411.0, 638.0, 1143.0, 2001.0, 3438.0, 5742.0, 9660.0, 15927.0, 26273.0, 42343.0, 66239.0, 100653.0, 147327.0, 206589.0, 276843.0, 344624.0, 404988.0, 437610.0, 437684.0, 403990.0, 346258.0, 275350.0, 206942.0, 147989.0, 101445.0, 67406.0, 43460.0, 27731.0, 16960.0, 10506.0, 6425.0, 3775.0, 2278.0, 1328.0, 772.0, 452.0, 233.0, 153.0, 85.0, 45.0, 24.0, 12.0, 6.0, 13.0, 7.0, 1.0, 1.0, 1.0], "bins": [-14.078125, -13.664306640625, -13.25048828125, -12.836669921875, -12.4228515625, -12.009033203125, -11.59521484375, -11.181396484375, -10.767578125, -10.353759765625, -9.93994140625, -9.526123046875, -9.1123046875, -8.698486328125, -8.28466796875, -7.870849609375, -7.45703125, -7.043212890625, -6.62939453125, -6.215576171875, -5.8017578125, -5.387939453125, -4.97412109375, -4.560302734375, -4.146484375, -3.732666015625, -3.31884765625, -2.905029296875, -2.4912109375, -2.077392578125, -1.66357421875, -1.249755859375, -0.8359375, -0.422119140625, -0.00830078125, 0.405517578125, 0.8193359375, 1.233154296875, 1.64697265625, 2.060791015625, 2.474609375, 2.888427734375, 3.30224609375, 3.716064453125, 4.1298828125, 4.543701171875, 4.95751953125, 5.371337890625, 5.78515625, 6.198974609375, 6.61279296875, 7.026611328125, 7.4404296875, 7.854248046875, 8.26806640625, 8.681884765625, 9.095703125, 9.509521484375, 9.92333984375, 10.337158203125, 10.7509765625, 11.164794921875, 11.57861328125, 11.992431640625, 12.40625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 0.0, 8.0, 7.0, 8.0, 13.0, 20.0, 24.0, 18.0, 25.0, 20.0, 21.0, 27.0, 36.0, 36.0, 38.0, 29.0, 36.0, 40.0, 35.0, 38.0, 29.0, 32.0, 33.0, 39.0, 30.0, 35.0, 26.0, 29.0, 35.0, 27.0, 25.0, 26.0, 21.0, 25.0, 19.0, 10.0, 13.0, 11.0, 15.0, 6.0, 6.0, 6.0, 6.0, 3.0, 5.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.90625, -15.3896484375, -14.873046875, -14.3564453125, -13.83984375, -13.3232421875, -12.806640625, -12.2900390625, -11.7734375, -11.2568359375, -10.740234375, -10.2236328125, -9.70703125, -9.1904296875, -8.673828125, -8.1572265625, -7.640625, -7.1240234375, -6.607421875, -6.0908203125, -5.57421875, -5.0576171875, -4.541015625, -4.0244140625, -3.5078125, -2.9912109375, -2.474609375, -1.9580078125, -1.44140625, -0.9248046875, -0.408203125, 0.1083984375, 0.625, 1.1416015625, 1.658203125, 2.1748046875, 2.69140625, 3.2080078125, 3.724609375, 4.2412109375, 4.7578125, 5.2744140625, 5.791015625, 6.3076171875, 6.82421875, 7.3408203125, 7.857421875, 8.3740234375, 8.890625, 9.4072265625, 9.923828125, 10.4404296875, 10.95703125, 11.4736328125, 11.990234375, 12.5068359375, 13.0234375, 13.5400390625, 14.056640625, 14.5732421875, 15.08984375, 15.6064453125, 16.123046875, 16.6396484375, 17.15625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 14.0, 25.0, 45.0, 75.0, 146.0, 279.0, 502.0, 1074.0, 2203.0, 4677.0, 9406.0, 18845.0, 37096.0, 68857.0, 122444.0, 201355.0, 304884.0, 417139.0, 514715.0, 560692.0, 540759.0, 460536.0, 352368.0, 240610.0, 150861.0, 87811.0, 47695.0, 24875.0, 12258.0, 6126.0, 3026.0, 1416.0, 733.0, 346.0, 159.0, 107.0, 41.0, 29.0, 16.0, 10.0, 17.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.953125, -21.370849609375, -20.78857421875, -20.206298828125, -19.6240234375, -19.041748046875, -18.45947265625, -17.877197265625, -17.294921875, -16.712646484375, -16.13037109375, -15.548095703125, -14.9658203125, -14.383544921875, -13.80126953125, -13.218994140625, -12.63671875, -12.054443359375, -11.47216796875, -10.889892578125, -10.3076171875, -9.725341796875, -9.14306640625, -8.560791015625, -7.978515625, -7.396240234375, -6.81396484375, -6.231689453125, -5.6494140625, -5.067138671875, -4.48486328125, -3.902587890625, -3.3203125, -2.738037109375, -2.15576171875, -1.573486328125, -0.9912109375, -0.408935546875, 0.17333984375, 0.755615234375, 1.337890625, 1.920166015625, 2.50244140625, 3.084716796875, 3.6669921875, 4.249267578125, 4.83154296875, 5.413818359375, 5.99609375, 6.578369140625, 7.16064453125, 7.742919921875, 8.3251953125, 8.907470703125, 9.48974609375, 10.072021484375, 10.654296875, 11.236572265625, 11.81884765625, 12.401123046875, 12.9833984375, 13.565673828125, 14.14794921875, 14.730224609375, 15.3125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 6.0, 6.0, 10.0, 17.0, 19.0, 18.0, 32.0, 36.0, 40.0, 52.0, 87.0, 75.0, 108.0, 98.0, 110.0, 141.0, 174.0, 141.0, 173.0, 180.0, 179.0, 212.0, 193.0, 190.0, 210.0, 185.0, 189.0, 149.0, 148.0, 118.0, 136.0, 116.0, 81.0, 76.0, 72.0, 48.0, 39.0, 35.0, 38.0, 29.0, 22.0, 20.0, 16.0, 17.0, 10.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.921875, -7.67401123046875, -7.4261474609375, -7.17828369140625, -6.930419921875, -6.68255615234375, -6.4346923828125, -6.18682861328125, -5.93896484375, -5.69110107421875, -5.4432373046875, -5.19537353515625, -4.947509765625, -4.69964599609375, -4.4517822265625, -4.20391845703125, -3.9560546875, -3.70819091796875, -3.4603271484375, -3.21246337890625, -2.964599609375, -2.71673583984375, -2.4688720703125, -2.22100830078125, -1.97314453125, -1.72528076171875, -1.4774169921875, -1.22955322265625, -0.981689453125, -0.73382568359375, -0.4859619140625, -0.23809814453125, 0.009765625, 0.25762939453125, 0.5054931640625, 0.75335693359375, 1.001220703125, 1.24908447265625, 1.4969482421875, 1.74481201171875, 1.99267578125, 2.24053955078125, 2.4884033203125, 2.73626708984375, 2.984130859375, 3.23199462890625, 3.4798583984375, 3.72772216796875, 3.9755859375, 4.22344970703125, 4.4713134765625, 4.71917724609375, 4.967041015625, 5.21490478515625, 5.4627685546875, 5.71063232421875, 5.95849609375, 6.20635986328125, 6.4542236328125, 6.70208740234375, 6.949951171875, 7.19781494140625, 7.4456787109375, 7.69354248046875, 7.94140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 12.0, 7.0, 16.0, 19.0, 17.0, 17.0, 27.0, 23.0, 29.0, 29.0, 35.0, 30.0, 39.0, 46.0, 35.0, 39.0, 39.0, 45.0, 35.0, 47.0, 39.0, 44.0, 41.0, 46.0, 31.0, 26.0, 22.0, 28.0, 22.0, 19.0, 20.0, 15.0, 11.0, 7.0, 6.0, 9.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.820310592651367, -17.23609733581543, -16.651884078979492, -16.067670822143555, -15.483458518981934, -14.899245262145996, -14.315032958984375, -13.730819702148438, -13.1466064453125, -12.562393188476562, -11.978179931640625, -11.393967628479004, -10.809754371643066, -10.225541114807129, -9.641328811645508, -9.05711555480957, -8.472902297973633, -7.888689041137695, -7.304476261138916, -6.720263481140137, -6.136050224304199, -5.551836967468262, -4.967624187469482, -4.383411407470703, -3.7991981506347656, -3.2149851322174072, -2.630772113800049, -2.0465590953826904, -1.462346076965332, -0.8781330585479736, -0.29392004013061523, 0.29029273986816406, 0.8745079040527344, 1.4587209224700928, 2.042933940887451, 2.6271469593048096, 3.211359977722168, 3.7955729961395264, 4.379786014556885, 4.963998794555664, 5.548212051391602, 6.132425308227539, 6.716638088226318, 7.300850868225098, 7.885064125061035, 8.469277381896973, 9.053489685058594, 9.637702941894531, 10.221916198730469, 10.806129455566406, 11.390342712402344, 11.974555015563965, 12.558768272399902, 13.14298152923584, 13.727193832397461, 14.311407089233398, 14.895620346069336, 15.479833602905273, 16.06404685974121, 16.64826011657715, 17.232471466064453, 17.81668472290039, 18.400897979736328, 18.985111236572266, 19.569324493408203]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 8.0, 4.0, 7.0, 12.0, 10.0, 11.0, 10.0, 13.0, 18.0, 21.0, 30.0, 21.0, 26.0, 32.0, 28.0, 28.0, 36.0, 24.0, 37.0, 30.0, 37.0, 38.0, 35.0, 28.0, 29.0, 28.0, 36.0, 31.0, 29.0, 25.0, 21.0, 27.0, 26.0, 29.0, 14.0, 16.0, 21.0, 14.0, 13.0, 18.0, 13.0, 19.0, 10.0, 5.0, 9.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-17.061779022216797, -16.507579803466797, -15.953380584716797, -15.399181365966797, -14.844982147216797, -14.290782928466797, -13.736583709716797, -13.182384490966797, -12.628185272216797, -12.073986053466797, -11.519786834716797, -10.965587615966797, -10.411388397216797, -9.857189178466797, -9.302989959716797, -8.748790740966797, -8.194591522216797, -7.640392303466797, -7.086193084716797, -6.531993865966797, -5.977794647216797, -5.423595428466797, -4.869396209716797, -4.315196990966797, -3.760997772216797, -3.206798553466797, -2.652599334716797, -2.098400115966797, -1.5442008972167969, -0.9900016784667969, -0.4358024597167969, 0.11839675903320312, 0.6725959777832031, 1.2267951965332031, 1.7809944152832031, 2.335193634033203, 2.889392852783203, 3.443592071533203, 3.997791290283203, 4.551990509033203, 5.106189727783203, 5.660388946533203, 6.214588165283203, 6.768787384033203, 7.322986602783203, 7.877185821533203, 8.431385040283203, 8.985584259033203, 9.539783477783203, 10.093982696533203, 10.648181915283203, 11.202381134033203, 11.756580352783203, 12.310779571533203, 12.864978790283203, 13.419178009033203, 13.973377227783203, 14.527576446533203, 15.081775665283203, 15.635974884033203, 16.190174102783203, 16.744373321533203, 17.298572540283203, 17.852771759033203, 18.406970977783203]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 12.0, 12.0, 33.0, 28.0, 61.0, 88.0, 151.0, 187.0, 297.0, 435.0, 577.0, 840.0, 1248.0, 1956.0, 2742.0, 4101.0, 6306.0, 9572.0, 14633.0, 22411.0, 34266.0, 52572.0, 79071.0, 113171.0, 147325.0, 155327.0, 128466.0, 92131.0, 62041.0, 40693.0, 26565.0, 17479.0, 11153.0, 7407.0, 4969.0, 3344.0, 2140.0, 1551.0, 1060.0, 738.0, 437.0, 284.0, 199.0, 131.0, 117.0, 73.0, 42.0, 39.0, 27.0, 13.0, 13.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-9.609375, -9.3199462890625, -9.030517578125, -8.7410888671875, -8.45166015625, -8.1622314453125, -7.872802734375, -7.5833740234375, -7.2939453125, -7.0045166015625, -6.715087890625, -6.4256591796875, -6.13623046875, -5.8468017578125, -5.557373046875, -5.2679443359375, -4.978515625, -4.6890869140625, -4.399658203125, -4.1102294921875, -3.82080078125, -3.5313720703125, -3.241943359375, -2.9525146484375, -2.6630859375, -2.3736572265625, -2.084228515625, -1.7947998046875, -1.50537109375, -1.2159423828125, -0.926513671875, -0.6370849609375, -0.34765625, -0.0582275390625, 0.231201171875, 0.5206298828125, 0.81005859375, 1.0994873046875, 1.388916015625, 1.6783447265625, 1.9677734375, 2.2572021484375, 2.546630859375, 2.8360595703125, 3.12548828125, 3.4149169921875, 3.704345703125, 3.9937744140625, 4.283203125, 4.5726318359375, 4.862060546875, 5.1514892578125, 5.44091796875, 5.7303466796875, 6.019775390625, 6.3092041015625, 6.5986328125, 6.8880615234375, 7.177490234375, 7.4669189453125, 7.75634765625, 8.0457763671875, 8.335205078125, 8.6246337890625, 8.9140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 3.0, 8.0, 13.0, 8.0, 13.0, 9.0, 11.0, 24.0, 21.0, 30.0, 17.0, 28.0, 37.0, 24.0, 25.0, 40.0, 26.0, 36.0, 29.0, 37.0, 38.0, 33.0, 27.0, 30.0, 28.0, 40.0, 29.0, 29.0, 24.0, 20.0, 30.0, 23.0, 29.0, 13.0, 17.0, 22.0, 13.0, 16.0, 15.0, 12.0, 18.0, 12.0, 3.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-16.984375, -16.431640625, -15.87890625, -15.326171875, -14.7734375, -14.220703125, -13.66796875, -13.115234375, -12.5625, -12.009765625, -11.45703125, -10.904296875, -10.3515625, -9.798828125, -9.24609375, -8.693359375, -8.140625, -7.587890625, -7.03515625, -6.482421875, -5.9296875, -5.376953125, -4.82421875, -4.271484375, -3.71875, -3.166015625, -2.61328125, -2.060546875, -1.5078125, -0.955078125, -0.40234375, 0.150390625, 0.703125, 1.255859375, 1.80859375, 2.361328125, 2.9140625, 3.466796875, 4.01953125, 4.572265625, 5.125, 5.677734375, 6.23046875, 6.783203125, 7.3359375, 7.888671875, 8.44140625, 8.994140625, 9.546875, 10.099609375, 10.65234375, 11.205078125, 11.7578125, 12.310546875, 12.86328125, 13.416015625, 13.96875, 14.521484375, 15.07421875, 15.626953125, 16.1796875, 16.732421875, 17.28515625, 17.837890625, 18.390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 9.0, 7.0, 11.0, 23.0, 28.0, 32.0, 51.0, 82.0, 130.0, 190.0, 307.0, 480.0, 741.0, 1176.0, 2075.0, 3782.0, 6758.0, 12951.0, 26547.0, 60422.0, 146110.0, 311335.0, 266287.0, 114099.0, 48125.0, 22253.0, 10773.0, 5782.0, 3188.0, 1835.0, 1138.0, 664.0, 400.0, 248.0, 169.0, 116.0, 84.0, 41.0, 38.0, 27.0, 14.0, 7.0, 5.0, 6.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1640625, -12.737548828125, -12.31103515625, -11.884521484375, -11.4580078125, -11.031494140625, -10.60498046875, -10.178466796875, -9.751953125, -9.325439453125, -8.89892578125, -8.472412109375, -8.0458984375, -7.619384765625, -7.19287109375, -6.766357421875, -6.33984375, -5.913330078125, -5.48681640625, -5.060302734375, -4.6337890625, -4.207275390625, -3.78076171875, -3.354248046875, -2.927734375, -2.501220703125, -2.07470703125, -1.648193359375, -1.2216796875, -0.795166015625, -0.36865234375, 0.057861328125, 0.484375, 0.910888671875, 1.33740234375, 1.763916015625, 2.1904296875, 2.616943359375, 3.04345703125, 3.469970703125, 3.896484375, 4.322998046875, 4.74951171875, 5.176025390625, 5.6025390625, 6.029052734375, 6.45556640625, 6.882080078125, 7.30859375, 7.735107421875, 8.16162109375, 8.588134765625, 9.0146484375, 9.441162109375, 9.86767578125, 10.294189453125, 10.720703125, 11.147216796875, 11.57373046875, 12.000244140625, 12.4267578125, 12.853271484375, 13.27978515625, 13.706298828125, 14.1328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 4.0, 3.0, 10.0, 6.0, 6.0, 13.0, 16.0, 8.0, 31.0, 25.0, 23.0, 29.0, 32.0, 33.0, 25.0, 47.0, 31.0, 28.0, 51.0, 28.0, 39.0, 30.0, 49.0, 48.0, 38.0, 42.0, 28.0, 47.0, 31.0, 28.0, 29.0, 25.0, 18.0, 12.0, 16.0, 15.0, 11.0, 4.0, 5.0, 5.0, 2.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.55322265625, -13.0908203125, -12.62841796875, -12.166015625, -11.70361328125, -11.2412109375, -10.77880859375, -10.31640625, -9.85400390625, -9.3916015625, -8.92919921875, -8.466796875, -8.00439453125, -7.5419921875, -7.07958984375, -6.6171875, -6.15478515625, -5.6923828125, -5.22998046875, -4.767578125, -4.30517578125, -3.8427734375, -3.38037109375, -2.91796875, -2.45556640625, -1.9931640625, -1.53076171875, -1.068359375, -0.60595703125, -0.1435546875, 0.31884765625, 0.78125, 1.24365234375, 1.7060546875, 2.16845703125, 2.630859375, 3.09326171875, 3.5556640625, 4.01806640625, 4.48046875, 4.94287109375, 5.4052734375, 5.86767578125, 6.330078125, 6.79248046875, 7.2548828125, 7.71728515625, 8.1796875, 8.64208984375, 9.1044921875, 9.56689453125, 10.029296875, 10.49169921875, 10.9541015625, 11.41650390625, 11.87890625, 12.34130859375, 12.8037109375, 13.26611328125, 13.728515625, 14.19091796875, 14.6533203125, 15.11572265625, 15.578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 15.0, 29.0, 32.0, 44.0, 52.0, 71.0, 95.0, 120.0, 168.0, 212.0, 290.0, 431.0, 582.0, 795.0, 1298.0, 1942.0, 3269.0, 6054.0, 12344.0, 32047.0, 122589.0, 636179.0, 161905.0, 37520.0, 14112.0, 6610.0, 3490.0, 1989.0, 1316.0, 804.0, 597.0, 396.0, 278.0, 220.0, 175.0, 97.0, 92.0, 67.0, 53.0, 48.0, 29.0, 18.0, 15.0, 13.0, 6.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.078125, -16.48046875, -15.8828125, -15.28515625, -14.6875, -14.08984375, -13.4921875, -12.89453125, -12.296875, -11.69921875, -11.1015625, -10.50390625, -9.90625, -9.30859375, -8.7109375, -8.11328125, -7.515625, -6.91796875, -6.3203125, -5.72265625, -5.125, -4.52734375, -3.9296875, -3.33203125, -2.734375, -2.13671875, -1.5390625, -0.94140625, -0.34375, 0.25390625, 0.8515625, 1.44921875, 2.046875, 2.64453125, 3.2421875, 3.83984375, 4.4375, 5.03515625, 5.6328125, 6.23046875, 6.828125, 7.42578125, 8.0234375, 8.62109375, 9.21875, 9.81640625, 10.4140625, 11.01171875, 11.609375, 12.20703125, 12.8046875, 13.40234375, 14.0, 14.59765625, 15.1953125, 15.79296875, 16.390625, 16.98828125, 17.5859375, 18.18359375, 18.78125, 19.37890625, 19.9765625, 20.57421875, 21.171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 13.0, 15.0, 14.0, 16.0, 18.0, 31.0, 44.0, 44.0, 64.0, 85.0, 125.0, 133.0, 93.0, 72.0, 60.0, 32.0, 36.0, 14.0, 20.0, 15.0, 7.0, 6.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012845993041992188, -0.0012431889772415161, -0.0012017786502838135, -0.0011603683233261108, -0.0011189579963684082, -0.0010775476694107056, -0.001036137342453003, -0.0009947270154953003, -0.0009533166885375977, -0.000911906361579895, -0.0008704960346221924, -0.0008290857076644897, -0.0007876753807067871, -0.0007462650537490845, -0.0007048547267913818, -0.0006634443998336792, -0.0006220340728759766, -0.0005806237459182739, -0.0005392134189605713, -0.0004978030920028687, -0.000456392765045166, -0.0004149824380874634, -0.00037357211112976074, -0.0003321617841720581, -0.00029075145721435547, -0.00024934113025665283, -0.0002079308032989502, -0.00016652047634124756, -0.00012511014938354492, -8.369982242584229e-05, -4.228949546813965e-05, -8.791685104370117e-07, 4.0531158447265625e-05, 8.194148540496826e-05, 0.0001233518123626709, 0.00016476213932037354, 0.00020617246627807617, 0.0002475827932357788, 0.00028899312019348145, 0.0003304034471511841, 0.0003718137741088867, 0.00041322410106658936, 0.000454634428024292, 0.0004960447549819946, 0.0005374550819396973, 0.0005788654088973999, 0.0006202757358551025, 0.0006616860628128052, 0.0007030963897705078, 0.0007445067167282104, 0.0007859170436859131, 0.0008273273706436157, 0.0008687376976013184, 0.000910148024559021, 0.0009515583515167236, 0.0009929686784744263, 0.001034379005432129, 0.0010757893323898315, 0.0011171996593475342, 0.0011586099863052368, 0.0012000203132629395, 0.001241430640220642, 0.0012828409671783447, 0.0013242512941360474, 0.00136566162109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 6.0, 10.0, 13.0, 18.0, 22.0, 39.0, 54.0, 71.0, 106.0, 138.0, 229.0, 319.0, 512.0, 749.0, 1111.0, 1639.0, 2586.0, 4034.0, 6333.0, 10214.0, 17132.0, 30351.0, 56415.0, 117507.0, 238220.0, 264402.0, 142183.0, 67278.0, 35317.0, 19815.0, 11538.0, 7313.0, 4505.0, 2826.0, 1848.0, 1180.0, 804.0, 565.0, 344.0, 252.0, 160.0, 110.0, 90.0, 68.0, 43.0, 28.0, 19.0, 14.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0], "bins": [-13.3359375, -12.933349609375, -12.53076171875, -12.128173828125, -11.7255859375, -11.322998046875, -10.92041015625, -10.517822265625, -10.115234375, -9.712646484375, -9.31005859375, -8.907470703125, -8.5048828125, -8.102294921875, -7.69970703125, -7.297119140625, -6.89453125, -6.491943359375, -6.08935546875, -5.686767578125, -5.2841796875, -4.881591796875, -4.47900390625, -4.076416015625, -3.673828125, -3.271240234375, -2.86865234375, -2.466064453125, -2.0634765625, -1.660888671875, -1.25830078125, -0.855712890625, -0.453125, -0.050537109375, 0.35205078125, 0.754638671875, 1.1572265625, 1.559814453125, 1.96240234375, 2.364990234375, 2.767578125, 3.170166015625, 3.57275390625, 3.975341796875, 4.3779296875, 4.780517578125, 5.18310546875, 5.585693359375, 5.98828125, 6.390869140625, 6.79345703125, 7.196044921875, 7.5986328125, 8.001220703125, 8.40380859375, 8.806396484375, 9.208984375, 9.611572265625, 10.01416015625, 10.416748046875, 10.8193359375, 11.221923828125, 11.62451171875, 12.027099609375, 12.4296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 5.0, 2.0, 8.0, 8.0, 14.0, 12.0, 12.0, 13.0, 19.0, 16.0, 25.0, 34.0, 45.0, 91.0, 95.0, 77.0, 102.0, 107.0, 84.0, 66.0, 45.0, 29.0, 21.0, 15.0, 10.0, 9.0, 6.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84375, -5.66253662109375, -5.4813232421875, -5.30010986328125, -5.118896484375, -4.93768310546875, -4.7564697265625, -4.57525634765625, -4.39404296875, -4.21282958984375, -4.0316162109375, -3.85040283203125, -3.669189453125, -3.48797607421875, -3.3067626953125, -3.12554931640625, -2.9443359375, -2.76312255859375, -2.5819091796875, -2.40069580078125, -2.219482421875, -2.03826904296875, -1.8570556640625, -1.67584228515625, -1.49462890625, -1.31341552734375, -1.1322021484375, -0.95098876953125, -0.769775390625, -0.58856201171875, -0.4073486328125, -0.22613525390625, -0.044921875, 0.13629150390625, 0.3175048828125, 0.49871826171875, 0.679931640625, 0.86114501953125, 1.0423583984375, 1.22357177734375, 1.40478515625, 1.58599853515625, 1.7672119140625, 1.94842529296875, 2.129638671875, 2.31085205078125, 2.4920654296875, 2.67327880859375, 2.8544921875, 3.03570556640625, 3.2169189453125, 3.39813232421875, 3.579345703125, 3.76055908203125, 3.9417724609375, 4.12298583984375, 4.30419921875, 4.48541259765625, 4.6666259765625, 4.84783935546875, 5.029052734375, 5.21026611328125, 5.3914794921875, 5.57269287109375, 5.75390625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 10.0, 8.0, 16.0, 13.0, 18.0, 15.0, 26.0, 18.0, 29.0, 41.0, 25.0, 48.0, 30.0, 27.0, 41.0, 44.0, 43.0, 27.0, 43.0, 43.0, 47.0, 41.0, 51.0, 48.0, 27.0, 28.0, 21.0, 26.0, 22.0, 18.0, 14.0, 17.0, 9.0, 11.0, 10.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.178775787353516, -17.589969635009766, -17.001163482666016, -16.4123592376709, -15.823553085327148, -15.234746932983398, -14.645941734313965, -14.057136535644531, -13.468330383300781, -12.879524230957031, -12.290719032287598, -11.701913833618164, -11.113107681274414, -10.524301528930664, -9.93549633026123, -9.346691131591797, -8.757884979248047, -8.169078826904297, -7.580273628234863, -6.9914679527282715, -6.40266227722168, -5.813856601715088, -5.225050926208496, -4.636245250701904, -4.0474395751953125, -3.4586338996887207, -2.869828224182129, -2.281022548675537, -1.6922168731689453, -1.1034111976623535, -0.5146055221557617, 0.07420015335083008, 0.6630077362060547, 1.2518134117126465, 1.8406190872192383, 2.42942476272583, 3.018230438232422, 3.6070361137390137, 4.1958417892456055, 4.784647464752197, 5.373453140258789, 5.962258815765381, 6.551064491271973, 7.1398701667785645, 7.728675842285156, 8.317481994628906, 8.90628719329834, 9.495092391967773, 10.083898544311523, 10.672704696655273, 11.261509895324707, 11.85031509399414, 12.43912124633789, 13.02792739868164, 13.616732597351074, 14.205537796020508, 14.794343948364258, 15.383150100708008, 15.971955299377441, 16.560760498046875, 17.149566650390625, 17.738372802734375, 18.327178955078125, 18.915983200073242, 19.504789352416992]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 8.0, 7.0, 10.0, 9.0, 10.0, 23.0, 20.0, 22.0, 23.0, 31.0, 18.0, 32.0, 37.0, 22.0, 31.0, 29.0, 35.0, 25.0, 33.0, 34.0, 40.0, 32.0, 33.0, 37.0, 26.0, 36.0, 23.0, 29.0, 22.0, 24.0, 37.0, 25.0, 18.0, 14.0, 15.0, 20.0, 10.0, 14.0, 14.0, 22.0, 9.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-16.965547561645508, -16.394412994384766, -15.823278427124023, -15.252144813537598, -14.681010246276855, -14.109875679016113, -13.538742065429688, -12.967607498168945, -12.396472930908203, -11.825338363647461, -11.254203796386719, -10.683070182800293, -10.11193561553955, -9.540801048278809, -8.969667434692383, -8.39853286743164, -7.827398300170898, -7.256263732910156, -6.685129642486572, -6.113995552062988, -5.542860984802246, -4.971726417541504, -4.40059232711792, -3.829457998275757, -3.2583236694335938, -2.6871893405914307, -2.1160550117492676, -1.5449206829071045, -0.9737863540649414, -0.4026520252227783, 0.16848230361938477, 0.7396166324615479, 1.310750961303711, 1.881885290145874, 2.453019618988037, 3.0241539478302, 3.5952882766723633, 4.1664228439331055, 4.7375569343566895, 5.308691024780273, 5.879825592041016, 6.450960159301758, 7.022094249725342, 7.593228340148926, 8.164362907409668, 8.73549747467041, 9.306631088256836, 9.877765655517578, 10.44890022277832, 11.020034790039062, 11.591169357299805, 12.16230297088623, 12.733437538146973, 13.304572105407715, 13.87570571899414, 14.446840286254883, 15.017974853515625, 15.589109420776367, 16.16024398803711, 16.73137855529785, 17.302513122558594, 17.873645782470703, 18.444780349731445, 19.015914916992188, 19.58704948425293]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 8.0, 15.0, 28.0, 62.0, 90.0, 139.0, 213.0, 417.0, 643.0, 1022.0, 1708.0, 2721.0, 4006.0, 6448.0, 9414.0, 13847.0, 20021.0, 27754.0, 37755.0, 49232.0, 61338.0, 73611.0, 83522.0, 90632.0, 92699.0, 89940.0, 82154.0, 71930.0, 59743.0, 47380.0, 36349.0, 26472.0, 18908.0, 13175.0, 8808.0, 5911.0, 3841.0, 2421.0, 1518.0, 1075.0, 638.0, 394.0, 227.0, 122.0, 88.0, 47.0, 23.0, 18.0, 11.0, 9.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.6392822265625, -12.223876953125, -11.8084716796875, -11.39306640625, -10.9776611328125, -10.562255859375, -10.1468505859375, -9.7314453125, -9.3160400390625, -8.900634765625, -8.4852294921875, -8.06982421875, -7.6544189453125, -7.239013671875, -6.8236083984375, -6.408203125, -5.9927978515625, -5.577392578125, -5.1619873046875, -4.74658203125, -4.3311767578125, -3.915771484375, -3.5003662109375, -3.0849609375, -2.6695556640625, -2.254150390625, -1.8387451171875, -1.42333984375, -1.0079345703125, -0.592529296875, -0.1771240234375, 0.23828125, 0.6536865234375, 1.069091796875, 1.4844970703125, 1.89990234375, 2.3153076171875, 2.730712890625, 3.1461181640625, 3.5615234375, 3.9769287109375, 4.392333984375, 4.8077392578125, 5.22314453125, 5.6385498046875, 6.053955078125, 6.4693603515625, 6.884765625, 7.3001708984375, 7.715576171875, 8.1309814453125, 8.54638671875, 8.9617919921875, 9.377197265625, 9.7926025390625, 10.2080078125, 10.6234130859375, 11.038818359375, 11.4542236328125, 11.86962890625, 12.2850341796875, 12.700439453125, 13.1158447265625, 13.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 10.0, 10.0, 12.0, 18.0, 19.0, 23.0, 24.0, 29.0, 23.0, 31.0, 34.0, 23.0, 30.0, 31.0, 32.0, 28.0, 30.0, 36.0, 41.0, 31.0, 33.0, 38.0, 27.0, 33.0, 26.0, 28.0, 25.0, 21.0, 36.0, 23.0, 26.0, 12.0, 16.0, 18.0, 10.0, 14.0, 16.0, 20.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-16.71875, -16.159423828125, -15.60009765625, -15.040771484375, -14.4814453125, -13.922119140625, -13.36279296875, -12.803466796875, -12.244140625, -11.684814453125, -11.12548828125, -10.566162109375, -10.0068359375, -9.447509765625, -8.88818359375, -8.328857421875, -7.76953125, -7.210205078125, -6.65087890625, -6.091552734375, -5.5322265625, -4.972900390625, -4.41357421875, -3.854248046875, -3.294921875, -2.735595703125, -2.17626953125, -1.616943359375, -1.0576171875, -0.498291015625, 0.06103515625, 0.620361328125, 1.1796875, 1.739013671875, 2.29833984375, 2.857666015625, 3.4169921875, 3.976318359375, 4.53564453125, 5.094970703125, 5.654296875, 6.213623046875, 6.77294921875, 7.332275390625, 7.8916015625, 8.450927734375, 9.01025390625, 9.569580078125, 10.12890625, 10.688232421875, 11.24755859375, 11.806884765625, 12.3662109375, 12.925537109375, 13.48486328125, 14.044189453125, 14.603515625, 15.162841796875, 15.72216796875, 16.281494140625, 16.8408203125, 17.400146484375, 17.95947265625, 18.518798828125, 19.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 9.0, 20.0, 26.0, 40.0, 56.0, 85.0, 114.0, 218.0, 292.0, 541.0, 766.0, 1167.0, 1846.0, 2655.0, 3965.0, 6255.0, 9082.0, 13175.0, 18878.0, 26412.0, 36035.0, 47580.0, 60634.0, 73124.0, 85064.0, 92352.0, 95679.0, 91944.0, 83563.0, 72260.0, 59756.0, 46820.0, 35345.0, 25618.0, 18310.0, 12819.0, 8675.0, 5959.0, 3914.0, 2580.0, 1735.0, 1159.0, 707.0, 450.0, 313.0, 182.0, 126.0, 82.0, 49.0, 52.0, 29.0, 15.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0], "bins": [-15.2109375, -14.7423095703125, -14.273681640625, -13.8050537109375, -13.33642578125, -12.8677978515625, -12.399169921875, -11.9305419921875, -11.4619140625, -10.9932861328125, -10.524658203125, -10.0560302734375, -9.58740234375, -9.1187744140625, -8.650146484375, -8.1815185546875, -7.712890625, -7.2442626953125, -6.775634765625, -6.3070068359375, -5.83837890625, -5.3697509765625, -4.901123046875, -4.4324951171875, -3.9638671875, -3.4952392578125, -3.026611328125, -2.5579833984375, -2.08935546875, -1.6207275390625, -1.152099609375, -0.6834716796875, -0.21484375, 0.2537841796875, 0.722412109375, 1.1910400390625, 1.65966796875, 2.1282958984375, 2.596923828125, 3.0655517578125, 3.5341796875, 4.0028076171875, 4.471435546875, 4.9400634765625, 5.40869140625, 5.8773193359375, 6.345947265625, 6.8145751953125, 7.283203125, 7.7518310546875, 8.220458984375, 8.6890869140625, 9.15771484375, 9.6263427734375, 10.094970703125, 10.5635986328125, 11.0322265625, 11.5008544921875, 11.969482421875, 12.4381103515625, 12.90673828125, 13.3753662109375, 13.843994140625, 14.3126220703125, 14.78125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 11.0, 9.0, 6.0, 8.0, 13.0, 17.0, 24.0, 21.0, 40.0, 25.0, 31.0, 47.0, 42.0, 41.0, 55.0, 40.0, 49.0, 57.0, 48.0, 40.0, 36.0, 45.0, 37.0, 52.0, 39.0, 19.0, 24.0, 23.0, 19.0, 12.0, 14.0, 4.0, 17.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.5625, -16.03173828125, -15.5009765625, -14.97021484375, -14.439453125, -13.90869140625, -13.3779296875, -12.84716796875, -12.31640625, -11.78564453125, -11.2548828125, -10.72412109375, -10.193359375, -9.66259765625, -9.1318359375, -8.60107421875, -8.0703125, -7.53955078125, -7.0087890625, -6.47802734375, -5.947265625, -5.41650390625, -4.8857421875, -4.35498046875, -3.82421875, -3.29345703125, -2.7626953125, -2.23193359375, -1.701171875, -1.17041015625, -0.6396484375, -0.10888671875, 0.421875, 0.95263671875, 1.4833984375, 2.01416015625, 2.544921875, 3.07568359375, 3.6064453125, 4.13720703125, 4.66796875, 5.19873046875, 5.7294921875, 6.26025390625, 6.791015625, 7.32177734375, 7.8525390625, 8.38330078125, 8.9140625, 9.44482421875, 9.9755859375, 10.50634765625, 11.037109375, 11.56787109375, 12.0986328125, 12.62939453125, 13.16015625, 13.69091796875, 14.2216796875, 14.75244140625, 15.283203125, 15.81396484375, 16.3447265625, 16.87548828125, 17.40625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 9.0, 8.0, 11.0, 17.0, 28.0, 47.0, 68.0, 120.0, 206.0, 321.0, 454.0, 734.0, 1182.0, 1931.0, 3262.0, 5706.0, 10077.0, 18360.0, 34069.0, 61314.0, 103917.0, 151004.0, 180570.0, 168801.0, 126355.0, 79646.0, 44465.0, 24351.0, 13470.0, 7310.0, 4236.0, 2409.0, 1540.0, 939.0, 590.0, 370.0, 245.0, 159.0, 97.0, 57.0, 44.0, 17.0, 22.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.4412841796875, -10.077880859375, -9.7144775390625, -9.35107421875, -8.9876708984375, -8.624267578125, -8.2608642578125, -7.8974609375, -7.5340576171875, -7.170654296875, -6.8072509765625, -6.44384765625, -6.0804443359375, -5.717041015625, -5.3536376953125, -4.990234375, -4.6268310546875, -4.263427734375, -3.9000244140625, -3.53662109375, -3.1732177734375, -2.809814453125, -2.4464111328125, -2.0830078125, -1.7196044921875, -1.356201171875, -0.9927978515625, -0.62939453125, -0.2659912109375, 0.097412109375, 0.4608154296875, 0.82421875, 1.1876220703125, 1.551025390625, 1.9144287109375, 2.27783203125, 2.6412353515625, 3.004638671875, 3.3680419921875, 3.7314453125, 4.0948486328125, 4.458251953125, 4.8216552734375, 5.18505859375, 5.5484619140625, 5.911865234375, 6.2752685546875, 6.638671875, 7.0020751953125, 7.365478515625, 7.7288818359375, 8.09228515625, 8.4556884765625, 8.819091796875, 9.1824951171875, 9.5458984375, 9.9093017578125, 10.272705078125, 10.6361083984375, 10.99951171875, 11.3629150390625, 11.726318359375, 12.0897216796875, 12.453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 7.0, 12.0, 19.0, 10.0, 22.0, 34.0, 30.0, 29.0, 34.0, 53.0, 46.0, 51.0, 61.0, 52.0, 57.0, 58.0, 46.0, 58.0, 52.0, 32.0, 40.0, 29.0, 26.0, 19.0, 13.0, 24.0, 19.0, 10.0, 7.0, 10.0, 6.0, 5.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010442733764648438, -0.0010117292404174805, -0.0009791851043701172, -0.0009466409683227539, -0.0009140968322753906, -0.0008815526962280273, -0.0008490085601806641, -0.0008164644241333008, -0.0007839202880859375, -0.0007513761520385742, -0.0007188320159912109, -0.0006862878799438477, -0.0006537437438964844, -0.0006211996078491211, -0.0005886554718017578, -0.0005561113357543945, -0.0005235671997070312, -0.000491023063659668, -0.0004584789276123047, -0.0004259347915649414, -0.0003933906555175781, -0.00036084651947021484, -0.00032830238342285156, -0.0002957582473754883, -0.000263214111328125, -0.00023066997528076172, -0.00019812583923339844, -0.00016558170318603516, -0.00013303756713867188, -0.0001004934310913086, -6.794929504394531e-05, -3.540515899658203e-05, -2.86102294921875e-06, 2.968311309814453e-05, 6.222724914550781e-05, 9.47713851928711e-05, 0.00012731552124023438, 0.00015985965728759766, 0.00019240379333496094, 0.00022494792938232422, 0.0002574920654296875, 0.0002900362014770508, 0.00032258033752441406, 0.00035512447357177734, 0.0003876686096191406, 0.0004202127456665039, 0.0004527568817138672, 0.00048530101776123047, 0.0005178451538085938, 0.000550389289855957, 0.0005829334259033203, 0.0006154775619506836, 0.0006480216979980469, 0.0006805658340454102, 0.0007131099700927734, 0.0007456541061401367, 0.0007781982421875, 0.0008107423782348633, 0.0008432865142822266, 0.0008758306503295898, 0.0009083747863769531, 0.0009409189224243164, 0.0009734630584716797, 0.001006007194519043, 0.0010385513305664062]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 9.0, 11.0, 12.0, 21.0, 31.0, 31.0, 56.0, 76.0, 107.0, 162.0, 253.0, 397.0, 585.0, 1031.0, 2023.0, 4045.0, 8980.0, 21491.0, 51848.0, 110883.0, 190372.0, 235130.0, 199104.0, 120850.0, 57184.0, 24284.0, 9945.0, 4529.0, 2090.0, 1186.0, 656.0, 380.0, 244.0, 171.0, 104.0, 87.0, 60.0, 35.0, 32.0, 19.0, 19.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.9422607421875, -13.486083984375, -13.0299072265625, -12.57373046875, -12.1175537109375, -11.661376953125, -11.2052001953125, -10.7490234375, -10.2928466796875, -9.836669921875, -9.3804931640625, -8.92431640625, -8.4681396484375, -8.011962890625, -7.5557861328125, -7.099609375, -6.6434326171875, -6.187255859375, -5.7310791015625, -5.27490234375, -4.8187255859375, -4.362548828125, -3.9063720703125, -3.4501953125, -2.9940185546875, -2.537841796875, -2.0816650390625, -1.62548828125, -1.1693115234375, -0.713134765625, -0.2569580078125, 0.19921875, 0.6553955078125, 1.111572265625, 1.5677490234375, 2.02392578125, 2.4801025390625, 2.936279296875, 3.3924560546875, 3.8486328125, 4.3048095703125, 4.760986328125, 5.2171630859375, 5.67333984375, 6.1295166015625, 6.585693359375, 7.0418701171875, 7.498046875, 7.9542236328125, 8.410400390625, 8.8665771484375, 9.32275390625, 9.7789306640625, 10.235107421875, 10.6912841796875, 11.1474609375, 11.6036376953125, 12.059814453125, 12.5159912109375, 12.97216796875, 13.4283447265625, 13.884521484375, 14.3406982421875, 14.796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 1.0, 2.0, 7.0, 8.0, 5.0, 5.0, 11.0, 13.0, 12.0, 18.0, 15.0, 19.0, 13.0, 27.0, 26.0, 32.0, 35.0, 53.0, 35.0, 54.0, 58.0, 51.0, 58.0, 62.0, 47.0, 40.0, 47.0, 36.0, 29.0, 36.0, 23.0, 21.0, 22.0, 16.0, 14.0, 10.0, 6.0, 4.0, 4.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.46875, -3.363922119140625, -3.25909423828125, -3.154266357421875, -3.0494384765625, -2.944610595703125, -2.83978271484375, -2.734954833984375, -2.630126953125, -2.525299072265625, -2.42047119140625, -2.315643310546875, -2.2108154296875, -2.105987548828125, -2.00115966796875, -1.896331787109375, -1.79150390625, -1.686676025390625, -1.58184814453125, -1.477020263671875, -1.3721923828125, -1.267364501953125, -1.16253662109375, -1.057708740234375, -0.952880859375, -0.848052978515625, -0.74322509765625, -0.638397216796875, -0.5335693359375, -0.428741455078125, -0.32391357421875, -0.219085693359375, -0.1142578125, -0.009429931640625, 0.09539794921875, 0.200225830078125, 0.3050537109375, 0.409881591796875, 0.51470947265625, 0.619537353515625, 0.724365234375, 0.829193115234375, 0.93402099609375, 1.038848876953125, 1.1436767578125, 1.248504638671875, 1.35333251953125, 1.458160400390625, 1.56298828125, 1.667816162109375, 1.77264404296875, 1.877471923828125, 1.9822998046875, 2.087127685546875, 2.19195556640625, 2.296783447265625, 2.401611328125, 2.506439208984375, 2.61126708984375, 2.716094970703125, 2.8209228515625, 2.925750732421875, 3.03057861328125, 3.135406494140625, 3.240234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 10.0, 7.0, 7.0, 14.0, 18.0, 17.0, 12.0, 15.0, 16.0, 31.0, 36.0, 38.0, 35.0, 41.0, 40.0, 42.0, 47.0, 44.0, 42.0, 42.0, 50.0, 52.0, 46.0, 35.0, 34.0, 36.0, 31.0, 17.0, 20.0, 21.0, 20.0, 18.0, 11.0, 8.0, 8.0, 13.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.405128479003906, -18.774864196777344, -18.144601821899414, -17.514339447021484, -16.884075164794922, -16.25381088256836, -15.62354850769043, -14.993285179138184, -14.363021850585938, -13.732758522033691, -13.102495193481445, -12.4722318649292, -11.841968536376953, -11.211705207824707, -10.581441879272461, -9.951178550720215, -9.320915222167969, -8.690651893615723, -8.060388565063477, -7.4301252365112305, -6.799861907958984, -6.169598579406738, -5.539335250854492, -4.909071922302246, -4.27880859375, -3.648545265197754, -3.018281936645508, -2.3880186080932617, -1.7577552795410156, -1.1274919509887695, -0.49722862243652344, 0.13303470611572266, 0.7632961273193359, 1.393559455871582, 2.023822784423828, 2.654086112976074, 3.2843494415283203, 3.9146127700805664, 4.5448760986328125, 5.175139427185059, 5.805402755737305, 6.435666084289551, 7.065929412841797, 7.696192741394043, 8.326456069946289, 8.956719398498535, 9.586982727050781, 10.217246055603027, 10.847509384155273, 11.47777271270752, 12.108036041259766, 12.738299369812012, 13.368562698364258, 13.998826026916504, 14.62908935546875, 15.259352684020996, 15.889616012573242, 16.519878387451172, 17.150142669677734, 17.780406951904297, 18.410669326782227, 19.040931701660156, 19.67119598388672, 20.30146026611328, 20.93172264099121]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 15.0, 16.0, 16.0, 16.0, 11.0, 22.0, 12.0, 25.0, 24.0, 29.0, 32.0, 34.0, 22.0, 27.0, 32.0, 35.0, 33.0, 31.0, 33.0, 39.0, 44.0, 38.0, 28.0, 28.0, 36.0, 26.0, 25.0, 38.0, 19.0, 23.0, 16.0, 21.0, 19.0, 13.0, 13.0, 13.0, 13.0, 13.0, 8.0, 6.0, 6.0, 13.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.860816955566406, -17.26935577392578, -16.677894592285156, -16.0864315032959, -15.494970321655273, -14.903509140014648, -14.312047958374023, -13.720586776733398, -13.129124641418457, -12.537663459777832, -11.94620132446289, -11.354740142822266, -10.76327896118164, -10.1718168258667, -9.580355644226074, -8.988893508911133, -8.397432327270508, -7.805970668792725, -7.214509010314941, -6.623047828674316, -6.031586170196533, -5.44012451171875, -4.848663330078125, -4.257201671600342, -3.6657400131225586, -3.0742783546447754, -2.4828169345855713, -1.8913553953170776, -1.299893856048584, -0.7084321975708008, -0.11697077751159668, 0.4744906425476074, 1.0659503936767578, 1.6574119329452515, 2.248873472213745, 2.840334892272949, 3.4317965507507324, 4.023258209228516, 4.614719390869141, 5.206181049346924, 5.797642707824707, 6.38910436630249, 6.980566024780273, 7.572027206420898, 8.163488388061523, 8.754950523376465, 9.34641170501709, 9.937873840332031, 10.529335021972656, 11.120796203613281, 11.712258338928223, 12.303719520568848, 12.895181655883789, 13.486642837524414, 14.078104019165039, 14.669565200805664, 15.261027336120605, 15.85248851776123, 16.443950653076172, 17.035411834716797, 17.626873016357422, 18.218334197998047, 18.809797286987305, 19.40125846862793, 19.992719650268555]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 10.0, 20.0, 32.0, 67.0, 98.0, 156.0, 280.0, 446.0, 843.0, 1340.0, 2276.0, 3778.0, 6258.0, 10086.0, 16988.0, 26968.0, 42793.0, 65528.0, 98174.0, 141441.0, 197148.0, 260304.0, 323932.0, 380567.0, 414847.0, 423189.0, 400672.0, 352604.0, 291194.0, 225339.0, 166075.0, 117938.0, 80060.0, 52426.0, 34666.0, 21587.0, 13329.0, 8300.0, 4956.0, 3092.0, 1754.0, 1103.0, 664.0, 389.0, 226.0, 130.0, 83.0, 46.0, 25.0, 22.0, 14.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.7421875, -13.3023681640625, -12.862548828125, -12.4227294921875, -11.98291015625, -11.5430908203125, -11.103271484375, -10.6634521484375, -10.2236328125, -9.7838134765625, -9.343994140625, -8.9041748046875, -8.46435546875, -8.0245361328125, -7.584716796875, -7.1448974609375, -6.705078125, -6.2652587890625, -5.825439453125, -5.3856201171875, -4.94580078125, -4.5059814453125, -4.066162109375, -3.6263427734375, -3.1865234375, -2.7467041015625, -2.306884765625, -1.8670654296875, -1.42724609375, -0.9874267578125, -0.547607421875, -0.1077880859375, 0.33203125, 0.7718505859375, 1.211669921875, 1.6514892578125, 2.09130859375, 2.5311279296875, 2.970947265625, 3.4107666015625, 3.8505859375, 4.2904052734375, 4.730224609375, 5.1700439453125, 5.60986328125, 6.0496826171875, 6.489501953125, 6.9293212890625, 7.369140625, 7.8089599609375, 8.248779296875, 8.6885986328125, 9.12841796875, 9.5682373046875, 10.008056640625, 10.4478759765625, 10.8876953125, 11.3275146484375, 11.767333984375, 12.2071533203125, 12.64697265625, 13.0867919921875, 13.526611328125, 13.9664306640625, 14.40625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 5.0, 20.0, 9.0, 20.0, 15.0, 16.0, 16.0, 16.0, 16.0, 27.0, 27.0, 35.0, 30.0, 26.0, 28.0, 23.0, 37.0, 34.0, 38.0, 32.0, 36.0, 41.0, 38.0, 33.0, 25.0, 28.0, 34.0, 25.0, 35.0, 30.0, 17.0, 20.0, 21.0, 15.0, 14.0, 14.0, 15.0, 10.0, 16.0, 11.0, 8.0, 3.0, 15.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.9140625, -15.3902587890625, -14.866455078125, -14.3426513671875, -13.81884765625, -13.2950439453125, -12.771240234375, -12.2474365234375, -11.7236328125, -11.1998291015625, -10.676025390625, -10.1522216796875, -9.62841796875, -9.1046142578125, -8.580810546875, -8.0570068359375, -7.533203125, -7.0093994140625, -6.485595703125, -5.9617919921875, -5.43798828125, -4.9141845703125, -4.390380859375, -3.8665771484375, -3.3427734375, -2.8189697265625, -2.295166015625, -1.7713623046875, -1.24755859375, -0.7237548828125, -0.199951171875, 0.3238525390625, 0.84765625, 1.3714599609375, 1.895263671875, 2.4190673828125, 2.94287109375, 3.4666748046875, 3.990478515625, 4.5142822265625, 5.0380859375, 5.5618896484375, 6.085693359375, 6.6094970703125, 7.13330078125, 7.6571044921875, 8.180908203125, 8.7047119140625, 9.228515625, 9.7523193359375, 10.276123046875, 10.7999267578125, 11.32373046875, 11.8475341796875, 12.371337890625, 12.8951416015625, 13.4189453125, 13.9427490234375, 14.466552734375, 14.9903564453125, 15.51416015625, 16.0379638671875, 16.561767578125, 17.0855712890625, 17.609375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 9.0, 14.0, 21.0, 36.0, 61.0, 90.0, 179.0, 264.0, 462.0, 748.0, 1283.0, 2164.0, 3551.0, 5898.0, 9580.0, 15229.0, 23180.0, 36013.0, 53270.0, 76998.0, 108523.0, 148912.0, 194167.0, 243763.0, 292575.0, 333822.0, 362067.0, 370575.0, 361256.0, 333724.0, 291769.0, 243915.0, 194275.0, 148237.0, 109118.0, 77378.0, 53162.0, 35244.0, 23385.0, 14883.0, 9730.0, 5775.0, 3605.0, 2140.0, 1324.0, 799.0, 480.0, 271.0, 142.0, 104.0, 50.0, 31.0, 18.0, 6.0, 10.0, 3.0, 1.0, 3.0], "bins": [-14.5859375, -14.1505126953125, -13.715087890625, -13.2796630859375, -12.84423828125, -12.4088134765625, -11.973388671875, -11.5379638671875, -11.1025390625, -10.6671142578125, -10.231689453125, -9.7962646484375, -9.36083984375, -8.9254150390625, -8.489990234375, -8.0545654296875, -7.619140625, -7.1837158203125, -6.748291015625, -6.3128662109375, -5.87744140625, -5.4420166015625, -5.006591796875, -4.5711669921875, -4.1357421875, -3.7003173828125, -3.264892578125, -2.8294677734375, -2.39404296875, -1.9586181640625, -1.523193359375, -1.0877685546875, -0.65234375, -0.2169189453125, 0.218505859375, 0.6539306640625, 1.08935546875, 1.5247802734375, 1.960205078125, 2.3956298828125, 2.8310546875, 3.2664794921875, 3.701904296875, 4.1373291015625, 4.57275390625, 5.0081787109375, 5.443603515625, 5.8790283203125, 6.314453125, 6.7498779296875, 7.185302734375, 7.6207275390625, 8.05615234375, 8.4915771484375, 8.927001953125, 9.3624267578125, 9.7978515625, 10.2332763671875, 10.668701171875, 11.1041259765625, 11.53955078125, 11.9749755859375, 12.410400390625, 12.8458251953125, 13.28125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 3.0, 10.0, 6.0, 22.0, 20.0, 27.0, 24.0, 50.0, 50.0, 71.0, 76.0, 79.0, 97.0, 120.0, 160.0, 165.0, 176.0, 207.0, 221.0, 201.0, 213.0, 219.0, 213.0, 196.0, 198.0, 192.0, 160.0, 131.0, 156.0, 121.0, 102.0, 79.0, 70.0, 48.0, 48.0, 35.0, 31.0, 21.0, 21.0, 15.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.81396484375, -7.5185546875, -7.22314453125, -6.927734375, -6.63232421875, -6.3369140625, -6.04150390625, -5.74609375, -5.45068359375, -5.1552734375, -4.85986328125, -4.564453125, -4.26904296875, -3.9736328125, -3.67822265625, -3.3828125, -3.08740234375, -2.7919921875, -2.49658203125, -2.201171875, -1.90576171875, -1.6103515625, -1.31494140625, -1.01953125, -0.72412109375, -0.4287109375, -0.13330078125, 0.162109375, 0.45751953125, 0.7529296875, 1.04833984375, 1.34375, 1.63916015625, 1.9345703125, 2.22998046875, 2.525390625, 2.82080078125, 3.1162109375, 3.41162109375, 3.70703125, 4.00244140625, 4.2978515625, 4.59326171875, 4.888671875, 5.18408203125, 5.4794921875, 5.77490234375, 6.0703125, 6.36572265625, 6.6611328125, 6.95654296875, 7.251953125, 7.54736328125, 7.8427734375, 8.13818359375, 8.43359375, 8.72900390625, 9.0244140625, 9.31982421875, 9.615234375, 9.91064453125, 10.2060546875, 10.50146484375, 10.796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 4.0, 6.0, 8.0, 11.0, 12.0, 12.0, 13.0, 18.0, 17.0, 23.0, 39.0, 32.0, 47.0, 40.0, 45.0, 46.0, 41.0, 60.0, 56.0, 60.0, 40.0, 46.0, 35.0, 41.0, 40.0, 21.0, 30.0, 28.0, 22.0, 20.0, 17.0, 13.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 6.0, 1.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.633602142333984, -20.90798568725586, -20.182371139526367, -19.456754684448242, -18.731138229370117, -18.005523681640625, -17.2799072265625, -16.554290771484375, -15.828675270080566, -15.103059768676758, -14.377443313598633, -13.651827812194824, -12.926212310791016, -12.20059585571289, -11.474980354309082, -10.749364852905273, -10.023748397827148, -9.29813289642334, -8.572516441345215, -7.846900939941406, -7.1212849617004395, -6.395668983459473, -5.670053482055664, -4.944437503814697, -4.2188215255737305, -3.4932055473327637, -2.767589807510376, -2.0419740676879883, -1.3163580894470215, -0.5907421112060547, 0.1348733901977539, 0.8604893684387207, 1.5861072540283203, 2.311723232269287, 3.037338972091675, 3.7629547119140625, 4.488570690155029, 5.214186668395996, 5.939802169799805, 6.6654181480407715, 7.391034126281738, 8.116649627685547, 8.842266082763672, 9.56788158416748, 10.293497085571289, 11.019113540649414, 11.744729042053223, 12.470344543457031, 13.195960998535156, 13.921576499938965, 14.64719295501709, 15.372808456420898, 16.098424911499023, 16.824039459228516, 17.54965591430664, 18.275272369384766, 19.00088882446289, 19.726505279541016, 20.452119827270508, 21.177736282348633, 21.903352737426758, 22.62896728515625, 23.354583740234375, 24.0802001953125, 24.805814743041992]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 0.0, 9.0, 4.0, 12.0, 13.0, 14.0, 13.0, 21.0, 24.0, 23.0, 22.0, 20.0, 26.0, 28.0, 47.0, 30.0, 35.0, 43.0, 41.0, 29.0, 30.0, 43.0, 52.0, 36.0, 45.0, 36.0, 33.0, 30.0, 33.0, 29.0, 19.0, 21.0, 24.0, 19.0, 21.0, 13.0, 16.0, 13.0, 7.0, 4.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.035367965698242, -19.320941925048828, -18.606515884399414, -17.89208984375, -17.177661895751953, -16.46323585510254, -15.748809814453125, -15.034383773803711, -14.319957733154297, -13.605531692504883, -12.891105651855469, -12.176678657531738, -11.462252616882324, -10.74782657623291, -10.03339958190918, -9.318973541259766, -8.604547500610352, -7.8901214599609375, -7.175694942474365, -6.461268424987793, -5.746842384338379, -5.032416343688965, -4.317989826202393, -3.6035633087158203, -2.8891372680664062, -2.174710988998413, -1.46028470993042, -0.7458584308624268, -0.031432151794433594, 0.6829941272735596, 1.3974204063415527, 2.111846923828125, 2.826272964477539, 3.5406992435455322, 4.255125522613525, 4.969552040100098, 5.683978080749512, 6.398404121398926, 7.112830638885498, 7.82725715637207, 8.541683197021484, 9.256109237670898, 9.970535278320312, 10.684962272644043, 11.399388313293457, 12.113814353942871, 12.828241348266602, 13.542667388916016, 14.25709342956543, 14.971519470214844, 15.685945510864258, 16.400371551513672, 17.11479949951172, 17.829225540161133, 18.543651580810547, 19.25807762145996, 19.972503662109375, 20.68692970275879, 21.401355743408203, 22.115781784057617, 22.83020782470703, 23.544635772705078, 24.259061813354492, 24.973487854003906, 25.68791389465332]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 13.0, 25.0, 21.0, 40.0, 34.0, 80.0, 95.0, 143.0, 187.0, 263.0, 419.0, 624.0, 904.0, 1376.0, 2135.0, 3445.0, 5445.0, 9015.0, 15509.0, 27878.0, 51872.0, 97475.0, 177372.0, 242722.0, 184660.0, 102335.0, 53720.0, 29131.0, 16349.0, 9350.0, 5739.0, 3535.0, 2206.0, 1472.0, 917.0, 626.0, 420.0, 305.0, 230.0, 134.0, 99.0, 77.0, 56.0, 28.0, 24.0, 10.0, 14.0, 8.0, 1.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1702880859375, -12.739013671875, -12.3077392578125, -11.87646484375, -11.4451904296875, -11.013916015625, -10.5826416015625, -10.1513671875, -9.7200927734375, -9.288818359375, -8.8575439453125, -8.42626953125, -7.9949951171875, -7.563720703125, -7.1324462890625, -6.701171875, -6.2698974609375, -5.838623046875, -5.4073486328125, -4.97607421875, -4.5447998046875, -4.113525390625, -3.6822509765625, -3.2509765625, -2.8197021484375, -2.388427734375, -1.9571533203125, -1.52587890625, -1.0946044921875, -0.663330078125, -0.2320556640625, 0.19921875, 0.6304931640625, 1.061767578125, 1.4930419921875, 1.92431640625, 2.3555908203125, 2.786865234375, 3.2181396484375, 3.6494140625, 4.0806884765625, 4.511962890625, 4.9432373046875, 5.37451171875, 5.8057861328125, 6.237060546875, 6.6683349609375, 7.099609375, 7.5308837890625, 7.962158203125, 8.3934326171875, 8.82470703125, 9.2559814453125, 9.687255859375, 10.1185302734375, 10.5498046875, 10.9810791015625, 11.412353515625, 11.8436279296875, 12.27490234375, 12.7061767578125, 13.137451171875, 13.5687255859375, 14.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 6.0, 15.0, 14.0, 12.0, 15.0, 22.0, 23.0, 22.0, 18.0, 24.0, 25.0, 33.0, 42.0, 33.0, 39.0, 43.0, 34.0, 26.0, 36.0, 50.0, 38.0, 39.0, 46.0, 29.0, 36.0, 33.0, 30.0, 26.0, 24.0, 20.0, 19.0, 22.0, 20.0, 12.0, 16.0, 14.0, 6.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -18.861328125, -18.16015625, -17.458984375, -16.7578125, -16.056640625, -15.35546875, -14.654296875, -13.953125, -13.251953125, -12.55078125, -11.849609375, -11.1484375, -10.447265625, -9.74609375, -9.044921875, -8.34375, -7.642578125, -6.94140625, -6.240234375, -5.5390625, -4.837890625, -4.13671875, -3.435546875, -2.734375, -2.033203125, -1.33203125, -0.630859375, 0.0703125, 0.771484375, 1.47265625, 2.173828125, 2.875, 3.576171875, 4.27734375, 4.978515625, 5.6796875, 6.380859375, 7.08203125, 7.783203125, 8.484375, 9.185546875, 9.88671875, 10.587890625, 11.2890625, 11.990234375, 12.69140625, 13.392578125, 14.09375, 14.794921875, 15.49609375, 16.197265625, 16.8984375, 17.599609375, 18.30078125, 19.001953125, 19.703125, 20.404296875, 21.10546875, 21.806640625, 22.5078125, 23.208984375, 23.91015625, 24.611328125, 25.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 7.0, 21.0, 16.0, 32.0, 42.0, 61.0, 83.0, 119.0, 157.0, 261.0, 379.0, 537.0, 791.0, 1078.0, 1753.0, 2725.0, 4662.0, 8043.0, 14850.0, 29986.0, 70239.0, 204975.0, 399276.0, 183015.0, 63966.0, 27897.0, 13953.0, 7521.0, 4435.0, 2699.0, 1728.0, 1024.0, 662.0, 460.0, 318.0, 221.0, 168.0, 110.0, 71.0, 48.0, 36.0, 34.0, 20.0, 20.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-15.390625, -14.9012451171875, -14.411865234375, -13.9224853515625, -13.43310546875, -12.9437255859375, -12.454345703125, -11.9649658203125, -11.4755859375, -10.9862060546875, -10.496826171875, -10.0074462890625, -9.51806640625, -9.0286865234375, -8.539306640625, -8.0499267578125, -7.560546875, -7.0711669921875, -6.581787109375, -6.0924072265625, -5.60302734375, -5.1136474609375, -4.624267578125, -4.1348876953125, -3.6455078125, -3.1561279296875, -2.666748046875, -2.1773681640625, -1.68798828125, -1.1986083984375, -0.709228515625, -0.2198486328125, 0.26953125, 0.7589111328125, 1.248291015625, 1.7376708984375, 2.22705078125, 2.7164306640625, 3.205810546875, 3.6951904296875, 4.1845703125, 4.6739501953125, 5.163330078125, 5.6527099609375, 6.14208984375, 6.6314697265625, 7.120849609375, 7.6102294921875, 8.099609375, 8.5889892578125, 9.078369140625, 9.5677490234375, 10.05712890625, 10.5465087890625, 11.035888671875, 11.5252685546875, 12.0146484375, 12.5040283203125, 12.993408203125, 13.4827880859375, 13.97216796875, 14.4615478515625, 14.950927734375, 15.4403076171875, 15.9296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 10.0, 10.0, 13.0, 10.0, 19.0, 17.0, 21.0, 26.0, 28.0, 21.0, 36.0, 30.0, 46.0, 33.0, 46.0, 41.0, 43.0, 38.0, 46.0, 47.0, 42.0, 36.0, 34.0, 40.0, 43.0, 24.0, 27.0, 20.0, 24.0, 15.0, 21.0, 14.0, 12.0, 22.0, 5.0, 10.0, 5.0, 10.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.125, -17.561279296875, -16.99755859375, -16.433837890625, -15.8701171875, -15.306396484375, -14.74267578125, -14.178955078125, -13.615234375, -13.051513671875, -12.48779296875, -11.924072265625, -11.3603515625, -10.796630859375, -10.23291015625, -9.669189453125, -9.10546875, -8.541748046875, -7.97802734375, -7.414306640625, -6.8505859375, -6.286865234375, -5.72314453125, -5.159423828125, -4.595703125, -4.031982421875, -3.46826171875, -2.904541015625, -2.3408203125, -1.777099609375, -1.21337890625, -0.649658203125, -0.0859375, 0.477783203125, 1.04150390625, 1.605224609375, 2.1689453125, 2.732666015625, 3.29638671875, 3.860107421875, 4.423828125, 4.987548828125, 5.55126953125, 6.114990234375, 6.6787109375, 7.242431640625, 7.80615234375, 8.369873046875, 8.93359375, 9.497314453125, 10.06103515625, 10.624755859375, 11.1884765625, 11.752197265625, 12.31591796875, 12.879638671875, 13.443359375, 14.007080078125, 14.57080078125, 15.134521484375, 15.6982421875, 16.261962890625, 16.82568359375, 17.389404296875, 17.953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 11.0, 14.0, 14.0, 20.0, 28.0, 54.0, 43.0, 84.0, 97.0, 177.0, 226.0, 423.0, 582.0, 1015.0, 1675.0, 3554.0, 11948.0, 549713.0, 459569.0, 11483.0, 3383.0, 1692.0, 989.0, 584.0, 353.0, 256.0, 178.0, 124.0, 85.0, 63.0, 35.0, 28.0, 11.0, 16.0, 4.0, 4.0, 8.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.3125, -78.84765625, -76.3828125, -73.91796875, -71.453125, -68.98828125, -66.5234375, -64.05859375, -61.59375, -59.12890625, -56.6640625, -54.19921875, -51.734375, -49.26953125, -46.8046875, -44.33984375, -41.875, -39.41015625, -36.9453125, -34.48046875, -32.015625, -29.55078125, -27.0859375, -24.62109375, -22.15625, -19.69140625, -17.2265625, -14.76171875, -12.296875, -9.83203125, -7.3671875, -4.90234375, -2.4375, 0.02734375, 2.4921875, 4.95703125, 7.421875, 9.88671875, 12.3515625, 14.81640625, 17.28125, 19.74609375, 22.2109375, 24.67578125, 27.140625, 29.60546875, 32.0703125, 34.53515625, 37.0, 39.46484375, 41.9296875, 44.39453125, 46.859375, 49.32421875, 51.7890625, 54.25390625, 56.71875, 59.18359375, 61.6484375, 64.11328125, 66.578125, 69.04296875, 71.5078125, 73.97265625, 76.4375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 4.0, 3.0, 9.0, 16.0, 46.0, 125.0, 466.0, 191.0, 58.0, 24.0, 10.0, 9.0, 11.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003421783447265625, -0.0032829642295837402, -0.0031441450119018555, -0.0030053257942199707, -0.002866506576538086, -0.002727687358856201, -0.0025888681411743164, -0.0024500489234924316, -0.002311229705810547, -0.002172410488128662, -0.0020335912704467773, -0.0018947720527648926, -0.0017559528350830078, -0.001617133617401123, -0.0014783143997192383, -0.0013394951820373535, -0.0012006759643554688, -0.001061856746673584, -0.0009230375289916992, -0.0007842183113098145, -0.0006453990936279297, -0.0005065798759460449, -0.00036776065826416016, -0.0002289414405822754, -9.012222290039062e-05, 4.869699478149414e-05, 0.0001875162124633789, 0.00032633543014526367, 0.00046515464782714844, 0.0006039738655090332, 0.000742793083190918, 0.0008816123008728027, 0.0010204315185546875, 0.0011592507362365723, 0.001298069953918457, 0.0014368891716003418, 0.0015757083892822266, 0.0017145276069641113, 0.001853346824645996, 0.001992166042327881, 0.0021309852600097656, 0.0022698044776916504, 0.002408623695373535, 0.00254744291305542, 0.0026862621307373047, 0.0028250813484191895, 0.0029639005661010742, 0.003102719783782959, 0.0032415390014648438, 0.0033803582191467285, 0.0035191774368286133, 0.003657996654510498, 0.003796815872192383, 0.003935635089874268, 0.004074454307556152, 0.004213273525238037, 0.004352092742919922, 0.004490911960601807, 0.004629731178283691, 0.004768550395965576, 0.004907369613647461, 0.005046188831329346, 0.0051850080490112305, 0.005323827266693115, 0.005462646484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 9.0, 21.0, 35.0, 48.0, 61.0, 83.0, 122.0, 154.0, 250.0, 284.0, 408.0, 574.0, 768.0, 1142.0, 1507.0, 2188.0, 3336.0, 5915.0, 15236.0, 97407.0, 733517.0, 148376.0, 18914.0, 6448.0, 3593.0, 2322.0, 1652.0, 1166.0, 826.0, 603.0, 460.0, 339.0, 216.0, 171.0, 127.0, 86.0, 59.0, 37.0, 21.0, 22.0, 21.0, 12.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.28125, -48.8271484375, -47.373046875, -45.9189453125, -44.46484375, -43.0107421875, -41.556640625, -40.1025390625, -38.6484375, -37.1943359375, -35.740234375, -34.2861328125, -32.83203125, -31.3779296875, -29.923828125, -28.4697265625, -27.015625, -25.5615234375, -24.107421875, -22.6533203125, -21.19921875, -19.7451171875, -18.291015625, -16.8369140625, -15.3828125, -13.9287109375, -12.474609375, -11.0205078125, -9.56640625, -8.1123046875, -6.658203125, -5.2041015625, -3.75, -2.2958984375, -0.841796875, 0.6123046875, 2.06640625, 3.5205078125, 4.974609375, 6.4287109375, 7.8828125, 9.3369140625, 10.791015625, 12.2451171875, 13.69921875, 15.1533203125, 16.607421875, 18.0615234375, 19.515625, 20.9697265625, 22.423828125, 23.8779296875, 25.33203125, 26.7861328125, 28.240234375, 29.6943359375, 31.1484375, 32.6025390625, 34.056640625, 35.5107421875, 36.96484375, 38.4189453125, 39.873046875, 41.3271484375, 42.78125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 10.0, 13.0, 13.0, 32.0, 51.0, 113.0, 165.0, 237.0, 168.0, 83.0, 49.0, 20.0, 13.0, 7.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.6328125, -14.2177734375, -13.802734375, -13.3876953125, -12.97265625, -12.5576171875, -12.142578125, -11.7275390625, -11.3125, -10.8974609375, -10.482421875, -10.0673828125, -9.65234375, -9.2373046875, -8.822265625, -8.4072265625, -7.9921875, -7.5771484375, -7.162109375, -6.7470703125, -6.33203125, -5.9169921875, -5.501953125, -5.0869140625, -4.671875, -4.2568359375, -3.841796875, -3.4267578125, -3.01171875, -2.5966796875, -2.181640625, -1.7666015625, -1.3515625, -0.9365234375, -0.521484375, -0.1064453125, 0.30859375, 0.7236328125, 1.138671875, 1.5537109375, 1.96875, 2.3837890625, 2.798828125, 3.2138671875, 3.62890625, 4.0439453125, 4.458984375, 4.8740234375, 5.2890625, 5.7041015625, 6.119140625, 6.5341796875, 6.94921875, 7.3642578125, 7.779296875, 8.1943359375, 8.609375, 9.0244140625, 9.439453125, 9.8544921875, 10.26953125, 10.6845703125, 11.099609375, 11.5146484375, 11.9296875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 16.0, 7.0, 12.0, 17.0, 19.0, 16.0, 17.0, 19.0, 31.0, 38.0, 31.0, 38.0, 56.0, 46.0, 48.0, 58.0, 50.0, 51.0, 49.0, 49.0, 29.0, 29.0, 33.0, 38.0, 28.0, 27.0, 20.0, 22.0, 17.0, 13.0, 9.0, 11.0, 11.0, 7.0, 6.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.07265281677246, -21.362104415893555, -20.651554107666016, -19.94100570678711, -19.230457305908203, -18.519908905029297, -17.809358596801758, -17.09881019592285, -16.388261795043945, -15.677712440490723, -14.967164039611816, -14.256614685058594, -13.546066284179688, -12.835516929626465, -12.124967575073242, -11.414419174194336, -10.703869819641113, -9.99332046508789, -9.282772064208984, -8.572222709655762, -7.8616743087768555, -7.151124954223633, -6.440576076507568, -5.730027198791504, -5.0194783210754395, -4.308929443359375, -3.5983805656433105, -2.887831449508667, -2.1772825717926025, -1.466733694076538, -0.7561845779418945, -0.04563570022583008, 0.6649131774902344, 1.3754620552062988, 2.0860109329223633, 2.796560049057007, 3.5071089267730713, 4.217658042907715, 4.928206920623779, 5.638755798339844, 6.349304676055908, 7.059853553771973, 7.770402431488037, 8.480951309204102, 9.191500663757324, 9.90204906463623, 10.612598419189453, 11.32314682006836, 12.033696174621582, 12.744245529174805, 13.454793930053711, 14.165343284606934, 14.87589168548584, 15.586441040039062, 16.29698944091797, 17.007537841796875, 17.718088150024414, 18.42863655090332, 19.13918685913086, 19.849735260009766, 20.560283660888672, 21.270832061767578, 21.981382369995117, 22.691930770874023, 23.40247917175293]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 10.0, 10.0, 8.0, 13.0, 19.0, 17.0, 23.0, 28.0, 24.0, 25.0, 31.0, 35.0, 26.0, 35.0, 40.0, 28.0, 29.0, 46.0, 40.0, 36.0, 43.0, 39.0, 40.0, 44.0, 30.0, 24.0, 36.0, 40.0, 25.0, 24.0, 25.0, 19.0, 9.0, 11.0, 14.0, 11.0, 5.0, 8.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.815587997436523, -19.05364418029785, -18.291698455810547, -17.529754638671875, -16.767810821533203, -16.0058650970459, -15.243921279907227, -14.481976509094238, -13.72003173828125, -12.958086967468262, -12.19614315032959, -11.434198379516602, -10.672253608703613, -9.910308837890625, -9.148365020751953, -8.386420249938965, -7.624476432800293, -6.862532138824463, -6.100587368011475, -5.3386430740356445, -4.576698303222656, -3.814754009246826, -3.052809715270996, -2.290864944458008, -1.5289206504821777, -0.7669761776924133, -0.005031704902648926, 0.7569127082824707, 1.5188572406768799, 2.280801773071289, 3.042746067047119, 3.8046908378601074, 4.5666351318359375, 5.328579425811768, 6.090524196624756, 6.852468490600586, 7.614413261413574, 8.376358032226562, 9.138301849365234, 9.900246620178223, 10.662191390991211, 11.4241361618042, 12.186079978942871, 12.94802474975586, 13.709969520568848, 14.471914291381836, 15.233858108520508, 15.995802879333496, 16.757747650146484, 17.519691467285156, 18.28163719177246, 19.043581008911133, 19.805524826049805, 20.56747055053711, 21.32941436767578, 22.091358184814453, 22.853302001953125, 23.615245819091797, 24.3771915435791, 25.139135360717773, 25.901079177856445, 26.66302490234375, 27.424968719482422, 28.186912536621094, 28.9488582611084]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 16.0, 24.0, 50.0, 67.0, 107.0, 195.0, 262.0, 456.0, 713.0, 1149.0, 1863.0, 2888.0, 4542.0, 6691.0, 10217.0, 14893.0, 21324.0, 29212.0, 39214.0, 51289.0, 62866.0, 74962.0, 84032.0, 90446.0, 92106.0, 88508.0, 80548.0, 69946.0, 57603.0, 45879.0, 34821.0, 26132.0, 18216.0, 12632.0, 8627.0, 5729.0, 3748.0, 2395.0, 1565.0, 984.0, 603.0, 416.0, 234.0, 156.0, 102.0, 45.0, 34.0, 23.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.0543212890625, -12.608642578125, -12.1629638671875, -11.71728515625, -11.2716064453125, -10.825927734375, -10.3802490234375, -9.9345703125, -9.4888916015625, -9.043212890625, -8.5975341796875, -8.15185546875, -7.7061767578125, -7.260498046875, -6.8148193359375, -6.369140625, -5.9234619140625, -5.477783203125, -5.0321044921875, -4.58642578125, -4.1407470703125, -3.695068359375, -3.2493896484375, -2.8037109375, -2.3580322265625, -1.912353515625, -1.4666748046875, -1.02099609375, -0.5753173828125, -0.129638671875, 0.3160400390625, 0.76171875, 1.2073974609375, 1.653076171875, 2.0987548828125, 2.54443359375, 2.9901123046875, 3.435791015625, 3.8814697265625, 4.3271484375, 4.7728271484375, 5.218505859375, 5.6641845703125, 6.10986328125, 6.5555419921875, 7.001220703125, 7.4468994140625, 7.892578125, 8.3382568359375, 8.783935546875, 9.2296142578125, 9.67529296875, 10.1209716796875, 10.566650390625, 11.0123291015625, 11.4580078125, 11.9036865234375, 12.349365234375, 12.7950439453125, 13.24072265625, 13.6864013671875, 14.132080078125, 14.5777587890625, 15.0234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 8.0, 13.0, 17.0, 18.0, 20.0, 30.0, 25.0, 23.0, 34.0, 35.0, 27.0, 34.0, 41.0, 27.0, 33.0, 41.0, 34.0, 42.0, 44.0, 40.0, 31.0, 44.0, 41.0, 22.0, 34.0, 39.0, 26.0, 25.0, 24.0, 17.0, 14.0, 10.0, 13.0, 10.0, 8.0, 8.0, 10.0, 4.0, 7.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.679443359375, -17.93701171875, -17.194580078125, -16.4521484375, -15.709716796875, -14.96728515625, -14.224853515625, -13.482421875, -12.739990234375, -11.99755859375, -11.255126953125, -10.5126953125, -9.770263671875, -9.02783203125, -8.285400390625, -7.54296875, -6.800537109375, -6.05810546875, -5.315673828125, -4.5732421875, -3.830810546875, -3.08837890625, -2.345947265625, -1.603515625, -0.861083984375, -0.11865234375, 0.623779296875, 1.3662109375, 2.108642578125, 2.85107421875, 3.593505859375, 4.3359375, 5.078369140625, 5.82080078125, 6.563232421875, 7.3056640625, 8.048095703125, 8.79052734375, 9.532958984375, 10.275390625, 11.017822265625, 11.76025390625, 12.502685546875, 13.2451171875, 13.987548828125, 14.72998046875, 15.472412109375, 16.21484375, 16.957275390625, 17.69970703125, 18.442138671875, 19.1845703125, 19.927001953125, 20.66943359375, 21.411865234375, 22.154296875, 22.896728515625, 23.63916015625, 24.381591796875, 25.1240234375, 25.866455078125, 26.60888671875, 27.351318359375, 28.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 13.0, 19.0, 21.0, 44.0, 42.0, 114.0, 147.0, 251.0, 460.0, 795.0, 1396.0, 2395.0, 4104.0, 6685.0, 10984.0, 17439.0, 27450.0, 40988.0, 57617.0, 76869.0, 95660.0, 110726.0, 116019.0, 112333.0, 99087.0, 81591.0, 61450.0, 44065.0, 29905.0, 19241.0, 12134.0, 7437.0, 4603.0, 2701.0, 1560.0, 898.0, 512.0, 328.0, 163.0, 108.0, 60.0, 47.0, 37.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 0.0, 2.0], "bins": [-20.984375, -20.39501953125, -19.8056640625, -19.21630859375, -18.626953125, -18.03759765625, -17.4482421875, -16.85888671875, -16.26953125, -15.68017578125, -15.0908203125, -14.50146484375, -13.912109375, -13.32275390625, -12.7333984375, -12.14404296875, -11.5546875, -10.96533203125, -10.3759765625, -9.78662109375, -9.197265625, -8.60791015625, -8.0185546875, -7.42919921875, -6.83984375, -6.25048828125, -5.6611328125, -5.07177734375, -4.482421875, -3.89306640625, -3.3037109375, -2.71435546875, -2.125, -1.53564453125, -0.9462890625, -0.35693359375, 0.232421875, 0.82177734375, 1.4111328125, 2.00048828125, 2.58984375, 3.17919921875, 3.7685546875, 4.35791015625, 4.947265625, 5.53662109375, 6.1259765625, 6.71533203125, 7.3046875, 7.89404296875, 8.4833984375, 9.07275390625, 9.662109375, 10.25146484375, 10.8408203125, 11.43017578125, 12.01953125, 12.60888671875, 13.1982421875, 13.78759765625, 14.376953125, 14.96630859375, 15.5556640625, 16.14501953125, 16.734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 6.0, 5.0, 7.0, 5.0, 10.0, 5.0, 16.0, 21.0, 26.0, 19.0, 24.0, 27.0, 33.0, 37.0, 34.0, 43.0, 59.0, 37.0, 41.0, 52.0, 50.0, 48.0, 59.0, 36.0, 32.0, 33.0, 32.0, 25.0, 22.0, 27.0, 24.0, 22.0, 14.0, 10.0, 17.0, 15.0, 4.0, 10.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.3125, -15.74609375, -15.1796875, -14.61328125, -14.046875, -13.48046875, -12.9140625, -12.34765625, -11.78125, -11.21484375, -10.6484375, -10.08203125, -9.515625, -8.94921875, -8.3828125, -7.81640625, -7.25, -6.68359375, -6.1171875, -5.55078125, -4.984375, -4.41796875, -3.8515625, -3.28515625, -2.71875, -2.15234375, -1.5859375, -1.01953125, -0.453125, 0.11328125, 0.6796875, 1.24609375, 1.8125, 2.37890625, 2.9453125, 3.51171875, 4.078125, 4.64453125, 5.2109375, 5.77734375, 6.34375, 6.91015625, 7.4765625, 8.04296875, 8.609375, 9.17578125, 9.7421875, 10.30859375, 10.875, 11.44140625, 12.0078125, 12.57421875, 13.140625, 13.70703125, 14.2734375, 14.83984375, 15.40625, 15.97265625, 16.5390625, 17.10546875, 17.671875, 18.23828125, 18.8046875, 19.37109375, 19.9375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 14.0, 16.0, 26.0, 38.0, 46.0, 61.0, 88.0, 152.0, 170.0, 280.0, 379.0, 515.0, 690.0, 1015.0, 1645.0, 2972.0, 5568.0, 12873.0, 32008.0, 82038.0, 176172.0, 262708.0, 236170.0, 134304.0, 56317.0, 22184.0, 9066.0, 4276.0, 2300.0, 1390.0, 883.0, 612.0, 442.0, 330.0, 208.0, 178.0, 102.0, 98.0, 66.0, 34.0, 27.0, 21.0, 13.0, 11.0, 10.0, 7.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.03125, -17.44580078125, -16.8603515625, -16.27490234375, -15.689453125, -15.10400390625, -14.5185546875, -13.93310546875, -13.34765625, -12.76220703125, -12.1767578125, -11.59130859375, -11.005859375, -10.42041015625, -9.8349609375, -9.24951171875, -8.6640625, -8.07861328125, -7.4931640625, -6.90771484375, -6.322265625, -5.73681640625, -5.1513671875, -4.56591796875, -3.98046875, -3.39501953125, -2.8095703125, -2.22412109375, -1.638671875, -1.05322265625, -0.4677734375, 0.11767578125, 0.703125, 1.28857421875, 1.8740234375, 2.45947265625, 3.044921875, 3.63037109375, 4.2158203125, 4.80126953125, 5.38671875, 5.97216796875, 6.5576171875, 7.14306640625, 7.728515625, 8.31396484375, 8.8994140625, 9.48486328125, 10.0703125, 10.65576171875, 11.2412109375, 11.82666015625, 12.412109375, 12.99755859375, 13.5830078125, 14.16845703125, 14.75390625, 15.33935546875, 15.9248046875, 16.51025390625, 17.095703125, 17.68115234375, 18.2666015625, 18.85205078125, 19.4375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 4.0, 10.0, 10.0, 23.0, 22.0, 43.0, 43.0, 42.0, 63.0, 72.0, 82.0, 71.0, 84.0, 75.0, 58.0, 77.0, 62.0, 47.0, 31.0, 31.0, 16.0, 12.0, 6.0, 5.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016622543334960938, -0.0016087591648101807, -0.0015552639961242676, -0.0015017688274383545, -0.0014482736587524414, -0.0013947784900665283, -0.0013412833213806152, -0.0012877881526947021, -0.001234292984008789, -0.001180797815322876, -0.0011273026466369629, -0.0010738074779510498, -0.0010203123092651367, -0.0009668171405792236, -0.0009133219718933105, -0.0008598268032073975, -0.0008063316345214844, -0.0007528364658355713, -0.0006993412971496582, -0.0006458461284637451, -0.000592350959777832, -0.0005388557910919189, -0.00048536062240600586, -0.0004318654537200928, -0.0003783702850341797, -0.0003248751163482666, -0.0002713799476623535, -0.00021788477897644043, -0.00016438961029052734, -0.00011089444160461426, -5.739927291870117e-05, -3.904104232788086e-06, 4.9591064453125e-05, 0.00010308623313903809, 0.00015658140182495117, 0.00021007657051086426, 0.00026357173919677734, 0.00031706690788269043, 0.0003705620765686035, 0.0004240572452545166, 0.0004775524139404297, 0.0005310475826263428, 0.0005845427513122559, 0.0006380379199981689, 0.000691533088684082, 0.0007450282573699951, 0.0007985234260559082, 0.0008520185947418213, 0.0009055137634277344, 0.0009590089321136475, 0.0010125041007995605, 0.0010659992694854736, 0.0011194944381713867, 0.0011729896068572998, 0.0012264847755432129, 0.001279979944229126, 0.001333475112915039, 0.0013869702816009521, 0.0014404654502868652, 0.0014939606189727783, 0.0015474557876586914, 0.0016009509563446045, 0.0016544461250305176, 0.0017079412937164307, 0.0017614364624023438]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 7.0, 4.0, 4.0, 4.0, 12.0, 14.0, 24.0, 40.0, 44.0, 68.0, 97.0, 145.0, 229.0, 367.0, 515.0, 768.0, 1262.0, 2160.0, 3747.0, 6916.0, 13715.0, 28132.0, 56587.0, 106913.0, 169030.0, 206330.0, 185021.0, 125040.0, 69424.0, 34982.0, 17136.0, 8549.0, 4517.0, 2483.0, 1521.0, 928.0, 587.0, 408.0, 257.0, 176.0, 143.0, 64.0, 49.0, 41.0, 34.0, 23.0, 8.0, 8.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8125, -13.3466796875, -12.880859375, -12.4150390625, -11.94921875, -11.4833984375, -11.017578125, -10.5517578125, -10.0859375, -9.6201171875, -9.154296875, -8.6884765625, -8.22265625, -7.7568359375, -7.291015625, -6.8251953125, -6.359375, -5.8935546875, -5.427734375, -4.9619140625, -4.49609375, -4.0302734375, -3.564453125, -3.0986328125, -2.6328125, -2.1669921875, -1.701171875, -1.2353515625, -0.76953125, -0.3037109375, 0.162109375, 0.6279296875, 1.09375, 1.5595703125, 2.025390625, 2.4912109375, 2.95703125, 3.4228515625, 3.888671875, 4.3544921875, 4.8203125, 5.2861328125, 5.751953125, 6.2177734375, 6.68359375, 7.1494140625, 7.615234375, 8.0810546875, 8.546875, 9.0126953125, 9.478515625, 9.9443359375, 10.41015625, 10.8759765625, 11.341796875, 11.8076171875, 12.2734375, 12.7392578125, 13.205078125, 13.6708984375, 14.13671875, 14.6025390625, 15.068359375, 15.5341796875, 16.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 3.0, 9.0, 9.0, 13.0, 16.0, 17.0, 18.0, 34.0, 24.0, 39.0, 52.0, 68.0, 79.0, 87.0, 71.0, 63.0, 56.0, 65.0, 46.0, 35.0, 38.0, 26.0, 33.0, 16.0, 11.0, 12.0, 11.0, 8.0, 4.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.93707275390625, -4.7569580078125, -4.57684326171875, -4.396728515625, -4.21661376953125, -4.0364990234375, -3.85638427734375, -3.67626953125, -3.49615478515625, -3.3160400390625, -3.13592529296875, -2.955810546875, -2.77569580078125, -2.5955810546875, -2.41546630859375, -2.2353515625, -2.05523681640625, -1.8751220703125, -1.69500732421875, -1.514892578125, -1.33477783203125, -1.1546630859375, -0.97454833984375, -0.79443359375, -0.61431884765625, -0.4342041015625, -0.25408935546875, -0.073974609375, 0.10614013671875, 0.2862548828125, 0.46636962890625, 0.646484375, 0.82659912109375, 1.0067138671875, 1.18682861328125, 1.366943359375, 1.54705810546875, 1.7271728515625, 1.90728759765625, 2.08740234375, 2.26751708984375, 2.4476318359375, 2.62774658203125, 2.807861328125, 2.98797607421875, 3.1680908203125, 3.34820556640625, 3.5283203125, 3.70843505859375, 3.8885498046875, 4.06866455078125, 4.248779296875, 4.42889404296875, 4.6090087890625, 4.78912353515625, 4.96923828125, 5.14935302734375, 5.3294677734375, 5.50958251953125, 5.689697265625, 5.86981201171875, 6.0499267578125, 6.23004150390625, 6.41015625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 15.0, 14.0, 19.0, 27.0, 19.0, 32.0, 30.0, 30.0, 43.0, 42.0, 45.0, 46.0, 57.0, 53.0, 60.0, 44.0, 48.0, 52.0, 32.0, 42.0, 50.0, 28.0, 12.0, 23.0, 24.0, 19.0, 14.0, 11.0, 7.0, 10.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.198631286621094, -24.416845321655273, -23.635061264038086, -22.853275299072266, -22.071489334106445, -21.289703369140625, -20.507919311523438, -19.726133346557617, -18.944347381591797, -18.162561416625977, -17.38077735900879, -16.59899139404297, -15.817205429077148, -15.035420417785645, -14.25363540649414, -13.47184944152832, -12.690065383911133, -11.908280372619629, -11.126494407653809, -10.344709396362305, -9.562923431396484, -8.78113842010498, -7.999353408813477, -7.2175679206848145, -6.435782432556152, -5.65399694442749, -4.872211456298828, -4.090426445007324, -3.308640956878662, -2.52685546875, -1.745070457458496, -0.963284969329834, -0.18149948120117188, 0.6002858877182007, 1.3820712566375732, 2.1638565063476562, 2.9456419944763184, 3.7274274826049805, 4.509212493896484, 5.2909979820251465, 6.072783470153809, 6.854568958282471, 7.636354446411133, 8.418139457702637, 9.19992446899414, 9.981710433959961, 10.763495445251465, 11.545280456542969, 12.327066421508789, 13.108851432800293, 13.890637397766113, 14.672422409057617, 15.454208374023438, 16.235992431640625, 17.017778396606445, 17.799564361572266, 18.581348419189453, 19.363134384155273, 20.14491844177246, 20.92670440673828, 21.7084903717041, 22.490276336669922, 23.27206039428711, 24.05384635925293, 24.83563232421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 5.0, 12.0, 11.0, 14.0, 11.0, 10.0, 20.0, 20.0, 19.0, 21.0, 20.0, 23.0, 19.0, 34.0, 25.0, 32.0, 27.0, 32.0, 31.0, 36.0, 33.0, 29.0, 35.0, 32.0, 32.0, 34.0, 37.0, 42.0, 29.0, 27.0, 36.0, 20.0, 18.0, 25.0, 25.0, 20.0, 18.0, 13.0, 10.0, 9.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-21.15036964416504, -20.481014251708984, -19.81165885925293, -19.142303466796875, -18.472949981689453, -17.8035945892334, -17.134239196777344, -16.46488380432129, -15.795528411865234, -15.12617301940918, -14.456817626953125, -13.787463188171387, -13.118107795715332, -12.448752403259277, -11.779397964477539, -11.110042572021484, -10.44068717956543, -9.771331787109375, -9.10197639465332, -8.432621955871582, -7.763266563415527, -7.093911170959473, -6.424556255340576, -5.75520133972168, -5.085845947265625, -4.41649055480957, -3.747135639190674, -3.0777804851531982, -2.4084253311157227, -1.739070177078247, -1.0697150230407715, -0.400360107421875, 0.2689952850341797, 0.9383504390716553, 1.6077055931091309, 2.2770607471466064, 2.946415901184082, 3.6157710552215576, 4.285126209259033, 4.95448112487793, 5.623836517333984, 6.293191909790039, 6.9625468254089355, 7.631901741027832, 8.301257133483887, 8.970612525939941, 9.63996696472168, 10.309322357177734, 10.978677749633789, 11.648033142089844, 12.317388534545898, 12.986742973327637, 13.656098365783691, 14.325453758239746, 14.994808197021484, 15.664163589477539, 16.333518981933594, 17.00287437438965, 17.672229766845703, 18.341585159301758, 19.010940551757812, 19.680294036865234, 20.34964942932129, 21.019004821777344, 21.6883602142334]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 7.0, 12.0, 19.0, 31.0, 33.0, 86.0, 146.0, 187.0, 353.0, 588.0, 937.0, 1544.0, 2450.0, 4149.0, 6342.0, 10420.0, 16475.0, 26045.0, 39857.0, 61607.0, 89479.0, 127845.0, 177793.0, 234733.0, 294359.0, 351701.0, 391177.0, 409108.0, 399254.0, 362479.0, 311333.0, 250852.0, 191614.0, 140592.0, 99206.0, 68019.0, 44551.0, 28833.0, 18812.0, 11821.0, 7630.0, 4513.0, 2872.0, 1685.0, 1114.0, 635.0, 351.0, 247.0, 144.0, 102.0, 54.0, 44.0, 17.0, 16.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-14.53125, -14.056884765625, -13.58251953125, -13.108154296875, -12.6337890625, -12.159423828125, -11.68505859375, -11.210693359375, -10.736328125, -10.261962890625, -9.78759765625, -9.313232421875, -8.8388671875, -8.364501953125, -7.89013671875, -7.415771484375, -6.94140625, -6.467041015625, -5.99267578125, -5.518310546875, -5.0439453125, -4.569580078125, -4.09521484375, -3.620849609375, -3.146484375, -2.672119140625, -2.19775390625, -1.723388671875, -1.2490234375, -0.774658203125, -0.30029296875, 0.174072265625, 0.6484375, 1.122802734375, 1.59716796875, 2.071533203125, 2.5458984375, 3.020263671875, 3.49462890625, 3.968994140625, 4.443359375, 4.917724609375, 5.39208984375, 5.866455078125, 6.3408203125, 6.815185546875, 7.28955078125, 7.763916015625, 8.23828125, 8.712646484375, 9.18701171875, 9.661376953125, 10.1357421875, 10.610107421875, 11.08447265625, 11.558837890625, 12.033203125, 12.507568359375, 12.98193359375, 13.456298828125, 13.9306640625, 14.405029296875, 14.87939453125, 15.353759765625, 15.828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 5.0, 11.0, 14.0, 14.0, 9.0, 16.0, 15.0, 21.0, 18.0, 21.0, 17.0, 27.0, 19.0, 33.0, 26.0, 32.0, 32.0, 30.0, 33.0, 34.0, 27.0, 37.0, 32.0, 25.0, 44.0, 38.0, 28.0, 42.0, 26.0, 33.0, 30.0, 23.0, 18.0, 23.0, 24.0, 18.0, 20.0, 10.0, 11.0, 10.0, 10.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-18.875, -18.27685546875, -17.6787109375, -17.08056640625, -16.482421875, -15.88427734375, -15.2861328125, -14.68798828125, -14.08984375, -13.49169921875, -12.8935546875, -12.29541015625, -11.697265625, -11.09912109375, -10.5009765625, -9.90283203125, -9.3046875, -8.70654296875, -8.1083984375, -7.51025390625, -6.912109375, -6.31396484375, -5.7158203125, -5.11767578125, -4.51953125, -3.92138671875, -3.3232421875, -2.72509765625, -2.126953125, -1.52880859375, -0.9306640625, -0.33251953125, 0.265625, 0.86376953125, 1.4619140625, 2.06005859375, 2.658203125, 3.25634765625, 3.8544921875, 4.45263671875, 5.05078125, 5.64892578125, 6.2470703125, 6.84521484375, 7.443359375, 8.04150390625, 8.6396484375, 9.23779296875, 9.8359375, 10.43408203125, 11.0322265625, 11.63037109375, 12.228515625, 12.82666015625, 13.4248046875, 14.02294921875, 14.62109375, 15.21923828125, 15.8173828125, 16.41552734375, 17.013671875, 17.61181640625, 18.2099609375, 18.80810546875, 19.40625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 8.0, 11.0, 19.0, 41.0, 61.0, 117.0, 203.0, 328.0, 565.0, 952.0, 1564.0, 2693.0, 4289.0, 7239.0, 11311.0, 17850.0, 27378.0, 41327.0, 61608.0, 86146.0, 119107.0, 160455.0, 205664.0, 254951.0, 299388.0, 337130.0, 359313.0, 364122.0, 350017.0, 321554.0, 278834.0, 231601.0, 184797.0, 139950.0, 103724.0, 74085.0, 50812.0, 34181.0, 22257.0, 14759.0, 9134.0, 5711.0, 3635.0, 2209.0, 1289.0, 787.0, 430.0, 273.0, 174.0, 102.0, 46.0, 36.0, 21.0, 20.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-15.2109375, -14.7244873046875, -14.238037109375, -13.7515869140625, -13.26513671875, -12.7786865234375, -12.292236328125, -11.8057861328125, -11.3193359375, -10.8328857421875, -10.346435546875, -9.8599853515625, -9.37353515625, -8.8870849609375, -8.400634765625, -7.9141845703125, -7.427734375, -6.9412841796875, -6.454833984375, -5.9683837890625, -5.48193359375, -4.9954833984375, -4.509033203125, -4.0225830078125, -3.5361328125, -3.0496826171875, -2.563232421875, -2.0767822265625, -1.59033203125, -1.1038818359375, -0.617431640625, -0.1309814453125, 0.35546875, 0.8419189453125, 1.328369140625, 1.8148193359375, 2.30126953125, 2.7877197265625, 3.274169921875, 3.7606201171875, 4.2470703125, 4.7335205078125, 5.219970703125, 5.7064208984375, 6.19287109375, 6.6793212890625, 7.165771484375, 7.6522216796875, 8.138671875, 8.6251220703125, 9.111572265625, 9.5980224609375, 10.08447265625, 10.5709228515625, 11.057373046875, 11.5438232421875, 12.0302734375, 12.5167236328125, 13.003173828125, 13.4896240234375, 13.97607421875, 14.4625244140625, 14.948974609375, 15.4354248046875, 15.921875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 20.0, 28.0, 25.0, 30.0, 45.0, 47.0, 46.0, 81.0, 72.0, 104.0, 125.0, 112.0, 142.0, 169.0, 205.0, 196.0, 200.0, 173.0, 202.0, 189.0, 201.0, 218.0, 180.0, 158.0, 153.0, 129.0, 130.0, 140.0, 106.0, 82.0, 69.0, 62.0, 47.0, 40.0, 33.0, 18.0, 13.0, 22.0, 8.0, 9.0, 8.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.60546875, -8.296875, -7.98828125, -7.6796875, -7.37109375, -7.0625, -6.75390625, -6.4453125, -6.13671875, -5.828125, -5.51953125, -5.2109375, -4.90234375, -4.59375, -4.28515625, -3.9765625, -3.66796875, -3.359375, -3.05078125, -2.7421875, -2.43359375, -2.125, -1.81640625, -1.5078125, -1.19921875, -0.890625, -0.58203125, -0.2734375, 0.03515625, 0.34375, 0.65234375, 0.9609375, 1.26953125, 1.578125, 1.88671875, 2.1953125, 2.50390625, 2.8125, 3.12109375, 3.4296875, 3.73828125, 4.046875, 4.35546875, 4.6640625, 4.97265625, 5.28125, 5.58984375, 5.8984375, 6.20703125, 6.515625, 6.82421875, 7.1328125, 7.44140625, 7.75, 8.05859375, 8.3671875, 8.67578125, 8.984375, 9.29296875, 9.6015625, 9.91015625, 10.21875, 10.52734375, 10.8359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 7.0, 3.0, 8.0, 16.0, 10.0, 14.0, 16.0, 17.0, 24.0, 27.0, 36.0, 28.0, 24.0, 47.0, 49.0, 51.0, 41.0, 39.0, 38.0, 47.0, 42.0, 53.0, 36.0, 32.0, 35.0, 34.0, 34.0, 21.0, 25.0, 29.0, 20.0, 14.0, 9.0, 17.0, 17.0, 11.0, 9.0, 7.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.3278751373291, -23.574804306030273, -22.821733474731445, -22.068662643432617, -21.31559181213379, -20.562522888183594, -19.809452056884766, -19.056381225585938, -18.30331039428711, -17.55023956298828, -16.797168731689453, -16.044097900390625, -15.291028022766113, -14.537957191467285, -13.784886360168457, -13.031816482543945, -12.2787446975708, -11.525673866271973, -10.772603034973145, -10.019533157348633, -9.266462326049805, -8.513391494750977, -7.760320663452148, -7.0072503089904785, -6.25417947769165, -5.501108646392822, -4.748038291931152, -3.994967460632324, -3.241896867752075, -2.488826274871826, -1.735755443572998, -0.9826850891113281, -0.2296142578125, 0.5234563946723938, 1.2765270471572876, 2.029597759246826, 2.782668352127075, 3.535738945007324, 4.288809776306152, 5.041880130767822, 5.79495096206665, 6.5480217933654785, 7.301092147827148, 8.054162979125977, 8.807233810424805, 9.560304641723633, 10.313375473022461, 11.066445350646973, 11.8195161819458, 12.572587013244629, 13.325657844543457, 14.078727722167969, 14.831798553466797, 15.584869384765625, 16.337940216064453, 17.09101104736328, 17.84408187866211, 18.597152709960938, 19.350223541259766, 20.103294372558594, 20.856365203857422, 21.60943603515625, 22.362506866455078, 23.115575790405273, 23.8686466217041]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 6.0, 14.0, 13.0, 14.0, 12.0, 15.0, 20.0, 26.0, 26.0, 24.0, 23.0, 23.0, 38.0, 36.0, 42.0, 30.0, 43.0, 48.0, 30.0, 41.0, 27.0, 45.0, 34.0, 37.0, 37.0, 50.0, 27.0, 25.0, 24.0, 21.0, 20.0, 20.0, 10.0, 15.0, 16.0, 14.0, 11.0, 5.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.413476943969727, -24.641132354736328, -23.868785858154297, -23.0964412689209, -22.3240966796875, -21.5517520904541, -20.779407501220703, -20.007061004638672, -19.234716415405273, -18.462371826171875, -17.690025329589844, -16.917680740356445, -16.145336151123047, -15.372991561889648, -14.600646018981934, -13.828300476074219, -13.05595588684082, -12.283611297607422, -11.511265754699707, -10.738920211791992, -9.966575622558594, -9.194231033325195, -8.42188549041748, -7.649540424346924, -6.877195358276367, -6.1048502922058105, -5.332505226135254, -4.560160160064697, -3.7878150939941406, -3.015470027923584, -2.2431249618530273, -1.4707798957824707, -0.6984348297119141, 0.07391023635864258, 0.8462553024291992, 1.6186003684997559, 2.3909454345703125, 3.163290500640869, 3.935635566711426, 4.707980632781982, 5.480325698852539, 6.252670764923096, 7.025015830993652, 7.797360897064209, 8.569705963134766, 9.342050552368164, 10.114396095275879, 10.886741638183594, 11.659086227416992, 12.43143081665039, 13.203776359558105, 13.97612190246582, 14.748466491699219, 15.520811080932617, 16.293155670166016, 17.065502166748047, 17.837846755981445, 18.610191345214844, 19.382537841796875, 20.154882431030273, 20.927227020263672, 21.69957160949707, 22.47191619873047, 23.2442626953125, 24.0166072845459]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 6.0, 9.0, 9.0, 26.0, 42.0, 57.0, 104.0, 155.0, 249.0, 427.0, 658.0, 1158.0, 1800.0, 3017.0, 4805.0, 7820.0, 12455.0, 19263.0, 30219.0, 46887.0, 69924.0, 98558.0, 129280.0, 146720.0, 137867.0, 108962.0, 78968.0, 53641.0, 34879.0, 22445.0, 14401.0, 8961.0, 5595.0, 3534.0, 2109.0, 1296.0, 866.0, 524.0, 306.0, 207.0, 132.0, 78.0, 38.0, 26.0, 22.0, 20.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-9.875, -9.5816650390625, -9.288330078125, -8.9949951171875, -8.70166015625, -8.4083251953125, -8.114990234375, -7.8216552734375, -7.5283203125, -7.2349853515625, -6.941650390625, -6.6483154296875, -6.35498046875, -6.0616455078125, -5.768310546875, -5.4749755859375, -5.181640625, -4.8883056640625, -4.594970703125, -4.3016357421875, -4.00830078125, -3.7149658203125, -3.421630859375, -3.1282958984375, -2.8349609375, -2.5416259765625, -2.248291015625, -1.9549560546875, -1.66162109375, -1.3682861328125, -1.074951171875, -0.7816162109375, -0.48828125, -0.1949462890625, 0.098388671875, 0.3917236328125, 0.68505859375, 0.9783935546875, 1.271728515625, 1.5650634765625, 1.8583984375, 2.1517333984375, 2.445068359375, 2.7384033203125, 3.03173828125, 3.3250732421875, 3.618408203125, 3.9117431640625, 4.205078125, 4.4984130859375, 4.791748046875, 5.0850830078125, 5.37841796875, 5.6717529296875, 5.965087890625, 6.2584228515625, 6.5517578125, 6.8450927734375, 7.138427734375, 7.4317626953125, 7.72509765625, 8.0184326171875, 8.311767578125, 8.6051025390625, 8.8984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 7.0, 12.0, 14.0, 15.0, 11.0, 14.0, 22.0, 25.0, 26.0, 24.0, 22.0, 26.0, 36.0, 37.0, 42.0, 32.0, 41.0, 46.0, 30.0, 43.0, 31.0, 39.0, 35.0, 35.0, 38.0, 48.0, 28.0, 26.0, 26.0, 22.0, 18.0, 19.0, 11.0, 17.0, 16.0, 12.0, 13.0, 3.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.5, -24.726806640625, -23.95361328125, -23.180419921875, -22.4072265625, -21.634033203125, -20.86083984375, -20.087646484375, -19.314453125, -18.541259765625, -17.76806640625, -16.994873046875, -16.2216796875, -15.448486328125, -14.67529296875, -13.902099609375, -13.12890625, -12.355712890625, -11.58251953125, -10.809326171875, -10.0361328125, -9.262939453125, -8.48974609375, -7.716552734375, -6.943359375, -6.170166015625, -5.39697265625, -4.623779296875, -3.8505859375, -3.077392578125, -2.30419921875, -1.531005859375, -0.7578125, 0.015380859375, 0.78857421875, 1.561767578125, 2.3349609375, 3.108154296875, 3.88134765625, 4.654541015625, 5.427734375, 6.200927734375, 6.97412109375, 7.747314453125, 8.5205078125, 9.293701171875, 10.06689453125, 10.840087890625, 11.61328125, 12.386474609375, 13.15966796875, 13.932861328125, 14.7060546875, 15.479248046875, 16.25244140625, 17.025634765625, 17.798828125, 18.572021484375, 19.34521484375, 20.118408203125, 20.8916015625, 21.664794921875, 22.43798828125, 23.211181640625, 23.984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 12.0, 15.0, 22.0, 30.0, 31.0, 62.0, 67.0, 121.0, 164.0, 264.0, 391.0, 564.0, 813.0, 1427.0, 2080.0, 3392.0, 5935.0, 10170.0, 18986.0, 37219.0, 79821.0, 181041.0, 313079.0, 208980.0, 91979.0, 42465.0, 21326.0, 11404.0, 6313.0, 3803.0, 2262.0, 1486.0, 903.0, 639.0, 369.0, 294.0, 185.0, 131.0, 103.0, 55.0, 39.0, 36.0, 20.0, 16.0, 17.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0], "bins": [-14.15625, -13.7081298828125, -13.260009765625, -12.8118896484375, -12.36376953125, -11.9156494140625, -11.467529296875, -11.0194091796875, -10.5712890625, -10.1231689453125, -9.675048828125, -9.2269287109375, -8.77880859375, -8.3306884765625, -7.882568359375, -7.4344482421875, -6.986328125, -6.5382080078125, -6.090087890625, -5.6419677734375, -5.19384765625, -4.7457275390625, -4.297607421875, -3.8494873046875, -3.4013671875, -2.9532470703125, -2.505126953125, -2.0570068359375, -1.60888671875, -1.1607666015625, -0.712646484375, -0.2645263671875, 0.18359375, 0.6317138671875, 1.079833984375, 1.5279541015625, 1.97607421875, 2.4241943359375, 2.872314453125, 3.3204345703125, 3.7685546875, 4.2166748046875, 4.664794921875, 5.1129150390625, 5.56103515625, 6.0091552734375, 6.457275390625, 6.9053955078125, 7.353515625, 7.8016357421875, 8.249755859375, 8.6978759765625, 9.14599609375, 9.5941162109375, 10.042236328125, 10.4903564453125, 10.9384765625, 11.3865966796875, 11.834716796875, 12.2828369140625, 12.73095703125, 13.1790771484375, 13.627197265625, 14.0753173828125, 14.5234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 17.0, 12.0, 14.0, 15.0, 22.0, 18.0, 29.0, 35.0, 33.0, 30.0, 28.0, 27.0, 45.0, 56.0, 35.0, 40.0, 47.0, 50.0, 38.0, 50.0, 40.0, 37.0, 34.0, 37.0, 33.0, 26.0, 28.0, 16.0, 13.0, 17.0, 15.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.03125, -22.3837890625, -21.736328125, -21.0888671875, -20.44140625, -19.7939453125, -19.146484375, -18.4990234375, -17.8515625, -17.2041015625, -16.556640625, -15.9091796875, -15.26171875, -14.6142578125, -13.966796875, -13.3193359375, -12.671875, -12.0244140625, -11.376953125, -10.7294921875, -10.08203125, -9.4345703125, -8.787109375, -8.1396484375, -7.4921875, -6.8447265625, -6.197265625, -5.5498046875, -4.90234375, -4.2548828125, -3.607421875, -2.9599609375, -2.3125, -1.6650390625, -1.017578125, -0.3701171875, 0.27734375, 0.9248046875, 1.572265625, 2.2197265625, 2.8671875, 3.5146484375, 4.162109375, 4.8095703125, 5.45703125, 6.1044921875, 6.751953125, 7.3994140625, 8.046875, 8.6943359375, 9.341796875, 9.9892578125, 10.63671875, 11.2841796875, 11.931640625, 12.5791015625, 13.2265625, 13.8740234375, 14.521484375, 15.1689453125, 15.81640625, 16.4638671875, 17.111328125, 17.7587890625, 18.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 6.0, 8.0, 11.0, 11.0, 24.0, 45.0, 56.0, 88.0, 148.0, 240.0, 435.0, 739.0, 1508.0, 3006.0, 6354.0, 14743.0, 40935.0, 152550.0, 559286.0, 189411.0, 47933.0, 16976.0, 7090.0, 3359.0, 1650.0, 786.0, 458.0, 267.0, 170.0, 86.0, 56.0, 48.0, 19.0, 10.0, 16.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.6640625, -15.1678466796875, -14.671630859375, -14.1754150390625, -13.67919921875, -13.1829833984375, -12.686767578125, -12.1905517578125, -11.6943359375, -11.1981201171875, -10.701904296875, -10.2056884765625, -9.70947265625, -9.2132568359375, -8.717041015625, -8.2208251953125, -7.724609375, -7.2283935546875, -6.732177734375, -6.2359619140625, -5.73974609375, -5.2435302734375, -4.747314453125, -4.2510986328125, -3.7548828125, -3.2586669921875, -2.762451171875, -2.2662353515625, -1.77001953125, -1.2738037109375, -0.777587890625, -0.2813720703125, 0.21484375, 0.7110595703125, 1.207275390625, 1.7034912109375, 2.19970703125, 2.6959228515625, 3.192138671875, 3.6883544921875, 4.1845703125, 4.6807861328125, 5.177001953125, 5.6732177734375, 6.16943359375, 6.6656494140625, 7.161865234375, 7.6580810546875, 8.154296875, 8.6505126953125, 9.146728515625, 9.6429443359375, 10.13916015625, 10.6353759765625, 11.131591796875, 11.6278076171875, 12.1240234375, 12.6202392578125, 13.116455078125, 13.6126708984375, 14.10888671875, 14.6051025390625, 15.101318359375, 15.5975341796875, 16.09375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 1.0, 8.0, 6.0, 5.0, 17.0, 22.0, 24.0, 38.0, 61.0, 75.0, 92.0, 134.0, 116.0, 103.0, 77.0, 62.0, 40.0, 19.0, 22.0, 18.0, 16.0, 10.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.001338958740234375, -0.0013018399477005005, -0.001264721155166626, -0.0012276023626327515, -0.001190483570098877, -0.0011533647775650024, -0.001116245985031128, -0.0010791271924972534, -0.001042008399963379, -0.0010048896074295044, -0.0009677708148956299, -0.0009306520223617554, -0.0008935332298278809, -0.0008564144372940063, -0.0008192956447601318, -0.0007821768522262573, -0.0007450580596923828, -0.0007079392671585083, -0.0006708204746246338, -0.0006337016820907593, -0.0005965828895568848, -0.0005594640970230103, -0.0005223453044891357, -0.00048522651195526123, -0.0004481077194213867, -0.0004109889268875122, -0.0003738701343536377, -0.0003367513418197632, -0.00029963254928588867, -0.00026251375675201416, -0.00022539496421813965, -0.00018827617168426514, -0.00015115737915039062, -0.00011403858661651611, -7.69197940826416e-05, -3.980100154876709e-05, -2.682209014892578e-06, 3.4436583518981934e-05, 7.155537605285645e-05, 0.00010867416858673096, 0.00014579296112060547, 0.00018291175365447998, 0.0002200305461883545, 0.000257149338722229, 0.0002942681312561035, 0.00033138692378997803, 0.00036850571632385254, 0.00040562450885772705, 0.00044274330139160156, 0.0004798620939254761, 0.0005169808864593506, 0.0005540996789932251, 0.0005912184715270996, 0.0006283372640609741, 0.0006654560565948486, 0.0007025748491287231, 0.0007396936416625977, 0.0007768124341964722, 0.0008139312267303467, 0.0008510500192642212, 0.0008881688117980957, 0.0009252876043319702, 0.0009624063968658447, 0.0009995251893997192, 0.0010366439819335938]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 14.0, 13.0, 17.0, 29.0, 29.0, 57.0, 87.0, 128.0, 222.0, 318.0, 551.0, 885.0, 1530.0, 2619.0, 4593.0, 8719.0, 16104.0, 30188.0, 55233.0, 99065.0, 162164.0, 210677.0, 184236.0, 120181.0, 68746.0, 37467.0, 19957.0, 11013.0, 5852.0, 3270.0, 1878.0, 1012.0, 635.0, 380.0, 245.0, 128.0, 86.0, 69.0, 41.0, 19.0, 25.0, 23.0, 14.0, 11.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.6561279296875, -9.351318359375, -9.0465087890625, -8.74169921875, -8.4368896484375, -8.132080078125, -7.8272705078125, -7.5224609375, -7.2176513671875, -6.912841796875, -6.6080322265625, -6.30322265625, -5.9984130859375, -5.693603515625, -5.3887939453125, -5.083984375, -4.7791748046875, -4.474365234375, -4.1695556640625, -3.86474609375, -3.5599365234375, -3.255126953125, -2.9503173828125, -2.6455078125, -2.3406982421875, -2.035888671875, -1.7310791015625, -1.42626953125, -1.1214599609375, -0.816650390625, -0.5118408203125, -0.20703125, 0.0977783203125, 0.402587890625, 0.7073974609375, 1.01220703125, 1.3170166015625, 1.621826171875, 1.9266357421875, 2.2314453125, 2.5362548828125, 2.841064453125, 3.1458740234375, 3.45068359375, 3.7554931640625, 4.060302734375, 4.3651123046875, 4.669921875, 4.9747314453125, 5.279541015625, 5.5843505859375, 5.88916015625, 6.1939697265625, 6.498779296875, 6.8035888671875, 7.1083984375, 7.4132080078125, 7.718017578125, 8.0228271484375, 8.32763671875, 8.6324462890625, 8.937255859375, 9.2420654296875, 9.546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 9.0, 10.0, 8.0, 9.0, 22.0, 19.0, 25.0, 27.0, 47.0, 41.0, 60.0, 66.0, 58.0, 59.0, 64.0, 60.0, 54.0, 44.0, 54.0, 37.0, 31.0, 35.0, 31.0, 19.0, 13.0, 18.0, 18.0, 7.0, 5.0, 8.0, 4.0, 1.0, 9.0, 1.0, 7.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.94140625, -3.8251953125, -3.708984375, -3.5927734375, -3.4765625, -3.3603515625, -3.244140625, -3.1279296875, -3.01171875, -2.8955078125, -2.779296875, -2.6630859375, -2.546875, -2.4306640625, -2.314453125, -2.1982421875, -2.08203125, -1.9658203125, -1.849609375, -1.7333984375, -1.6171875, -1.5009765625, -1.384765625, -1.2685546875, -1.15234375, -1.0361328125, -0.919921875, -0.8037109375, -0.6875, -0.5712890625, -0.455078125, -0.3388671875, -0.22265625, -0.1064453125, 0.009765625, 0.1259765625, 0.2421875, 0.3583984375, 0.474609375, 0.5908203125, 0.70703125, 0.8232421875, 0.939453125, 1.0556640625, 1.171875, 1.2880859375, 1.404296875, 1.5205078125, 1.63671875, 1.7529296875, 1.869140625, 1.9853515625, 2.1015625, 2.2177734375, 2.333984375, 2.4501953125, 2.56640625, 2.6826171875, 2.798828125, 2.9150390625, 3.03125, 3.1474609375, 3.263671875, 3.3798828125, 3.49609375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 18.0, 6.0, 20.0, 18.0, 21.0, 25.0, 32.0, 29.0, 27.0, 42.0, 50.0, 47.0, 50.0, 46.0, 35.0, 49.0, 45.0, 45.0, 44.0, 39.0, 29.0, 25.0, 42.0, 31.0, 29.0, 23.0, 19.0, 15.0, 11.0, 17.0, 15.0, 7.0, 10.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.9354248046875, -26.152223587036133, -25.369022369384766, -24.5858211517334, -23.80261993408203, -23.01941680908203, -22.236215591430664, -21.453014373779297, -20.66981315612793, -19.886611938476562, -19.103410720825195, -18.320209503173828, -17.537006378173828, -16.75380516052246, -15.970603942871094, -15.187402725219727, -14.40420150756836, -13.621000289916992, -12.837799072265625, -12.054596900939941, -11.271395683288574, -10.488194465637207, -9.704992294311523, -8.921791076660156, -8.138589859008789, -7.355388641357422, -6.5721869468688965, -5.788985252380371, -5.005784034729004, -4.222582817077637, -3.4393811225891113, -2.656179428100586, -1.8729782104492188, -1.0897767543792725, -0.30657529830932617, 0.4766261577606201, 1.2598276138305664, 2.0430290699005127, 2.826230525970459, 3.6094322204589844, 4.392633438110352, 5.175834655761719, 5.959036350250244, 6.7422380447387695, 7.525439262390137, 8.308640480041504, 9.091842651367188, 9.875043869018555, 10.658245086669922, 11.441446304321289, 12.224647521972656, 13.00784969329834, 13.791050910949707, 14.574252128601074, 15.357454299926758, 16.140655517578125, 16.923856735229492, 17.70705795288086, 18.490259170532227, 19.273460388183594, 20.056663513183594, 20.83986473083496, 21.623065948486328, 22.406267166137695, 23.189468383789062]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 10.0, 12.0, 17.0, 6.0, 13.0, 23.0, 22.0, 28.0, 33.0, 22.0, 21.0, 27.0, 34.0, 42.0, 30.0, 40.0, 40.0, 36.0, 29.0, 45.0, 33.0, 34.0, 53.0, 39.0, 35.0, 32.0, 34.0, 26.0, 25.0, 22.0, 11.0, 15.0, 16.0, 15.0, 14.0, 11.0, 10.0, 5.0, 8.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.940406799316406, -25.166536331176758, -24.392667770385742, -23.618797302246094, -22.844928741455078, -22.07105827331543, -21.29718780517578, -20.523319244384766, -19.74945068359375, -18.9755802154541, -18.201711654663086, -17.427841186523438, -16.653972625732422, -15.880102157592773, -15.106232643127441, -14.33236312866211, -13.558492660522461, -12.784623146057129, -12.010753631591797, -11.236883163452148, -10.463014602661133, -9.689144134521484, -8.915274620056152, -8.14140510559082, -7.367535591125488, -6.593666076660156, -5.819796562194824, -5.045926570892334, -4.272057056427002, -3.49818754196167, -2.7243175506591797, -1.9504480361938477, -1.1765785217285156, -0.40270888805389404, 0.37116074562072754, 1.1450304985046387, 1.9189000129699707, 2.6927695274353027, 3.466639518737793, 4.240509033203125, 5.014378547668457, 5.788248062133789, 6.562117576599121, 7.335987567901611, 8.109857559204102, 8.883726119995117, 9.657596588134766, 10.431466102600098, 11.20533561706543, 11.979205131530762, 12.753074645996094, 13.526945114135742, 14.300813674926758, 15.074684143066406, 15.848553657531738, 16.62242317199707, 17.39629364013672, 18.170164108276367, 18.944032669067383, 19.71790313720703, 20.491771697998047, 21.265642166137695, 22.039512634277344, 22.81338119506836, 23.587249755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 9.0, 16.0, 29.0, 41.0, 68.0, 99.0, 158.0, 298.0, 484.0, 800.0, 1252.0, 2068.0, 3278.0, 5191.0, 8032.0, 12088.0, 18102.0, 25640.0, 35872.0, 48289.0, 60574.0, 74325.0, 85538.0, 93189.0, 96181.0, 93711.0, 85917.0, 73847.0, 61001.0, 47918.0, 35952.0, 26063.0, 18078.0, 12383.0, 8171.0, 5269.0, 3274.0, 2023.0, 1336.0, 774.0, 482.0, 310.0, 163.0, 99.0, 70.0, 42.0, 26.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.0599365234375, -14.549560546875, -14.0391845703125, -13.52880859375, -13.0184326171875, -12.508056640625, -11.9976806640625, -11.4873046875, -10.9769287109375, -10.466552734375, -9.9561767578125, -9.44580078125, -8.9354248046875, -8.425048828125, -7.9146728515625, -7.404296875, -6.8939208984375, -6.383544921875, -5.8731689453125, -5.36279296875, -4.8524169921875, -4.342041015625, -3.8316650390625, -3.3212890625, -2.8109130859375, -2.300537109375, -1.7901611328125, -1.27978515625, -0.7694091796875, -0.259033203125, 0.2513427734375, 0.76171875, 1.2720947265625, 1.782470703125, 2.2928466796875, 2.80322265625, 3.3135986328125, 3.823974609375, 4.3343505859375, 4.8447265625, 5.3551025390625, 5.865478515625, 6.3758544921875, 6.88623046875, 7.3966064453125, 7.906982421875, 8.4173583984375, 8.927734375, 9.4381103515625, 9.948486328125, 10.4588623046875, 10.96923828125, 11.4796142578125, 11.989990234375, 12.5003662109375, 13.0107421875, 13.5211181640625, 14.031494140625, 14.5418701171875, 15.05224609375, 15.5626220703125, 16.072998046875, 16.5833740234375, 17.09375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 10.0, 9.0, 17.0, 15.0, 6.0, 16.0, 19.0, 26.0, 28.0, 26.0, 23.0, 26.0, 26.0, 39.0, 37.0, 30.0, 45.0, 30.0, 43.0, 30.0, 41.0, 35.0, 34.0, 49.0, 41.0, 28.0, 40.0, 33.0, 25.0, 22.0, 23.0, 14.0, 12.0, 20.0, 12.0, 13.0, 13.0, 9.0, 4.0, 9.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.140625, -24.388916015625, -23.63720703125, -22.885498046875, -22.1337890625, -21.382080078125, -20.63037109375, -19.878662109375, -19.126953125, -18.375244140625, -17.62353515625, -16.871826171875, -16.1201171875, -15.368408203125, -14.61669921875, -13.864990234375, -13.11328125, -12.361572265625, -11.60986328125, -10.858154296875, -10.1064453125, -9.354736328125, -8.60302734375, -7.851318359375, -7.099609375, -6.347900390625, -5.59619140625, -4.844482421875, -4.0927734375, -3.341064453125, -2.58935546875, -1.837646484375, -1.0859375, -0.334228515625, 0.41748046875, 1.169189453125, 1.9208984375, 2.672607421875, 3.42431640625, 4.176025390625, 4.927734375, 5.679443359375, 6.43115234375, 7.182861328125, 7.9345703125, 8.686279296875, 9.43798828125, 10.189697265625, 10.94140625, 11.693115234375, 12.44482421875, 13.196533203125, 13.9482421875, 14.699951171875, 15.45166015625, 16.203369140625, 16.955078125, 17.706787109375, 18.45849609375, 19.210205078125, 19.9619140625, 20.713623046875, 21.46533203125, 22.217041015625, 22.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 12.0, 13.0, 27.0, 45.0, 83.0, 115.0, 225.0, 306.0, 514.0, 819.0, 1340.0, 2166.0, 3518.0, 5477.0, 8672.0, 13307.0, 19777.0, 28801.0, 40012.0, 53712.0, 68779.0, 82576.0, 93601.0, 99517.0, 99803.0, 94032.0, 83717.0, 68328.0, 54085.0, 39959.0, 28928.0, 19735.0, 13117.0, 8608.0, 5483.0, 3570.0, 2173.0, 1373.0, 868.0, 530.0, 326.0, 196.0, 93.0, 70.0, 62.0, 35.0, 17.0, 15.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-19.359375, -18.7900390625, -18.220703125, -17.6513671875, -17.08203125, -16.5126953125, -15.943359375, -15.3740234375, -14.8046875, -14.2353515625, -13.666015625, -13.0966796875, -12.52734375, -11.9580078125, -11.388671875, -10.8193359375, -10.25, -9.6806640625, -9.111328125, -8.5419921875, -7.97265625, -7.4033203125, -6.833984375, -6.2646484375, -5.6953125, -5.1259765625, -4.556640625, -3.9873046875, -3.41796875, -2.8486328125, -2.279296875, -1.7099609375, -1.140625, -0.5712890625, -0.001953125, 0.5673828125, 1.13671875, 1.7060546875, 2.275390625, 2.8447265625, 3.4140625, 3.9833984375, 4.552734375, 5.1220703125, 5.69140625, 6.2607421875, 6.830078125, 7.3994140625, 7.96875, 8.5380859375, 9.107421875, 9.6767578125, 10.24609375, 10.8154296875, 11.384765625, 11.9541015625, 12.5234375, 13.0927734375, 13.662109375, 14.2314453125, 14.80078125, 15.3701171875, 15.939453125, 16.5087890625, 17.078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 7.0, 7.0, 6.0, 6.0, 16.0, 21.0, 21.0, 20.0, 19.0, 26.0, 26.0, 34.0, 37.0, 30.0, 39.0, 38.0, 38.0, 44.0, 37.0, 48.0, 40.0, 37.0, 37.0, 44.0, 44.0, 27.0, 34.0, 18.0, 30.0, 26.0, 24.0, 25.0, 12.0, 11.0, 7.0, 12.0, 9.0, 9.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-20.03125, -19.4989013671875, -18.966552734375, -18.4342041015625, -17.90185546875, -17.3695068359375, -16.837158203125, -16.3048095703125, -15.7724609375, -15.2401123046875, -14.707763671875, -14.1754150390625, -13.64306640625, -13.1107177734375, -12.578369140625, -12.0460205078125, -11.513671875, -10.9813232421875, -10.448974609375, -9.9166259765625, -9.38427734375, -8.8519287109375, -8.319580078125, -7.7872314453125, -7.2548828125, -6.7225341796875, -6.190185546875, -5.6578369140625, -5.12548828125, -4.5931396484375, -4.060791015625, -3.5284423828125, -2.99609375, -2.4637451171875, -1.931396484375, -1.3990478515625, -0.86669921875, -0.3343505859375, 0.197998046875, 0.7303466796875, 1.2626953125, 1.7950439453125, 2.327392578125, 2.8597412109375, 3.39208984375, 3.9244384765625, 4.456787109375, 4.9891357421875, 5.521484375, 6.0538330078125, 6.586181640625, 7.1185302734375, 7.65087890625, 8.1832275390625, 8.715576171875, 9.2479248046875, 9.7802734375, 10.3126220703125, 10.844970703125, 11.3773193359375, 11.90966796875, 12.4420166015625, 12.974365234375, 13.5067138671875, 14.0390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 12.0, 18.0, 25.0, 47.0, 59.0, 100.0, 145.0, 230.0, 354.0, 485.0, 802.0, 1325.0, 2064.0, 3274.0, 5582.0, 9375.0, 16178.0, 28214.0, 46706.0, 74368.0, 107177.0, 137896.0, 151233.0, 141926.0, 112899.0, 80444.0, 51137.0, 31368.0, 18432.0, 10762.0, 6122.0, 3672.0, 2273.0, 1373.0, 879.0, 536.0, 362.0, 261.0, 141.0, 87.0, 74.0, 34.0, 35.0, 20.0, 19.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.984375, -11.6051025390625, -11.225830078125, -10.8465576171875, -10.46728515625, -10.0880126953125, -9.708740234375, -9.3294677734375, -8.9501953125, -8.5709228515625, -8.191650390625, -7.8123779296875, -7.43310546875, -7.0538330078125, -6.674560546875, -6.2952880859375, -5.916015625, -5.5367431640625, -5.157470703125, -4.7781982421875, -4.39892578125, -4.0196533203125, -3.640380859375, -3.2611083984375, -2.8818359375, -2.5025634765625, -2.123291015625, -1.7440185546875, -1.36474609375, -0.9854736328125, -0.606201171875, -0.2269287109375, 0.15234375, 0.5316162109375, 0.910888671875, 1.2901611328125, 1.66943359375, 2.0487060546875, 2.427978515625, 2.8072509765625, 3.1865234375, 3.5657958984375, 3.945068359375, 4.3243408203125, 4.70361328125, 5.0828857421875, 5.462158203125, 5.8414306640625, 6.220703125, 6.5999755859375, 6.979248046875, 7.3585205078125, 7.73779296875, 8.1170654296875, 8.496337890625, 8.8756103515625, 9.2548828125, 9.6341552734375, 10.013427734375, 10.3927001953125, 10.77197265625, 11.1512451171875, 11.530517578125, 11.9097900390625, 12.2890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 7.0, 18.0, 16.0, 25.0, 31.0, 34.0, 36.0, 44.0, 51.0, 63.0, 82.0, 67.0, 81.0, 71.0, 81.0, 55.0, 44.0, 40.0, 23.0, 24.0, 24.0, 16.0, 20.0, 12.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014066696166992188, -0.0013528019189834595, -0.0012989342212677002, -0.001245066523551941, -0.0011911988258361816, -0.0011373311281204224, -0.001083463430404663, -0.0010295957326889038, -0.0009757280349731445, -0.0009218603372573853, -0.000867992639541626, -0.0008141249418258667, -0.0007602572441101074, -0.0007063895463943481, -0.0006525218486785889, -0.0005986541509628296, -0.0005447864532470703, -0.000490918755531311, -0.00043705105781555176, -0.0003831833600997925, -0.0003293156623840332, -0.0002754479646682739, -0.00022158026695251465, -0.00016771256923675537, -0.0001138448715209961, -5.9977173805236816e-05, -6.109476089477539e-06, 4.775822162628174e-05, 0.00010162591934204102, 0.0001554936170578003, 0.00020936131477355957, 0.00026322901248931885, 0.0003170967102050781, 0.0003709644079208374, 0.0004248321056365967, 0.00047869980335235596, 0.0005325675010681152, 0.0005864351987838745, 0.0006403028964996338, 0.0006941705942153931, 0.0007480382919311523, 0.0008019059896469116, 0.0008557736873626709, 0.0009096413850784302, 0.0009635090827941895, 0.0010173767805099487, 0.001071244478225708, 0.0011251121759414673, 0.0011789798736572266, 0.0012328475713729858, 0.0012867152690887451, 0.0013405829668045044, 0.0013944506645202637, 0.001448318362236023, 0.0015021860599517822, 0.0015560537576675415, 0.0016099214553833008, 0.00166378915309906, 0.0017176568508148193, 0.0017715245485305786, 0.0018253922462463379, 0.0018792599439620972, 0.0019331276416778564, 0.0019869953393936157, 0.002040863037109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 21.0, 21.0, 33.0, 42.0, 70.0, 90.0, 158.0, 228.0, 352.0, 559.0, 822.0, 1240.0, 1915.0, 2760.0, 4356.0, 6278.0, 9342.0, 13838.0, 20510.0, 29375.0, 41734.0, 56745.0, 74251.0, 90292.0, 102892.0, 108147.0, 104146.0, 93698.0, 77543.0, 60928.0, 45560.0, 32149.0, 22483.0, 14997.0, 10268.0, 6890.0, 4571.0, 3090.0, 2055.0, 1331.0, 900.0, 626.0, 403.0, 284.0, 192.0, 122.0, 94.0, 52.0, 32.0, 18.0, 10.0, 17.0, 9.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-9.03125, -8.74560546875, -8.4599609375, -8.17431640625, -7.888671875, -7.60302734375, -7.3173828125, -7.03173828125, -6.74609375, -6.46044921875, -6.1748046875, -5.88916015625, -5.603515625, -5.31787109375, -5.0322265625, -4.74658203125, -4.4609375, -4.17529296875, -3.8896484375, -3.60400390625, -3.318359375, -3.03271484375, -2.7470703125, -2.46142578125, -2.17578125, -1.89013671875, -1.6044921875, -1.31884765625, -1.033203125, -0.74755859375, -0.4619140625, -0.17626953125, 0.109375, 0.39501953125, 0.6806640625, 0.96630859375, 1.251953125, 1.53759765625, 1.8232421875, 2.10888671875, 2.39453125, 2.68017578125, 2.9658203125, 3.25146484375, 3.537109375, 3.82275390625, 4.1083984375, 4.39404296875, 4.6796875, 4.96533203125, 5.2509765625, 5.53662109375, 5.822265625, 6.10791015625, 6.3935546875, 6.67919921875, 6.96484375, 7.25048828125, 7.5361328125, 7.82177734375, 8.107421875, 8.39306640625, 8.6787109375, 8.96435546875, 9.25]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 9.0, 8.0, 10.0, 13.0, 7.0, 11.0, 10.0, 29.0, 26.0, 32.0, 22.0, 36.0, 38.0, 41.0, 41.0, 61.0, 37.0, 59.0, 55.0, 52.0, 60.0, 32.0, 46.0, 31.0, 41.0, 35.0, 28.0, 27.0, 27.0, 14.0, 12.0, 13.0, 5.0, 9.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.20733642578125, -4.0670166015625, -3.92669677734375, -3.786376953125, -3.64605712890625, -3.5057373046875, -3.36541748046875, -3.22509765625, -3.08477783203125, -2.9444580078125, -2.80413818359375, -2.663818359375, -2.52349853515625, -2.3831787109375, -2.24285888671875, -2.1025390625, -1.96221923828125, -1.8218994140625, -1.68157958984375, -1.541259765625, -1.40093994140625, -1.2606201171875, -1.12030029296875, -0.97998046875, -0.83966064453125, -0.6993408203125, -0.55902099609375, -0.418701171875, -0.27838134765625, -0.1380615234375, 0.00225830078125, 0.142578125, 0.28289794921875, 0.4232177734375, 0.56353759765625, 0.703857421875, 0.84417724609375, 0.9844970703125, 1.12481689453125, 1.26513671875, 1.40545654296875, 1.5457763671875, 1.68609619140625, 1.826416015625, 1.96673583984375, 2.1070556640625, 2.24737548828125, 2.3876953125, 2.52801513671875, 2.6683349609375, 2.80865478515625, 2.948974609375, 3.08929443359375, 3.2296142578125, 3.36993408203125, 3.51025390625, 3.65057373046875, 3.7908935546875, 3.93121337890625, 4.071533203125, 4.21185302734375, 4.3521728515625, 4.49249267578125, 4.6328125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 11.0, 10.0, 14.0, 16.0, 13.0, 12.0, 25.0, 21.0, 34.0, 37.0, 40.0, 52.0, 48.0, 48.0, 50.0, 49.0, 44.0, 47.0, 46.0, 46.0, 43.0, 33.0, 37.0, 30.0, 26.0, 31.0, 25.0, 18.0, 16.0, 17.0, 12.0, 12.0, 6.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.349365234375, -27.52082061767578, -26.692276000976562, -25.863731384277344, -25.035186767578125, -24.206642150878906, -23.378097534179688, -22.5495548248291, -21.721010208129883, -20.892465591430664, -20.063920974731445, -19.235376358032227, -18.406831741333008, -17.578289031982422, -16.749744415283203, -15.921199798583984, -15.09265422821045, -14.26410961151123, -13.435564994812012, -12.60702133178711, -11.77847671508789, -10.949932098388672, -10.121387481689453, -9.292842864990234, -8.464298248291016, -7.635753631591797, -6.807209491729736, -5.978664875030518, -5.150120735168457, -4.321576118469238, -3.4930315017700195, -2.664487361907959, -1.8359432220458984, -1.0073988437652588, -0.1788543462753296, 0.6496901512145996, 1.4782345294952393, 2.306778907775879, 3.1353235244750977, 3.963867664337158, 4.792412281036377, 5.620956897735596, 6.449501037597656, 7.278045654296875, 8.106590270996094, 8.935134887695312, 9.763679504394531, 10.592223167419434, 11.420767784118652, 12.249312400817871, 13.07785701751709, 13.906400680541992, 14.734945297241211, 15.56348991394043, 16.39203453063965, 17.220579147338867, 18.049123764038086, 18.877668380737305, 19.706212997436523, 20.534757614135742, 21.36330223083496, 22.191844940185547, 23.020389556884766, 23.848934173583984, 24.677478790283203]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 2.0, 8.0, 7.0, 7.0, 18.0, 15.0, 13.0, 10.0, 21.0, 20.0, 23.0, 28.0, 24.0, 18.0, 26.0, 31.0, 35.0, 27.0, 39.0, 31.0, 40.0, 32.0, 38.0, 42.0, 36.0, 29.0, 29.0, 34.0, 39.0, 39.0, 26.0, 32.0, 22.0, 23.0, 19.0, 21.0, 15.0, 16.0, 7.0, 7.0, 9.0, 9.0, 6.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.60373878479004, -21.873626708984375, -21.143516540527344, -20.41340446472168, -19.68329429626465, -18.953182220458984, -18.223072052001953, -17.49295997619629, -16.762849807739258, -16.032737731933594, -15.302627563476562, -14.572516441345215, -13.842405319213867, -13.11229419708252, -12.382183074951172, -11.652070999145508, -10.92195987701416, -10.191848754882812, -9.461737632751465, -8.731626510620117, -8.00151538848877, -7.271404266357422, -6.541292667388916, -5.811181545257568, -5.081070423126221, -4.350959300994873, -3.6208481788635254, -2.8907368183135986, -2.160625696182251, -1.4305145740509033, -0.7004032135009766, 0.029707908630371094, 0.7598190307617188, 1.4899301528930664, 2.220041275024414, 2.950152635574341, 3.6802637577056885, 4.410374641418457, 5.140486240386963, 5.8705973625183105, 6.600708484649658, 7.330819606781006, 8.060931205749512, 8.79104232788086, 9.521153450012207, 10.251264572143555, 10.981375694274902, 11.71148681640625, 12.441597938537598, 13.171709060668945, 13.901820182800293, 14.63193130493164, 15.362042427062988, 16.092153549194336, 16.822265625, 17.55237579345703, 18.282487869262695, 19.01259994506836, 19.74271011352539, 20.472822189331055, 21.202932357788086, 21.93304443359375, 22.66315460205078, 23.393266677856445, 24.123376846313477]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 12.0, 23.0, 29.0, 38.0, 66.0, 133.0, 225.0, 327.0, 555.0, 989.0, 1565.0, 2666.0, 4488.0, 7238.0, 11684.0, 18788.0, 29714.0, 46231.0, 69931.0, 102921.0, 145775.0, 197836.0, 257454.0, 317753.0, 366843.0, 401118.0, 407516.0, 386722.0, 346661.0, 289487.0, 231028.0, 173813.0, 125493.0, 86993.0, 58614.0, 38345.0, 24644.0, 15813.0, 9686.0, 5962.0, 3640.0, 2195.0, 1327.0, 757.0, 515.0, 267.0, 169.0, 95.0, 58.0, 35.0, 20.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.984375, -15.473388671875, -14.96240234375, -14.451416015625, -13.9404296875, -13.429443359375, -12.91845703125, -12.407470703125, -11.896484375, -11.385498046875, -10.87451171875, -10.363525390625, -9.8525390625, -9.341552734375, -8.83056640625, -8.319580078125, -7.80859375, -7.297607421875, -6.78662109375, -6.275634765625, -5.7646484375, -5.253662109375, -4.74267578125, -4.231689453125, -3.720703125, -3.209716796875, -2.69873046875, -2.187744140625, -1.6767578125, -1.165771484375, -0.65478515625, -0.143798828125, 0.3671875, 0.878173828125, 1.38916015625, 1.900146484375, 2.4111328125, 2.922119140625, 3.43310546875, 3.944091796875, 4.455078125, 4.966064453125, 5.47705078125, 5.988037109375, 6.4990234375, 7.010009765625, 7.52099609375, 8.031982421875, 8.54296875, 9.053955078125, 9.56494140625, 10.075927734375, 10.5869140625, 11.097900390625, 11.60888671875, 12.119873046875, 12.630859375, 13.141845703125, 13.65283203125, 14.163818359375, 14.6748046875, 15.185791015625, 15.69677734375, 16.207763671875, 16.71875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 4.0, 7.0, 6.0, 16.0, 13.0, 15.0, 11.0, 16.0, 19.0, 21.0, 26.0, 23.0, 22.0, 22.0, 29.0, 26.0, 35.0, 38.0, 31.0, 30.0, 42.0, 36.0, 34.0, 45.0, 33.0, 28.0, 44.0, 20.0, 50.0, 27.0, 29.0, 29.0, 15.0, 24.0, 23.0, 21.0, 12.0, 14.0, 7.0, 8.0, 10.0, 5.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.03125, -19.381591796875, -18.73193359375, -18.082275390625, -17.4326171875, -16.782958984375, -16.13330078125, -15.483642578125, -14.833984375, -14.184326171875, -13.53466796875, -12.885009765625, -12.2353515625, -11.585693359375, -10.93603515625, -10.286376953125, -9.63671875, -8.987060546875, -8.33740234375, -7.687744140625, -7.0380859375, -6.388427734375, -5.73876953125, -5.089111328125, -4.439453125, -3.789794921875, -3.14013671875, -2.490478515625, -1.8408203125, -1.191162109375, -0.54150390625, 0.108154296875, 0.7578125, 1.407470703125, 2.05712890625, 2.706787109375, 3.3564453125, 4.006103515625, 4.65576171875, 5.305419921875, 5.955078125, 6.604736328125, 7.25439453125, 7.904052734375, 8.5537109375, 9.203369140625, 9.85302734375, 10.502685546875, 11.15234375, 11.802001953125, 12.45166015625, 13.101318359375, 13.7509765625, 14.400634765625, 15.05029296875, 15.699951171875, 16.349609375, 16.999267578125, 17.64892578125, 18.298583984375, 18.9482421875, 19.597900390625, 20.24755859375, 20.897216796875, 21.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 6.0, 24.0, 35.0, 57.0, 112.0, 171.0, 295.0, 484.0, 846.0, 1368.0, 2274.0, 3721.0, 6320.0, 9894.0, 15211.0, 24183.0, 35972.0, 52865.0, 76538.0, 106224.0, 142806.0, 186179.0, 232599.0, 278069.0, 317094.0, 346122.0, 360209.0, 353416.0, 332170.0, 295527.0, 252739.0, 206458.0, 161965.0, 120711.0, 88502.0, 62367.0, 42412.0, 28668.0, 18499.0, 11939.0, 7525.0, 4714.0, 2866.0, 1631.0, 1026.0, 605.0, 388.0, 201.0, 118.0, 70.0, 37.0, 32.0, 12.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.875, -15.358154296875, -14.84130859375, -14.324462890625, -13.8076171875, -13.290771484375, -12.77392578125, -12.257080078125, -11.740234375, -11.223388671875, -10.70654296875, -10.189697265625, -9.6728515625, -9.156005859375, -8.63916015625, -8.122314453125, -7.60546875, -7.088623046875, -6.57177734375, -6.054931640625, -5.5380859375, -5.021240234375, -4.50439453125, -3.987548828125, -3.470703125, -2.953857421875, -2.43701171875, -1.920166015625, -1.4033203125, -0.886474609375, -0.36962890625, 0.147216796875, 0.6640625, 1.180908203125, 1.69775390625, 2.214599609375, 2.7314453125, 3.248291015625, 3.76513671875, 4.281982421875, 4.798828125, 5.315673828125, 5.83251953125, 6.349365234375, 6.8662109375, 7.383056640625, 7.89990234375, 8.416748046875, 8.93359375, 9.450439453125, 9.96728515625, 10.484130859375, 11.0009765625, 11.517822265625, 12.03466796875, 12.551513671875, 13.068359375, 13.585205078125, 14.10205078125, 14.618896484375, 15.1357421875, 15.652587890625, 16.16943359375, 16.686279296875, 17.203125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 11.0, 12.0, 11.0, 25.0, 37.0, 34.0, 49.0, 44.0, 70.0, 73.0, 92.0, 100.0, 115.0, 114.0, 125.0, 154.0, 174.0, 194.0, 199.0, 214.0, 185.0, 187.0, 168.0, 173.0, 199.0, 176.0, 156.0, 135.0, 123.0, 132.0, 121.0, 90.0, 71.0, 63.0, 56.0, 26.0, 31.0, 33.0, 23.0, 12.0, 10.0, 16.0, 11.0, 9.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1796875, -9.863037109375, -9.54638671875, -9.229736328125, -8.9130859375, -8.596435546875, -8.27978515625, -7.963134765625, -7.646484375, -7.329833984375, -7.01318359375, -6.696533203125, -6.3798828125, -6.063232421875, -5.74658203125, -5.429931640625, -5.11328125, -4.796630859375, -4.47998046875, -4.163330078125, -3.8466796875, -3.530029296875, -3.21337890625, -2.896728515625, -2.580078125, -2.263427734375, -1.94677734375, -1.630126953125, -1.3134765625, -0.996826171875, -0.68017578125, -0.363525390625, -0.046875, 0.269775390625, 0.58642578125, 0.903076171875, 1.2197265625, 1.536376953125, 1.85302734375, 2.169677734375, 2.486328125, 2.802978515625, 3.11962890625, 3.436279296875, 3.7529296875, 4.069580078125, 4.38623046875, 4.702880859375, 5.01953125, 5.336181640625, 5.65283203125, 5.969482421875, 6.2861328125, 6.602783203125, 6.91943359375, 7.236083984375, 7.552734375, 7.869384765625, 8.18603515625, 8.502685546875, 8.8193359375, 9.135986328125, 9.45263671875, 9.769287109375, 10.0859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 18.0, 17.0, 23.0, 26.0, 23.0, 35.0, 24.0, 36.0, 37.0, 44.0, 40.0, 52.0, 37.0, 52.0, 51.0, 45.0, 59.0, 38.0, 44.0, 31.0, 37.0, 43.0, 33.0, 23.0, 26.0, 24.0, 13.0, 12.0, 13.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.2209358215332, -31.280160903930664, -30.339387893676758, -29.39861297607422, -28.45783805847168, -27.51706314086914, -26.576290130615234, -25.635515213012695, -24.694740295410156, -23.753965377807617, -22.81319236755371, -21.872417449951172, -20.931642532348633, -19.990867614746094, -19.050094604492188, -18.10931968688965, -17.16854476928711, -16.22776985168457, -15.286995887756348, -14.346221923828125, -13.405447006225586, -12.464673042297363, -11.52389907836914, -10.583124160766602, -9.642351150512695, -8.701577186584473, -7.760802268981934, -6.820028305053711, -5.879253387451172, -4.938479423522949, -3.9977049827575684, -3.0569305419921875, -2.1161556243896484, -1.1753811836242676, -0.23460686206817627, 0.706167459487915, 1.646941900253296, 2.5877161026000977, 3.5284905433654785, 4.469264984130859, 5.41003942489624, 6.350813865661621, 7.291588306427002, 8.232362747192383, 9.173136711120605, 10.113910675048828, 11.054685592651367, 11.995460510253906, 12.936234474182129, 13.877008438110352, 14.81778335571289, 15.758557319641113, 16.699331283569336, 17.640106201171875, 18.580881118774414, 19.521656036376953, 20.46242904663086, 21.4032039642334, 22.343976974487305, 23.284751892089844, 24.225526809692383, 25.166301727294922, 26.107074737548828, 27.047849655151367, 27.988624572753906]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 2.0, 4.0, 10.0, 11.0, 10.0, 13.0, 13.0, 12.0, 21.0, 24.0, 27.0, 30.0, 25.0, 36.0, 36.0, 30.0, 31.0, 51.0, 43.0, 27.0, 37.0, 45.0, 46.0, 51.0, 38.0, 34.0, 35.0, 39.0, 31.0, 20.0, 31.0, 23.0, 23.0, 18.0, 19.0, 8.0, 11.0, 6.0, 11.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.168256759643555, -24.31243133544922, -23.456605911254883, -22.600778579711914, -21.744953155517578, -20.889127731323242, -20.033302307128906, -19.177474975585938, -18.3216495513916, -17.465824127197266, -16.60999870300293, -15.754172325134277, -14.898345947265625, -14.042520523071289, -13.186695098876953, -12.3308687210083, -11.475043296813965, -10.619217872619629, -9.763391494750977, -8.90756607055664, -8.051739692687988, -7.195914268493652, -6.340088367462158, -5.484262466430664, -4.62843656539917, -3.772610664367676, -2.9167847633361816, -2.0609591007232666, -1.2051331996917725, -0.3493075370788574, 0.5065183639526367, 1.3623442649841309, 2.218170166015625, 3.073996067047119, 3.9298219680786133, 4.785647392272949, 5.641473770141602, 6.4972991943359375, 7.353125095367432, 8.208950996398926, 9.064777374267578, 9.920602798461914, 10.776429176330566, 11.632254600524902, 12.488080978393555, 13.34390640258789, 14.199731826782227, 15.055558204650879, 15.911383628845215, 16.767210006713867, 17.623035430908203, 18.47886085510254, 19.334686279296875, 20.190513610839844, 21.04633903503418, 21.902164459228516, 22.75798988342285, 23.613815307617188, 24.469640731811523, 25.325468063354492, 26.181293487548828, 27.037118911743164, 27.8929443359375, 28.74877166748047, 29.604597091674805]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 19.0, 19.0, 31.0, 54.0, 65.0, 120.0, 171.0, 275.0, 412.0, 580.0, 920.0, 1328.0, 2060.0, 3407.0, 5042.0, 7835.0, 11983.0, 18192.0, 28018.0, 42846.0, 65623.0, 97523.0, 134092.0, 154792.0, 143835.0, 110267.0, 75854.0, 49834.0, 32656.0, 21340.0, 13894.0, 8673.0, 5835.0, 3820.0, 2431.0, 1596.0, 1054.0, 707.0, 475.0, 294.0, 182.0, 131.0, 87.0, 57.0, 38.0, 27.0, 20.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.753662109375, -8.46826171875, -8.182861328125, -7.8974609375, -7.612060546875, -7.32666015625, -7.041259765625, -6.755859375, -6.470458984375, -6.18505859375, -5.899658203125, -5.6142578125, -5.328857421875, -5.04345703125, -4.758056640625, -4.47265625, -4.187255859375, -3.90185546875, -3.616455078125, -3.3310546875, -3.045654296875, -2.76025390625, -2.474853515625, -2.189453125, -1.904052734375, -1.61865234375, -1.333251953125, -1.0478515625, -0.762451171875, -0.47705078125, -0.191650390625, 0.09375, 0.379150390625, 0.66455078125, 0.949951171875, 1.2353515625, 1.520751953125, 1.80615234375, 2.091552734375, 2.376953125, 2.662353515625, 2.94775390625, 3.233154296875, 3.5185546875, 3.803955078125, 4.08935546875, 4.374755859375, 4.66015625, 4.945556640625, 5.23095703125, 5.516357421875, 5.8017578125, 6.087158203125, 6.37255859375, 6.657958984375, 6.943359375, 7.228759765625, 7.51416015625, 7.799560546875, 8.0849609375, 8.370361328125, 8.65576171875, 8.941162109375, 9.2265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 5.0, 2.0, 5.0, 10.0, 9.0, 11.0, 13.0, 14.0, 11.0, 20.0, 25.0, 27.0, 30.0, 26.0, 35.0, 33.0, 36.0, 27.0, 55.0, 37.0, 34.0, 37.0, 43.0, 47.0, 49.0, 38.0, 37.0, 29.0, 44.0, 32.0, 17.0, 29.0, 24.0, 24.0, 19.0, 19.0, 7.0, 10.0, 7.0, 10.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.328125, -24.469970703125, -23.61181640625, -22.753662109375, -21.8955078125, -21.037353515625, -20.17919921875, -19.321044921875, -18.462890625, -17.604736328125, -16.74658203125, -15.888427734375, -15.0302734375, -14.172119140625, -13.31396484375, -12.455810546875, -11.59765625, -10.739501953125, -9.88134765625, -9.023193359375, -8.1650390625, -7.306884765625, -6.44873046875, -5.590576171875, -4.732421875, -3.874267578125, -3.01611328125, -2.157958984375, -1.2998046875, -0.441650390625, 0.41650390625, 1.274658203125, 2.1328125, 2.990966796875, 3.84912109375, 4.707275390625, 5.5654296875, 6.423583984375, 7.28173828125, 8.139892578125, 8.998046875, 9.856201171875, 10.71435546875, 11.572509765625, 12.4306640625, 13.288818359375, 14.14697265625, 15.005126953125, 15.86328125, 16.721435546875, 17.57958984375, 18.437744140625, 19.2958984375, 20.154052734375, 21.01220703125, 21.870361328125, 22.728515625, 23.586669921875, 24.44482421875, 25.302978515625, 26.1611328125, 27.019287109375, 27.87744140625, 28.735595703125, 29.59375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 8.0, 8.0, 10.0, 10.0, 18.0, 28.0, 39.0, 52.0, 69.0, 127.0, 185.0, 285.0, 444.0, 677.0, 1029.0, 1713.0, 2870.0, 4774.0, 8497.0, 16037.0, 32643.0, 74630.0, 199282.0, 370232.0, 193583.0, 72870.0, 32071.0, 15778.0, 8353.0, 4877.0, 2740.0, 1681.0, 992.0, 688.0, 424.0, 291.0, 176.0, 105.0, 75.0, 58.0, 33.0, 25.0, 21.0, 14.0, 13.0, 5.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.40625, -15.916259765625, -15.42626953125, -14.936279296875, -14.4462890625, -13.956298828125, -13.46630859375, -12.976318359375, -12.486328125, -11.996337890625, -11.50634765625, -11.016357421875, -10.5263671875, -10.036376953125, -9.54638671875, -9.056396484375, -8.56640625, -8.076416015625, -7.58642578125, -7.096435546875, -6.6064453125, -6.116455078125, -5.62646484375, -5.136474609375, -4.646484375, -4.156494140625, -3.66650390625, -3.176513671875, -2.6865234375, -2.196533203125, -1.70654296875, -1.216552734375, -0.7265625, -0.236572265625, 0.25341796875, 0.743408203125, 1.2333984375, 1.723388671875, 2.21337890625, 2.703369140625, 3.193359375, 3.683349609375, 4.17333984375, 4.663330078125, 5.1533203125, 5.643310546875, 6.13330078125, 6.623291015625, 7.11328125, 7.603271484375, 8.09326171875, 8.583251953125, 9.0732421875, 9.563232421875, 10.05322265625, 10.543212890625, 11.033203125, 11.523193359375, 12.01318359375, 12.503173828125, 12.9931640625, 13.483154296875, 13.97314453125, 14.463134765625, 14.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 9.0, 8.0, 8.0, 17.0, 12.0, 15.0, 13.0, 28.0, 26.0, 22.0, 28.0, 35.0, 27.0, 32.0, 36.0, 27.0, 42.0, 29.0, 47.0, 40.0, 30.0, 39.0, 43.0, 34.0, 36.0, 29.0, 23.0, 39.0, 29.0, 23.0, 24.0, 25.0, 11.0, 13.0, 13.0, 6.0, 19.0, 8.0, 6.0, 6.0, 6.0, 14.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-17.984375, -17.449462890625, -16.91455078125, -16.379638671875, -15.8447265625, -15.309814453125, -14.77490234375, -14.239990234375, -13.705078125, -13.170166015625, -12.63525390625, -12.100341796875, -11.5654296875, -11.030517578125, -10.49560546875, -9.960693359375, -9.42578125, -8.890869140625, -8.35595703125, -7.821044921875, -7.2861328125, -6.751220703125, -6.21630859375, -5.681396484375, -5.146484375, -4.611572265625, -4.07666015625, -3.541748046875, -3.0068359375, -2.471923828125, -1.93701171875, -1.402099609375, -0.8671875, -0.332275390625, 0.20263671875, 0.737548828125, 1.2724609375, 1.807373046875, 2.34228515625, 2.877197265625, 3.412109375, 3.947021484375, 4.48193359375, 5.016845703125, 5.5517578125, 6.086669921875, 6.62158203125, 7.156494140625, 7.69140625, 8.226318359375, 8.76123046875, 9.296142578125, 9.8310546875, 10.365966796875, 10.90087890625, 11.435791015625, 11.970703125, 12.505615234375, 13.04052734375, 13.575439453125, 14.1103515625, 14.645263671875, 15.18017578125, 15.715087890625, 16.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 11.0, 8.0, 9.0, 14.0, 20.0, 30.0, 45.0, 60.0, 56.0, 120.0, 121.0, 195.0, 287.0, 436.0, 613.0, 1064.0, 1861.0, 3350.0, 6439.0, 14001.0, 37756.0, 160265.0, 632929.0, 129563.0, 33089.0, 12747.0, 5895.0, 3073.0, 1687.0, 946.0, 622.0, 389.0, 251.0, 164.0, 139.0, 99.0, 59.0, 38.0, 29.0, 20.0, 14.0, 4.0, 10.0, 4.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.093994140625, -15.54736328125, -15.000732421875, -14.4541015625, -13.907470703125, -13.36083984375, -12.814208984375, -12.267578125, -11.720947265625, -11.17431640625, -10.627685546875, -10.0810546875, -9.534423828125, -8.98779296875, -8.441162109375, -7.89453125, -7.347900390625, -6.80126953125, -6.254638671875, -5.7080078125, -5.161376953125, -4.61474609375, -4.068115234375, -3.521484375, -2.974853515625, -2.42822265625, -1.881591796875, -1.3349609375, -0.788330078125, -0.24169921875, 0.304931640625, 0.8515625, 1.398193359375, 1.94482421875, 2.491455078125, 3.0380859375, 3.584716796875, 4.13134765625, 4.677978515625, 5.224609375, 5.771240234375, 6.31787109375, 6.864501953125, 7.4111328125, 7.957763671875, 8.50439453125, 9.051025390625, 9.59765625, 10.144287109375, 10.69091796875, 11.237548828125, 11.7841796875, 12.330810546875, 12.87744140625, 13.424072265625, 13.970703125, 14.517333984375, 15.06396484375, 15.610595703125, 16.1572265625, 16.703857421875, 17.25048828125, 17.797119140625, 18.34375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 28.0, 39.0, 82.0, 153.0, 213.0, 187.0, 121.0, 50.0, 27.0, 22.0, 16.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0017261505126953125, -0.0016749203205108643, -0.001623690128326416, -0.0015724599361419678, -0.0015212297439575195, -0.0014699995517730713, -0.001418769359588623, -0.0013675391674041748, -0.0013163089752197266, -0.0012650787830352783, -0.00121384859085083, -0.0011626183986663818, -0.0011113882064819336, -0.0010601580142974854, -0.0010089278221130371, -0.0009576976299285889, -0.0009064674377441406, -0.0008552372455596924, -0.0008040070533752441, -0.0007527768611907959, -0.0007015466690063477, -0.0006503164768218994, -0.0005990862846374512, -0.0005478560924530029, -0.0004966259002685547, -0.00044539570808410645, -0.0003941655158996582, -0.00034293532371520996, -0.0002917051315307617, -0.00024047493934631348, -0.00018924474716186523, -0.000138014554977417, -8.678436279296875e-05, -3.555417060852051e-05, 1.5676021575927734e-05, 6.690621376037598e-05, 0.00011813640594482422, 0.00016936659812927246, 0.0002205967903137207, 0.00027182698249816895, 0.0003230571746826172, 0.00037428736686706543, 0.00042551755905151367, 0.0004767477512359619, 0.0005279779434204102, 0.0005792081356048584, 0.0006304383277893066, 0.0006816685199737549, 0.0007328987121582031, 0.0007841289043426514, 0.0008353590965270996, 0.0008865892887115479, 0.0009378194808959961, 0.0009890496730804443, 0.0010402798652648926, 0.0010915100574493408, 0.001142740249633789, 0.0011939704418182373, 0.0012452006340026855, 0.0012964308261871338, 0.001347661018371582, 0.0013988912105560303, 0.0014501214027404785, 0.0015013515949249268, 0.001552581787109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 3.0, 10.0, 5.0, 14.0, 24.0, 19.0, 27.0, 29.0, 51.0, 60.0, 91.0, 141.0, 168.0, 271.0, 383.0, 538.0, 872.0, 1328.0, 2120.0, 3308.0, 5652.0, 10050.0, 18369.0, 35537.0, 71537.0, 145550.0, 245043.0, 234903.0, 133565.0, 65749.0, 32599.0, 17006.0, 9364.0, 5318.0, 3188.0, 1919.0, 1223.0, 770.0, 558.0, 369.0, 230.0, 165.0, 104.0, 77.0, 69.0, 51.0, 28.0, 28.0, 22.0, 16.0, 8.0, 9.0, 6.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.3359375, -10.957275390625, -10.57861328125, -10.199951171875, -9.8212890625, -9.442626953125, -9.06396484375, -8.685302734375, -8.306640625, -7.927978515625, -7.54931640625, -7.170654296875, -6.7919921875, -6.413330078125, -6.03466796875, -5.656005859375, -5.27734375, -4.898681640625, -4.52001953125, -4.141357421875, -3.7626953125, -3.384033203125, -3.00537109375, -2.626708984375, -2.248046875, -1.869384765625, -1.49072265625, -1.112060546875, -0.7333984375, -0.354736328125, 0.02392578125, 0.402587890625, 0.78125, 1.159912109375, 1.53857421875, 1.917236328125, 2.2958984375, 2.674560546875, 3.05322265625, 3.431884765625, 3.810546875, 4.189208984375, 4.56787109375, 4.946533203125, 5.3251953125, 5.703857421875, 6.08251953125, 6.461181640625, 6.83984375, 7.218505859375, 7.59716796875, 7.975830078125, 8.3544921875, 8.733154296875, 9.11181640625, 9.490478515625, 9.869140625, 10.247802734375, 10.62646484375, 11.005126953125, 11.3837890625, 11.762451171875, 12.14111328125, 12.519775390625, 12.8984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 19.0, 15.0, 19.0, 22.0, 27.0, 33.0, 46.0, 45.0, 53.0, 64.0, 73.0, 75.0, 81.0, 64.0, 49.0, 43.0, 41.0, 38.0, 39.0, 21.0, 16.0, 16.0, 20.0, 4.0, 8.0, 7.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.0390625, -3.9146728515625, -3.790283203125, -3.6658935546875, -3.54150390625, -3.4171142578125, -3.292724609375, -3.1683349609375, -3.0439453125, -2.9195556640625, -2.795166015625, -2.6707763671875, -2.54638671875, -2.4219970703125, -2.297607421875, -2.1732177734375, -2.048828125, -1.9244384765625, -1.800048828125, -1.6756591796875, -1.55126953125, -1.4268798828125, -1.302490234375, -1.1781005859375, -1.0537109375, -0.9293212890625, -0.804931640625, -0.6805419921875, -0.55615234375, -0.4317626953125, -0.307373046875, -0.1829833984375, -0.05859375, 0.0657958984375, 0.190185546875, 0.3145751953125, 0.43896484375, 0.5633544921875, 0.687744140625, 0.8121337890625, 0.9365234375, 1.0609130859375, 1.185302734375, 1.3096923828125, 1.43408203125, 1.5584716796875, 1.682861328125, 1.8072509765625, 1.931640625, 2.0560302734375, 2.180419921875, 2.3048095703125, 2.42919921875, 2.5535888671875, 2.677978515625, 2.8023681640625, 2.9267578125, 3.0511474609375, 3.175537109375, 3.2999267578125, 3.42431640625, 3.5487060546875, 3.673095703125, 3.7974853515625, 3.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 11.0, 11.0, 16.0, 19.0, 20.0, 27.0, 36.0, 32.0, 22.0, 37.0, 34.0, 42.0, 41.0, 44.0, 44.0, 49.0, 59.0, 53.0, 44.0, 42.0, 46.0, 25.0, 26.0, 46.0, 32.0, 31.0, 24.0, 14.0, 18.0, 12.0, 11.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.32973098754883, -31.400022506713867, -30.470312118530273, -29.540603637695312, -28.61089324951172, -27.681184768676758, -26.751476287841797, -25.821765899658203, -24.89205551147461, -23.96234703063965, -23.032636642456055, -22.102928161621094, -21.1732177734375, -20.24350929260254, -19.313800811767578, -18.384090423583984, -17.454381942749023, -16.524673461914062, -15.594963073730469, -14.665254592895508, -13.735544204711914, -12.805835723876953, -11.876126289367676, -10.946416854858398, -10.016707420349121, -9.086997985839844, -8.157288551330566, -7.227579593658447, -6.29787015914917, -5.368160724639893, -4.438451766967773, -3.508742332458496, -2.5790348052978516, -1.6493254899978638, -0.719616174697876, 0.21009302139282227, 1.1398024559020996, 2.069511890411377, 2.999220848083496, 3.9289302825927734, 4.858639717102051, 5.788349151611328, 6.7180585861206055, 7.647767543792725, 8.577476501464844, 9.507186889648438, 10.436895370483398, 11.366604804992676, 12.296314239501953, 13.22602367401123, 14.155733108520508, 15.085441589355469, 16.015151977539062, 16.944860458374023, 17.874568939208984, 18.804279327392578, 19.733989715576172, 20.663698196411133, 21.593408584594727, 22.523117065429688, 23.45282745361328, 24.382535934448242, 25.312244415283203, 26.241954803466797, 27.171663284301758]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 5.0, 5.0, 10.0, 15.0, 13.0, 9.0, 16.0, 19.0, 18.0, 28.0, 25.0, 30.0, 34.0, 33.0, 42.0, 31.0, 38.0, 42.0, 41.0, 45.0, 28.0, 49.0, 55.0, 39.0, 39.0, 31.0, 39.0, 20.0, 28.0, 32.0, 22.0, 24.0, 17.0, 13.0, 21.0, 6.0, 7.0, 8.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.670787811279297, -24.803524017333984, -23.936262130737305, -23.068998336791992, -22.201736450195312, -21.33447265625, -20.467208862304688, -19.599945068359375, -18.732683181762695, -17.865419387817383, -16.998157501220703, -16.13089370727539, -15.263630867004395, -14.396368026733398, -13.529104232788086, -12.66184139251709, -11.794578552246094, -10.927315711975098, -10.060052871704102, -9.192789077758789, -8.325526237487793, -7.458263397216797, -6.591000080108643, -5.723736763000488, -4.856473922729492, -3.989210844039917, -3.121947765350342, -2.2546846866607666, -1.3874216079711914, -0.5201587677001953, 0.347104549407959, 1.2143678665161133, 2.0816307067871094, 2.9488937854766846, 3.8161568641662598, 4.683420181274414, 5.55068302154541, 6.417945861816406, 7.2852091789245605, 8.152472496032715, 9.019735336303711, 9.886998176574707, 10.754261016845703, 11.621524810791016, 12.488787651062012, 13.356050491333008, 14.22331428527832, 15.090577125549316, 15.957839965820312, 16.825103759765625, 17.692365646362305, 18.559629440307617, 19.426891326904297, 20.29415512084961, 21.161418914794922, 22.028682708740234, 22.895944595336914, 23.763208389282227, 24.630470275878906, 25.49773406982422, 26.36499786376953, 27.23225975036621, 28.099523544311523, 28.966785430908203, 29.834049224853516]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 2.0, 8.0, 12.0, 23.0, 38.0, 67.0, 84.0, 122.0, 240.0, 403.0, 638.0, 1040.0, 1694.0, 2651.0, 4169.0, 6247.0, 9689.0, 14080.0, 20335.0, 28361.0, 37853.0, 49218.0, 61670.0, 72886.0, 82813.0, 88754.0, 91065.0, 88848.0, 81626.0, 71829.0, 59801.0, 48322.0, 37030.0, 27368.0, 19751.0, 13730.0, 9290.0, 5987.0, 3996.0, 2550.0, 1607.0, 1019.0, 621.0, 415.0, 262.0, 141.0, 90.0, 55.0, 27.0, 16.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2554931640625, -14.737548828125, -14.2196044921875, -13.70166015625, -13.1837158203125, -12.665771484375, -12.1478271484375, -11.6298828125, -11.1119384765625, -10.593994140625, -10.0760498046875, -9.55810546875, -9.0401611328125, -8.522216796875, -8.0042724609375, -7.486328125, -6.9683837890625, -6.450439453125, -5.9324951171875, -5.41455078125, -4.8966064453125, -4.378662109375, -3.8607177734375, -3.3427734375, -2.8248291015625, -2.306884765625, -1.7889404296875, -1.27099609375, -0.7530517578125, -0.235107421875, 0.2828369140625, 0.80078125, 1.3187255859375, 1.836669921875, 2.3546142578125, 2.87255859375, 3.3905029296875, 3.908447265625, 4.4263916015625, 4.9443359375, 5.4622802734375, 5.980224609375, 6.4981689453125, 7.01611328125, 7.5340576171875, 8.052001953125, 8.5699462890625, 9.087890625, 9.6058349609375, 10.123779296875, 10.6417236328125, 11.15966796875, 11.6776123046875, 12.195556640625, 12.7135009765625, 13.2314453125, 13.7493896484375, 14.267333984375, 14.7852783203125, 15.30322265625, 15.8211669921875, 16.339111328125, 16.8570556640625, 17.375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 9.0, 5.0, 5.0, 8.0, 9.0, 17.0, 12.0, 7.0, 18.0, 19.0, 19.0, 26.0, 31.0, 27.0, 35.0, 32.0, 42.0, 31.0, 41.0, 42.0, 39.0, 44.0, 33.0, 46.0, 51.0, 37.0, 41.0, 36.0, 34.0, 20.0, 31.0, 28.0, 22.0, 23.0, 17.0, 13.0, 19.0, 6.0, 9.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -23.940673828125, -23.10009765625, -22.259521484375, -21.4189453125, -20.578369140625, -19.73779296875, -18.897216796875, -18.056640625, -17.216064453125, -16.37548828125, -15.534912109375, -14.6943359375, -13.853759765625, -13.01318359375, -12.172607421875, -11.33203125, -10.491455078125, -9.65087890625, -8.810302734375, -7.9697265625, -7.129150390625, -6.28857421875, -5.447998046875, -4.607421875, -3.766845703125, -2.92626953125, -2.085693359375, -1.2451171875, -0.404541015625, 0.43603515625, 1.276611328125, 2.1171875, 2.957763671875, 3.79833984375, 4.638916015625, 5.4794921875, 6.320068359375, 7.16064453125, 8.001220703125, 8.841796875, 9.682373046875, 10.52294921875, 11.363525390625, 12.2041015625, 13.044677734375, 13.88525390625, 14.725830078125, 15.56640625, 16.406982421875, 17.24755859375, 18.088134765625, 18.9287109375, 19.769287109375, 20.60986328125, 21.450439453125, 22.291015625, 23.131591796875, 23.97216796875, 24.812744140625, 25.6533203125, 26.493896484375, 27.33447265625, 28.175048828125, 29.015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 18.0, 17.0, 38.0, 61.0, 117.0, 156.0, 284.0, 502.0, 872.0, 1386.0, 2473.0, 4055.0, 6798.0, 10983.0, 17762.0, 27313.0, 40938.0, 57359.0, 76424.0, 94648.0, 109226.0, 115077.0, 111222.0, 99074.0, 82015.0, 62242.0, 45033.0, 30732.0, 20246.0, 12549.0, 7589.0, 4652.0, 2768.0, 1567.0, 937.0, 554.0, 345.0, 214.0, 140.0, 66.0, 42.0, 20.0, 22.0, 3.0, 5.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.84619140625, -21.1767578125, -20.50732421875, -19.837890625, -19.16845703125, -18.4990234375, -17.82958984375, -17.16015625, -16.49072265625, -15.8212890625, -15.15185546875, -14.482421875, -13.81298828125, -13.1435546875, -12.47412109375, -11.8046875, -11.13525390625, -10.4658203125, -9.79638671875, -9.126953125, -8.45751953125, -7.7880859375, -7.11865234375, -6.44921875, -5.77978515625, -5.1103515625, -4.44091796875, -3.771484375, -3.10205078125, -2.4326171875, -1.76318359375, -1.09375, -0.42431640625, 0.2451171875, 0.91455078125, 1.583984375, 2.25341796875, 2.9228515625, 3.59228515625, 4.26171875, 4.93115234375, 5.6005859375, 6.27001953125, 6.939453125, 7.60888671875, 8.2783203125, 8.94775390625, 9.6171875, 10.28662109375, 10.9560546875, 11.62548828125, 12.294921875, 12.96435546875, 13.6337890625, 14.30322265625, 14.97265625, 15.64208984375, 16.3115234375, 16.98095703125, 17.650390625, 18.31982421875, 18.9892578125, 19.65869140625, 20.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 7.0, 9.0, 9.0, 23.0, 21.0, 13.0, 25.0, 23.0, 41.0, 37.0, 41.0, 42.0, 34.0, 37.0, 51.0, 44.0, 48.0, 45.0, 41.0, 41.0, 40.0, 35.0, 45.0, 43.0, 25.0, 25.0, 22.0, 19.0, 18.0, 17.0, 14.0, 12.0, 7.0, 5.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.71875, -17.11279296875, -16.5068359375, -15.90087890625, -15.294921875, -14.68896484375, -14.0830078125, -13.47705078125, -12.87109375, -12.26513671875, -11.6591796875, -11.05322265625, -10.447265625, -9.84130859375, -9.2353515625, -8.62939453125, -8.0234375, -7.41748046875, -6.8115234375, -6.20556640625, -5.599609375, -4.99365234375, -4.3876953125, -3.78173828125, -3.17578125, -2.56982421875, -1.9638671875, -1.35791015625, -0.751953125, -0.14599609375, 0.4599609375, 1.06591796875, 1.671875, 2.27783203125, 2.8837890625, 3.48974609375, 4.095703125, 4.70166015625, 5.3076171875, 5.91357421875, 6.51953125, 7.12548828125, 7.7314453125, 8.33740234375, 8.943359375, 9.54931640625, 10.1552734375, 10.76123046875, 11.3671875, 11.97314453125, 12.5791015625, 13.18505859375, 13.791015625, 14.39697265625, 15.0029296875, 15.60888671875, 16.21484375, 16.82080078125, 17.4267578125, 18.03271484375, 18.638671875, 19.24462890625, 19.8505859375, 20.45654296875, 21.0625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 12.0, 13.0, 18.0, 27.0, 34.0, 53.0, 67.0, 99.0, 144.0, 209.0, 290.0, 448.0, 669.0, 1163.0, 1730.0, 2913.0, 5039.0, 8493.0, 14807.0, 25656.0, 42405.0, 66335.0, 95925.0, 124950.0, 142822.0, 141457.0, 120986.0, 92040.0, 62808.0, 39393.0, 23813.0, 13674.0, 7981.0, 4612.0, 2851.0, 1690.0, 902.0, 656.0, 433.0, 279.0, 201.0, 132.0, 107.0, 58.0, 55.0, 28.0, 23.0, 29.0, 14.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.0526123046875, -10.683349609375, -10.3140869140625, -9.94482421875, -9.5755615234375, -9.206298828125, -8.8370361328125, -8.4677734375, -8.0985107421875, -7.729248046875, -7.3599853515625, -6.99072265625, -6.6214599609375, -6.252197265625, -5.8829345703125, -5.513671875, -5.1444091796875, -4.775146484375, -4.4058837890625, -4.03662109375, -3.6673583984375, -3.298095703125, -2.9288330078125, -2.5595703125, -2.1903076171875, -1.821044921875, -1.4517822265625, -1.08251953125, -0.7132568359375, -0.343994140625, 0.0252685546875, 0.39453125, 0.7637939453125, 1.133056640625, 1.5023193359375, 1.87158203125, 2.2408447265625, 2.610107421875, 2.9793701171875, 3.3486328125, 3.7178955078125, 4.087158203125, 4.4564208984375, 4.82568359375, 5.1949462890625, 5.564208984375, 5.9334716796875, 6.302734375, 6.6719970703125, 7.041259765625, 7.4105224609375, 7.77978515625, 8.1490478515625, 8.518310546875, 8.8875732421875, 9.2568359375, 9.6260986328125, 9.995361328125, 10.3646240234375, 10.73388671875, 11.1031494140625, 11.472412109375, 11.8416748046875, 12.2109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 4.0, 18.0, 19.0, 31.0, 39.0, 41.0, 53.0, 98.0, 82.0, 77.0, 98.0, 79.0, 60.0, 83.0, 60.0, 37.0, 41.0, 21.0, 13.0, 13.0, 13.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002044677734375, -0.00197717547416687, -0.0019096732139587402, -0.0018421709537506104, -0.0017746686935424805, -0.0017071664333343506, -0.0016396641731262207, -0.0015721619129180908, -0.001504659652709961, -0.001437157392501831, -0.0013696551322937012, -0.0013021528720855713, -0.0012346506118774414, -0.0011671483516693115, -0.0010996460914611816, -0.0010321438312530518, -0.0009646415710449219, -0.000897139310836792, -0.0008296370506286621, -0.0007621347904205322, -0.0006946325302124023, -0.0006271302700042725, -0.0005596280097961426, -0.0004921257495880127, -0.0004246234893798828, -0.00035712122917175293, -0.00028961896896362305, -0.00022211670875549316, -0.00015461444854736328, -8.71121883392334e-05, -1.9609928131103516e-05, 4.789233207702637e-05, 0.00011539459228515625, 0.00018289685249328613, 0.000250399112701416, 0.0003179013729095459, 0.0003854036331176758, 0.00045290589332580566, 0.0005204081535339355, 0.0005879104137420654, 0.0006554126739501953, 0.0007229149341583252, 0.0007904171943664551, 0.000857919454574585, 0.0009254217147827148, 0.0009929239749908447, 0.0010604262351989746, 0.0011279284954071045, 0.0011954307556152344, 0.0012629330158233643, 0.0013304352760314941, 0.001397937536239624, 0.001465439796447754, 0.0015329420566558838, 0.0016004443168640137, 0.0016679465770721436, 0.0017354488372802734, 0.0018029510974884033, 0.0018704533576965332, 0.001937955617904663, 0.002005457878112793, 0.002072960138320923, 0.0021404623985290527, 0.0022079646587371826, 0.0022754669189453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 20.0, 17.0, 24.0, 46.0, 75.0, 127.0, 175.0, 326.0, 485.0, 761.0, 1229.0, 2159.0, 3641.0, 6071.0, 9960.0, 16291.0, 26533.0, 42414.0, 63036.0, 86859.0, 110844.0, 127252.0, 128841.0, 118142.0, 97392.0, 72338.0, 49957.0, 32641.0, 20008.0, 12302.0, 7361.0, 4402.0, 2636.0, 1625.0, 944.0, 622.0, 347.0, 236.0, 147.0, 93.0, 58.0, 35.0, 26.0, 19.0, 8.0, 7.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.3046875, -11.9449462890625, -11.585205078125, -11.2254638671875, -10.86572265625, -10.5059814453125, -10.146240234375, -9.7864990234375, -9.4267578125, -9.0670166015625, -8.707275390625, -8.3475341796875, -7.98779296875, -7.6280517578125, -7.268310546875, -6.9085693359375, -6.548828125, -6.1890869140625, -5.829345703125, -5.4696044921875, -5.10986328125, -4.7501220703125, -4.390380859375, -4.0306396484375, -3.6708984375, -3.3111572265625, -2.951416015625, -2.5916748046875, -2.23193359375, -1.8721923828125, -1.512451171875, -1.1527099609375, -0.79296875, -0.4332275390625, -0.073486328125, 0.2862548828125, 0.64599609375, 1.0057373046875, 1.365478515625, 1.7252197265625, 2.0849609375, 2.4447021484375, 2.804443359375, 3.1641845703125, 3.52392578125, 3.8836669921875, 4.243408203125, 4.6031494140625, 4.962890625, 5.3226318359375, 5.682373046875, 6.0421142578125, 6.40185546875, 6.7615966796875, 7.121337890625, 7.4810791015625, 7.8408203125, 8.2005615234375, 8.560302734375, 8.9200439453125, 9.27978515625, 9.6395263671875, 9.999267578125, 10.3590087890625, 10.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 13.0, 10.0, 8.0, 15.0, 24.0, 24.0, 30.0, 26.0, 39.0, 49.0, 35.0, 47.0, 57.0, 55.0, 64.0, 57.0, 63.0, 62.0, 54.0, 54.0, 36.0, 38.0, 29.0, 19.0, 24.0, 15.0, 14.0, 6.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.19140625, -6.01123046875, -5.8310546875, -5.65087890625, -5.470703125, -5.29052734375, -5.1103515625, -4.93017578125, -4.75, -4.56982421875, -4.3896484375, -4.20947265625, -4.029296875, -3.84912109375, -3.6689453125, -3.48876953125, -3.30859375, -3.12841796875, -2.9482421875, -2.76806640625, -2.587890625, -2.40771484375, -2.2275390625, -2.04736328125, -1.8671875, -1.68701171875, -1.5068359375, -1.32666015625, -1.146484375, -0.96630859375, -0.7861328125, -0.60595703125, -0.42578125, -0.24560546875, -0.0654296875, 0.11474609375, 0.294921875, 0.47509765625, 0.6552734375, 0.83544921875, 1.015625, 1.19580078125, 1.3759765625, 1.55615234375, 1.736328125, 1.91650390625, 2.0966796875, 2.27685546875, 2.45703125, 2.63720703125, 2.8173828125, 2.99755859375, 3.177734375, 3.35791015625, 3.5380859375, 3.71826171875, 3.8984375, 4.07861328125, 4.2587890625, 4.43896484375, 4.619140625, 4.79931640625, 4.9794921875, 5.15966796875, 5.33984375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 5.0, 6.0, 4.0, 10.0, 17.0, 18.0, 18.0, 16.0, 18.0, 21.0, 34.0, 19.0, 39.0, 30.0, 28.0, 44.0, 40.0, 44.0, 35.0, 42.0, 37.0, 32.0, 36.0, 37.0, 46.0, 39.0, 19.0, 33.0, 32.0, 18.0, 26.0, 16.0, 27.0, 14.0, 14.0, 16.0, 13.0, 13.0, 11.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.643314361572266, -21.868803024291992, -21.09429168701172, -20.319780349731445, -19.545269012451172, -18.7707576751709, -17.996246337890625, -17.22173500061035, -16.447223663330078, -15.672712326049805, -14.898200988769531, -14.123689651489258, -13.349178314208984, -12.574666976928711, -11.800155639648438, -11.025644302368164, -10.251133918762207, -9.476622581481934, -8.70211124420166, -7.927599906921387, -7.153088569641113, -6.37857723236084, -5.604066371917725, -4.829555034637451, -4.055043697357178, -3.2805323600769043, -2.506021022796631, -1.7315099239349365, -0.9569985866546631, -0.18248724937438965, 0.5920238494873047, 1.3665351867675781, 2.1410465240478516, 2.915557861328125, 3.6900691986083984, 4.464580535888672, 5.239091873168945, 6.013603210449219, 6.788114070892334, 7.562625408172607, 8.337137222290039, 9.111648559570312, 9.886159896850586, 10.66067123413086, 11.435182571411133, 12.209693908691406, 12.98420524597168, 13.758716583251953, 14.53322696685791, 15.307738304138184, 16.08224868774414, 16.856760025024414, 17.631271362304688, 18.40578269958496, 19.180294036865234, 19.954805374145508, 20.72931671142578, 21.503828048706055, 22.278339385986328, 23.0528507232666, 23.827362060546875, 24.60187339782715, 25.376384735107422, 26.150896072387695, 26.92540740966797]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 9.0, 14.0, 6.0, 6.0, 7.0, 17.0, 20.0, 27.0, 29.0, 28.0, 26.0, 37.0, 40.0, 36.0, 22.0, 47.0, 49.0, 38.0, 36.0, 42.0, 44.0, 38.0, 45.0, 25.0, 31.0, 24.0, 35.0, 30.0, 27.0, 27.0, 22.0, 22.0, 7.0, 12.0, 13.0, 13.0, 12.0, 4.0, 9.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.092042922973633, -26.248403549194336, -25.404762268066406, -24.56112289428711, -23.717483520507812, -22.873844146728516, -22.030202865600586, -21.18656349182129, -20.34292221069336, -19.499282836914062, -18.655641555786133, -17.812002182006836, -16.96836280822754, -16.12472152709961, -15.281082153320312, -14.437442779541016, -13.593803405761719, -12.750163078308105, -11.906523704528809, -11.062883377075195, -10.219244003295898, -9.375603675842285, -8.531963348388672, -7.688323497772217, -6.844683647155762, -6.001043796539307, -5.157403945922852, -4.313763618469238, -3.470123767852783, -2.626483917236328, -1.7828435897827148, -0.9392037391662598, -0.09556388854980469, 0.7480760812759399, 1.5917160511016846, 2.4353561401367188, 3.278995990753174, 4.122635841369629, 4.966276168823242, 5.809916019439697, 6.653555870056152, 7.497195720672607, 8.340835571289062, 9.184475898742676, 10.028116226196289, 10.871755599975586, 11.7153959274292, 12.559036254882812, 13.40267562866211, 14.246315956115723, 15.08995532989502, 15.933595657348633, 16.77723503112793, 17.62087631225586, 18.464515686035156, 19.308155059814453, 20.15179443359375, 20.995433807373047, 21.839075088500977, 22.682714462280273, 23.52635383605957, 24.3699951171875, 25.213634490966797, 26.057273864746094, 26.900915145874023]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 12.0, 17.0, 22.0, 29.0, 53.0, 86.0, 144.0, 267.0, 428.0, 735.0, 1217.0, 1899.0, 3125.0, 4982.0, 8104.0, 12578.0, 19556.0, 30395.0, 45263.0, 66994.0, 96538.0, 135359.0, 180066.0, 232783.0, 287972.0, 336456.0, 371137.0, 386491.0, 379120.0, 350516.0, 305784.0, 253065.0, 198143.0, 149532.0, 108376.0, 76919.0, 52327.0, 35064.0, 22858.0, 14670.0, 9519.0, 5846.0, 3832.0, 2276.0, 1482.0, 890.0, 554.0, 329.0, 191.0, 86.0, 81.0, 44.0, 26.0, 19.0, 15.0, 9.0, 5.0, 4.0], "bins": [-17.5, -16.9803466796875, -16.460693359375, -15.9410400390625, -15.42138671875, -14.9017333984375, -14.382080078125, -13.8624267578125, -13.3427734375, -12.8231201171875, -12.303466796875, -11.7838134765625, -11.26416015625, -10.7445068359375, -10.224853515625, -9.7052001953125, -9.185546875, -8.6658935546875, -8.146240234375, -7.6265869140625, -7.10693359375, -6.5872802734375, -6.067626953125, -5.5479736328125, -5.0283203125, -4.5086669921875, -3.989013671875, -3.4693603515625, -2.94970703125, -2.4300537109375, -1.910400390625, -1.3907470703125, -0.87109375, -0.3514404296875, 0.168212890625, 0.6878662109375, 1.20751953125, 1.7271728515625, 2.246826171875, 2.7664794921875, 3.2861328125, 3.8057861328125, 4.325439453125, 4.8450927734375, 5.36474609375, 5.8843994140625, 6.404052734375, 6.9237060546875, 7.443359375, 7.9630126953125, 8.482666015625, 9.0023193359375, 9.52197265625, 10.0416259765625, 10.561279296875, 11.0809326171875, 11.6005859375, 12.1202392578125, 12.639892578125, 13.1595458984375, 13.67919921875, 14.1988525390625, 14.718505859375, 15.2381591796875, 15.7578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 5.0, 5.0, 10.0, 19.0, 28.0, 26.0, 25.0, 21.0, 43.0, 30.0, 39.0, 44.0, 28.0, 50.0, 36.0, 36.0, 39.0, 37.0, 51.0, 49.0, 27.0, 25.0, 34.0, 24.0, 35.0, 30.0, 28.0, 23.0, 17.0, 21.0, 9.0, 13.0, 12.0, 13.0, 6.0, 8.0, 6.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.75, -22.99609375, -22.2421875, -21.48828125, -20.734375, -19.98046875, -19.2265625, -18.47265625, -17.71875, -16.96484375, -16.2109375, -15.45703125, -14.703125, -13.94921875, -13.1953125, -12.44140625, -11.6875, -10.93359375, -10.1796875, -9.42578125, -8.671875, -7.91796875, -7.1640625, -6.41015625, -5.65625, -4.90234375, -4.1484375, -3.39453125, -2.640625, -1.88671875, -1.1328125, -0.37890625, 0.375, 1.12890625, 1.8828125, 2.63671875, 3.390625, 4.14453125, 4.8984375, 5.65234375, 6.40625, 7.16015625, 7.9140625, 8.66796875, 9.421875, 10.17578125, 10.9296875, 11.68359375, 12.4375, 13.19140625, 13.9453125, 14.69921875, 15.453125, 16.20703125, 16.9609375, 17.71484375, 18.46875, 19.22265625, 19.9765625, 20.73046875, 21.484375, 22.23828125, 22.9921875, 23.74609375, 24.5]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 21.0, 41.0, 61.0, 99.0, 199.0, 281.0, 539.0, 861.0, 1531.0, 2500.0, 3986.0, 6555.0, 10441.0, 16224.0, 25023.0, 37400.0, 54577.0, 78310.0, 108625.0, 144809.0, 186957.0, 232030.0, 276923.0, 316734.0, 343247.0, 355102.0, 349463.0, 327900.0, 293277.0, 251231.0, 205232.0, 161985.0, 122341.0, 90352.0, 63860.0, 43647.0, 29558.0, 19425.0, 12595.0, 7925.0, 4875.0, 3038.0, 1849.0, 1114.0, 656.0, 390.0, 232.0, 118.0, 64.0, 37.0, 14.0, 11.0, 5.0, 6.0, 1.0, 0.0, 3.0], "bins": [-17.765625, -17.222412109375, -16.67919921875, -16.135986328125, -15.5927734375, -15.049560546875, -14.50634765625, -13.963134765625, -13.419921875, -12.876708984375, -12.33349609375, -11.790283203125, -11.2470703125, -10.703857421875, -10.16064453125, -9.617431640625, -9.07421875, -8.531005859375, -7.98779296875, -7.444580078125, -6.9013671875, -6.358154296875, -5.81494140625, -5.271728515625, -4.728515625, -4.185302734375, -3.64208984375, -3.098876953125, -2.5556640625, -2.012451171875, -1.46923828125, -0.926025390625, -0.3828125, 0.160400390625, 0.70361328125, 1.246826171875, 1.7900390625, 2.333251953125, 2.87646484375, 3.419677734375, 3.962890625, 4.506103515625, 5.04931640625, 5.592529296875, 6.1357421875, 6.678955078125, 7.22216796875, 7.765380859375, 8.30859375, 8.851806640625, 9.39501953125, 9.938232421875, 10.4814453125, 11.024658203125, 11.56787109375, 12.111083984375, 12.654296875, 13.197509765625, 13.74072265625, 14.283935546875, 14.8271484375, 15.370361328125, 15.91357421875, 16.456787109375, 17.0]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 11.0, 11.0, 15.0, 17.0, 23.0, 27.0, 42.0, 44.0, 57.0, 71.0, 84.0, 109.0, 94.0, 124.0, 148.0, 143.0, 178.0, 180.0, 188.0, 196.0, 178.0, 223.0, 174.0, 207.0, 170.0, 181.0, 174.0, 126.0, 120.0, 124.0, 122.0, 93.0, 78.0, 65.0, 61.0, 48.0, 28.0, 29.0, 24.0, 16.0, 14.0, 15.0, 7.0, 9.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.28125, -9.9534912109375, -9.625732421875, -9.2979736328125, -8.97021484375, -8.6424560546875, -8.314697265625, -7.9869384765625, -7.6591796875, -7.3314208984375, -7.003662109375, -6.6759033203125, -6.34814453125, -6.0203857421875, -5.692626953125, -5.3648681640625, -5.037109375, -4.7093505859375, -4.381591796875, -4.0538330078125, -3.72607421875, -3.3983154296875, -3.070556640625, -2.7427978515625, -2.4150390625, -2.0872802734375, -1.759521484375, -1.4317626953125, -1.10400390625, -0.7762451171875, -0.448486328125, -0.1207275390625, 0.20703125, 0.5347900390625, 0.862548828125, 1.1903076171875, 1.51806640625, 1.8458251953125, 2.173583984375, 2.5013427734375, 2.8291015625, 3.1568603515625, 3.484619140625, 3.8123779296875, 4.14013671875, 4.4678955078125, 4.795654296875, 5.1234130859375, 5.451171875, 5.7789306640625, 6.106689453125, 6.4344482421875, 6.76220703125, 7.0899658203125, 7.417724609375, 7.7454833984375, 8.0732421875, 8.4010009765625, 8.728759765625, 9.0565185546875, 9.38427734375, 9.7120361328125, 10.039794921875, 10.3675537109375, 10.6953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 8.0, 9.0, 11.0, 10.0, 10.0, 16.0, 12.0, 17.0, 29.0, 27.0, 31.0, 36.0, 25.0, 32.0, 34.0, 52.0, 38.0, 27.0, 43.0, 50.0, 37.0, 42.0, 42.0, 29.0, 39.0, 36.0, 26.0, 27.0, 28.0, 21.0, 13.0, 16.0, 23.0, 16.0, 15.0, 9.0, 10.0, 9.0, 11.0, 6.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.139440536499023, -25.35384750366211, -24.568254470825195, -23.78266143798828, -22.997066497802734, -22.21147346496582, -21.425880432128906, -20.640287399291992, -19.854694366455078, -19.069101333618164, -18.28350830078125, -17.497913360595703, -16.71232032775879, -15.926727294921875, -15.141134262084961, -14.355541229248047, -13.569947242736816, -12.784354209899902, -11.998760223388672, -11.213167190551758, -10.427574157714844, -9.64198112487793, -8.8563871383667, -8.070794105529785, -7.285200595855713, -6.499607086181641, -5.714014053344727, -4.928420543670654, -4.142827033996582, -3.357234001159668, -2.5716404914855957, -1.7860474586486816, -1.0004539489746094, -0.21486061811447144, 0.5707327127456665, 1.3563261032104492, 2.1419193744659424, 2.9275126457214355, 3.713106155395508, 4.498699188232422, 5.284292697906494, 6.069886207580566, 6.8554792404174805, 7.641072750091553, 8.426666259765625, 9.212259292602539, 9.997852325439453, 10.783445358276367, 11.569039344787598, 12.354632377624512, 13.140226364135742, 13.925819396972656, 14.71141242980957, 15.497005462646484, 16.28260040283203, 17.068191528320312, 17.85378646850586, 18.639379501342773, 19.424972534179688, 20.210567474365234, 20.99616050720215, 21.781753540039062, 22.567346572875977, 23.35293960571289, 24.138532638549805]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 9.0, 9.0, 12.0, 11.0, 9.0, 15.0, 18.0, 7.0, 26.0, 21.0, 29.0, 36.0, 34.0, 33.0, 35.0, 34.0, 37.0, 43.0, 34.0, 45.0, 47.0, 37.0, 26.0, 18.0, 37.0, 34.0, 27.0, 29.0, 29.0, 26.0, 23.0, 21.0, 24.0, 19.0, 22.0, 7.0, 12.0, 8.0, 7.0, 10.0, 10.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-24.923303604125977, -24.14080238342285, -23.358299255371094, -22.57579803466797, -21.793296813964844, -21.010793685913086, -20.22829246520996, -19.445789337158203, -18.663288116455078, -17.880786895751953, -17.098283767700195, -16.31578254699707, -15.533280372619629, -14.750778198242188, -13.968276977539062, -13.185774803161621, -12.403273582458496, -11.620771408081055, -10.83827018737793, -10.055768013000488, -9.273265838623047, -8.490764617919922, -7.7082624435424805, -6.925760269165039, -6.143258571624756, -5.360756874084473, -4.578254699707031, -3.795753002166748, -3.0132510662078857, -2.2307491302490234, -1.4482474327087402, -0.6657452583312988, 0.11675643920898438, 0.8992583155632019, 1.6817601919174194, 2.464262008666992, 3.2467639446258545, 4.029265880584717, 4.811767578125, 5.594269752502441, 6.376771450042725, 7.159273147583008, 7.941775321960449, 8.72427749633789, 9.506778717041016, 10.289280891418457, 11.071783065795898, 11.854284286499023, 12.636786460876465, 13.419288635253906, 14.201789855957031, 14.984292030334473, 15.766794204711914, 16.54929542541504, 17.331798553466797, 18.114299774169922, 18.896800994873047, 19.679302215576172, 20.46180534362793, 21.244306564331055, 22.02680778503418, 22.809310913085938, 23.591812133789062, 24.374313354492188, 25.156816482543945]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 5.0, 2.0, 9.0, 14.0, 10.0, 10.0, 8.0, 20.0, 38.0, 54.0, 67.0, 110.0, 146.0, 188.0, 291.0, 431.0, 742.0, 1337.0, 2298.0, 4415.0, 8864.0, 18799.0, 42451.0, 97766.0, 205958.0, 285955.0, 202986.0, 96704.0, 41592.0, 18636.0, 8720.0, 4309.0, 2223.0, 1261.0, 744.0, 439.0, 294.0, 183.0, 137.0, 89.0, 71.0, 53.0, 33.0, 26.0, 14.0, 12.0, 17.0, 4.0, 3.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-16.609375, -16.09814453125, -15.5869140625, -15.07568359375, -14.564453125, -14.05322265625, -13.5419921875, -13.03076171875, -12.51953125, -12.00830078125, -11.4970703125, -10.98583984375, -10.474609375, -9.96337890625, -9.4521484375, -8.94091796875, -8.4296875, -7.91845703125, -7.4072265625, -6.89599609375, -6.384765625, -5.87353515625, -5.3623046875, -4.85107421875, -4.33984375, -3.82861328125, -3.3173828125, -2.80615234375, -2.294921875, -1.78369140625, -1.2724609375, -0.76123046875, -0.25, 0.26123046875, 0.7724609375, 1.28369140625, 1.794921875, 2.30615234375, 2.8173828125, 3.32861328125, 3.83984375, 4.35107421875, 4.8623046875, 5.37353515625, 5.884765625, 6.39599609375, 6.9072265625, 7.41845703125, 7.9296875, 8.44091796875, 8.9521484375, 9.46337890625, 9.974609375, 10.48583984375, 10.9970703125, 11.50830078125, 12.01953125, 12.53076171875, 13.0419921875, 13.55322265625, 14.064453125, 14.57568359375, 15.0869140625, 15.59814453125, 16.109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 10.0, 8.0, 11.0, 10.0, 10.0, 12.0, 21.0, 9.0, 21.0, 25.0, 29.0, 34.0, 35.0, 34.0, 37.0, 31.0, 37.0, 43.0, 35.0, 47.0, 47.0, 35.0, 28.0, 19.0, 37.0, 30.0, 30.0, 30.0, 26.0, 26.0, 24.0, 23.0, 25.0, 18.0, 18.0, 9.0, 13.0, 7.0, 9.0, 9.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-25.0625, -24.278076171875, -23.49365234375, -22.709228515625, -21.9248046875, -21.140380859375, -20.35595703125, -19.571533203125, -18.787109375, -18.002685546875, -17.21826171875, -16.433837890625, -15.6494140625, -14.864990234375, -14.08056640625, -13.296142578125, -12.51171875, -11.727294921875, -10.94287109375, -10.158447265625, -9.3740234375, -8.589599609375, -7.80517578125, -7.020751953125, -6.236328125, -5.451904296875, -4.66748046875, -3.883056640625, -3.0986328125, -2.314208984375, -1.52978515625, -0.745361328125, 0.0390625, 0.823486328125, 1.60791015625, 2.392333984375, 3.1767578125, 3.961181640625, 4.74560546875, 5.530029296875, 6.314453125, 7.098876953125, 7.88330078125, 8.667724609375, 9.4521484375, 10.236572265625, 11.02099609375, 11.805419921875, 12.58984375, 13.374267578125, 14.15869140625, 14.943115234375, 15.7275390625, 16.511962890625, 17.29638671875, 18.080810546875, 18.865234375, 19.649658203125, 20.43408203125, 21.218505859375, 22.0029296875, 22.787353515625, 23.57177734375, 24.356201171875, 25.140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 13.0, 11.0, 8.0, 20.0, 16.0, 33.0, 71.0, 68.0, 136.0, 221.0, 319.0, 557.0, 905.0, 1682.0, 3319.0, 6738.0, 16241.0, 48788.0, 196097.0, 497690.0, 196434.0, 48921.0, 16124.0, 6760.0, 3241.0, 1703.0, 948.0, 514.0, 343.0, 202.0, 132.0, 74.0, 66.0, 35.0, 29.0, 22.0, 12.0, 19.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.510498046875, -18.84912109375, -18.187744140625, -17.5263671875, -16.864990234375, -16.20361328125, -15.542236328125, -14.880859375, -14.219482421875, -13.55810546875, -12.896728515625, -12.2353515625, -11.573974609375, -10.91259765625, -10.251220703125, -9.58984375, -8.928466796875, -8.26708984375, -7.605712890625, -6.9443359375, -6.282958984375, -5.62158203125, -4.960205078125, -4.298828125, -3.637451171875, -2.97607421875, -2.314697265625, -1.6533203125, -0.991943359375, -0.33056640625, 0.330810546875, 0.9921875, 1.653564453125, 2.31494140625, 2.976318359375, 3.6376953125, 4.299072265625, 4.96044921875, 5.621826171875, 6.283203125, 6.944580078125, 7.60595703125, 8.267333984375, 8.9287109375, 9.590087890625, 10.25146484375, 10.912841796875, 11.57421875, 12.235595703125, 12.89697265625, 13.558349609375, 14.2197265625, 14.881103515625, 15.54248046875, 16.203857421875, 16.865234375, 17.526611328125, 18.18798828125, 18.849365234375, 19.5107421875, 20.172119140625, 20.83349609375, 21.494873046875, 22.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 2.0, 6.0, 4.0, 9.0, 5.0, 10.0, 10.0, 8.0, 9.0, 14.0, 17.0, 18.0, 19.0, 26.0, 28.0, 29.0, 33.0, 42.0, 21.0, 24.0, 42.0, 39.0, 43.0, 35.0, 31.0, 40.0, 37.0, 32.0, 27.0, 28.0, 35.0, 38.0, 29.0, 26.0, 18.0, 28.0, 26.0, 14.0, 17.0, 19.0, 9.0, 12.0, 8.0, 5.0, 9.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.767822265625, -14.23876953125, -13.709716796875, -13.1806640625, -12.651611328125, -12.12255859375, -11.593505859375, -11.064453125, -10.535400390625, -10.00634765625, -9.477294921875, -8.9482421875, -8.419189453125, -7.89013671875, -7.361083984375, -6.83203125, -6.302978515625, -5.77392578125, -5.244873046875, -4.7158203125, -4.186767578125, -3.65771484375, -3.128662109375, -2.599609375, -2.070556640625, -1.54150390625, -1.012451171875, -0.4833984375, 0.045654296875, 0.57470703125, 1.103759765625, 1.6328125, 2.161865234375, 2.69091796875, 3.219970703125, 3.7490234375, 4.278076171875, 4.80712890625, 5.336181640625, 5.865234375, 6.394287109375, 6.92333984375, 7.452392578125, 7.9814453125, 8.510498046875, 9.03955078125, 9.568603515625, 10.09765625, 10.626708984375, 11.15576171875, 11.684814453125, 12.2138671875, 12.742919921875, 13.27197265625, 13.801025390625, 14.330078125, 14.859130859375, 15.38818359375, 15.917236328125, 16.4462890625, 16.975341796875, 17.50439453125, 18.033447265625, 18.5625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 4.0, 9.0, 13.0, 22.0, 21.0, 29.0, 49.0, 63.0, 79.0, 131.0, 215.0, 306.0, 453.0, 714.0, 1125.0, 1865.0, 3083.0, 5871.0, 12727.0, 33551.0, 132661.0, 603317.0, 181337.0, 40702.0, 14712.0, 6651.0, 3545.0, 1946.0, 1135.0, 735.0, 445.0, 348.0, 209.0, 154.0, 106.0, 72.0, 32.0, 35.0, 27.0, 14.0, 19.0, 6.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.2598876953125, -12.840087890625, -12.4202880859375, -12.00048828125, -11.5806884765625, -11.160888671875, -10.7410888671875, -10.3212890625, -9.9014892578125, -9.481689453125, -9.0618896484375, -8.64208984375, -8.2222900390625, -7.802490234375, -7.3826904296875, -6.962890625, -6.5430908203125, -6.123291015625, -5.7034912109375, -5.28369140625, -4.8638916015625, -4.444091796875, -4.0242919921875, -3.6044921875, -3.1846923828125, -2.764892578125, -2.3450927734375, -1.92529296875, -1.5054931640625, -1.085693359375, -0.6658935546875, -0.24609375, 0.1737060546875, 0.593505859375, 1.0133056640625, 1.43310546875, 1.8529052734375, 2.272705078125, 2.6925048828125, 3.1123046875, 3.5321044921875, 3.951904296875, 4.3717041015625, 4.79150390625, 5.2113037109375, 5.631103515625, 6.0509033203125, 6.470703125, 6.8905029296875, 7.310302734375, 7.7301025390625, 8.14990234375, 8.5697021484375, 8.989501953125, 9.4093017578125, 9.8291015625, 10.2489013671875, 10.668701171875, 11.0885009765625, 11.50830078125, 11.9281005859375, 12.347900390625, 12.7677001953125, 13.1875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 9.0, 5.0, 7.0, 8.0, 7.0, 14.0, 15.0, 22.0, 37.0, 38.0, 59.0, 69.0, 69.0, 70.0, 100.0, 65.0, 76.0, 74.0, 55.0, 48.0, 39.0, 21.0, 29.0, 11.0, 12.0, 6.0, 11.0, 5.0, 2.0, 5.0, 0.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006546974182128906, -0.0006364732980728149, -0.0006182491779327393, -0.0006000250577926636, -0.0005818009376525879, -0.0005635768175125122, -0.0005453526973724365, -0.0005271285772323608, -0.0005089044570922852, -0.0004906803369522095, -0.0004724562168121338, -0.0004542320966720581, -0.0004360079765319824, -0.00041778385639190674, -0.00039955973625183105, -0.00038133561611175537, -0.0003631114959716797, -0.000344887375831604, -0.0003266632556915283, -0.00030843913555145264, -0.00029021501541137695, -0.00027199089527130127, -0.0002537667751312256, -0.0002355426549911499, -0.00021731853485107422, -0.00019909441471099854, -0.00018087029457092285, -0.00016264617443084717, -0.00014442205429077148, -0.0001261979341506958, -0.00010797381401062012, -8.974969387054443e-05, -7.152557373046875e-05, -5.3301453590393066e-05, -3.507733345031738e-05, -1.68532133102417e-05, 1.3709068298339844e-06, 1.9595026969909668e-05, 3.781914710998535e-05, 5.6043267250061035e-05, 7.426738739013672e-05, 9.24915075302124e-05, 0.00011071562767028809, 0.00012893974781036377, 0.00014716386795043945, 0.00016538798809051514, 0.00018361210823059082, 0.0002018362283706665, 0.0002200603485107422, 0.00023828446865081787, 0.00025650858879089355, 0.00027473270893096924, 0.0002929568290710449, 0.0003111809492111206, 0.0003294050693511963, 0.00034762918949127197, 0.00036585330963134766, 0.00038407742977142334, 0.000402301549911499, 0.0004205256700515747, 0.0004387497901916504, 0.0004569739103317261, 0.00047519803047180176, 0.0004934221506118774, 0.0005116462707519531]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 9.0, 15.0, 21.0, 17.0, 20.0, 34.0, 45.0, 56.0, 83.0, 111.0, 187.0, 243.0, 311.0, 496.0, 737.0, 988.0, 1481.0, 2275.0, 3458.0, 5467.0, 9098.0, 16031.0, 29756.0, 58566.0, 119634.0, 219002.0, 250824.0, 159738.0, 78986.0, 39307.0, 20738.0, 11543.0, 6794.0, 4086.0, 2717.0, 1817.0, 1172.0, 798.0, 587.0, 402.0, 253.0, 183.0, 116.0, 86.0, 80.0, 49.0, 40.0, 27.0, 20.0, 14.0, 13.0, 10.0, 10.0, 5.0, 2.0, 3.0, 1.0], "bins": [-11.03125, -10.6990966796875, -10.366943359375, -10.0347900390625, -9.70263671875, -9.3704833984375, -9.038330078125, -8.7061767578125, -8.3740234375, -8.0418701171875, -7.709716796875, -7.3775634765625, -7.04541015625, -6.7132568359375, -6.381103515625, -6.0489501953125, -5.716796875, -5.3846435546875, -5.052490234375, -4.7203369140625, -4.38818359375, -4.0560302734375, -3.723876953125, -3.3917236328125, -3.0595703125, -2.7274169921875, -2.395263671875, -2.0631103515625, -1.73095703125, -1.3988037109375, -1.066650390625, -0.7344970703125, -0.40234375, -0.0701904296875, 0.261962890625, 0.5941162109375, 0.92626953125, 1.2584228515625, 1.590576171875, 1.9227294921875, 2.2548828125, 2.5870361328125, 2.919189453125, 3.2513427734375, 3.58349609375, 3.9156494140625, 4.247802734375, 4.5799560546875, 4.912109375, 5.2442626953125, 5.576416015625, 5.9085693359375, 6.24072265625, 6.5728759765625, 6.905029296875, 7.2371826171875, 7.5693359375, 7.9014892578125, 8.233642578125, 8.5657958984375, 8.89794921875, 9.2301025390625, 9.562255859375, 9.8944091796875, 10.2265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 4.0, 6.0, 5.0, 7.0, 19.0, 19.0, 32.0, 38.0, 60.0, 80.0, 93.0, 119.0, 110.0, 115.0, 76.0, 48.0, 43.0, 30.0, 26.0, 14.0, 14.0, 6.0, 12.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.578125, -5.41046142578125, -5.2427978515625, -5.07513427734375, -4.907470703125, -4.73980712890625, -4.5721435546875, -4.40447998046875, -4.23681640625, -4.06915283203125, -3.9014892578125, -3.73382568359375, -3.566162109375, -3.39849853515625, -3.2308349609375, -3.06317138671875, -2.8955078125, -2.72784423828125, -2.5601806640625, -2.39251708984375, -2.224853515625, -2.05718994140625, -1.8895263671875, -1.72186279296875, -1.55419921875, -1.38653564453125, -1.2188720703125, -1.05120849609375, -0.883544921875, -0.71588134765625, -0.5482177734375, -0.38055419921875, -0.212890625, -0.04522705078125, 0.1224365234375, 0.29010009765625, 0.457763671875, 0.62542724609375, 0.7930908203125, 0.96075439453125, 1.12841796875, 1.29608154296875, 1.4637451171875, 1.63140869140625, 1.799072265625, 1.96673583984375, 2.1343994140625, 2.30206298828125, 2.4697265625, 2.63739013671875, 2.8050537109375, 2.97271728515625, 3.140380859375, 3.30804443359375, 3.4757080078125, 3.64337158203125, 3.81103515625, 3.97869873046875, 4.1463623046875, 4.31402587890625, 4.481689453125, 4.64935302734375, 4.8170166015625, 4.98468017578125, 5.15234375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 2.0, 4.0, 12.0, 2.0, 10.0, 12.0, 12.0, 10.0, 15.0, 15.0, 24.0, 24.0, 32.0, 26.0, 29.0, 35.0, 34.0, 31.0, 36.0, 42.0, 33.0, 33.0, 45.0, 43.0, 32.0, 42.0, 36.0, 36.0, 38.0, 25.0, 23.0, 33.0, 20.0, 16.0, 16.0, 24.0, 16.0, 20.0, 10.0, 8.0, 6.0, 12.0, 6.0, 3.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.39115333557129, -24.62701416015625, -23.86287498474121, -23.098735809326172, -22.3345947265625, -21.57045555114746, -20.806316375732422, -20.042177200317383, -19.278038024902344, -18.513898849487305, -17.749759674072266, -16.985620498657227, -16.221481323242188, -15.457341194152832, -14.693201065063477, -13.929061889648438, -13.164922714233398, -12.40078353881836, -11.63664436340332, -10.872504234313965, -10.108365058898926, -9.344225883483887, -8.580085754394531, -7.815946578979492, -7.051807403564453, -6.287668228149414, -5.523528575897217, -4.7593889236450195, -3.9952497482299805, -3.2311103343963623, -2.466970920562744, -1.7028312683105469, -0.9386940002441406, -0.17455458641052246, 0.5895848274230957, 1.3537242412567139, 2.117863655090332, 2.88200306892395, 3.6461424827575684, 4.410282135009766, 5.174421310424805, 5.938560485839844, 6.702700138092041, 7.466839790344238, 8.230978965759277, 8.995118141174316, 9.759258270263672, 10.523397445678711, 11.28753662109375, 12.051675796508789, 12.815814971923828, 13.579955101013184, 14.344094276428223, 15.108233451843262, 15.872373580932617, 16.636512756347656, 17.400651931762695, 18.164791107177734, 18.928930282592773, 19.693069458007812, 20.457210540771484, 21.221349716186523, 21.985488891601562, 22.7496280670166, 23.51376724243164]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 1.0, 8.0, 11.0, 14.0, 6.0, 15.0, 20.0, 13.0, 23.0, 18.0, 30.0, 31.0, 37.0, 33.0, 32.0, 37.0, 43.0, 44.0, 42.0, 42.0, 38.0, 37.0, 28.0, 34.0, 29.0, 23.0, 33.0, 33.0, 24.0, 29.0, 25.0, 19.0, 26.0, 15.0, 19.0, 11.0, 14.0, 11.0, 7.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.519662857055664, -24.72125816345215, -23.922853469848633, -23.124448776245117, -22.3260440826416, -21.527637481689453, -20.729232788085938, -19.930828094482422, -19.132423400878906, -18.33401870727539, -17.535614013671875, -16.73720932006836, -15.938803672790527, -15.140398979187012, -14.341994285583496, -13.543588638305664, -12.745184898376465, -11.94678020477295, -11.148375511169434, -10.349969863891602, -9.551565170288086, -8.75316047668457, -7.954755783081055, -7.156350612640381, -6.357945919036865, -5.55954122543335, -4.761136054992676, -3.96273136138916, -3.1643264293670654, -2.3659214973449707, -1.567516803741455, -0.7691116333007812, 0.029293060302734375, 0.8276979327201843, 1.6261028051376343, 2.4245076179504395, 3.222912549972534, 4.021317481994629, 4.8197221755981445, 5.618127346038818, 6.416532039642334, 7.21493673324585, 8.013341903686523, 8.811746597290039, 9.610151290893555, 10.40855598449707, 11.206960678100586, 12.005366325378418, 12.803771018981934, 13.60217571258545, 14.400580406188965, 15.198986053466797, 15.997390747070312, 16.795795440673828, 17.594200134277344, 18.39260482788086, 19.191009521484375, 19.98941421508789, 20.787818908691406, 21.586223602294922, 22.384628295898438, 23.183032989501953, 23.98143768310547, 24.779844284057617, 25.578248977661133]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 7.0, 27.0, 45.0, 88.0, 144.0, 236.0, 371.0, 587.0, 1072.0, 1706.0, 2798.0, 4420.0, 6981.0, 10736.0, 16342.0, 23800.0, 33438.0, 45220.0, 58754.0, 71729.0, 83531.0, 92827.0, 96623.0, 95314.0, 88358.0, 76765.0, 64493.0, 51424.0, 38250.0, 27403.0, 19246.0, 13204.0, 8490.0, 5489.0, 3442.0, 2072.0, 1239.0, 756.0, 456.0, 271.0, 170.0, 105.0, 48.0, 28.0, 18.0, 13.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.146240234375, -15.62060546875, -15.094970703125, -14.5693359375, -14.043701171875, -13.51806640625, -12.992431640625, -12.466796875, -11.941162109375, -11.41552734375, -10.889892578125, -10.3642578125, -9.838623046875, -9.31298828125, -8.787353515625, -8.26171875, -7.736083984375, -7.21044921875, -6.684814453125, -6.1591796875, -5.633544921875, -5.10791015625, -4.582275390625, -4.056640625, -3.531005859375, -3.00537109375, -2.479736328125, -1.9541015625, -1.428466796875, -0.90283203125, -0.377197265625, 0.1484375, 0.674072265625, 1.19970703125, 1.725341796875, 2.2509765625, 2.776611328125, 3.30224609375, 3.827880859375, 4.353515625, 4.879150390625, 5.40478515625, 5.930419921875, 6.4560546875, 6.981689453125, 7.50732421875, 8.032958984375, 8.55859375, 9.084228515625, 9.60986328125, 10.135498046875, 10.6611328125, 11.186767578125, 11.71240234375, 12.238037109375, 12.763671875, 13.289306640625, 13.81494140625, 14.340576171875, 14.8662109375, 15.391845703125, 15.91748046875, 16.443115234375, 16.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 5.0, 5.0, 2.0, 9.0, 12.0, 13.0, 8.0, 13.0, 21.0, 10.0, 24.0, 23.0, 30.0, 32.0, 32.0, 35.0, 35.0, 38.0, 40.0, 43.0, 45.0, 43.0, 32.0, 38.0, 31.0, 33.0, 26.0, 25.0, 33.0, 35.0, 21.0, 28.0, 31.0, 18.0, 21.0, 14.0, 23.0, 10.0, 12.0, 11.0, 6.0, 10.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.859375, -24.078125, -23.296875, -22.515625, -21.734375, -20.953125, -20.171875, -19.390625, -18.609375, -17.828125, -17.046875, -16.265625, -15.484375, -14.703125, -13.921875, -13.140625, -12.359375, -11.578125, -10.796875, -10.015625, -9.234375, -8.453125, -7.671875, -6.890625, -6.109375, -5.328125, -4.546875, -3.765625, -2.984375, -2.203125, -1.421875, -0.640625, 0.140625, 0.921875, 1.703125, 2.484375, 3.265625, 4.046875, 4.828125, 5.609375, 6.390625, 7.171875, 7.953125, 8.734375, 9.515625, 10.296875, 11.078125, 11.859375, 12.640625, 13.421875, 14.203125, 14.984375, 15.765625, 16.546875, 17.328125, 18.109375, 18.890625, 19.671875, 20.453125, 21.234375, 22.015625, 22.796875, 23.578125, 24.359375, 25.140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 8.0, 7.0, 21.0, 31.0, 64.0, 68.0, 143.0, 227.0, 424.0, 666.0, 1133.0, 1924.0, 3111.0, 5063.0, 8168.0, 12665.0, 19241.0, 28297.0, 39535.0, 54166.0, 68685.0, 83473.0, 95016.0, 101788.0, 101645.0, 95405.0, 83840.0, 68650.0, 53946.0, 40072.0, 28558.0, 18990.0, 12620.0, 8089.0, 5029.0, 3086.0, 1867.0, 1127.0, 657.0, 414.0, 254.0, 137.0, 94.0, 49.0, 39.0, 23.0, 10.0, 14.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.546875, -17.98486328125, -17.4228515625, -16.86083984375, -16.298828125, -15.73681640625, -15.1748046875, -14.61279296875, -14.05078125, -13.48876953125, -12.9267578125, -12.36474609375, -11.802734375, -11.24072265625, -10.6787109375, -10.11669921875, -9.5546875, -8.99267578125, -8.4306640625, -7.86865234375, -7.306640625, -6.74462890625, -6.1826171875, -5.62060546875, -5.05859375, -4.49658203125, -3.9345703125, -3.37255859375, -2.810546875, -2.24853515625, -1.6865234375, -1.12451171875, -0.5625, -0.00048828125, 0.5615234375, 1.12353515625, 1.685546875, 2.24755859375, 2.8095703125, 3.37158203125, 3.93359375, 4.49560546875, 5.0576171875, 5.61962890625, 6.181640625, 6.74365234375, 7.3056640625, 7.86767578125, 8.4296875, 8.99169921875, 9.5537109375, 10.11572265625, 10.677734375, 11.23974609375, 11.8017578125, 12.36376953125, 12.92578125, 13.48779296875, 14.0498046875, 14.61181640625, 15.173828125, 15.73583984375, 16.2978515625, 16.85986328125, 17.421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 8.0, 8.0, 13.0, 11.0, 9.0, 17.0, 18.0, 24.0, 29.0, 38.0, 45.0, 33.0, 44.0, 40.0, 48.0, 30.0, 52.0, 48.0, 38.0, 65.0, 42.0, 35.0, 47.0, 36.0, 39.0, 19.0, 29.0, 22.0, 23.0, 18.0, 14.0, 16.0, 9.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-22.90625, -22.280029296875, -21.65380859375, -21.027587890625, -20.4013671875, -19.775146484375, -19.14892578125, -18.522705078125, -17.896484375, -17.270263671875, -16.64404296875, -16.017822265625, -15.3916015625, -14.765380859375, -14.13916015625, -13.512939453125, -12.88671875, -12.260498046875, -11.63427734375, -11.008056640625, -10.3818359375, -9.755615234375, -9.12939453125, -8.503173828125, -7.876953125, -7.250732421875, -6.62451171875, -5.998291015625, -5.3720703125, -4.745849609375, -4.11962890625, -3.493408203125, -2.8671875, -2.240966796875, -1.61474609375, -0.988525390625, -0.3623046875, 0.263916015625, 0.89013671875, 1.516357421875, 2.142578125, 2.768798828125, 3.39501953125, 4.021240234375, 4.6474609375, 5.273681640625, 5.89990234375, 6.526123046875, 7.15234375, 7.778564453125, 8.40478515625, 9.031005859375, 9.6572265625, 10.283447265625, 10.90966796875, 11.535888671875, 12.162109375, 12.788330078125, 13.41455078125, 14.040771484375, 14.6669921875, 15.293212890625, 15.91943359375, 16.545654296875, 17.171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 6.0, 4.0, 15.0, 25.0, 48.0, 82.0, 129.0, 230.0, 482.0, 897.0, 1712.0, 3644.0, 7633.0, 16150.0, 33337.0, 63050.0, 106247.0, 152951.0, 182008.0, 171860.0, 131889.0, 84051.0, 46486.0, 23614.0, 11448.0, 5365.0, 2547.0, 1238.0, 630.0, 339.0, 186.0, 88.0, 61.0, 43.0, 23.0, 12.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.2122802734375, -12.768310546875, -12.3243408203125, -11.88037109375, -11.4364013671875, -10.992431640625, -10.5484619140625, -10.1044921875, -9.6605224609375, -9.216552734375, -8.7725830078125, -8.32861328125, -7.8846435546875, -7.440673828125, -6.9967041015625, -6.552734375, -6.1087646484375, -5.664794921875, -5.2208251953125, -4.77685546875, -4.3328857421875, -3.888916015625, -3.4449462890625, -3.0009765625, -2.5570068359375, -2.113037109375, -1.6690673828125, -1.22509765625, -0.7811279296875, -0.337158203125, 0.1068115234375, 0.55078125, 0.9947509765625, 1.438720703125, 1.8826904296875, 2.32666015625, 2.7706298828125, 3.214599609375, 3.6585693359375, 4.1025390625, 4.5465087890625, 4.990478515625, 5.4344482421875, 5.87841796875, 6.3223876953125, 6.766357421875, 7.2103271484375, 7.654296875, 8.0982666015625, 8.542236328125, 8.9862060546875, 9.43017578125, 9.8741455078125, 10.318115234375, 10.7620849609375, 11.2060546875, 11.6500244140625, 12.093994140625, 12.5379638671875, 12.98193359375, 13.4259033203125, 13.869873046875, 14.3138427734375, 14.7578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 6.0, 6.0, 11.0, 14.0, 15.0, 19.0, 39.0, 34.0, 38.0, 55.0, 67.0, 62.0, 68.0, 83.0, 69.0, 66.0, 57.0, 57.0, 47.0, 43.0, 27.0, 22.0, 16.0, 26.0, 11.0, 11.0, 10.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013408660888671875, -0.0012922883033752441, -0.0012437105178833008, -0.0011951327323913574, -0.001146554946899414, -0.0010979771614074707, -0.0010493993759155273, -0.001000821590423584, -0.0009522438049316406, -0.0009036660194396973, -0.0008550882339477539, -0.0008065104484558105, -0.0007579326629638672, -0.0007093548774719238, -0.0006607770919799805, -0.0006121993064880371, -0.0005636215209960938, -0.0005150437355041504, -0.00046646595001220703, -0.00041788816452026367, -0.0003693103790283203, -0.00032073259353637695, -0.0002721548080444336, -0.00022357702255249023, -0.00017499923706054688, -0.00012642145156860352, -7.784366607666016e-05, -2.9265880584716797e-05, 1.9311904907226562e-05, 6.788969039916992e-05, 0.00011646747589111328, 0.00016504526138305664, 0.000213623046875, 0.00026220083236694336, 0.0003107786178588867, 0.0003593564033508301, 0.00040793418884277344, 0.0004565119743347168, 0.0005050897598266602, 0.0005536675453186035, 0.0006022453308105469, 0.0006508231163024902, 0.0006994009017944336, 0.000747978687286377, 0.0007965564727783203, 0.0008451342582702637, 0.000893712043762207, 0.0009422898292541504, 0.0009908676147460938, 0.0010394454002380371, 0.0010880231857299805, 0.0011366009712219238, 0.0011851787567138672, 0.0012337565422058105, 0.001282334327697754, 0.0013309121131896973, 0.0013794898986816406, 0.001428067684173584, 0.0014766454696655273, 0.0015252232551574707, 0.001573801040649414, 0.0016223788261413574, 0.0016709566116333008, 0.0017195343971252441, 0.0017681121826171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 10.0, 15.0, 41.0, 45.0, 77.0, 109.0, 168.0, 282.0, 474.0, 711.0, 1257.0, 2310.0, 3746.0, 6595.0, 11161.0, 18977.0, 31323.0, 50499.0, 76615.0, 105347.0, 129943.0, 141536.0, 133966.0, 111056.0, 81863.0, 55207.0, 34786.0, 21015.0, 12245.0, 7090.0, 4121.0, 2410.0, 1403.0, 855.0, 472.0, 292.0, 187.0, 119.0, 73.0, 39.0, 41.0, 26.0, 11.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.6171875, -12.2301025390625, -11.843017578125, -11.4559326171875, -11.06884765625, -10.6817626953125, -10.294677734375, -9.9075927734375, -9.5205078125, -9.1334228515625, -8.746337890625, -8.3592529296875, -7.97216796875, -7.5850830078125, -7.197998046875, -6.8109130859375, -6.423828125, -6.0367431640625, -5.649658203125, -5.2625732421875, -4.87548828125, -4.4884033203125, -4.101318359375, -3.7142333984375, -3.3271484375, -2.9400634765625, -2.552978515625, -2.1658935546875, -1.77880859375, -1.3917236328125, -1.004638671875, -0.6175537109375, -0.23046875, 0.1566162109375, 0.543701171875, 0.9307861328125, 1.31787109375, 1.7049560546875, 2.092041015625, 2.4791259765625, 2.8662109375, 3.2532958984375, 3.640380859375, 4.0274658203125, 4.41455078125, 4.8016357421875, 5.188720703125, 5.5758056640625, 5.962890625, 6.3499755859375, 6.737060546875, 7.1241455078125, 7.51123046875, 7.8983154296875, 8.285400390625, 8.6724853515625, 9.0595703125, 9.4466552734375, 9.833740234375, 10.2208251953125, 10.60791015625, 10.9949951171875, 11.382080078125, 11.7691650390625, 12.15625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 8.0, 10.0, 16.0, 14.0, 13.0, 20.0, 21.0, 35.0, 36.0, 35.0, 44.0, 49.0, 41.0, 48.0, 53.0, 53.0, 68.0, 54.0, 47.0, 40.0, 49.0, 39.0, 33.0, 28.0, 27.0, 22.0, 20.0, 11.0, 8.0, 12.0, 5.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-5.296875, -5.1484375, -5.0, -4.8515625, -4.703125, -4.5546875, -4.40625, -4.2578125, -4.109375, -3.9609375, -3.8125, -3.6640625, -3.515625, -3.3671875, -3.21875, -3.0703125, -2.921875, -2.7734375, -2.625, -2.4765625, -2.328125, -2.1796875, -2.03125, -1.8828125, -1.734375, -1.5859375, -1.4375, -1.2890625, -1.140625, -0.9921875, -0.84375, -0.6953125, -0.546875, -0.3984375, -0.25, -0.1015625, 0.046875, 0.1953125, 0.34375, 0.4921875, 0.640625, 0.7890625, 0.9375, 1.0859375, 1.234375, 1.3828125, 1.53125, 1.6796875, 1.828125, 1.9765625, 2.125, 2.2734375, 2.421875, 2.5703125, 2.71875, 2.8671875, 3.015625, 3.1640625, 3.3125, 3.4609375, 3.609375, 3.7578125, 3.90625, 4.0546875, 4.203125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 1.0, 2.0, 6.0, 10.0, 13.0, 19.0, 11.0, 23.0, 28.0, 20.0, 22.0, 25.0, 28.0, 37.0, 30.0, 28.0, 34.0, 44.0, 54.0, 52.0, 39.0, 37.0, 35.0, 44.0, 30.0, 29.0, 26.0, 37.0, 29.0, 30.0, 23.0, 18.0, 14.0, 21.0, 18.0, 15.0, 11.0, 12.0, 9.0, 5.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.296188354492188, -25.5085506439209, -24.72091293334961, -23.933277130126953, -23.145639419555664, -22.358001708984375, -21.570363998413086, -20.782726287841797, -19.99509048461914, -19.20745277404785, -18.419815063476562, -17.632179260253906, -16.844541549682617, -16.056903839111328, -15.269266128540039, -14.48162841796875, -13.693990707397461, -12.906352996826172, -12.1187162399292, -11.33107852935791, -10.543441772460938, -9.755804061889648, -8.96816635131836, -8.18052864074707, -7.392891883850098, -6.605254650115967, -5.817617416381836, -5.029979705810547, -4.242342472076416, -3.454705238342285, -2.667067527770996, -1.8794302940368652, -1.0917930603027344, -0.30415570735931396, 0.48348164558410645, 1.2711191177368164, 2.0587563514709473, 2.846393585205078, 3.634031295776367, 4.421668529510498, 5.209305763244629, 5.99694299697876, 6.784580230712891, 7.57221794128418, 8.359855651855469, 9.147492408752441, 9.93513011932373, 10.722766876220703, 11.510404586791992, 12.298042297363281, 13.085679054260254, 13.873316764831543, 14.660953521728516, 15.448591232299805, 16.236228942871094, 17.023866653442383, 17.811504364013672, 18.59914207458496, 19.38677978515625, 20.174415588378906, 20.962053298950195, 21.749691009521484, 22.537328720092773, 23.324966430664062, 24.11260223388672]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 4.0, 5.0, 9.0, 10.0, 9.0, 12.0, 16.0, 19.0, 19.0, 39.0, 22.0, 32.0, 24.0, 25.0, 29.0, 40.0, 34.0, 38.0, 42.0, 45.0, 41.0, 37.0, 41.0, 40.0, 34.0, 31.0, 21.0, 25.0, 28.0, 39.0, 23.0, 37.0, 20.0, 13.0, 11.0, 5.0, 13.0, 7.0, 8.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-26.40523910522461, -25.58992576599121, -24.774612426757812, -23.95929718017578, -23.143983840942383, -22.328670501708984, -21.513357162475586, -20.698043823242188, -19.882728576660156, -19.067415237426758, -18.25210189819336, -17.436786651611328, -16.62147331237793, -15.806159973144531, -14.990846633911133, -14.175533294677734, -13.360219955444336, -12.544906616210938, -11.729592323303223, -10.914278984069824, -10.09896469116211, -9.283651351928711, -8.468338012695312, -7.653024196624756, -6.837710380554199, -6.022396564483643, -5.207082748413086, -4.3917694091796875, -3.576455593109131, -2.761141777038574, -1.9458284378051758, -1.1305146217346191, -0.3151988983154297, 0.5001147985458374, 1.3154284954071045, 2.130742073059082, 2.9460558891296387, 3.7613697052001953, 4.576683044433594, 5.39199686050415, 6.207310676574707, 7.022624492645264, 7.83793830871582, 8.653251647949219, 9.468564987182617, 10.283879280090332, 11.09919261932373, 11.914506912231445, 12.729820251464844, 13.545133590698242, 14.360447883605957, 15.175761222839355, 15.99107551574707, 16.80638885498047, 17.621702194213867, 18.437015533447266, 19.252330780029297, 20.067644119262695, 20.882957458496094, 21.698272705078125, 22.513586044311523, 23.328899383544922, 24.14421272277832, 24.95952606201172, 25.774839401245117]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 12.0, 18.0, 32.0, 45.0, 71.0, 138.0, 213.0, 396.0, 674.0, 1135.0, 1830.0, 3146.0, 5011.0, 8019.0, 12919.0, 20525.0, 31115.0, 47136.0, 69333.0, 98692.0, 136732.0, 182577.0, 233325.0, 283903.0, 330689.0, 365677.0, 378214.0, 372988.0, 346517.0, 303477.0, 253627.0, 201898.0, 153807.0, 113166.0, 79633.0, 54925.0, 37096.0, 24070.0, 15774.0, 10014.0, 6013.0, 3781.0, 2334.0, 1433.0, 904.0, 515.0, 297.0, 171.0, 110.0, 72.0, 36.0, 16.0, 17.0, 9.0, 2.0, 3.0], "bins": [-18.828125, -18.2855224609375, -17.742919921875, -17.2003173828125, -16.65771484375, -16.1151123046875, -15.572509765625, -15.0299072265625, -14.4873046875, -13.9447021484375, -13.402099609375, -12.8594970703125, -12.31689453125, -11.7742919921875, -11.231689453125, -10.6890869140625, -10.146484375, -9.6038818359375, -9.061279296875, -8.5186767578125, -7.97607421875, -7.4334716796875, -6.890869140625, -6.3482666015625, -5.8056640625, -5.2630615234375, -4.720458984375, -4.1778564453125, -3.63525390625, -3.0926513671875, -2.550048828125, -2.0074462890625, -1.46484375, -0.9222412109375, -0.379638671875, 0.1629638671875, 0.70556640625, 1.2481689453125, 1.790771484375, 2.3333740234375, 2.8759765625, 3.4185791015625, 3.961181640625, 4.5037841796875, 5.04638671875, 5.5889892578125, 6.131591796875, 6.6741943359375, 7.216796875, 7.7593994140625, 8.302001953125, 8.8446044921875, 9.38720703125, 9.9298095703125, 10.472412109375, 11.0150146484375, 11.5576171875, 12.1002197265625, 12.642822265625, 13.1854248046875, 13.72802734375, 14.2706298828125, 14.813232421875, 15.3558349609375, 15.8984375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 7.0, 6.0, 7.0, 5.0, 8.0, 7.0, 12.0, 17.0, 19.0, 16.0, 28.0, 38.0, 29.0, 24.0, 32.0, 20.0, 39.0, 37.0, 30.0, 39.0, 33.0, 54.0, 35.0, 44.0, 36.0, 43.0, 30.0, 23.0, 20.0, 28.0, 30.0, 31.0, 30.0, 30.0, 21.0, 11.0, 7.0, 11.0, 8.0, 10.0, 7.0, 12.0, 6.0, 4.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-22.90625, -22.1845703125, -21.462890625, -20.7412109375, -20.01953125, -19.2978515625, -18.576171875, -17.8544921875, -17.1328125, -16.4111328125, -15.689453125, -14.9677734375, -14.24609375, -13.5244140625, -12.802734375, -12.0810546875, -11.359375, -10.6376953125, -9.916015625, -9.1943359375, -8.47265625, -7.7509765625, -7.029296875, -6.3076171875, -5.5859375, -4.8642578125, -4.142578125, -3.4208984375, -2.69921875, -1.9775390625, -1.255859375, -0.5341796875, 0.1875, 0.9091796875, 1.630859375, 2.3525390625, 3.07421875, 3.7958984375, 4.517578125, 5.2392578125, 5.9609375, 6.6826171875, 7.404296875, 8.1259765625, 8.84765625, 9.5693359375, 10.291015625, 11.0126953125, 11.734375, 12.4560546875, 13.177734375, 13.8994140625, 14.62109375, 15.3427734375, 16.064453125, 16.7861328125, 17.5078125, 18.2294921875, 18.951171875, 19.6728515625, 20.39453125, 21.1162109375, 21.837890625, 22.5595703125, 23.28125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 10.0, 21.0, 32.0, 53.0, 116.0, 180.0, 312.0, 532.0, 924.0, 1492.0, 2603.0, 3919.0, 6599.0, 10187.0, 15887.0, 24582.0, 36339.0, 53094.0, 75578.0, 102651.0, 137646.0, 176701.0, 218070.0, 260707.0, 297696.0, 326412.0, 340483.0, 340821.0, 326533.0, 297773.0, 262461.0, 219250.0, 178227.0, 138210.0, 103690.0, 74990.0, 53658.0, 37047.0, 24913.0, 16449.0, 10648.0, 6493.0, 4065.0, 2477.0, 1600.0, 873.0, 571.0, 316.0, 170.0, 88.0, 51.0, 52.0, 18.0, 10.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.1875, -16.63330078125, -16.0791015625, -15.52490234375, -14.970703125, -14.41650390625, -13.8623046875, -13.30810546875, -12.75390625, -12.19970703125, -11.6455078125, -11.09130859375, -10.537109375, -9.98291015625, -9.4287109375, -8.87451171875, -8.3203125, -7.76611328125, -7.2119140625, -6.65771484375, -6.103515625, -5.54931640625, -4.9951171875, -4.44091796875, -3.88671875, -3.33251953125, -2.7783203125, -2.22412109375, -1.669921875, -1.11572265625, -0.5615234375, -0.00732421875, 0.546875, 1.10107421875, 1.6552734375, 2.20947265625, 2.763671875, 3.31787109375, 3.8720703125, 4.42626953125, 4.98046875, 5.53466796875, 6.0888671875, 6.64306640625, 7.197265625, 7.75146484375, 8.3056640625, 8.85986328125, 9.4140625, 9.96826171875, 10.5224609375, 11.07666015625, 11.630859375, 12.18505859375, 12.7392578125, 13.29345703125, 13.84765625, 14.40185546875, 14.9560546875, 15.51025390625, 16.064453125, 16.61865234375, 17.1728515625, 17.72705078125, 18.28125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 8.0, 9.0, 13.0, 23.0, 21.0, 21.0, 40.0, 46.0, 61.0, 69.0, 71.0, 87.0, 93.0, 94.0, 129.0, 170.0, 156.0, 182.0, 195.0, 163.0, 202.0, 187.0, 190.0, 199.0, 154.0, 186.0, 171.0, 147.0, 141.0, 126.0, 135.0, 93.0, 89.0, 84.0, 56.0, 53.0, 46.0, 35.0, 32.0, 22.0, 12.0, 15.0, 12.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-11.3125, -10.968994140625, -10.62548828125, -10.281982421875, -9.9384765625, -9.594970703125, -9.25146484375, -8.907958984375, -8.564453125, -8.220947265625, -7.87744140625, -7.533935546875, -7.1904296875, -6.846923828125, -6.50341796875, -6.159912109375, -5.81640625, -5.472900390625, -5.12939453125, -4.785888671875, -4.4423828125, -4.098876953125, -3.75537109375, -3.411865234375, -3.068359375, -2.724853515625, -2.38134765625, -2.037841796875, -1.6943359375, -1.350830078125, -1.00732421875, -0.663818359375, -0.3203125, 0.023193359375, 0.36669921875, 0.710205078125, 1.0537109375, 1.397216796875, 1.74072265625, 2.084228515625, 2.427734375, 2.771240234375, 3.11474609375, 3.458251953125, 3.8017578125, 4.145263671875, 4.48876953125, 4.832275390625, 5.17578125, 5.519287109375, 5.86279296875, 6.206298828125, 6.5498046875, 6.893310546875, 7.23681640625, 7.580322265625, 7.923828125, 8.267333984375, 8.61083984375, 8.954345703125, 9.2978515625, 9.641357421875, 9.98486328125, 10.328369140625, 10.671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 9.0, 13.0, 24.0, 17.0, 17.0, 20.0, 28.0, 28.0, 30.0, 29.0, 50.0, 40.0, 39.0, 39.0, 55.0, 58.0, 51.0, 38.0, 43.0, 42.0, 34.0, 37.0, 38.0, 29.0, 28.0, 35.0, 13.0, 24.0, 14.0, 9.0, 8.0, 14.0, 15.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.165422439575195, -30.222684860229492, -29.279945373535156, -28.337207794189453, -27.39447021484375, -26.451732635498047, -25.508995056152344, -24.566255569458008, -23.623517990112305, -22.6807804107666, -21.738040924072266, -20.795303344726562, -19.85256576538086, -18.909828186035156, -17.967090606689453, -17.024351119995117, -16.081613540649414, -15.138875961303711, -14.196137428283691, -13.253398895263672, -12.310661315917969, -11.367923736572266, -10.425185203552246, -9.482446670532227, -8.539709091186523, -7.596971035003662, -6.654232978820801, -5.7114949226379395, -4.768756866455078, -3.826018810272217, -2.8832807540893555, -1.9405426979064941, -0.9978065490722656, -0.0550684928894043, 0.887669563293457, 1.8304076194763184, 2.7731456756591797, 3.715883731842041, 4.658621788024902, 5.601359844207764, 6.544097900390625, 7.486835956573486, 8.429574012756348, 9.372312545776367, 10.31505012512207, 11.257787704467773, 12.200526237487793, 13.143264770507812, 14.086002349853516, 15.028739929199219, 15.971478462219238, 16.914216995239258, 17.85695457458496, 18.799692153930664, 19.742431640625, 20.685169219970703, 21.627906799316406, 22.57064437866211, 23.513381958007812, 24.45612144470215, 25.39885902404785, 26.341596603393555, 27.28433609008789, 28.227073669433594, 29.169811248779297]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 9.0, 5.0, 8.0, 12.0, 12.0, 15.0, 13.0, 24.0, 12.0, 19.0, 29.0, 19.0, 36.0, 36.0, 29.0, 42.0, 35.0, 45.0, 38.0, 34.0, 47.0, 38.0, 37.0, 32.0, 38.0, 39.0, 27.0, 27.0, 32.0, 26.0, 23.0, 18.0, 14.0, 16.0, 14.0, 23.0, 19.0, 15.0, 6.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-26.97835350036621, -26.145578384399414, -25.312803268432617, -24.480030059814453, -23.647254943847656, -22.81447982788086, -21.981704711914062, -21.148929595947266, -20.31615447998047, -19.483379364013672, -18.650604248046875, -17.817829132080078, -16.985055923461914, -16.152280807495117, -15.31950569152832, -14.486730575561523, -13.65395736694336, -12.821182250976562, -11.988408088684082, -11.155632972717285, -10.322858810424805, -9.490083694458008, -8.657308578491211, -7.824533939361572, -6.991759300231934, -6.158984661102295, -5.326210021972656, -4.493434906005859, -3.6606602668762207, -2.827885627746582, -1.9951105117797852, -1.1623358726501465, -0.329559326171875, 0.5032154321670532, 1.3359901905059814, 2.168765068054199, 3.001539707183838, 3.8343143463134766, 4.667089462280273, 5.499864101409912, 6.332638740539551, 7.1654133796691895, 7.998188018798828, 8.830963134765625, 9.663738250732422, 10.496512413024902, 11.3292875289917, 12.16206169128418, 12.994836807250977, 13.827611923217773, 14.660386085510254, 15.49316120147705, 16.32593536376953, 17.158710479736328, 17.991485595703125, 18.824260711669922, 19.65703582763672, 20.489810943603516, 21.322586059570312, 22.15536117553711, 22.988134384155273, 23.82090950012207, 24.653684616088867, 25.486459732055664, 26.319232940673828]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 10.0, 17.0, 17.0, 28.0, 31.0, 78.0, 88.0, 155.0, 184.0, 268.0, 435.0, 616.0, 962.0, 1484.0, 2287.0, 3499.0, 5482.0, 8988.0, 14002.0, 23156.0, 36385.0, 56449.0, 83436.0, 114822.0, 139948.0, 145925.0, 127230.0, 96760.0, 66761.0, 43965.0, 27918.0, 17468.0, 10724.0, 6708.0, 4245.0, 2726.0, 1785.0, 1154.0, 799.0, 515.0, 326.0, 221.0, 152.0, 111.0, 79.0, 52.0, 43.0, 16.0, 13.0, 9.0, 15.0, 3.0, 3.0, 5.0, 3.0], "bins": [-7.5234375, -7.30352783203125, -7.0836181640625, -6.86370849609375, -6.643798828125, -6.42388916015625, -6.2039794921875, -5.98406982421875, -5.76416015625, -5.54425048828125, -5.3243408203125, -5.10443115234375, -4.884521484375, -4.66461181640625, -4.4447021484375, -4.22479248046875, -4.0048828125, -3.78497314453125, -3.5650634765625, -3.34515380859375, -3.125244140625, -2.90533447265625, -2.6854248046875, -2.46551513671875, -2.24560546875, -2.02569580078125, -1.8057861328125, -1.58587646484375, -1.365966796875, -1.14605712890625, -0.9261474609375, -0.70623779296875, -0.486328125, -0.26641845703125, -0.0465087890625, 0.17340087890625, 0.393310546875, 0.61322021484375, 0.8331298828125, 1.05303955078125, 1.27294921875, 1.49285888671875, 1.7127685546875, 1.93267822265625, 2.152587890625, 2.37249755859375, 2.5924072265625, 2.81231689453125, 3.0322265625, 3.25213623046875, 3.4720458984375, 3.69195556640625, 3.911865234375, 4.13177490234375, 4.3516845703125, 4.57159423828125, 4.79150390625, 5.01141357421875, 5.2313232421875, 5.45123291015625, 5.671142578125, 5.89105224609375, 6.1109619140625, 6.33087158203125, 6.55078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 9.0, 5.0, 6.0, 14.0, 8.0, 17.0, 13.0, 24.0, 13.0, 18.0, 31.0, 18.0, 35.0, 35.0, 28.0, 41.0, 39.0, 42.0, 39.0, 37.0, 46.0, 37.0, 38.0, 29.0, 39.0, 39.0, 29.0, 26.0, 33.0, 25.0, 23.0, 17.0, 15.0, 17.0, 15.0, 20.0, 19.0, 16.0, 7.0, 8.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-26.9375, -26.10498046875, -25.2724609375, -24.43994140625, -23.607421875, -22.77490234375, -21.9423828125, -21.10986328125, -20.27734375, -19.44482421875, -18.6123046875, -17.77978515625, -16.947265625, -16.11474609375, -15.2822265625, -14.44970703125, -13.6171875, -12.78466796875, -11.9521484375, -11.11962890625, -10.287109375, -9.45458984375, -8.6220703125, -7.78955078125, -6.95703125, -6.12451171875, -5.2919921875, -4.45947265625, -3.626953125, -2.79443359375, -1.9619140625, -1.12939453125, -0.296875, 0.53564453125, 1.3681640625, 2.20068359375, 3.033203125, 3.86572265625, 4.6982421875, 5.53076171875, 6.36328125, 7.19580078125, 8.0283203125, 8.86083984375, 9.693359375, 10.52587890625, 11.3583984375, 12.19091796875, 13.0234375, 13.85595703125, 14.6884765625, 15.52099609375, 16.353515625, 17.18603515625, 18.0185546875, 18.85107421875, 19.68359375, 20.51611328125, 21.3486328125, 22.18115234375, 23.013671875, 23.84619140625, 24.6787109375, 25.51123046875, 26.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 13.0, 20.0, 38.0, 39.0, 67.0, 102.0, 107.0, 148.0, 289.0, 412.0, 630.0, 1038.0, 1696.0, 2723.0, 4838.0, 8859.0, 18277.0, 40279.0, 96205.0, 227295.0, 320512.0, 184003.0, 75671.0, 32027.0, 14921.0, 7671.0, 4204.0, 2361.0, 1458.0, 924.0, 585.0, 375.0, 227.0, 167.0, 122.0, 55.0, 52.0, 40.0, 34.0, 15.0, 16.0, 3.0, 6.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.65625, -10.3270263671875, -9.997802734375, -9.6685791015625, -9.33935546875, -9.0101318359375, -8.680908203125, -8.3516845703125, -8.0224609375, -7.6932373046875, -7.364013671875, -7.0347900390625, -6.70556640625, -6.3763427734375, -6.047119140625, -5.7178955078125, -5.388671875, -5.0594482421875, -4.730224609375, -4.4010009765625, -4.07177734375, -3.7425537109375, -3.413330078125, -3.0841064453125, -2.7548828125, -2.4256591796875, -2.096435546875, -1.7672119140625, -1.43798828125, -1.1087646484375, -0.779541015625, -0.4503173828125, -0.12109375, 0.2081298828125, 0.537353515625, 0.8665771484375, 1.19580078125, 1.5250244140625, 1.854248046875, 2.1834716796875, 2.5126953125, 2.8419189453125, 3.171142578125, 3.5003662109375, 3.82958984375, 4.1588134765625, 4.488037109375, 4.8172607421875, 5.146484375, 5.4757080078125, 5.804931640625, 6.1341552734375, 6.46337890625, 6.7926025390625, 7.121826171875, 7.4510498046875, 7.7802734375, 8.1094970703125, 8.438720703125, 8.7679443359375, 9.09716796875, 9.4263916015625, 9.755615234375, 10.0848388671875, 10.4140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 15.0, 12.0, 17.0, 19.0, 36.0, 18.0, 19.0, 26.0, 23.0, 35.0, 51.0, 39.0, 35.0, 45.0, 31.0, 41.0, 38.0, 30.0, 40.0, 50.0, 43.0, 40.0, 42.0, 39.0, 18.0, 16.0, 26.0, 29.0, 20.0, 10.0, 17.0, 10.0, 16.0, 2.0, 10.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.734375, -19.1822509765625, -18.630126953125, -18.0780029296875, -17.52587890625, -16.9737548828125, -16.421630859375, -15.8695068359375, -15.3173828125, -14.7652587890625, -14.213134765625, -13.6610107421875, -13.10888671875, -12.5567626953125, -12.004638671875, -11.4525146484375, -10.900390625, -10.3482666015625, -9.796142578125, -9.2440185546875, -8.69189453125, -8.1397705078125, -7.587646484375, -7.0355224609375, -6.4833984375, -5.9312744140625, -5.379150390625, -4.8270263671875, -4.27490234375, -3.7227783203125, -3.170654296875, -2.6185302734375, -2.06640625, -1.5142822265625, -0.962158203125, -0.4100341796875, 0.14208984375, 0.6942138671875, 1.246337890625, 1.7984619140625, 2.3505859375, 2.9027099609375, 3.454833984375, 4.0069580078125, 4.55908203125, 5.1112060546875, 5.663330078125, 6.2154541015625, 6.767578125, 7.3197021484375, 7.871826171875, 8.4239501953125, 8.97607421875, 9.5281982421875, 10.080322265625, 10.6324462890625, 11.1845703125, 11.7366943359375, 12.288818359375, 12.8409423828125, 13.39306640625, 13.9451904296875, 14.497314453125, 15.0494384765625, 15.6015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 8.0, 23.0, 23.0, 31.0, 54.0, 65.0, 84.0, 147.0, 207.0, 309.0, 417.0, 687.0, 1056.0, 1771.0, 3088.0, 5660.0, 10891.0, 23703.0, 61845.0, 230671.0, 481613.0, 144120.0, 44116.0, 18037.0, 8670.0, 4490.0, 2502.0, 1485.0, 926.0, 578.0, 396.0, 262.0, 199.0, 138.0, 87.0, 50.0, 41.0, 24.0, 18.0, 8.0, 14.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3046875, -8.0396728515625, -7.774658203125, -7.5096435546875, -7.24462890625, -6.9796142578125, -6.714599609375, -6.4495849609375, -6.1845703125, -5.9195556640625, -5.654541015625, -5.3895263671875, -5.12451171875, -4.8594970703125, -4.594482421875, -4.3294677734375, -4.064453125, -3.7994384765625, -3.534423828125, -3.2694091796875, -3.00439453125, -2.7393798828125, -2.474365234375, -2.2093505859375, -1.9443359375, -1.6793212890625, -1.414306640625, -1.1492919921875, -0.88427734375, -0.6192626953125, -0.354248046875, -0.0892333984375, 0.17578125, 0.4407958984375, 0.705810546875, 0.9708251953125, 1.23583984375, 1.5008544921875, 1.765869140625, 2.0308837890625, 2.2958984375, 2.5609130859375, 2.825927734375, 3.0909423828125, 3.35595703125, 3.6209716796875, 3.885986328125, 4.1510009765625, 4.416015625, 4.6810302734375, 4.946044921875, 5.2110595703125, 5.47607421875, 5.7410888671875, 6.006103515625, 6.2711181640625, 6.5361328125, 6.8011474609375, 7.066162109375, 7.3311767578125, 7.59619140625, 7.8612060546875, 8.126220703125, 8.3912353515625, 8.65625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 3.0, 4.0, 11.0, 16.0, 23.0, 36.0, 35.0, 37.0, 34.0, 31.0, 46.0, 65.0, 63.0, 77.0, 60.0, 56.0, 72.0, 47.0, 52.0, 41.0, 37.0, 37.0, 21.0, 28.0, 12.0, 17.0, 9.0, 11.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022339820861816406, -0.00021230056881904602, -0.00020120292901992798, -0.00019010528922080994, -0.0001790076494216919, -0.00016791000962257385, -0.0001568123698234558, -0.00014571473002433777, -0.00013461709022521973, -0.00012351945042610168, -0.00011242181062698364, -0.0001013241708278656, -9.022653102874756e-05, -7.912889122962952e-05, -6.803125143051147e-05, -5.693361163139343e-05, -4.583597183227539e-05, -3.473833203315735e-05, -2.3640692234039307e-05, -1.2543052434921265e-05, -1.4454126358032227e-06, 9.65222716331482e-06, 2.074986696243286e-05, 3.18475067615509e-05, 4.2945146560668945e-05, 5.404278635978699e-05, 6.514042615890503e-05, 7.623806595802307e-05, 8.733570575714111e-05, 9.843334555625916e-05, 0.0001095309853553772, 0.00012062862515449524, 0.00013172626495361328, 0.00014282390475273132, 0.00015392154455184937, 0.0001650191843509674, 0.00017611682415008545, 0.0001872144639492035, 0.00019831210374832153, 0.00020940974354743958, 0.00022050738334655762, 0.00023160502314567566, 0.0002427026629447937, 0.00025380030274391174, 0.0002648979425430298, 0.00027599558234214783, 0.00028709322214126587, 0.0002981908619403839, 0.00030928850173950195, 0.00032038614153862, 0.00033148378133773804, 0.0003425814211368561, 0.0003536790609359741, 0.00036477670073509216, 0.0003758743405342102, 0.00038697198033332825, 0.0003980696201324463, 0.00040916725993156433, 0.0004202648997306824, 0.0004313625395298004, 0.00044246017932891846, 0.0004535578191280365, 0.00046465545892715454, 0.0004757530987262726, 0.0004868507385253906]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 10.0, 14.0, 20.0, 18.0, 27.0, 33.0, 53.0, 59.0, 99.0, 143.0, 194.0, 308.0, 384.0, 642.0, 916.0, 1584.0, 2449.0, 3978.0, 6587.0, 11270.0, 20818.0, 38503.0, 72630.0, 130963.0, 196796.0, 209977.0, 153393.0, 89365.0, 47723.0, 25163.0, 13926.0, 7869.0, 4612.0, 2795.0, 1825.0, 1114.0, 726.0, 485.0, 328.0, 209.0, 170.0, 115.0, 67.0, 48.0, 42.0, 25.0, 17.0, 17.0, 10.0, 9.0, 9.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0], "bins": [-8.3828125, -8.1221923828125, -7.861572265625, -7.6009521484375, -7.34033203125, -7.0797119140625, -6.819091796875, -6.5584716796875, -6.2978515625, -6.0372314453125, -5.776611328125, -5.5159912109375, -5.25537109375, -4.9947509765625, -4.734130859375, -4.4735107421875, -4.212890625, -3.9522705078125, -3.691650390625, -3.4310302734375, -3.17041015625, -2.9097900390625, -2.649169921875, -2.3885498046875, -2.1279296875, -1.8673095703125, -1.606689453125, -1.3460693359375, -1.08544921875, -0.8248291015625, -0.564208984375, -0.3035888671875, -0.04296875, 0.2176513671875, 0.478271484375, 0.7388916015625, 0.99951171875, 1.2601318359375, 1.520751953125, 1.7813720703125, 2.0419921875, 2.3026123046875, 2.563232421875, 2.8238525390625, 3.08447265625, 3.3450927734375, 3.605712890625, 3.8663330078125, 4.126953125, 4.3875732421875, 4.648193359375, 4.9088134765625, 5.16943359375, 5.4300537109375, 5.690673828125, 5.9512939453125, 6.2119140625, 6.4725341796875, 6.733154296875, 6.9937744140625, 7.25439453125, 7.5150146484375, 7.775634765625, 8.0362548828125, 8.296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 5.0, 3.0, 18.0, 8.0, 14.0, 14.0, 20.0, 37.0, 37.0, 48.0, 54.0, 68.0, 70.0, 72.0, 62.0, 85.0, 50.0, 61.0, 40.0, 42.0, 32.0, 19.0, 23.0, 21.0, 14.0, 7.0, 13.0, 11.0, 11.0, 4.0, 10.0, 0.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.99609375, -2.90826416015625, -2.8204345703125, -2.73260498046875, -2.644775390625, -2.55694580078125, -2.4691162109375, -2.38128662109375, -2.29345703125, -2.20562744140625, -2.1177978515625, -2.02996826171875, -1.942138671875, -1.85430908203125, -1.7664794921875, -1.67864990234375, -1.5908203125, -1.50299072265625, -1.4151611328125, -1.32733154296875, -1.239501953125, -1.15167236328125, -1.0638427734375, -0.97601318359375, -0.88818359375, -0.80035400390625, -0.7125244140625, -0.62469482421875, -0.536865234375, -0.44903564453125, -0.3612060546875, -0.27337646484375, -0.185546875, -0.09771728515625, -0.0098876953125, 0.07794189453125, 0.165771484375, 0.25360107421875, 0.3414306640625, 0.42926025390625, 0.51708984375, 0.60491943359375, 0.6927490234375, 0.78057861328125, 0.868408203125, 0.95623779296875, 1.0440673828125, 1.13189697265625, 1.2197265625, 1.30755615234375, 1.3953857421875, 1.48321533203125, 1.571044921875, 1.65887451171875, 1.7467041015625, 1.83453369140625, 1.92236328125, 2.01019287109375, 2.0980224609375, 2.18585205078125, 2.273681640625, 2.36151123046875, 2.4493408203125, 2.53717041015625, 2.625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 9.0, 8.0, 9.0, 20.0, 16.0, 21.0, 21.0, 23.0, 23.0, 30.0, 34.0, 29.0, 54.0, 47.0, 32.0, 44.0, 64.0, 45.0, 44.0, 41.0, 43.0, 44.0, 33.0, 34.0, 40.0, 28.0, 33.0, 26.0, 13.0, 21.0, 8.0, 10.0, 15.0, 9.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.470264434814453, -30.52984046936035, -29.58941650390625, -28.64899253845215, -27.708568572998047, -26.768142700195312, -25.827720642089844, -24.88729476928711, -23.946870803833008, -23.006446838378906, -22.066022872924805, -21.125598907470703, -20.1851749420166, -19.2447509765625, -18.304325103759766, -17.363901138305664, -16.423477172851562, -15.483053207397461, -14.54262924194336, -13.602205276489258, -12.66178035736084, -11.721356391906738, -10.780932426452637, -9.840507507324219, -8.90008544921875, -7.959661483764648, -7.019237041473389, -6.078813076019287, -5.138388633728027, -4.197964668273926, -3.257540702819824, -2.3171162605285645, -1.3766918182373047, -0.4362676739692688, 0.5041564702987671, 1.4445805549621582, 2.385004758834839, 3.3254289627075195, 4.265852928161621, 5.206277370452881, 6.146701335906982, 7.087125301361084, 8.027549743652344, 8.967973709106445, 9.908397674560547, 10.848821640014648, 11.78924560546875, 12.729670524597168, 13.67009449005127, 14.610518455505371, 15.550942420959473, 16.49136734008789, 17.431791305541992, 18.372215270996094, 19.312639236450195, 20.253063201904297, 21.1934871673584, 22.1339111328125, 23.0743350982666, 24.014759063720703, 24.955183029174805, 25.895606994628906, 26.83603286743164, 27.776456832885742, 28.716880798339844]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 8.0, 7.0, 11.0, 7.0, 15.0, 12.0, 23.0, 17.0, 18.0, 21.0, 27.0, 29.0, 37.0, 31.0, 41.0, 33.0, 40.0, 42.0, 34.0, 46.0, 38.0, 34.0, 35.0, 38.0, 39.0, 29.0, 26.0, 27.0, 34.0, 23.0, 25.0, 11.0, 16.0, 18.0, 19.0, 18.0, 16.0, 13.0, 8.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-27.368040084838867, -26.532081604003906, -25.696123123168945, -24.860164642333984, -24.024206161499023, -23.188247680664062, -22.3522891998291, -21.51633071899414, -20.68037223815918, -19.84441375732422, -19.008455276489258, -18.172496795654297, -17.336538314819336, -16.500579833984375, -15.664621353149414, -14.828662872314453, -13.992705345153809, -13.156746864318848, -12.320788383483887, -11.484829902648926, -10.648871421813965, -9.81291389465332, -8.97695541381836, -8.140996932983398, -7.305037975311279, -6.469079494476318, -5.633121013641357, -4.797163009643555, -3.9612042903900146, -3.125246047973633, -2.289287567138672, -1.453329086303711, -0.61737060546875, 0.21858781576156616, 1.0545462369918823, 1.8905045986175537, 2.7264630794525146, 3.5624213218688965, 4.398379802703857, 5.234338283538818, 6.070296764373779, 6.90625524520874, 7.742213726043701, 8.578171730041504, 9.414130210876465, 10.250088691711426, 11.086047172546387, 11.922005653381348, 12.757964134216309, 13.59392261505127, 14.42988109588623, 15.265839576721191, 16.101797103881836, 16.937755584716797, 17.773714065551758, 18.60967254638672, 19.44563102722168, 20.28158950805664, 21.1175479888916, 21.953506469726562, 22.789464950561523, 23.625423431396484, 24.461381912231445, 25.297340393066406, 26.133298873901367]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 15.0, 30.0, 52.0, 55.0, 152.0, 185.0, 345.0, 509.0, 868.0, 1421.0, 2304.0, 3619.0, 5615.0, 8447.0, 12601.0, 17982.0, 25563.0, 34325.0, 45300.0, 57325.0, 68928.0, 78624.0, 86293.0, 89564.0, 89553.0, 83989.0, 75304.0, 64224.0, 52650.0, 41393.0, 30952.0, 22610.0, 16169.0, 11281.0, 7448.0, 4774.0, 2968.0, 1883.0, 1222.0, 806.0, 449.0, 297.0, 178.0, 93.0, 71.0, 37.0, 34.0, 23.0, 10.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.984375, -15.4658203125, -14.947265625, -14.4287109375, -13.91015625, -13.3916015625, -12.873046875, -12.3544921875, -11.8359375, -11.3173828125, -10.798828125, -10.2802734375, -9.76171875, -9.2431640625, -8.724609375, -8.2060546875, -7.6875, -7.1689453125, -6.650390625, -6.1318359375, -5.61328125, -5.0947265625, -4.576171875, -4.0576171875, -3.5390625, -3.0205078125, -2.501953125, -1.9833984375, -1.46484375, -0.9462890625, -0.427734375, 0.0908203125, 0.609375, 1.1279296875, 1.646484375, 2.1650390625, 2.68359375, 3.2021484375, 3.720703125, 4.2392578125, 4.7578125, 5.2763671875, 5.794921875, 6.3134765625, 6.83203125, 7.3505859375, 7.869140625, 8.3876953125, 8.90625, 9.4248046875, 9.943359375, 10.4619140625, 10.98046875, 11.4990234375, 12.017578125, 12.5361328125, 13.0546875, 13.5732421875, 14.091796875, 14.6103515625, 15.12890625, 15.6474609375, 16.166015625, 16.6845703125, 17.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 3.0, 8.0, 7.0, 7.0, 12.0, 7.0, 16.0, 12.0, 22.0, 17.0, 18.0, 22.0, 25.0, 29.0, 38.0, 32.0, 40.0, 35.0, 40.0, 39.0, 35.0, 47.0, 36.0, 33.0, 34.0, 40.0, 40.0, 26.0, 28.0, 30.0, 30.0, 26.0, 21.0, 15.0, 16.0, 16.0, 19.0, 19.0, 16.0, 12.0, 8.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-26.625, -25.8115234375, -24.998046875, -24.1845703125, -23.37109375, -22.5576171875, -21.744140625, -20.9306640625, -20.1171875, -19.3037109375, -18.490234375, -17.6767578125, -16.86328125, -16.0498046875, -15.236328125, -14.4228515625, -13.609375, -12.7958984375, -11.982421875, -11.1689453125, -10.35546875, -9.5419921875, -8.728515625, -7.9150390625, -7.1015625, -6.2880859375, -5.474609375, -4.6611328125, -3.84765625, -3.0341796875, -2.220703125, -1.4072265625, -0.59375, 0.2197265625, 1.033203125, 1.8466796875, 2.66015625, 3.4736328125, 4.287109375, 5.1005859375, 5.9140625, 6.7275390625, 7.541015625, 8.3544921875, 9.16796875, 9.9814453125, 10.794921875, 11.6083984375, 12.421875, 13.2353515625, 14.048828125, 14.8623046875, 15.67578125, 16.4892578125, 17.302734375, 18.1162109375, 18.9296875, 19.7431640625, 20.556640625, 21.3701171875, 22.18359375, 22.9970703125, 23.810546875, 24.6240234375, 25.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 7.0, 5.0, 14.0, 15.0, 28.0, 38.0, 66.0, 92.0, 162.0, 278.0, 403.0, 639.0, 996.0, 1634.0, 2543.0, 3792.0, 5891.0, 8877.0, 12890.0, 18374.0, 25356.0, 34072.0, 44810.0, 55645.0, 66968.0, 77205.0, 84211.0, 87824.0, 88189.0, 83424.0, 75339.0, 64835.0, 53633.0, 42063.0, 32041.0, 23659.0, 17165.0, 11855.0, 7976.0, 5527.0, 3561.0, 2386.0, 1532.0, 944.0, 596.0, 352.0, 254.0, 134.0, 103.0, 60.0, 40.0, 33.0, 13.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0], "bins": [-16.734375, -16.2257080078125, -15.717041015625, -15.2083740234375, -14.69970703125, -14.1910400390625, -13.682373046875, -13.1737060546875, -12.6650390625, -12.1563720703125, -11.647705078125, -11.1390380859375, -10.63037109375, -10.1217041015625, -9.613037109375, -9.1043701171875, -8.595703125, -8.0870361328125, -7.578369140625, -7.0697021484375, -6.56103515625, -6.0523681640625, -5.543701171875, -5.0350341796875, -4.5263671875, -4.0177001953125, -3.509033203125, -3.0003662109375, -2.49169921875, -1.9830322265625, -1.474365234375, -0.9656982421875, -0.45703125, 0.0516357421875, 0.560302734375, 1.0689697265625, 1.57763671875, 2.0863037109375, 2.594970703125, 3.1036376953125, 3.6123046875, 4.1209716796875, 4.629638671875, 5.1383056640625, 5.64697265625, 6.1556396484375, 6.664306640625, 7.1729736328125, 7.681640625, 8.1903076171875, 8.698974609375, 9.2076416015625, 9.71630859375, 10.2249755859375, 10.733642578125, 11.2423095703125, 11.7509765625, 12.2596435546875, 12.768310546875, 13.2769775390625, 13.78564453125, 14.2943115234375, 14.802978515625, 15.3116455078125, 15.8203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 8.0, 13.0, 6.0, 8.0, 19.0, 23.0, 21.0, 19.0, 25.0, 28.0, 35.0, 42.0, 44.0, 46.0, 49.0, 39.0, 48.0, 42.0, 65.0, 48.0, 41.0, 42.0, 41.0, 31.0, 31.0, 36.0, 37.0, 20.0, 20.0, 15.0, 12.0, 10.0, 4.0, 6.0, 4.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.25830078125, -17.5947265625, -16.93115234375, -16.267578125, -15.60400390625, -14.9404296875, -14.27685546875, -13.61328125, -12.94970703125, -12.2861328125, -11.62255859375, -10.958984375, -10.29541015625, -9.6318359375, -8.96826171875, -8.3046875, -7.64111328125, -6.9775390625, -6.31396484375, -5.650390625, -4.98681640625, -4.3232421875, -3.65966796875, -2.99609375, -2.33251953125, -1.6689453125, -1.00537109375, -0.341796875, 0.32177734375, 0.9853515625, 1.64892578125, 2.3125, 2.97607421875, 3.6396484375, 4.30322265625, 4.966796875, 5.63037109375, 6.2939453125, 6.95751953125, 7.62109375, 8.28466796875, 8.9482421875, 9.61181640625, 10.275390625, 10.93896484375, 11.6025390625, 12.26611328125, 12.9296875, 13.59326171875, 14.2568359375, 14.92041015625, 15.583984375, 16.24755859375, 16.9111328125, 17.57470703125, 18.23828125, 18.90185546875, 19.5654296875, 20.22900390625, 20.892578125, 21.55615234375, 22.2197265625, 22.88330078125, 23.546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 12.0, 21.0, 26.0, 31.0, 51.0, 83.0, 90.0, 177.0, 270.0, 445.0, 731.0, 1138.0, 1959.0, 3181.0, 5309.0, 8914.0, 15264.0, 24384.0, 38801.0, 57175.0, 80471.0, 102918.0, 120236.0, 126588.0, 120066.0, 103346.0, 79720.0, 57358.0, 38352.0, 24308.0, 14739.0, 8997.0, 5273.0, 3236.0, 1873.0, 1100.0, 658.0, 423.0, 280.0, 215.0, 106.0, 69.0, 59.0, 28.0, 21.0, 16.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.15625, -9.833740234375, -9.51123046875, -9.188720703125, -8.8662109375, -8.543701171875, -8.22119140625, -7.898681640625, -7.576171875, -7.253662109375, -6.93115234375, -6.608642578125, -6.2861328125, -5.963623046875, -5.64111328125, -5.318603515625, -4.99609375, -4.673583984375, -4.35107421875, -4.028564453125, -3.7060546875, -3.383544921875, -3.06103515625, -2.738525390625, -2.416015625, -2.093505859375, -1.77099609375, -1.448486328125, -1.1259765625, -0.803466796875, -0.48095703125, -0.158447265625, 0.1640625, 0.486572265625, 0.80908203125, 1.131591796875, 1.4541015625, 1.776611328125, 2.09912109375, 2.421630859375, 2.744140625, 3.066650390625, 3.38916015625, 3.711669921875, 4.0341796875, 4.356689453125, 4.67919921875, 5.001708984375, 5.32421875, 5.646728515625, 5.96923828125, 6.291748046875, 6.6142578125, 6.936767578125, 7.25927734375, 7.581787109375, 7.904296875, 8.226806640625, 8.54931640625, 8.871826171875, 9.1943359375, 9.516845703125, 9.83935546875, 10.161865234375, 10.484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 8.0, 6.0, 12.0, 11.0, 11.0, 14.0, 18.0, 21.0, 21.0, 27.0, 21.0, 32.0, 25.0, 35.0, 36.0, 30.0, 41.0, 36.0, 42.0, 44.0, 27.0, 56.0, 49.0, 36.0, 31.0, 34.0, 19.0, 34.0, 36.0, 22.0, 34.0, 18.0, 17.0, 12.0, 12.0, 12.0, 10.0, 4.0, 11.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0009489059448242188, -0.0009185820817947388, -0.0008882582187652588, -0.0008579343557357788, -0.0008276104927062988, -0.0007972866296768188, -0.0007669627666473389, -0.0007366389036178589, -0.0007063150405883789, -0.0006759911775588989, -0.0006456673145294189, -0.000615343451499939, -0.000585019588470459, -0.000554695725440979, -0.000524371862411499, -0.000494047999382019, -0.00046372413635253906, -0.0004334002733230591, -0.0004030764102935791, -0.0003727525472640991, -0.00034242868423461914, -0.00031210482120513916, -0.0002817809581756592, -0.0002514570951461792, -0.00022113323211669922, -0.00019080936908721924, -0.00016048550605773926, -0.00013016164302825928, -9.98377799987793e-05, -6.951391696929932e-05, -3.9190053939819336e-05, -8.866190910339355e-06, 2.1457672119140625e-05, 5.1781535148620605e-05, 8.210539817810059e-05, 0.00011242926120758057, 0.00014275312423706055, 0.00017307698726654053, 0.0002034008502960205, 0.0002337247133255005, 0.00026404857635498047, 0.00029437243938446045, 0.00032469630241394043, 0.0003550201654434204, 0.0003853440284729004, 0.00041566789150238037, 0.00044599175453186035, 0.00047631561756134033, 0.0005066394805908203, 0.0005369633436203003, 0.0005672872066497803, 0.0005976110696792603, 0.0006279349327087402, 0.0006582587957382202, 0.0006885826587677002, 0.0007189065217971802, 0.0007492303848266602, 0.0007795542478561401, 0.0008098781108856201, 0.0008402019739151001, 0.0008705258369445801, 0.0009008496999740601, 0.00093117356300354, 0.00096149742603302, 0.0009918212890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 12.0, 13.0, 29.0, 31.0, 55.0, 61.0, 95.0, 155.0, 240.0, 376.0, 570.0, 884.0, 1343.0, 2081.0, 3192.0, 5072.0, 7622.0, 11605.0, 17784.0, 25481.0, 35867.0, 49337.0, 64711.0, 79771.0, 92910.0, 101402.0, 102841.0, 97665.0, 85849.0, 71493.0, 56545.0, 41699.0, 29979.0, 21053.0, 13920.0, 9370.0, 6102.0, 3958.0, 2594.0, 1656.0, 1133.0, 658.0, 454.0, 292.0, 195.0, 125.0, 87.0, 52.0, 39.0, 32.0, 24.0, 16.0, 8.0, 5.0, 6.0, 4.0], "bins": [-10.5546875, -10.246337890625, -9.93798828125, -9.629638671875, -9.3212890625, -9.012939453125, -8.70458984375, -8.396240234375, -8.087890625, -7.779541015625, -7.47119140625, -7.162841796875, -6.8544921875, -6.546142578125, -6.23779296875, -5.929443359375, -5.62109375, -5.312744140625, -5.00439453125, -4.696044921875, -4.3876953125, -4.079345703125, -3.77099609375, -3.462646484375, -3.154296875, -2.845947265625, -2.53759765625, -2.229248046875, -1.9208984375, -1.612548828125, -1.30419921875, -0.995849609375, -0.6875, -0.379150390625, -0.07080078125, 0.237548828125, 0.5458984375, 0.854248046875, 1.16259765625, 1.470947265625, 1.779296875, 2.087646484375, 2.39599609375, 2.704345703125, 3.0126953125, 3.321044921875, 3.62939453125, 3.937744140625, 4.24609375, 4.554443359375, 4.86279296875, 5.171142578125, 5.4794921875, 5.787841796875, 6.09619140625, 6.404541015625, 6.712890625, 7.021240234375, 7.32958984375, 7.637939453125, 7.9462890625, 8.254638671875, 8.56298828125, 8.871337890625, 9.1796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 14.0, 6.0, 11.0, 21.0, 27.0, 19.0, 20.0, 21.0, 33.0, 43.0, 44.0, 51.0, 61.0, 58.0, 42.0, 44.0, 60.0, 57.0, 45.0, 39.0, 31.0, 31.0, 29.0, 34.0, 31.0, 20.0, 20.0, 12.0, 18.0, 11.0, 9.0, 8.0, 7.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3203125, -4.17437744140625, -4.0284423828125, -3.88250732421875, -3.736572265625, -3.59063720703125, -3.4447021484375, -3.29876708984375, -3.15283203125, -3.00689697265625, -2.8609619140625, -2.71502685546875, -2.569091796875, -2.42315673828125, -2.2772216796875, -2.13128662109375, -1.9853515625, -1.83941650390625, -1.6934814453125, -1.54754638671875, -1.401611328125, -1.25567626953125, -1.1097412109375, -0.96380615234375, -0.81787109375, -0.67193603515625, -0.5260009765625, -0.38006591796875, -0.234130859375, -0.08819580078125, 0.0577392578125, 0.20367431640625, 0.349609375, 0.49554443359375, 0.6414794921875, 0.78741455078125, 0.933349609375, 1.07928466796875, 1.2252197265625, 1.37115478515625, 1.51708984375, 1.66302490234375, 1.8089599609375, 1.95489501953125, 2.100830078125, 2.24676513671875, 2.3927001953125, 2.53863525390625, 2.6845703125, 2.83050537109375, 2.9764404296875, 3.12237548828125, 3.268310546875, 3.41424560546875, 3.5601806640625, 3.70611572265625, 3.85205078125, 3.99798583984375, 4.1439208984375, 4.28985595703125, 4.435791015625, 4.58172607421875, 4.7276611328125, 4.87359619140625, 5.01953125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 10.0, 20.0, 20.0, 20.0, 32.0, 34.0, 37.0, 34.0, 44.0, 54.0, 48.0, 56.0, 46.0, 48.0, 48.0, 50.0, 58.0, 38.0, 51.0, 39.0, 28.0, 26.0, 28.0, 22.0, 21.0, 11.0, 17.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.083290100097656, -36.036983489990234, -34.99068069458008, -33.944374084472656, -32.8980712890625, -31.85176658630371, -30.805461883544922, -29.7591552734375, -28.712852478027344, -27.666547775268555, -26.620243072509766, -25.573938369750977, -24.527633666992188, -23.4813289642334, -22.43502426147461, -21.388717651367188, -20.3424129486084, -19.29610824584961, -18.24980354309082, -17.20349884033203, -16.157194137573242, -15.110889434814453, -14.064583778381348, -13.018279075622559, -11.97197437286377, -10.92566967010498, -9.879364967346191, -8.833059310913086, -7.786755084991455, -6.740450382232666, -5.694145202636719, -4.64784049987793, -3.6015357971191406, -2.5552310943603516, -1.5089261531829834, -0.46262121200561523, 0.5836834907531738, 1.629988193511963, 2.67629337310791, 3.722598075866699, 4.768902778625488, 5.815207481384277, 6.861512184143066, 7.907817363739014, 8.954122543334961, 10.00042724609375, 11.046731948852539, 12.093036651611328, 13.139341354370117, 14.185646057128906, 15.231950759887695, 16.278255462646484, 17.324560165405273, 18.370864868164062, 19.417171478271484, 20.46347427368164, 21.509780883789062, 22.55608558654785, 23.60239028930664, 24.64869499206543, 25.69499969482422, 26.741304397583008, 27.787609100341797, 28.83391571044922, 29.880218505859375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 9.0, 11.0, 16.0, 13.0, 9.0, 11.0, 27.0, 20.0, 17.0, 29.0, 18.0, 32.0, 26.0, 33.0, 34.0, 43.0, 29.0, 32.0, 41.0, 46.0, 48.0, 45.0, 48.0, 37.0, 35.0, 36.0, 29.0, 32.0, 21.0, 29.0, 20.0, 15.0, 20.0, 17.0, 16.0, 11.0, 6.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.72342300415039, -27.80643653869629, -26.889450073242188, -25.972463607788086, -25.055477142333984, -24.13848876953125, -23.22150230407715, -22.304515838623047, -21.387529373168945, -20.470542907714844, -19.553556442260742, -18.63656997680664, -17.719581604003906, -16.802597045898438, -15.885608673095703, -14.968622207641602, -14.0516357421875, -13.134649276733398, -12.217662811279297, -11.300675392150879, -10.383688926696777, -9.466702461242676, -8.549715042114258, -7.632728576660156, -6.715742111206055, -5.798755645751953, -4.881768703460693, -3.9647819995880127, -3.047795295715332, -2.1308088302612305, -1.2138218879699707, -0.29683494567871094, 0.6201515197753906, 1.5371382236480713, 2.454124927520752, 3.3711116313934326, 4.288098335266113, 5.205084800720215, 6.122071743011475, 7.039058685302734, 7.956045150756836, 8.873031616210938, 9.790018081665039, 10.707005500793457, 11.623991966247559, 12.54097843170166, 13.457965850830078, 14.37495231628418, 15.291938781738281, 16.208925247192383, 17.125911712646484, 18.042898178100586, 18.959884643554688, 19.876873016357422, 20.793859481811523, 21.710845947265625, 22.627832412719727, 23.544818878173828, 24.46180534362793, 25.37879180908203, 26.295780181884766, 27.212764739990234, 28.12975311279297, 29.04673957824707, 29.963726043701172]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 9.0, 21.0, 36.0, 56.0, 73.0, 174.0, 296.0, 454.0, 838.0, 1491.0, 2342.0, 3887.0, 6342.0, 10007.0, 16208.0, 25037.0, 38971.0, 57470.0, 84472.0, 119302.0, 162530.0, 211630.0, 264146.0, 314522.0, 355121.0, 377694.0, 381237.0, 361870.0, 325560.0, 276141.0, 223604.0, 172891.0, 127875.0, 91264.0, 63308.0, 42400.0, 27920.0, 18063.0, 11303.0, 7002.0, 4259.0, 2597.0, 1600.0, 885.0, 565.0, 332.0, 209.0, 121.0, 67.0, 38.0, 20.0, 9.0, 11.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.8125, -17.239990234375, -16.66748046875, -16.094970703125, -15.5224609375, -14.949951171875, -14.37744140625, -13.804931640625, -13.232421875, -12.659912109375, -12.08740234375, -11.514892578125, -10.9423828125, -10.369873046875, -9.79736328125, -9.224853515625, -8.65234375, -8.079833984375, -7.50732421875, -6.934814453125, -6.3623046875, -5.789794921875, -5.21728515625, -4.644775390625, -4.072265625, -3.499755859375, -2.92724609375, -2.354736328125, -1.7822265625, -1.209716796875, -0.63720703125, -0.064697265625, 0.5078125, 1.080322265625, 1.65283203125, 2.225341796875, 2.7978515625, 3.370361328125, 3.94287109375, 4.515380859375, 5.087890625, 5.660400390625, 6.23291015625, 6.805419921875, 7.3779296875, 7.950439453125, 8.52294921875, 9.095458984375, 9.66796875, 10.240478515625, 10.81298828125, 11.385498046875, 11.9580078125, 12.530517578125, 13.10302734375, 13.675537109375, 14.248046875, 14.820556640625, 15.39306640625, 15.965576171875, 16.5380859375, 17.110595703125, 17.68310546875, 18.255615234375, 18.828125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 11.0, 9.0, 19.0, 8.0, 14.0, 12.0, 22.0, 22.0, 19.0, 24.0, 24.0, 28.0, 29.0, 28.0, 36.0, 38.0, 37.0, 27.0, 52.0, 36.0, 48.0, 55.0, 32.0, 48.0, 34.0, 29.0, 39.0, 23.0, 24.0, 27.0, 24.0, 16.0, 21.0, 19.0, 12.0, 10.0, 7.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.671875, -24.85595703125, -24.0400390625, -23.22412109375, -22.408203125, -21.59228515625, -20.7763671875, -19.96044921875, -19.14453125, -18.32861328125, -17.5126953125, -16.69677734375, -15.880859375, -15.06494140625, -14.2490234375, -13.43310546875, -12.6171875, -11.80126953125, -10.9853515625, -10.16943359375, -9.353515625, -8.53759765625, -7.7216796875, -6.90576171875, -6.08984375, -5.27392578125, -4.4580078125, -3.64208984375, -2.826171875, -2.01025390625, -1.1943359375, -0.37841796875, 0.4375, 1.25341796875, 2.0693359375, 2.88525390625, 3.701171875, 4.51708984375, 5.3330078125, 6.14892578125, 6.96484375, 7.78076171875, 8.5966796875, 9.41259765625, 10.228515625, 11.04443359375, 11.8603515625, 12.67626953125, 13.4921875, 14.30810546875, 15.1240234375, 15.93994140625, 16.755859375, 17.57177734375, 18.3876953125, 19.20361328125, 20.01953125, 20.83544921875, 21.6513671875, 22.46728515625, 23.283203125, 24.09912109375, 24.9150390625, 25.73095703125, 26.546875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 13.0, 13.0, 18.0, 33.0, 66.0, 118.0, 221.0, 373.0, 695.0, 1162.0, 1911.0, 3156.0, 4719.0, 8091.0, 12256.0, 18793.0, 28505.0, 41605.0, 59078.0, 83076.0, 110702.0, 144903.0, 182580.0, 222605.0, 261385.0, 294722.0, 318347.0, 332010.0, 329612.0, 315427.0, 288049.0, 253835.0, 214278.0, 175485.0, 137171.0, 104725.0, 76445.0, 55838.0, 38627.0, 26232.0, 17308.0, 11282.0, 7251.0, 4529.0, 2746.0, 1722.0, 1063.0, 656.0, 374.0, 195.0, 133.0, 77.0, 37.0, 11.0, 11.0, 12.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.09375, -16.54052734375, -15.9873046875, -15.43408203125, -14.880859375, -14.32763671875, -13.7744140625, -13.22119140625, -12.66796875, -12.11474609375, -11.5615234375, -11.00830078125, -10.455078125, -9.90185546875, -9.3486328125, -8.79541015625, -8.2421875, -7.68896484375, -7.1357421875, -6.58251953125, -6.029296875, -5.47607421875, -4.9228515625, -4.36962890625, -3.81640625, -3.26318359375, -2.7099609375, -2.15673828125, -1.603515625, -1.05029296875, -0.4970703125, 0.05615234375, 0.609375, 1.16259765625, 1.7158203125, 2.26904296875, 2.822265625, 3.37548828125, 3.9287109375, 4.48193359375, 5.03515625, 5.58837890625, 6.1416015625, 6.69482421875, 7.248046875, 7.80126953125, 8.3544921875, 8.90771484375, 9.4609375, 10.01416015625, 10.5673828125, 11.12060546875, 11.673828125, 12.22705078125, 12.7802734375, 13.33349609375, 13.88671875, 14.43994140625, 14.9931640625, 15.54638671875, 16.099609375, 16.65283203125, 17.2060546875, 17.75927734375, 18.3125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 9.0, 15.0, 17.0, 22.0, 31.0, 23.0, 36.0, 54.0, 59.0, 75.0, 105.0, 109.0, 102.0, 128.0, 145.0, 162.0, 175.0, 167.0, 154.0, 237.0, 195.0, 202.0, 192.0, 187.0, 209.0, 185.0, 160.0, 150.0, 138.0, 108.0, 96.0, 81.0, 61.0, 62.0, 48.0, 37.0, 39.0, 19.0, 19.0, 19.0, 11.0, 11.0, 4.0, 4.0, 7.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.6634521484375, -10.295654296875, -9.9278564453125, -9.56005859375, -9.1922607421875, -8.824462890625, -8.4566650390625, -8.0888671875, -7.7210693359375, -7.353271484375, -6.9854736328125, -6.61767578125, -6.2498779296875, -5.882080078125, -5.5142822265625, -5.146484375, -4.7786865234375, -4.410888671875, -4.0430908203125, -3.67529296875, -3.3074951171875, -2.939697265625, -2.5718994140625, -2.2041015625, -1.8363037109375, -1.468505859375, -1.1007080078125, -0.73291015625, -0.3651123046875, 0.002685546875, 0.3704833984375, 0.73828125, 1.1060791015625, 1.473876953125, 1.8416748046875, 2.20947265625, 2.5772705078125, 2.945068359375, 3.3128662109375, 3.6806640625, 4.0484619140625, 4.416259765625, 4.7840576171875, 5.15185546875, 5.5196533203125, 5.887451171875, 6.2552490234375, 6.623046875, 6.9908447265625, 7.358642578125, 7.7264404296875, 8.09423828125, 8.4620361328125, 8.829833984375, 9.1976318359375, 9.5654296875, 9.9332275390625, 10.301025390625, 10.6688232421875, 11.03662109375, 11.4044189453125, 11.772216796875, 12.1400146484375, 12.5078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 10.0, 7.0, 8.0, 21.0, 14.0, 16.0, 21.0, 23.0, 26.0, 26.0, 20.0, 30.0, 41.0, 54.0, 33.0, 29.0, 27.0, 42.0, 42.0, 31.0, 44.0, 46.0, 38.0, 34.0, 30.0, 26.0, 33.0, 26.0, 27.0, 24.0, 24.0, 16.0, 12.0, 12.0, 9.0, 12.0, 13.0, 7.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.968320846557617, -26.146636962890625, -25.324951171875, -24.503267288208008, -23.681583404541016, -22.859899520874023, -22.03821563720703, -21.216529846191406, -20.394845962524414, -19.573162078857422, -18.751476287841797, -17.929792404174805, -17.108108520507812, -16.28642463684082, -15.464739799499512, -14.643054962158203, -13.821371078491211, -12.999687194824219, -12.17800235748291, -11.356317520141602, -10.53463363647461, -9.712949752807617, -8.891264915466309, -8.069580078125, -7.247896194458008, -6.426211833953857, -5.604527473449707, -4.782843112945557, -3.9611587524414062, -3.139474391937256, -2.3177900314331055, -1.496105670928955, -0.6744213104248047, 0.1472630500793457, 0.9689474105834961, 1.7906317710876465, 2.612316131591797, 3.4340004920959473, 4.255684852600098, 5.077369213104248, 5.899053573608398, 6.720737934112549, 7.542422294616699, 8.364107131958008, 9.185791015625, 10.007474899291992, 10.8291597366333, 11.65084457397461, 12.472528457641602, 13.294212341308594, 14.115897178649902, 14.937582015991211, 15.759265899658203, 16.580949783325195, 17.402633666992188, 18.224319458007812, 19.046003341674805, 19.867687225341797, 20.689373016357422, 21.511056900024414, 22.332740783691406, 23.1544246673584, 23.97610855102539, 24.797794342041016, 25.619478225708008]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 6.0, 8.0, 10.0, 6.0, 9.0, 17.0, 12.0, 11.0, 21.0, 17.0, 25.0, 22.0, 30.0, 28.0, 27.0, 32.0, 30.0, 34.0, 31.0, 47.0, 40.0, 42.0, 34.0, 33.0, 29.0, 32.0, 37.0, 35.0, 34.0, 25.0, 24.0, 19.0, 19.0, 15.0, 21.0, 16.0, 23.0, 19.0, 17.0, 3.0, 14.0, 10.0, 9.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-24.797746658325195, -23.99693489074707, -23.196123123168945, -22.395309448242188, -21.594497680664062, -20.793685913085938, -19.992874145507812, -19.192062377929688, -18.391250610351562, -17.590438842773438, -16.789627075195312, -15.988814353942871, -15.188002586364746, -14.387189865112305, -13.58637809753418, -12.785566329956055, -11.984753608703613, -11.183941841125488, -10.383129119873047, -9.582317352294922, -8.781505584716797, -7.980693340301514, -7.1798810958862305, -6.3790693283081055, -5.578257083892822, -4.777444839477539, -3.976633071899414, -3.175820827484131, -2.3750088214874268, -1.5741968154907227, -0.7733845710754395, 0.027427196502685547, 0.8282394409179688, 1.6290514469146729, 2.429863452911377, 3.23067569732666, 4.031487464904785, 4.832299709320068, 5.633111953735352, 6.433923721313477, 7.23473596572876, 8.035548210144043, 8.836359977722168, 9.63717269897461, 10.437984466552734, 11.23879623413086, 12.039608001708984, 12.84041976928711, 13.64123249053955, 14.442044258117676, 15.242856979370117, 16.043668746948242, 16.844480514526367, 17.645292282104492, 18.44610595703125, 19.246917724609375, 20.0477294921875, 20.848541259765625, 21.64935302734375, 22.450164794921875, 23.250978469848633, 24.051790237426758, 24.852602005004883, 25.653413772583008, 26.454225540161133]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 11.0, 8.0, 18.0, 23.0, 41.0, 66.0, 105.0, 153.0, 239.0, 316.0, 536.0, 774.0, 1190.0, 1767.0, 2806.0, 4439.0, 6916.0, 10819.0, 16784.0, 26227.0, 40712.0, 59675.0, 86063.0, 114397.0, 135351.0, 137085.0, 119674.0, 92198.0, 65912.0, 43668.0, 28910.0, 18562.0, 11710.0, 7629.0, 4827.0, 3139.0, 1967.0, 1314.0, 816.0, 538.0, 417.0, 250.0, 161.0, 103.0, 66.0, 62.0, 31.0, 27.0, 16.0, 14.0, 12.0, 6.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0], "bins": [-5.9921875, -5.799560546875, -5.60693359375, -5.414306640625, -5.2216796875, -5.029052734375, -4.83642578125, -4.643798828125, -4.451171875, -4.258544921875, -4.06591796875, -3.873291015625, -3.6806640625, -3.488037109375, -3.29541015625, -3.102783203125, -2.91015625, -2.717529296875, -2.52490234375, -2.332275390625, -2.1396484375, -1.947021484375, -1.75439453125, -1.561767578125, -1.369140625, -1.176513671875, -0.98388671875, -0.791259765625, -0.5986328125, -0.406005859375, -0.21337890625, -0.020751953125, 0.171875, 0.364501953125, 0.55712890625, 0.749755859375, 0.9423828125, 1.135009765625, 1.32763671875, 1.520263671875, 1.712890625, 1.905517578125, 2.09814453125, 2.290771484375, 2.4833984375, 2.676025390625, 2.86865234375, 3.061279296875, 3.25390625, 3.446533203125, 3.63916015625, 3.831787109375, 4.0244140625, 4.217041015625, 4.40966796875, 4.602294921875, 4.794921875, 4.987548828125, 5.18017578125, 5.372802734375, 5.5654296875, 5.758056640625, 5.95068359375, 6.143310546875, 6.3359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 10.0, 6.0, 9.0, 17.0, 11.0, 11.0, 21.0, 16.0, 24.0, 26.0, 26.0, 29.0, 29.0, 31.0, 31.0, 32.0, 34.0, 44.0, 41.0, 43.0, 30.0, 37.0, 26.0, 34.0, 38.0, 34.0, 32.0, 26.0, 25.0, 19.0, 19.0, 14.0, 21.0, 17.0, 22.0, 20.0, 17.0, 2.0, 16.0, 9.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-24.84375, -24.044189453125, -23.24462890625, -22.445068359375, -21.6455078125, -20.845947265625, -20.04638671875, -19.246826171875, -18.447265625, -17.647705078125, -16.84814453125, -16.048583984375, -15.2490234375, -14.449462890625, -13.64990234375, -12.850341796875, -12.05078125, -11.251220703125, -10.45166015625, -9.652099609375, -8.8525390625, -8.052978515625, -7.25341796875, -6.453857421875, -5.654296875, -4.854736328125, -4.05517578125, -3.255615234375, -2.4560546875, -1.656494140625, -0.85693359375, -0.057373046875, 0.7421875, 1.541748046875, 2.34130859375, 3.140869140625, 3.9404296875, 4.739990234375, 5.53955078125, 6.339111328125, 7.138671875, 7.938232421875, 8.73779296875, 9.537353515625, 10.3369140625, 11.136474609375, 11.93603515625, 12.735595703125, 13.53515625, 14.334716796875, 15.13427734375, 15.933837890625, 16.7333984375, 17.532958984375, 18.33251953125, 19.132080078125, 19.931640625, 20.731201171875, 21.53076171875, 22.330322265625, 23.1298828125, 23.929443359375, 24.72900390625, 25.528564453125, 26.328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 19.0, 15.0, 34.0, 47.0, 59.0, 65.0, 134.0, 184.0, 224.0, 362.0, 514.0, 798.0, 1167.0, 1891.0, 2892.0, 4733.0, 8038.0, 13639.0, 24833.0, 46610.0, 91610.0, 172724.0, 245429.0, 198331.0, 109144.0, 55413.0, 29117.0, 16081.0, 9242.0, 5591.0, 3322.0, 2174.0, 1361.0, 915.0, 584.0, 396.0, 273.0, 191.0, 108.0, 95.0, 57.0, 38.0, 35.0, 24.0, 14.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.95703125, -7.71319580078125, -7.4693603515625, -7.22552490234375, -6.981689453125, -6.73785400390625, -6.4940185546875, -6.25018310546875, -6.00634765625, -5.76251220703125, -5.5186767578125, -5.27484130859375, -5.031005859375, -4.78717041015625, -4.5433349609375, -4.29949951171875, -4.0556640625, -3.81182861328125, -3.5679931640625, -3.32415771484375, -3.080322265625, -2.83648681640625, -2.5926513671875, -2.34881591796875, -2.10498046875, -1.86114501953125, -1.6173095703125, -1.37347412109375, -1.129638671875, -0.88580322265625, -0.6419677734375, -0.39813232421875, -0.154296875, 0.08953857421875, 0.3333740234375, 0.57720947265625, 0.821044921875, 1.06488037109375, 1.3087158203125, 1.55255126953125, 1.79638671875, 2.04022216796875, 2.2840576171875, 2.52789306640625, 2.771728515625, 3.01556396484375, 3.2593994140625, 3.50323486328125, 3.7470703125, 3.99090576171875, 4.2347412109375, 4.47857666015625, 4.722412109375, 4.96624755859375, 5.2100830078125, 5.45391845703125, 5.69775390625, 5.94158935546875, 6.1854248046875, 6.42926025390625, 6.673095703125, 6.91693115234375, 7.1607666015625, 7.40460205078125, 7.6484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 4.0, 9.0, 4.0, 9.0, 6.0, 7.0, 13.0, 15.0, 14.0, 23.0, 18.0, 20.0, 23.0, 25.0, 24.0, 40.0, 34.0, 34.0, 33.0, 37.0, 41.0, 42.0, 52.0, 40.0, 45.0, 49.0, 33.0, 28.0, 45.0, 32.0, 28.0, 26.0, 13.0, 14.0, 26.0, 18.0, 13.0, 16.0, 7.0, 8.0, 2.0, 5.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.4697265625, -15.908203125, -15.3466796875, -14.78515625, -14.2236328125, -13.662109375, -13.1005859375, -12.5390625, -11.9775390625, -11.416015625, -10.8544921875, -10.29296875, -9.7314453125, -9.169921875, -8.6083984375, -8.046875, -7.4853515625, -6.923828125, -6.3623046875, -5.80078125, -5.2392578125, -4.677734375, -4.1162109375, -3.5546875, -2.9931640625, -2.431640625, -1.8701171875, -1.30859375, -0.7470703125, -0.185546875, 0.3759765625, 0.9375, 1.4990234375, 2.060546875, 2.6220703125, 3.18359375, 3.7451171875, 4.306640625, 4.8681640625, 5.4296875, 5.9912109375, 6.552734375, 7.1142578125, 7.67578125, 8.2373046875, 8.798828125, 9.3603515625, 9.921875, 10.4833984375, 11.044921875, 11.6064453125, 12.16796875, 12.7294921875, 13.291015625, 13.8525390625, 14.4140625, 14.9755859375, 15.537109375, 16.0986328125, 16.66015625, 17.2216796875, 17.783203125, 18.3447265625, 18.90625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 9.0, 11.0, 11.0, 20.0, 39.0, 59.0, 88.0, 106.0, 169.0, 234.0, 325.0, 506.0, 736.0, 1039.0, 1643.0, 2576.0, 4123.0, 6803.0, 12334.0, 23518.0, 52015.0, 140963.0, 395909.0, 250231.0, 80940.0, 33898.0, 16528.0, 9088.0, 5229.0, 3210.0, 2042.0, 1346.0, 914.0, 583.0, 391.0, 273.0, 212.0, 147.0, 78.0, 70.0, 49.0, 30.0, 21.0, 8.0, 15.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16796875, -5.9736328125, -5.779296875, -5.5849609375, -5.390625, -5.1962890625, -5.001953125, -4.8076171875, -4.61328125, -4.4189453125, -4.224609375, -4.0302734375, -3.8359375, -3.6416015625, -3.447265625, -3.2529296875, -3.05859375, -2.8642578125, -2.669921875, -2.4755859375, -2.28125, -2.0869140625, -1.892578125, -1.6982421875, -1.50390625, -1.3095703125, -1.115234375, -0.9208984375, -0.7265625, -0.5322265625, -0.337890625, -0.1435546875, 0.05078125, 0.2451171875, 0.439453125, 0.6337890625, 0.828125, 1.0224609375, 1.216796875, 1.4111328125, 1.60546875, 1.7998046875, 1.994140625, 2.1884765625, 2.3828125, 2.5771484375, 2.771484375, 2.9658203125, 3.16015625, 3.3544921875, 3.548828125, 3.7431640625, 3.9375, 4.1318359375, 4.326171875, 4.5205078125, 4.71484375, 4.9091796875, 5.103515625, 5.2978515625, 5.4921875, 5.6865234375, 5.880859375, 6.0751953125, 6.26953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 18.0, 15.0, 12.0, 14.0, 25.0, 27.0, 30.0, 37.0, 42.0, 41.0, 47.0, 40.0, 50.0, 48.0, 57.0, 50.0, 52.0, 40.0, 46.0, 35.0, 58.0, 25.0, 32.0, 21.0, 20.0, 10.0, 13.0, 15.0, 11.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026988983154296875, -0.0002611801028251648, -0.00025247037410736084, -0.00024376064538955688, -0.00023505091667175293, -0.00022634118795394897, -0.00021763145923614502, -0.00020892173051834106, -0.0002002120018005371, -0.00019150227308273315, -0.0001827925443649292, -0.00017408281564712524, -0.0001653730869293213, -0.00015666335821151733, -0.00014795362949371338, -0.00013924390077590942, -0.00013053417205810547, -0.00012182444334030151, -0.00011311471462249756, -0.0001044049859046936, -9.569525718688965e-05, -8.69855284690857e-05, -7.827579975128174e-05, -6.956607103347778e-05, -6.085634231567383e-05, -5.214661359786987e-05, -4.343688488006592e-05, -3.472715616226196e-05, -2.6017427444458008e-05, -1.7307698726654053e-05, -8.597970008850098e-06, 1.1175870895385742e-07, 8.821487426757812e-06, 1.7531216144561768e-05, 2.6240944862365723e-05, 3.495067358016968e-05, 4.366040229797363e-05, 5.237013101577759e-05, 6.107985973358154e-05, 6.97895884513855e-05, 7.849931716918945e-05, 8.720904588699341e-05, 9.591877460479736e-05, 0.00010462850332260132, 0.00011333823204040527, 0.00012204796075820923, 0.00013075768947601318, 0.00013946741819381714, 0.0001481771469116211, 0.00015688687562942505, 0.000165596604347229, 0.00017430633306503296, 0.00018301606178283691, 0.00019172579050064087, 0.00020043551921844482, 0.00020914524793624878, 0.00021785497665405273, 0.0002265647053718567, 0.00023527443408966064, 0.0002439841628074646, 0.00025269389152526855, 0.0002614036202430725, 0.00027011334896087646, 0.0002788230776786804, 0.0002875328063964844]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 5.0, 13.0, 19.0, 18.0, 36.0, 43.0, 76.0, 109.0, 152.0, 226.0, 355.0, 547.0, 859.0, 1307.0, 2058.0, 3340.0, 5324.0, 8606.0, 14619.0, 24187.0, 40833.0, 68561.0, 110616.0, 160068.0, 181987.0, 154767.0, 106107.0, 65751.0, 38805.0, 22985.0, 13871.0, 8515.0, 4948.0, 3214.0, 2008.0, 1288.0, 757.0, 523.0, 339.0, 246.0, 144.0, 109.0, 68.0, 46.0, 34.0, 24.0, 15.0, 10.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.87890625, -6.67327880859375, -6.4676513671875, -6.26202392578125, -6.056396484375, -5.85076904296875, -5.6451416015625, -5.43951416015625, -5.23388671875, -5.02825927734375, -4.8226318359375, -4.61700439453125, -4.411376953125, -4.20574951171875, -4.0001220703125, -3.79449462890625, -3.5888671875, -3.38323974609375, -3.1776123046875, -2.97198486328125, -2.766357421875, -2.56072998046875, -2.3551025390625, -2.14947509765625, -1.94384765625, -1.73822021484375, -1.5325927734375, -1.32696533203125, -1.121337890625, -0.91571044921875, -0.7100830078125, -0.50445556640625, -0.298828125, -0.09320068359375, 0.1124267578125, 0.31805419921875, 0.523681640625, 0.72930908203125, 0.9349365234375, 1.14056396484375, 1.34619140625, 1.55181884765625, 1.7574462890625, 1.96307373046875, 2.168701171875, 2.37432861328125, 2.5799560546875, 2.78558349609375, 2.9912109375, 3.19683837890625, 3.4024658203125, 3.60809326171875, 3.813720703125, 4.01934814453125, 4.2249755859375, 4.43060302734375, 4.63623046875, 4.84185791015625, 5.0474853515625, 5.25311279296875, 5.458740234375, 5.66436767578125, 5.8699951171875, 6.07562255859375, 6.28125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 16.0, 14.0, 20.0, 28.0, 48.0, 44.0, 48.0, 62.0, 71.0, 77.0, 86.0, 81.0, 78.0, 68.0, 40.0, 41.0, 31.0, 23.0, 17.0, 8.0, 12.0, 14.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.28192138671875, -2.1986083984375, -2.11529541015625, -2.031982421875, -1.94866943359375, -1.8653564453125, -1.78204345703125, -1.69873046875, -1.61541748046875, -1.5321044921875, -1.44879150390625, -1.365478515625, -1.28216552734375, -1.1988525390625, -1.11553955078125, -1.0322265625, -0.94891357421875, -0.8656005859375, -0.78228759765625, -0.698974609375, -0.61566162109375, -0.5323486328125, -0.44903564453125, -0.36572265625, -0.28240966796875, -0.1990966796875, -0.11578369140625, -0.032470703125, 0.05084228515625, 0.1341552734375, 0.21746826171875, 0.30078125, 0.38409423828125, 0.4674072265625, 0.55072021484375, 0.634033203125, 0.71734619140625, 0.8006591796875, 0.88397216796875, 0.96728515625, 1.05059814453125, 1.1339111328125, 1.21722412109375, 1.300537109375, 1.38385009765625, 1.4671630859375, 1.55047607421875, 1.6337890625, 1.71710205078125, 1.8004150390625, 1.88372802734375, 1.967041015625, 2.05035400390625, 2.1336669921875, 2.21697998046875, 2.30029296875, 2.38360595703125, 2.4669189453125, 2.55023193359375, 2.633544921875, 2.71685791015625, 2.8001708984375, 2.88348388671875, 2.966796875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 5.0, 8.0, 6.0, 6.0, 6.0, 14.0, 15.0, 12.0, 17.0, 27.0, 21.0, 22.0, 23.0, 24.0, 25.0, 37.0, 50.0, 38.0, 30.0, 29.0, 35.0, 27.0, 47.0, 42.0, 46.0, 44.0, 28.0, 29.0, 24.0, 28.0, 34.0, 26.0, 26.0, 25.0, 17.0, 15.0, 9.0, 14.0, 10.0, 13.0, 13.0, 9.0, 4.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.71864128112793, -24.91893196105957, -24.119220733642578, -23.31951141357422, -22.519800186157227, -21.720090866088867, -20.920379638671875, -20.120670318603516, -19.320960998535156, -18.521251678466797, -17.721540451049805, -16.921831130981445, -16.122119903564453, -15.322410583496094, -14.522700309753418, -13.722990036010742, -12.92327880859375, -12.123568534851074, -11.323858261108398, -10.524148941040039, -9.724437713623047, -8.924728393554688, -8.125018119812012, -7.325307846069336, -6.52559757232666, -5.725887298583984, -4.926177024841309, -4.126467227935791, -3.3267569541931152, -2.5270466804504395, -1.7273368835449219, -0.9276266098022461, -0.1279163360595703, 0.6717938184738159, 1.4715039730072021, 2.271214008331299, 3.0709242820739746, 3.8706345558166504, 4.670344352722168, 5.470054626464844, 6.2697649002075195, 7.069475173950195, 7.869185447692871, 8.668895721435547, 9.468605041503906, 10.268316268920898, 11.068025588989258, 11.867735862731934, 12.66744613647461, 13.467156410217285, 14.266866683959961, 15.06657600402832, 15.866287231445312, 16.665996551513672, 17.46570587158203, 18.265417098999023, 19.065128326416016, 19.864837646484375, 20.664548873901367, 21.464258193969727, 22.26396942138672, 23.063678741455078, 23.863388061523438, 24.66309928894043, 25.46280860900879]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 10.0, 8.0, 8.0, 5.0, 13.0, 15.0, 12.0, 10.0, 21.0, 22.0, 28.0, 19.0, 29.0, 32.0, 25.0, 35.0, 30.0, 33.0, 31.0, 49.0, 39.0, 32.0, 32.0, 33.0, 32.0, 41.0, 27.0, 34.0, 29.0, 26.0, 21.0, 23.0, 16.0, 16.0, 18.0, 21.0, 22.0, 17.0, 16.0, 6.0, 10.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-24.910968780517578, -24.126188278198242, -23.341405868530273, -22.556625366210938, -21.77184295654297, -20.987062454223633, -20.202281951904297, -19.417499542236328, -18.63271713256836, -17.847936630249023, -17.063154220581055, -16.27837371826172, -15.49359130859375, -14.708810806274414, -13.924029350280762, -13.13924789428711, -12.354467391967773, -11.569685935974121, -10.784904479980469, -10.000123977661133, -9.215341567993164, -8.430561065673828, -7.645779609680176, -6.860998153686523, -6.076216697692871, -5.291435241699219, -4.506653785705566, -3.7218728065490723, -2.93709135055542, -2.1523098945617676, -1.3675289154052734, -0.5827474594116211, 0.20203590393066406, 0.9868172407150269, 1.7715985774993896, 2.556379795074463, 3.3411612510681152, 4.125942707061768, 4.910723686218262, 5.695505142211914, 6.480286598205566, 7.265068054199219, 8.049849510192871, 8.834630966186523, 9.61941146850586, 10.404193878173828, 11.188974380493164, 11.973755836486816, 12.758537292480469, 13.543318748474121, 14.328100204467773, 15.11288070678711, 15.897663116455078, 16.682443618774414, 17.46722412109375, 18.25200653076172, 19.036788940429688, 19.821569442749023, 20.606351852416992, 21.391132354736328, 22.175914764404297, 22.960695266723633, 23.74547576904297, 24.530258178710938, 25.315038681030273]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 7.0, 9.0, 22.0, 33.0, 55.0, 90.0, 121.0, 212.0, 359.0, 539.0, 901.0, 1367.0, 2083.0, 3149.0, 4547.0, 6987.0, 10018.0, 14448.0, 19447.0, 26455.0, 34581.0, 43770.0, 53978.0, 63042.0, 71916.0, 78099.0, 82251.0, 81559.0, 79268.0, 73166.0, 64385.0, 55038.0, 45033.0, 36089.0, 27365.0, 20611.0, 14636.0, 10698.0, 7481.0, 5083.0, 3449.0, 2228.0, 1443.0, 966.0, 588.0, 388.0, 242.0, 147.0, 79.0, 55.0, 39.0, 14.0, 12.0, 11.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.796875, -13.338134765625, -12.87939453125, -12.420654296875, -11.9619140625, -11.503173828125, -11.04443359375, -10.585693359375, -10.126953125, -9.668212890625, -9.20947265625, -8.750732421875, -8.2919921875, -7.833251953125, -7.37451171875, -6.915771484375, -6.45703125, -5.998291015625, -5.53955078125, -5.080810546875, -4.6220703125, -4.163330078125, -3.70458984375, -3.245849609375, -2.787109375, -2.328369140625, -1.86962890625, -1.410888671875, -0.9521484375, -0.493408203125, -0.03466796875, 0.424072265625, 0.8828125, 1.341552734375, 1.80029296875, 2.259033203125, 2.7177734375, 3.176513671875, 3.63525390625, 4.093994140625, 4.552734375, 5.011474609375, 5.47021484375, 5.928955078125, 6.3876953125, 6.846435546875, 7.30517578125, 7.763916015625, 8.22265625, 8.681396484375, 9.14013671875, 9.598876953125, 10.0576171875, 10.516357421875, 10.97509765625, 11.433837890625, 11.892578125, 12.351318359375, 12.81005859375, 13.268798828125, 13.7275390625, 14.186279296875, 14.64501953125, 15.103759765625, 15.5625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 8.0, 5.0, 7.0, 13.0, 14.0, 14.0, 10.0, 22.0, 21.0, 24.0, 25.0, 27.0, 33.0, 27.0, 30.0, 31.0, 33.0, 31.0, 49.0, 35.0, 35.0, 36.0, 31.0, 30.0, 41.0, 28.0, 32.0, 28.0, 30.0, 24.0, 19.0, 16.0, 19.0, 15.0, 22.0, 21.0, 19.0, 15.0, 6.0, 10.0, 9.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-24.328125, -23.562744140625, -22.79736328125, -22.031982421875, -21.2666015625, -20.501220703125, -19.73583984375, -18.970458984375, -18.205078125, -17.439697265625, -16.67431640625, -15.908935546875, -15.1435546875, -14.378173828125, -13.61279296875, -12.847412109375, -12.08203125, -11.316650390625, -10.55126953125, -9.785888671875, -9.0205078125, -8.255126953125, -7.48974609375, -6.724365234375, -5.958984375, -5.193603515625, -4.42822265625, -3.662841796875, -2.8974609375, -2.132080078125, -1.36669921875, -0.601318359375, 0.1640625, 0.929443359375, 1.69482421875, 2.460205078125, 3.2255859375, 3.990966796875, 4.75634765625, 5.521728515625, 6.287109375, 7.052490234375, 7.81787109375, 8.583251953125, 9.3486328125, 10.114013671875, 10.87939453125, 11.644775390625, 12.41015625, 13.175537109375, 13.94091796875, 14.706298828125, 15.4716796875, 16.237060546875, 17.00244140625, 17.767822265625, 18.533203125, 19.298583984375, 20.06396484375, 20.829345703125, 21.5947265625, 22.360107421875, 23.12548828125, 23.890869140625, 24.65625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 20.0, 30.0, 50.0, 57.0, 120.0, 185.0, 318.0, 515.0, 789.0, 1291.0, 1860.0, 2921.0, 4455.0, 6512.0, 9775.0, 14065.0, 19344.0, 27242.0, 35598.0, 46446.0, 57016.0, 67059.0, 76908.0, 83711.0, 87046.0, 86469.0, 80940.0, 73074.0, 63306.0, 51923.0, 41469.0, 31375.0, 23494.0, 17101.0, 11967.0, 8189.0, 5523.0, 3648.0, 2444.0, 1641.0, 971.0, 641.0, 393.0, 236.0, 158.0, 100.0, 67.0, 31.0, 24.0, 18.0, 7.0, 6.0, 0.0, 2.0, 0.0, 3.0], "bins": [-15.7890625, -15.307373046875, -14.82568359375, -14.343994140625, -13.8623046875, -13.380615234375, -12.89892578125, -12.417236328125, -11.935546875, -11.453857421875, -10.97216796875, -10.490478515625, -10.0087890625, -9.527099609375, -9.04541015625, -8.563720703125, -8.08203125, -7.600341796875, -7.11865234375, -6.636962890625, -6.1552734375, -5.673583984375, -5.19189453125, -4.710205078125, -4.228515625, -3.746826171875, -3.26513671875, -2.783447265625, -2.3017578125, -1.820068359375, -1.33837890625, -0.856689453125, -0.375, 0.106689453125, 0.58837890625, 1.070068359375, 1.5517578125, 2.033447265625, 2.51513671875, 2.996826171875, 3.478515625, 3.960205078125, 4.44189453125, 4.923583984375, 5.4052734375, 5.886962890625, 6.36865234375, 6.850341796875, 7.33203125, 7.813720703125, 8.29541015625, 8.777099609375, 9.2587890625, 9.740478515625, 10.22216796875, 10.703857421875, 11.185546875, 11.667236328125, 12.14892578125, 12.630615234375, 13.1123046875, 13.593994140625, 14.07568359375, 14.557373046875, 15.0390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 5.0, 8.0, 15.0, 9.0, 13.0, 9.0, 13.0, 14.0, 18.0, 21.0, 30.0, 40.0, 30.0, 42.0, 35.0, 39.0, 46.0, 52.0, 48.0, 39.0, 52.0, 42.0, 37.0, 37.0, 31.0, 31.0, 32.0, 23.0, 22.0, 29.0, 25.0, 19.0, 10.0, 11.0, 18.0, 8.0, 14.0, 6.0, 3.0, 7.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-22.28125, -21.656494140625, -21.03173828125, -20.406982421875, -19.7822265625, -19.157470703125, -18.53271484375, -17.907958984375, -17.283203125, -16.658447265625, -16.03369140625, -15.408935546875, -14.7841796875, -14.159423828125, -13.53466796875, -12.909912109375, -12.28515625, -11.660400390625, -11.03564453125, -10.410888671875, -9.7861328125, -9.161376953125, -8.53662109375, -7.911865234375, -7.287109375, -6.662353515625, -6.03759765625, -5.412841796875, -4.7880859375, -4.163330078125, -3.53857421875, -2.913818359375, -2.2890625, -1.664306640625, -1.03955078125, -0.414794921875, 0.2099609375, 0.834716796875, 1.45947265625, 2.084228515625, 2.708984375, 3.333740234375, 3.95849609375, 4.583251953125, 5.2080078125, 5.832763671875, 6.45751953125, 7.082275390625, 7.70703125, 8.331787109375, 8.95654296875, 9.581298828125, 10.2060546875, 10.830810546875, 11.45556640625, 12.080322265625, 12.705078125, 13.329833984375, 13.95458984375, 14.579345703125, 15.2041015625, 15.828857421875, 16.45361328125, 17.078369140625, 17.703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 10.0, 15.0, 23.0, 33.0, 54.0, 78.0, 164.0, 237.0, 417.0, 664.0, 1196.0, 1962.0, 3162.0, 5274.0, 8623.0, 13672.0, 21497.0, 32116.0, 46106.0, 62506.0, 80325.0, 95246.0, 107181.0, 110116.0, 105192.0, 93080.0, 76312.0, 58832.0, 42724.0, 29510.0, 19498.0, 12572.0, 7908.0, 4973.0, 2988.0, 1707.0, 1079.0, 592.0, 347.0, 205.0, 152.0, 83.0, 47.0, 36.0, 19.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.2421875, -8.9654541015625, -8.688720703125, -8.4119873046875, -8.13525390625, -7.8585205078125, -7.581787109375, -7.3050537109375, -7.0283203125, -6.7515869140625, -6.474853515625, -6.1981201171875, -5.92138671875, -5.6446533203125, -5.367919921875, -5.0911865234375, -4.814453125, -4.5377197265625, -4.260986328125, -3.9842529296875, -3.70751953125, -3.4307861328125, -3.154052734375, -2.8773193359375, -2.6005859375, -2.3238525390625, -2.047119140625, -1.7703857421875, -1.49365234375, -1.2169189453125, -0.940185546875, -0.6634521484375, -0.38671875, -0.1099853515625, 0.166748046875, 0.4434814453125, 0.72021484375, 0.9969482421875, 1.273681640625, 1.5504150390625, 1.8271484375, 2.1038818359375, 2.380615234375, 2.6573486328125, 2.93408203125, 3.2108154296875, 3.487548828125, 3.7642822265625, 4.041015625, 4.3177490234375, 4.594482421875, 4.8712158203125, 5.14794921875, 5.4246826171875, 5.701416015625, 5.9781494140625, 6.2548828125, 6.5316162109375, 6.808349609375, 7.0850830078125, 7.36181640625, 7.6385498046875, 7.915283203125, 8.1920166015625, 8.46875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 2.0, 4.0, 8.0, 9.0, 8.0, 8.0, 17.0, 12.0, 16.0, 21.0, 16.0, 26.0, 43.0, 32.0, 36.0, 44.0, 40.0, 55.0, 49.0, 45.0, 68.0, 43.0, 48.0, 38.0, 36.0, 43.0, 40.0, 37.0, 26.0, 22.0, 23.0, 27.0, 12.0, 11.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012052804231643677, -0.0011688768863677979, -0.001132473349571228, -0.0010960698127746582, -0.0010596662759780884, -0.0010232627391815186, -0.0009868592023849487, -0.0009504556655883789, -0.0009140521287918091, -0.0008776485919952393, -0.0008412450551986694, -0.0008048415184020996, -0.0007684379816055298, -0.00073203444480896, -0.0006956309080123901, -0.0006592273712158203, -0.0006228238344192505, -0.0005864202976226807, -0.0005500167608261108, -0.000513613224029541, -0.0004772096872329712, -0.00044080615043640137, -0.00040440261363983154, -0.0003679990768432617, -0.0003315955400466919, -0.00029519200325012207, -0.00025878846645355225, -0.00022238492965698242, -0.0001859813928604126, -0.00014957785606384277, -0.00011317431926727295, -7.677078247070312e-05, -4.03672456741333e-05, -3.9637088775634766e-06, 3.243982791900635e-05, 6.884336471557617e-05, 0.000105246901512146, 0.00014165043830871582, 0.00017805397510528564, 0.00021445751190185547, 0.0002508610486984253, 0.0002872645854949951, 0.00032366812229156494, 0.00036007165908813477, 0.0003964751958847046, 0.0004328787326812744, 0.00046928226947784424, 0.0005056858062744141, 0.0005420893430709839, 0.0005784928798675537, 0.0006148964166641235, 0.0006512999534606934, 0.0006877034902572632, 0.000724107027053833, 0.0007605105638504028, 0.0007969141006469727, 0.0008333176374435425, 0.0008697211742401123, 0.0009061247110366821, 0.000942528247833252, 0.0009789317846298218, 0.0010153353214263916, 0.0010517388582229614, 0.0010881423950195312]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 17.0, 25.0, 39.0, 57.0, 104.0, 152.0, 256.0, 404.0, 590.0, 1026.0, 1624.0, 2413.0, 3778.0, 5998.0, 9516.0, 14138.0, 21040.0, 30404.0, 42866.0, 57851.0, 73622.0, 88221.0, 99070.0, 104450.0, 102020.0, 93024.0, 78908.0, 62681.0, 48375.0, 34985.0, 24226.0, 16461.0, 10784.0, 7018.0, 4616.0, 2851.0, 1808.0, 1141.0, 730.0, 479.0, 302.0, 193.0, 104.0, 80.0, 46.0, 18.0, 12.0, 12.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.4140625, -10.1048583984375, -9.795654296875, -9.4864501953125, -9.17724609375, -8.8680419921875, -8.558837890625, -8.2496337890625, -7.9404296875, -7.6312255859375, -7.322021484375, -7.0128173828125, -6.70361328125, -6.3944091796875, -6.085205078125, -5.7760009765625, -5.466796875, -5.1575927734375, -4.848388671875, -4.5391845703125, -4.22998046875, -3.9207763671875, -3.611572265625, -3.3023681640625, -2.9931640625, -2.6839599609375, -2.374755859375, -2.0655517578125, -1.75634765625, -1.4471435546875, -1.137939453125, -0.8287353515625, -0.51953125, -0.2103271484375, 0.098876953125, 0.4080810546875, 0.71728515625, 1.0264892578125, 1.335693359375, 1.6448974609375, 1.9541015625, 2.2633056640625, 2.572509765625, 2.8817138671875, 3.19091796875, 3.5001220703125, 3.809326171875, 4.1185302734375, 4.427734375, 4.7369384765625, 5.046142578125, 5.3553466796875, 5.66455078125, 5.9737548828125, 6.282958984375, 6.5921630859375, 6.9013671875, 7.2105712890625, 7.519775390625, 7.8289794921875, 8.13818359375, 8.4473876953125, 8.756591796875, 9.0657958984375, 9.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 6.0, 9.0, 16.0, 18.0, 21.0, 13.0, 27.0, 24.0, 33.0, 31.0, 38.0, 46.0, 34.0, 53.0, 48.0, 47.0, 52.0, 45.0, 47.0, 39.0, 46.0, 40.0, 35.0, 26.0, 27.0, 26.0, 13.0, 32.0, 15.0, 13.0, 12.0, 8.0, 9.0, 8.0, 9.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.51397705078125, -4.3638916015625, -4.21380615234375, -4.063720703125, -3.91363525390625, -3.7635498046875, -3.61346435546875, -3.46337890625, -3.31329345703125, -3.1632080078125, -3.01312255859375, -2.863037109375, -2.71295166015625, -2.5628662109375, -2.41278076171875, -2.2626953125, -2.11260986328125, -1.9625244140625, -1.81243896484375, -1.662353515625, -1.51226806640625, -1.3621826171875, -1.21209716796875, -1.06201171875, -0.91192626953125, -0.7618408203125, -0.61175537109375, -0.461669921875, -0.31158447265625, -0.1614990234375, -0.01141357421875, 0.138671875, 0.28875732421875, 0.4388427734375, 0.58892822265625, 0.739013671875, 0.88909912109375, 1.0391845703125, 1.18927001953125, 1.33935546875, 1.48944091796875, 1.6395263671875, 1.78961181640625, 1.939697265625, 2.08978271484375, 2.2398681640625, 2.38995361328125, 2.5400390625, 2.69012451171875, 2.8402099609375, 2.99029541015625, 3.140380859375, 3.29046630859375, 3.4405517578125, 3.59063720703125, 3.74072265625, 3.89080810546875, 4.0408935546875, 4.19097900390625, 4.341064453125, 4.49114990234375, 4.6412353515625, 4.79132080078125, 4.94140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 9.0, 10.0, 16.0, 10.0, 22.0, 19.0, 28.0, 23.0, 26.0, 31.0, 40.0, 44.0, 42.0, 37.0, 37.0, 39.0, 45.0, 33.0, 51.0, 43.0, 46.0, 29.0, 40.0, 38.0, 27.0, 27.0, 22.0, 27.0, 31.0, 16.0, 17.0, 12.0, 7.0, 5.0, 8.0, 11.0, 3.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640209197998047, -28.715333938598633, -27.790456771850586, -26.865581512451172, -25.940704345703125, -25.01582908630371, -24.090953826904297, -23.16607666015625, -22.241201400756836, -21.316326141357422, -20.391448974609375, -19.46657371520996, -18.541698455810547, -17.6168212890625, -16.691946029663086, -15.767069816589355, -14.842193603515625, -13.917317390441895, -12.992441177368164, -12.06756591796875, -11.14268970489502, -10.217813491821289, -9.292938232421875, -8.368062019348145, -7.443185806274414, -6.518309593200684, -5.593433856964111, -4.668558120727539, -3.7436819076538086, -2.818805694580078, -1.8939299583435059, -0.9690542221069336, -0.04417610168457031, 0.880699872970581, 1.8055758476257324, 2.730451822280884, 3.655327796936035, 4.580204010009766, 5.505079746246338, 6.42995548248291, 7.354831695556641, 8.279707908630371, 9.204584121704102, 10.129459381103516, 11.054335594177246, 11.979211807250977, 12.90408706665039, 13.828963279724121, 14.753839492797852, 15.678715705871582, 16.603591918945312, 17.528467178344727, 18.45334243774414, 19.378219604492188, 20.3030948638916, 21.227970123291016, 22.152847290039062, 23.077722549438477, 24.002599716186523, 24.927474975585938, 25.852352142333984, 26.7772274017334, 27.702102661132812, 28.62697982788086, 29.551855087280273]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 1.0, 3.0, 9.0, 6.0, 11.0, 13.0, 16.0, 16.0, 13.0, 13.0, 23.0, 21.0, 24.0, 29.0, 33.0, 23.0, 32.0, 30.0, 41.0, 40.0, 37.0, 40.0, 35.0, 33.0, 30.0, 33.0, 26.0, 31.0, 36.0, 33.0, 30.0, 24.0, 19.0, 18.0, 15.0, 22.0, 24.0, 12.0, 20.0, 10.0, 11.0, 17.0, 10.0, 10.0, 6.0, 3.0, 3.0, 8.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.513824462890625, -24.693084716796875, -23.872344970703125, -23.051603317260742, -22.230863571166992, -21.410123825073242, -20.58938217163086, -19.76864242553711, -18.94790267944336, -18.12716293334961, -17.30642318725586, -16.485681533813477, -15.664941787719727, -14.844202041625977, -14.02346134185791, -13.202720642089844, -12.381980895996094, -11.561241149902344, -10.740500450134277, -9.919759750366211, -9.099020004272461, -8.278280258178711, -7.4575395584106445, -6.636799335479736, -5.816059112548828, -4.99531888961792, -4.174578666687012, -3.3538384437561035, -2.5330982208251953, -1.712357997894287, -0.8916177749633789, -0.0708775520324707, 0.7498626708984375, 1.5706028938293457, 2.391343116760254, 3.212083339691162, 4.03282356262207, 4.8535637855529785, 5.674304008483887, 6.495044231414795, 7.315784454345703, 8.136524200439453, 8.95726490020752, 9.778005599975586, 10.598745346069336, 11.419485092163086, 12.240225791931152, 13.060966491699219, 13.881706237792969, 14.702445983886719, 15.523186683654785, 16.34392738342285, 17.1646671295166, 17.98540687561035, 18.806148529052734, 19.626888275146484, 20.447628021240234, 21.268367767333984, 22.089107513427734, 22.909849166870117, 23.730588912963867, 24.551328659057617, 25.3720703125, 26.19281005859375, 27.0135498046875]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 6.0, 19.0, 22.0, 57.0, 91.0, 169.0, 261.0, 447.0, 807.0, 1373.0, 2345.0, 3782.0, 6191.0, 10136.0, 16277.0, 24958.0, 38113.0, 56403.0, 82844.0, 115615.0, 157926.0, 204398.0, 257793.0, 308045.0, 345867.0, 371245.0, 376390.0, 360719.0, 327235.0, 281413.0, 230726.0, 179198.0, 135321.0, 97941.0, 68745.0, 46363.0, 31224.0, 20175.0, 12776.0, 8116.0, 5060.0, 3103.0, 1887.0, 1141.0, 689.0, 375.0, 213.0, 119.0, 81.0, 44.0, 18.0, 11.0, 5.0, 6.0, 1.0, 2.0], "bins": [-19.765625, -19.1884765625, -18.611328125, -18.0341796875, -17.45703125, -16.8798828125, -16.302734375, -15.7255859375, -15.1484375, -14.5712890625, -13.994140625, -13.4169921875, -12.83984375, -12.2626953125, -11.685546875, -11.1083984375, -10.53125, -9.9541015625, -9.376953125, -8.7998046875, -8.22265625, -7.6455078125, -7.068359375, -6.4912109375, -5.9140625, -5.3369140625, -4.759765625, -4.1826171875, -3.60546875, -3.0283203125, -2.451171875, -1.8740234375, -1.296875, -0.7197265625, -0.142578125, 0.4345703125, 1.01171875, 1.5888671875, 2.166015625, 2.7431640625, 3.3203125, 3.8974609375, 4.474609375, 5.0517578125, 5.62890625, 6.2060546875, 6.783203125, 7.3603515625, 7.9375, 8.5146484375, 9.091796875, 9.6689453125, 10.24609375, 10.8232421875, 11.400390625, 11.9775390625, 12.5546875, 13.1318359375, 13.708984375, 14.2861328125, 14.86328125, 15.4404296875, 16.017578125, 16.5947265625, 17.171875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 3.0, 2.0, 2.0, 8.0, 11.0, 10.0, 8.0, 20.0, 12.0, 14.0, 17.0, 26.0, 23.0, 23.0, 32.0, 29.0, 24.0, 31.0, 36.0, 37.0, 32.0, 51.0, 33.0, 37.0, 33.0, 28.0, 36.0, 24.0, 33.0, 36.0, 33.0, 24.0, 22.0, 25.0, 17.0, 18.0, 17.0, 25.0, 15.0, 16.0, 10.0, 14.0, 14.0, 13.0, 5.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.0625, -22.318359375, -21.57421875, -20.830078125, -20.0859375, -19.341796875, -18.59765625, -17.853515625, -17.109375, -16.365234375, -15.62109375, -14.876953125, -14.1328125, -13.388671875, -12.64453125, -11.900390625, -11.15625, -10.412109375, -9.66796875, -8.923828125, -8.1796875, -7.435546875, -6.69140625, -5.947265625, -5.203125, -4.458984375, -3.71484375, -2.970703125, -2.2265625, -1.482421875, -0.73828125, 0.005859375, 0.75, 1.494140625, 2.23828125, 2.982421875, 3.7265625, 4.470703125, 5.21484375, 5.958984375, 6.703125, 7.447265625, 8.19140625, 8.935546875, 9.6796875, 10.423828125, 11.16796875, 11.912109375, 12.65625, 13.400390625, 14.14453125, 14.888671875, 15.6328125, 16.376953125, 17.12109375, 17.865234375, 18.609375, 19.353515625, 20.09765625, 20.841796875, 21.5859375, 22.330078125, 23.07421875, 23.818359375, 24.5625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 13.0, 31.0, 67.0, 115.0, 204.0, 333.0, 628.0, 1095.0, 1754.0, 2913.0, 4962.0, 7712.0, 12628.0, 19230.0, 29786.0, 43778.0, 63287.0, 88294.0, 120366.0, 157450.0, 200036.0, 241186.0, 281130.0, 315641.0, 335689.0, 343982.0, 336412.0, 314481.0, 280986.0, 240469.0, 199299.0, 156623.0, 119218.0, 88065.0, 63079.0, 43249.0, 29103.0, 19175.0, 12266.0, 7747.0, 4821.0, 2906.0, 1759.0, 1001.0, 589.0, 316.0, 160.0, 93.0, 78.0, 42.0, 18.0, 7.0, 10.0, 2.0], "bins": [-20.828125, -20.2412109375, -19.654296875, -19.0673828125, -18.48046875, -17.8935546875, -17.306640625, -16.7197265625, -16.1328125, -15.5458984375, -14.958984375, -14.3720703125, -13.78515625, -13.1982421875, -12.611328125, -12.0244140625, -11.4375, -10.8505859375, -10.263671875, -9.6767578125, -9.08984375, -8.5029296875, -7.916015625, -7.3291015625, -6.7421875, -6.1552734375, -5.568359375, -4.9814453125, -4.39453125, -3.8076171875, -3.220703125, -2.6337890625, -2.046875, -1.4599609375, -0.873046875, -0.2861328125, 0.30078125, 0.8876953125, 1.474609375, 2.0615234375, 2.6484375, 3.2353515625, 3.822265625, 4.4091796875, 4.99609375, 5.5830078125, 6.169921875, 6.7568359375, 7.34375, 7.9306640625, 8.517578125, 9.1044921875, 9.69140625, 10.2783203125, 10.865234375, 11.4521484375, 12.0390625, 12.6259765625, 13.212890625, 13.7998046875, 14.38671875, 14.9736328125, 15.560546875, 16.1474609375, 16.734375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 9.0, 11.0, 15.0, 13.0, 21.0, 24.0, 28.0, 41.0, 40.0, 38.0, 64.0, 66.0, 86.0, 97.0, 107.0, 98.0, 127.0, 137.0, 156.0, 165.0, 179.0, 199.0, 173.0, 194.0, 191.0, 178.0, 164.0, 159.0, 138.0, 145.0, 143.0, 119.0, 98.0, 111.0, 91.0, 86.0, 63.0, 64.0, 46.0, 46.0, 32.0, 27.0, 17.0, 20.0, 10.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-10.28125, -9.9454345703125, -9.609619140625, -9.2738037109375, -8.93798828125, -8.6021728515625, -8.266357421875, -7.9305419921875, -7.5947265625, -7.2589111328125, -6.923095703125, -6.5872802734375, -6.25146484375, -5.9156494140625, -5.579833984375, -5.2440185546875, -4.908203125, -4.5723876953125, -4.236572265625, -3.9007568359375, -3.56494140625, -3.2291259765625, -2.893310546875, -2.5574951171875, -2.2216796875, -1.8858642578125, -1.550048828125, -1.2142333984375, -0.87841796875, -0.5426025390625, -0.206787109375, 0.1290283203125, 0.46484375, 0.8006591796875, 1.136474609375, 1.4722900390625, 1.80810546875, 2.1439208984375, 2.479736328125, 2.8155517578125, 3.1513671875, 3.4871826171875, 3.822998046875, 4.1588134765625, 4.49462890625, 4.8304443359375, 5.166259765625, 5.5020751953125, 5.837890625, 6.1737060546875, 6.509521484375, 6.8453369140625, 7.18115234375, 7.5169677734375, 7.852783203125, 8.1885986328125, 8.5244140625, 8.8602294921875, 9.196044921875, 9.5318603515625, 9.86767578125, 10.2034912109375, 10.539306640625, 10.8751220703125, 11.2109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 1.0, 6.0, 6.0, 1.0, 3.0, 8.0, 11.0, 9.0, 12.0, 13.0, 15.0, 4.0, 13.0, 19.0, 28.0, 26.0, 26.0, 23.0, 43.0, 39.0, 51.0, 43.0, 39.0, 31.0, 57.0, 42.0, 43.0, 32.0, 43.0, 29.0, 30.0, 30.0, 28.0, 26.0, 24.0, 15.0, 18.0, 14.0, 22.0, 15.0, 11.0, 13.0, 10.0, 6.0, 5.0, 11.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.492328643798828, -24.6621150970459, -23.83190155029297, -23.001686096191406, -22.171472549438477, -21.341259002685547, -20.511043548583984, -19.680830001831055, -18.850616455078125, -18.020402908325195, -17.190189361572266, -16.359973907470703, -15.529760360717773, -14.699546813964844, -13.869332313537598, -13.039117813110352, -12.208904266357422, -11.378690719604492, -10.548476219177246, -9.71826171875, -8.88804817199707, -8.05783462524414, -7.2276201248168945, -6.397406101226807, -5.567192077636719, -4.736978054046631, -3.906764030456543, -3.076550006866455, -2.246335983276367, -1.4161219596862793, -0.5859079360961914, 0.24430608749389648, 1.0745220184326172, 1.904736042022705, 2.734950065612793, 3.565164089202881, 4.395378112792969, 5.225592136383057, 6.0558061599731445, 6.886020183563232, 7.71623420715332, 8.54644775390625, 9.376662254333496, 10.206876754760742, 11.037090301513672, 11.867303848266602, 12.697518348693848, 13.527732849121094, 14.357946395874023, 15.188159942626953, 16.018375396728516, 16.848588943481445, 17.678802490234375, 18.509016036987305, 19.339229583740234, 20.169445037841797, 20.999658584594727, 21.829872131347656, 22.66008758544922, 23.49030113220215, 24.320514678955078, 25.150728225708008, 25.980941772460938, 26.8111572265625, 27.64137077331543]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 10.0, 2.0, 6.0, 7.0, 12.0, 13.0, 14.0, 11.0, 23.0, 24.0, 40.0, 25.0, 35.0, 33.0, 39.0, 42.0, 35.0, 31.0, 50.0, 36.0, 40.0, 31.0, 35.0, 35.0, 36.0, 34.0, 36.0, 37.0, 24.0, 27.0, 17.0, 18.0, 22.0, 24.0, 13.0, 11.0, 12.0, 23.0, 7.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15850067138672, -26.215932846069336, -25.273365020751953, -24.330799102783203, -23.38823127746582, -22.445663452148438, -21.503097534179688, -20.560529708862305, -19.617961883544922, -18.67539405822754, -17.732826232910156, -16.790260314941406, -15.847692489624023, -14.90512466430664, -13.962557792663574, -13.019990921020508, -12.077423095703125, -11.134855270385742, -10.192288398742676, -9.24972152709961, -8.307153701782227, -7.364586353302002, -6.422019004821777, -5.479451656341553, -4.536884307861328, -3.5943169593811035, -2.651749610900879, -1.7091822624206543, -0.7666149139404297, 0.17595243453979492, 1.1185197830200195, 2.061087131500244, 3.0036544799804688, 3.9462218284606934, 4.888789176940918, 5.831356525421143, 6.773923873901367, 7.716491222381592, 8.659058570861816, 9.601625442504883, 10.544193267822266, 11.486761093139648, 12.429327964782715, 13.371894836425781, 14.314462661743164, 15.257030487060547, 16.199596405029297, 17.14216423034668, 18.084732055664062, 19.027299880981445, 19.969867706298828, 20.912433624267578, 21.85500144958496, 22.797569274902344, 23.740135192871094, 24.682703018188477, 25.62527084350586, 26.567838668823242, 27.510406494140625, 28.452972412109375, 29.395540237426758, 30.33810806274414, 31.28067398071289, 32.223243713378906, 33.165809631347656]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 9.0, 24.0, 14.0, 34.0, 65.0, 59.0, 106.0, 164.0, 245.0, 416.0, 660.0, 1066.0, 1709.0, 3021.0, 5069.0, 8926.0, 16149.0, 28579.0, 50542.0, 88859.0, 140850.0, 183892.0, 182188.0, 137062.0, 86254.0, 49085.0, 27317.0, 15362.0, 8536.0, 4909.0, 2889.0, 1671.0, 1078.0, 613.0, 391.0, 247.0, 171.0, 106.0, 72.0, 41.0, 25.0, 21.0, 22.0, 14.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7734375, -7.5140380859375, -7.254638671875, -6.9952392578125, -6.73583984375, -6.4764404296875, -6.217041015625, -5.9576416015625, -5.6982421875, -5.4388427734375, -5.179443359375, -4.9200439453125, -4.66064453125, -4.4012451171875, -4.141845703125, -3.8824462890625, -3.623046875, -3.3636474609375, -3.104248046875, -2.8448486328125, -2.58544921875, -2.3260498046875, -2.066650390625, -1.8072509765625, -1.5478515625, -1.2884521484375, -1.029052734375, -0.7696533203125, -0.51025390625, -0.2508544921875, 0.008544921875, 0.2679443359375, 0.52734375, 0.7867431640625, 1.046142578125, 1.3055419921875, 1.56494140625, 1.8243408203125, 2.083740234375, 2.3431396484375, 2.6025390625, 2.8619384765625, 3.121337890625, 3.3807373046875, 3.64013671875, 3.8995361328125, 4.158935546875, 4.4183349609375, 4.677734375, 4.9371337890625, 5.196533203125, 5.4559326171875, 5.71533203125, 5.9747314453125, 6.234130859375, 6.4935302734375, 6.7529296875, 7.0123291015625, 7.271728515625, 7.5311279296875, 7.79052734375, 8.0499267578125, 8.309326171875, 8.5687255859375, 8.828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 6.0, 7.0, 11.0, 15.0, 14.0, 10.0, 21.0, 25.0, 37.0, 28.0, 35.0, 32.0, 40.0, 39.0, 38.0, 32.0, 47.0, 37.0, 43.0, 28.0, 34.0, 36.0, 37.0, 35.0, 33.0, 40.0, 22.0, 28.0, 15.0, 21.0, 22.0, 23.0, 12.0, 12.0, 12.0, 23.0, 8.0, 11.0, 8.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.078125, -26.136962890625, -25.19580078125, -24.254638671875, -23.3134765625, -22.372314453125, -21.43115234375, -20.489990234375, -19.548828125, -18.607666015625, -17.66650390625, -16.725341796875, -15.7841796875, -14.843017578125, -13.90185546875, -12.960693359375, -12.01953125, -11.078369140625, -10.13720703125, -9.196044921875, -8.2548828125, -7.313720703125, -6.37255859375, -5.431396484375, -4.490234375, -3.549072265625, -2.60791015625, -1.666748046875, -0.7255859375, 0.215576171875, 1.15673828125, 2.097900390625, 3.0390625, 3.980224609375, 4.92138671875, 5.862548828125, 6.8037109375, 7.744873046875, 8.68603515625, 9.627197265625, 10.568359375, 11.509521484375, 12.45068359375, 13.391845703125, 14.3330078125, 15.274169921875, 16.21533203125, 17.156494140625, 18.09765625, 19.038818359375, 19.97998046875, 20.921142578125, 21.8623046875, 22.803466796875, 23.74462890625, 24.685791015625, 25.626953125, 26.568115234375, 27.50927734375, 28.450439453125, 29.3916015625, 30.332763671875, 31.27392578125, 32.215087890625, 33.15625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 9.0, 11.0, 18.0, 24.0, 33.0, 31.0, 53.0, 62.0, 91.0, 144.0, 218.0, 319.0, 511.0, 869.0, 1448.0, 2525.0, 4590.0, 9167.0, 20330.0, 51450.0, 142889.0, 331012.0, 291754.0, 113842.0, 42230.0, 17288.0, 7919.0, 4017.0, 2148.0, 1241.0, 764.0, 546.0, 298.0, 186.0, 162.0, 100.0, 72.0, 42.0, 42.0, 35.0, 15.0, 12.0, 12.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.734375, -12.358642578125, -11.98291015625, -11.607177734375, -11.2314453125, -10.855712890625, -10.47998046875, -10.104248046875, -9.728515625, -9.352783203125, -8.97705078125, -8.601318359375, -8.2255859375, -7.849853515625, -7.47412109375, -7.098388671875, -6.72265625, -6.346923828125, -5.97119140625, -5.595458984375, -5.2197265625, -4.843994140625, -4.46826171875, -4.092529296875, -3.716796875, -3.341064453125, -2.96533203125, -2.589599609375, -2.2138671875, -1.838134765625, -1.46240234375, -1.086669921875, -0.7109375, -0.335205078125, 0.04052734375, 0.416259765625, 0.7919921875, 1.167724609375, 1.54345703125, 1.919189453125, 2.294921875, 2.670654296875, 3.04638671875, 3.422119140625, 3.7978515625, 4.173583984375, 4.54931640625, 4.925048828125, 5.30078125, 5.676513671875, 6.05224609375, 6.427978515625, 6.8037109375, 7.179443359375, 7.55517578125, 7.930908203125, 8.306640625, 8.682373046875, 9.05810546875, 9.433837890625, 9.8095703125, 10.185302734375, 10.56103515625, 10.936767578125, 11.3125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 9.0, 7.0, 11.0, 5.0, 5.0, 13.0, 13.0, 10.0, 15.0, 14.0, 24.0, 24.0, 19.0, 29.0, 24.0, 27.0, 32.0, 36.0, 28.0, 52.0, 37.0, 35.0, 42.0, 40.0, 29.0, 23.0, 27.0, 35.0, 36.0, 31.0, 34.0, 25.0, 27.0, 28.0, 21.0, 17.0, 18.0, 14.0, 11.0, 12.0, 9.0, 9.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.359375, -16.790771484375, -16.22216796875, -15.653564453125, -15.0849609375, -14.516357421875, -13.94775390625, -13.379150390625, -12.810546875, -12.241943359375, -11.67333984375, -11.104736328125, -10.5361328125, -9.967529296875, -9.39892578125, -8.830322265625, -8.26171875, -7.693115234375, -7.12451171875, -6.555908203125, -5.9873046875, -5.418701171875, -4.85009765625, -4.281494140625, -3.712890625, -3.144287109375, -2.57568359375, -2.007080078125, -1.4384765625, -0.869873046875, -0.30126953125, 0.267333984375, 0.8359375, 1.404541015625, 1.97314453125, 2.541748046875, 3.1103515625, 3.678955078125, 4.24755859375, 4.816162109375, 5.384765625, 5.953369140625, 6.52197265625, 7.090576171875, 7.6591796875, 8.227783203125, 8.79638671875, 9.364990234375, 9.93359375, 10.502197265625, 11.07080078125, 11.639404296875, 12.2080078125, 12.776611328125, 13.34521484375, 13.913818359375, 14.482421875, 15.051025390625, 15.61962890625, 16.188232421875, 16.7568359375, 17.325439453125, 17.89404296875, 18.462646484375, 19.03125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 20.0, 37.0, 36.0, 75.0, 94.0, 124.0, 204.0, 332.0, 482.0, 771.0, 1202.0, 1921.0, 3021.0, 5232.0, 9545.0, 19685.0, 48123.0, 162631.0, 502884.0, 191200.0, 53938.0, 21759.0, 10518.0, 5722.0, 3306.0, 1964.0, 1244.0, 830.0, 530.0, 346.0, 245.0, 181.0, 111.0, 75.0, 53.0, 35.0, 23.0, 15.0, 4.0, 11.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0], "bins": [-8.375, -8.13262939453125, -7.8902587890625, -7.64788818359375, -7.405517578125, -7.16314697265625, -6.9207763671875, -6.67840576171875, -6.43603515625, -6.19366455078125, -5.9512939453125, -5.70892333984375, -5.466552734375, -5.22418212890625, -4.9818115234375, -4.73944091796875, -4.4970703125, -4.25469970703125, -4.0123291015625, -3.76995849609375, -3.527587890625, -3.28521728515625, -3.0428466796875, -2.80047607421875, -2.55810546875, -2.31573486328125, -2.0733642578125, -1.83099365234375, -1.588623046875, -1.34625244140625, -1.1038818359375, -0.86151123046875, -0.619140625, -0.37677001953125, -0.1343994140625, 0.10797119140625, 0.350341796875, 0.59271240234375, 0.8350830078125, 1.07745361328125, 1.31982421875, 1.56219482421875, 1.8045654296875, 2.04693603515625, 2.289306640625, 2.53167724609375, 2.7740478515625, 3.01641845703125, 3.2587890625, 3.50115966796875, 3.7435302734375, 3.98590087890625, 4.228271484375, 4.47064208984375, 4.7130126953125, 4.95538330078125, 5.19775390625, 5.44012451171875, 5.6824951171875, 5.92486572265625, 6.167236328125, 6.40960693359375, 6.6519775390625, 6.89434814453125, 7.13671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 13.0, 21.0, 36.0, 30.0, 36.0, 35.0, 74.0, 63.0, 77.0, 66.0, 62.0, 51.0, 67.0, 65.0, 50.0, 55.0, 40.0, 40.0, 22.0, 17.0, 15.0, 10.0, 13.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0004172325134277344, -0.00040591880679130554, -0.0003946051001548767, -0.0003832913935184479, -0.00037197768688201904, -0.0003606639802455902, -0.0003493502736091614, -0.00033803656697273254, -0.0003267228603363037, -0.0003154091536998749, -0.00030409544706344604, -0.0002927817404270172, -0.0002814680337905884, -0.00027015432715415955, -0.0002588406205177307, -0.0002475269138813019, -0.00023621320724487305, -0.00022489950060844421, -0.00021358579397201538, -0.00020227208733558655, -0.00019095838069915771, -0.00017964467406272888, -0.00016833096742630005, -0.00015701726078987122, -0.00014570355415344238, -0.00013438984751701355, -0.00012307614088058472, -0.00011176243424415588, -0.00010044872760772705, -8.913502097129822e-05, -7.782131433486938e-05, -6.650760769844055e-05, -5.519390106201172e-05, -4.3880194425582886e-05, -3.256648778915405e-05, -2.125278115272522e-05, -9.939074516296387e-06, 1.3746321201324463e-06, 1.268833875656128e-05, 2.4002045392990112e-05, 3.5315752029418945e-05, 4.662945866584778e-05, 5.794316530227661e-05, 6.925687193870544e-05, 8.057057857513428e-05, 9.188428521156311e-05, 0.00010319799184799194, 0.00011451169848442078, 0.0001258254051208496, 0.00013713911175727844, 0.00014845281839370728, 0.0001597665250301361, 0.00017108023166656494, 0.00018239393830299377, 0.0001937076449394226, 0.00020502135157585144, 0.00021633505821228027, 0.0002276487648487091, 0.00023896247148513794, 0.00025027617812156677, 0.0002615898847579956, 0.00027290359139442444, 0.00028421729803085327, 0.0002955310046672821, 0.00030684471130371094]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 4.0, 18.0, 28.0, 31.0, 57.0, 80.0, 100.0, 146.0, 216.0, 301.0, 537.0, 785.0, 1219.0, 1924.0, 3161.0, 5229.0, 8736.0, 15038.0, 26299.0, 47342.0, 83413.0, 141018.0, 197179.0, 193326.0, 136406.0, 80284.0, 44759.0, 24991.0, 14212.0, 8326.0, 5050.0, 3028.0, 1830.0, 1222.0, 749.0, 517.0, 322.0, 199.0, 139.0, 101.0, 70.0, 56.0, 24.0, 19.0, 18.0, 14.0, 14.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.3170166015625, -6.098876953125, -5.8807373046875, -5.66259765625, -5.4444580078125, -5.226318359375, -5.0081787109375, -4.7900390625, -4.5718994140625, -4.353759765625, -4.1356201171875, -3.91748046875, -3.6993408203125, -3.481201171875, -3.2630615234375, -3.044921875, -2.8267822265625, -2.608642578125, -2.3905029296875, -2.17236328125, -1.9542236328125, -1.736083984375, -1.5179443359375, -1.2998046875, -1.0816650390625, -0.863525390625, -0.6453857421875, -0.42724609375, -0.2091064453125, 0.009033203125, 0.2271728515625, 0.4453125, 0.6634521484375, 0.881591796875, 1.0997314453125, 1.31787109375, 1.5360107421875, 1.754150390625, 1.9722900390625, 2.1904296875, 2.4085693359375, 2.626708984375, 2.8448486328125, 3.06298828125, 3.2811279296875, 3.499267578125, 3.7174072265625, 3.935546875, 4.1536865234375, 4.371826171875, 4.5899658203125, 4.80810546875, 5.0262451171875, 5.244384765625, 5.4625244140625, 5.6806640625, 5.8988037109375, 6.116943359375, 6.3350830078125, 6.55322265625, 6.7713623046875, 6.989501953125, 7.2076416015625, 7.42578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 9.0, 14.0, 8.0, 25.0, 30.0, 33.0, 39.0, 58.0, 66.0, 101.0, 101.0, 100.0, 83.0, 69.0, 58.0, 46.0, 31.0, 31.0, 19.0, 20.0, 22.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.655364990234375, -3.54119873046875, -3.427032470703125, -3.3128662109375, -3.198699951171875, -3.08453369140625, -2.970367431640625, -2.856201171875, -2.742034912109375, -2.62786865234375, -2.513702392578125, -2.3995361328125, -2.285369873046875, -2.17120361328125, -2.057037353515625, -1.94287109375, -1.828704833984375, -1.71453857421875, -1.600372314453125, -1.4862060546875, -1.372039794921875, -1.25787353515625, -1.143707275390625, -1.029541015625, -0.915374755859375, -0.80120849609375, -0.687042236328125, -0.5728759765625, -0.458709716796875, -0.34454345703125, -0.230377197265625, -0.1162109375, -0.002044677734375, 0.11212158203125, 0.226287841796875, 0.3404541015625, 0.454620361328125, 0.56878662109375, 0.682952880859375, 0.797119140625, 0.911285400390625, 1.02545166015625, 1.139617919921875, 1.2537841796875, 1.367950439453125, 1.48211669921875, 1.596282958984375, 1.71044921875, 1.824615478515625, 1.93878173828125, 2.052947998046875, 2.1671142578125, 2.281280517578125, 2.39544677734375, 2.509613037109375, 2.623779296875, 2.737945556640625, 2.85211181640625, 2.966278076171875, 3.0804443359375, 3.194610595703125, 3.30877685546875, 3.422943115234375, 3.537109375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 3.0, 4.0, 8.0, 7.0, 7.0, 12.0, 10.0, 14.0, 9.0, 8.0, 22.0, 30.0, 19.0, 29.0, 28.0, 23.0, 43.0, 41.0, 49.0, 36.0, 41.0, 40.0, 42.0, 46.0, 34.0, 39.0, 45.0, 32.0, 29.0, 30.0, 21.0, 28.0, 21.0, 13.0, 18.0, 16.0, 19.0, 15.0, 10.0, 10.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.700149536132812, -23.879846572875977, -23.059541702270508, -22.239238739013672, -21.418935775756836, -20.5986328125, -19.77832794189453, -18.958024978637695, -18.13772201538086, -17.317419052124023, -16.497114181518555, -15.676811218261719, -14.856508255004883, -14.03620433807373, -13.215900421142578, -12.395597457885742, -11.575292587280273, -10.754988670349121, -9.934685707092285, -9.114381790161133, -8.294078826904297, -7.4737749099731445, -6.653470993041992, -5.833167552947998, -5.012864112854004, -4.19256067276001, -3.3722569942474365, -2.5519533157348633, -1.7316498756408691, -0.911346435546875, -0.09104251861572266, 0.7292609214782715, 1.5495662689208984, 2.3698697090148926, 3.190173387527466, 4.010477066040039, 4.830780506134033, 5.651083946228027, 6.47138786315918, 7.291691303253174, 8.111994743347168, 8.93229866027832, 9.752601623535156, 10.572905540466309, 11.393209457397461, 12.213512420654297, 13.03381633758545, 13.854120254516602, 14.674423217773438, 15.49472713470459, 16.315031051635742, 17.135334014892578, 17.955636978149414, 18.77593994140625, 19.59624481201172, 20.416547775268555, 21.23685073852539, 22.057153701782227, 22.877458572387695, 23.69776153564453, 24.518064498901367, 25.338367462158203, 26.158672332763672, 26.978975296020508, 27.799280166625977]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 8.0, 11.0, 16.0, 13.0, 11.0, 24.0, 27.0, 34.0, 34.0, 30.0, 34.0, 39.0, 39.0, 36.0, 32.0, 51.0, 31.0, 40.0, 33.0, 34.0, 38.0, 40.0, 28.0, 34.0, 39.0, 22.0, 26.0, 22.0, 23.0, 16.0, 19.0, 18.0, 10.0, 16.0, 17.0, 11.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.947019577026367, -26.005422592163086, -25.063825607299805, -24.122228622436523, -23.18062973022461, -22.239032745361328, -21.297435760498047, -20.355838775634766, -19.414241790771484, -18.472644805908203, -17.531047821044922, -16.58945083618164, -15.647852897644043, -14.706255912780762, -13.764657974243164, -12.823060989379883, -11.881464004516602, -10.93986701965332, -9.998270034790039, -9.056672096252441, -8.11507511138916, -7.173478126525879, -6.2318806648254395, -5.290283203125, -4.348686218261719, -3.4070889949798584, -2.465491771697998, -1.5238945484161377, -0.5822973251342773, 0.3592996597290039, 1.3008971214294434, 2.242494583129883, 3.184093475341797, 4.125690460205078, 5.067287921905518, 6.008885383605957, 6.950482368469238, 7.8920793533325195, 8.833677291870117, 9.775274276733398, 10.71687126159668, 11.658468246459961, 12.600065231323242, 13.54166316986084, 14.483260154724121, 15.424857139587402, 16.366455078125, 17.30805206298828, 18.249649047851562, 19.191246032714844, 20.132843017578125, 21.074440002441406, 22.016036987304688, 22.95763397216797, 23.899232864379883, 24.840829849243164, 25.782426834106445, 26.724023818969727, 27.665620803833008, 28.60721778869629, 29.548816680908203, 30.490413665771484, 31.432010650634766, 32.37360763549805, 33.31520462036133]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 11.0, 29.0, 37.0, 75.0, 115.0, 195.0, 329.0, 519.0, 877.0, 1392.0, 2194.0, 3320.0, 5367.0, 7932.0, 11733.0, 16964.0, 23964.0, 32368.0, 43244.0, 54909.0, 66681.0, 76901.0, 84898.0, 89308.0, 89333.0, 85562.0, 76978.0, 66781.0, 55168.0, 43719.0, 32758.0, 24085.0, 16722.0, 11885.0, 7965.0, 5307.0, 3246.0, 2174.0, 1349.0, 849.0, 515.0, 306.0, 205.0, 105.0, 74.0, 44.0, 22.0, 18.0, 8.0, 8.0, 5.0, 5.0], "bins": [-17.734375, -17.2418212890625, -16.749267578125, -16.2567138671875, -15.76416015625, -15.2716064453125, -14.779052734375, -14.2864990234375, -13.7939453125, -13.3013916015625, -12.808837890625, -12.3162841796875, -11.82373046875, -11.3311767578125, -10.838623046875, -10.3460693359375, -9.853515625, -9.3609619140625, -8.868408203125, -8.3758544921875, -7.88330078125, -7.3907470703125, -6.898193359375, -6.4056396484375, -5.9130859375, -5.4205322265625, -4.927978515625, -4.4354248046875, -3.94287109375, -3.4503173828125, -2.957763671875, -2.4652099609375, -1.97265625, -1.4801025390625, -0.987548828125, -0.4949951171875, -0.00244140625, 0.4901123046875, 0.982666015625, 1.4752197265625, 1.9677734375, 2.4603271484375, 2.952880859375, 3.4454345703125, 3.93798828125, 4.4305419921875, 4.923095703125, 5.4156494140625, 5.908203125, 6.4007568359375, 6.893310546875, 7.3858642578125, 7.87841796875, 8.3709716796875, 8.863525390625, 9.3560791015625, 9.8486328125, 10.3411865234375, 10.833740234375, 11.3262939453125, 11.81884765625, 12.3114013671875, 12.803955078125, 13.2965087890625, 13.7890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 4.0, 9.0, 8.0, 16.0, 15.0, 9.0, 22.0, 25.0, 39.0, 30.0, 31.0, 38.0, 34.0, 37.0, 37.0, 35.0, 49.0, 36.0, 34.0, 35.0, 34.0, 42.0, 34.0, 31.0, 33.0, 39.0, 27.0, 24.0, 20.0, 25.0, 14.0, 19.0, 18.0, 13.0, 13.0, 21.0, 9.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.46875, -25.548828125, -24.62890625, -23.708984375, -22.7890625, -21.869140625, -20.94921875, -20.029296875, -19.109375, -18.189453125, -17.26953125, -16.349609375, -15.4296875, -14.509765625, -13.58984375, -12.669921875, -11.75, -10.830078125, -9.91015625, -8.990234375, -8.0703125, -7.150390625, -6.23046875, -5.310546875, -4.390625, -3.470703125, -2.55078125, -1.630859375, -0.7109375, 0.208984375, 1.12890625, 2.048828125, 2.96875, 3.888671875, 4.80859375, 5.728515625, 6.6484375, 7.568359375, 8.48828125, 9.408203125, 10.328125, 11.248046875, 12.16796875, 13.087890625, 14.0078125, 14.927734375, 15.84765625, 16.767578125, 17.6875, 18.607421875, 19.52734375, 20.447265625, 21.3671875, 22.287109375, 23.20703125, 24.126953125, 25.046875, 25.966796875, 26.88671875, 27.806640625, 28.7265625, 29.646484375, 30.56640625, 31.486328125, 32.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 10.0, 4.0, 27.0, 52.0, 63.0, 112.0, 190.0, 294.0, 558.0, 914.0, 1602.0, 2538.0, 4041.0, 6703.0, 10438.0, 15930.0, 23181.0, 33224.0, 45322.0, 59494.0, 73618.0, 87535.0, 96441.0, 100118.0, 97658.0, 89762.0, 77320.0, 63027.0, 48819.0, 35898.0, 25710.0, 17355.0, 11345.0, 7395.0, 4642.0, 2919.0, 1752.0, 1091.0, 626.0, 344.0, 193.0, 121.0, 83.0, 28.0, 30.0, 15.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.65625, -17.114990234375, -16.57373046875, -16.032470703125, -15.4912109375, -14.949951171875, -14.40869140625, -13.867431640625, -13.326171875, -12.784912109375, -12.24365234375, -11.702392578125, -11.1611328125, -10.619873046875, -10.07861328125, -9.537353515625, -8.99609375, -8.454833984375, -7.91357421875, -7.372314453125, -6.8310546875, -6.289794921875, -5.74853515625, -5.207275390625, -4.666015625, -4.124755859375, -3.58349609375, -3.042236328125, -2.5009765625, -1.959716796875, -1.41845703125, -0.877197265625, -0.3359375, 0.205322265625, 0.74658203125, 1.287841796875, 1.8291015625, 2.370361328125, 2.91162109375, 3.452880859375, 3.994140625, 4.535400390625, 5.07666015625, 5.617919921875, 6.1591796875, 6.700439453125, 7.24169921875, 7.782958984375, 8.32421875, 8.865478515625, 9.40673828125, 9.947998046875, 10.4892578125, 11.030517578125, 11.57177734375, 12.113037109375, 12.654296875, 13.195556640625, 13.73681640625, 14.278076171875, 14.8193359375, 15.360595703125, 15.90185546875, 16.443115234375, 16.984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 7.0, 4.0, 6.0, 11.0, 14.0, 7.0, 18.0, 10.0, 15.0, 23.0, 24.0, 23.0, 26.0, 25.0, 30.0, 29.0, 34.0, 30.0, 31.0, 41.0, 45.0, 32.0, 47.0, 32.0, 29.0, 32.0, 40.0, 29.0, 34.0, 33.0, 25.0, 29.0, 27.0, 23.0, 18.0, 18.0, 17.0, 12.0, 15.0, 11.0, 9.0, 5.0, 3.0, 5.0, 6.0, 8.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.3125, -18.72705078125, -18.1416015625, -17.55615234375, -16.970703125, -16.38525390625, -15.7998046875, -15.21435546875, -14.62890625, -14.04345703125, -13.4580078125, -12.87255859375, -12.287109375, -11.70166015625, -11.1162109375, -10.53076171875, -9.9453125, -9.35986328125, -8.7744140625, -8.18896484375, -7.603515625, -7.01806640625, -6.4326171875, -5.84716796875, -5.26171875, -4.67626953125, -4.0908203125, -3.50537109375, -2.919921875, -2.33447265625, -1.7490234375, -1.16357421875, -0.578125, 0.00732421875, 0.5927734375, 1.17822265625, 1.763671875, 2.34912109375, 2.9345703125, 3.52001953125, 4.10546875, 4.69091796875, 5.2763671875, 5.86181640625, 6.447265625, 7.03271484375, 7.6181640625, 8.20361328125, 8.7890625, 9.37451171875, 9.9599609375, 10.54541015625, 11.130859375, 11.71630859375, 12.3017578125, 12.88720703125, 13.47265625, 14.05810546875, 14.6435546875, 15.22900390625, 15.814453125, 16.39990234375, 16.9853515625, 17.57080078125, 18.15625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 10.0, 19.0, 20.0, 34.0, 48.0, 95.0, 141.0, 184.0, 275.0, 434.0, 675.0, 1043.0, 1612.0, 2550.0, 4084.0, 6484.0, 10065.0, 15142.0, 22575.0, 32016.0, 44565.0, 58702.0, 73254.0, 86857.0, 97317.0, 101023.0, 98577.0, 90453.0, 78364.0, 63098.0, 48701.0, 35627.0, 25312.0, 17222.0, 11466.0, 7307.0, 4753.0, 3033.0, 1893.0, 1216.0, 777.0, 515.0, 345.0, 218.0, 161.0, 101.0, 63.0, 46.0, 29.0, 17.0, 8.0, 10.0, 3.0, 4.0, 5.0], "bins": [-8.6640625, -8.4140625, -8.1640625, -7.9140625, -7.6640625, -7.4140625, -7.1640625, -6.9140625, -6.6640625, -6.4140625, -6.1640625, -5.9140625, -5.6640625, -5.4140625, -5.1640625, -4.9140625, -4.6640625, -4.4140625, -4.1640625, -3.9140625, -3.6640625, -3.4140625, -3.1640625, -2.9140625, -2.6640625, -2.4140625, -2.1640625, -1.9140625, -1.6640625, -1.4140625, -1.1640625, -0.9140625, -0.6640625, -0.4140625, -0.1640625, 0.0859375, 0.3359375, 0.5859375, 0.8359375, 1.0859375, 1.3359375, 1.5859375, 1.8359375, 2.0859375, 2.3359375, 2.5859375, 2.8359375, 3.0859375, 3.3359375, 3.5859375, 3.8359375, 4.0859375, 4.3359375, 4.5859375, 4.8359375, 5.0859375, 5.3359375, 5.5859375, 5.8359375, 6.0859375, 6.3359375, 6.5859375, 6.8359375, 7.0859375, 7.3359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 13.0, 17.0, 25.0, 23.0, 31.0, 28.0, 34.0, 46.0, 51.0, 56.0, 59.0, 56.0, 57.0, 51.0, 74.0, 61.0, 57.0, 36.0, 41.0, 24.0, 25.0, 23.0, 21.0, 16.0, 14.0, 14.0, 11.0, 12.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001415252685546875, -0.0013691335916519165, -0.001323014497756958, -0.0012768954038619995, -0.001230776309967041, -0.0011846572160720825, -0.001138538122177124, -0.0010924190282821655, -0.001046299934387207, -0.0010001808404922485, -0.00095406174659729, -0.0009079426527023315, -0.000861823558807373, -0.0008157044649124146, -0.0007695853710174561, -0.0007234662771224976, -0.0006773471832275391, -0.0006312280893325806, -0.0005851089954376221, -0.0005389899015426636, -0.0004928708076477051, -0.0004467517137527466, -0.0004006326198577881, -0.0003545135259628296, -0.0003083944320678711, -0.0002622753381729126, -0.0002161562442779541, -0.0001700371503829956, -0.0001239180564880371, -7.779896259307861e-05, -3.167986869812012e-05, 1.4439225196838379e-05, 6.0558319091796875e-05, 0.00010667741298675537, 0.00015279650688171387, 0.00019891560077667236, 0.00024503469467163086, 0.00029115378856658936, 0.00033727288246154785, 0.00038339197635650635, 0.00042951107025146484, 0.00047563016414642334, 0.0005217492580413818, 0.0005678683519363403, 0.0006139874458312988, 0.0006601065397262573, 0.0007062256336212158, 0.0007523447275161743, 0.0007984638214111328, 0.0008445829153060913, 0.0008907020092010498, 0.0009368211030960083, 0.0009829401969909668, 0.0010290592908859253, 0.0010751783847808838, 0.0011212974786758423, 0.0011674165725708008, 0.0012135356664657593, 0.0012596547603607178, 0.0013057738542556763, 0.0013518929481506348, 0.0013980120420455933, 0.0014441311359405518, 0.0014902502298355103, 0.0015363693237304688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 10.0, 12.0, 28.0, 34.0, 57.0, 85.0, 116.0, 188.0, 225.0, 332.0, 463.0, 652.0, 1098.0, 1563.0, 2324.0, 3685.0, 5632.0, 8363.0, 12283.0, 17940.0, 25750.0, 35487.0, 47236.0, 60915.0, 74496.0, 85961.0, 93830.0, 96446.0, 93159.0, 85244.0, 73811.0, 60067.0, 46801.0, 35215.0, 25261.0, 17790.0, 12118.0, 8064.0, 5408.0, 3420.0, 2354.0, 1545.0, 1017.0, 650.0, 476.0, 302.0, 201.0, 134.0, 108.0, 61.0, 49.0, 27.0, 23.0, 18.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0], "bins": [-8.8203125, -8.5400390625, -8.259765625, -7.9794921875, -7.69921875, -7.4189453125, -7.138671875, -6.8583984375, -6.578125, -6.2978515625, -6.017578125, -5.7373046875, -5.45703125, -5.1767578125, -4.896484375, -4.6162109375, -4.3359375, -4.0556640625, -3.775390625, -3.4951171875, -3.21484375, -2.9345703125, -2.654296875, -2.3740234375, -2.09375, -1.8134765625, -1.533203125, -1.2529296875, -0.97265625, -0.6923828125, -0.412109375, -0.1318359375, 0.1484375, 0.4287109375, 0.708984375, 0.9892578125, 1.26953125, 1.5498046875, 1.830078125, 2.1103515625, 2.390625, 2.6708984375, 2.951171875, 3.2314453125, 3.51171875, 3.7919921875, 4.072265625, 4.3525390625, 4.6328125, 4.9130859375, 5.193359375, 5.4736328125, 5.75390625, 6.0341796875, 6.314453125, 6.5947265625, 6.875, 7.1552734375, 7.435546875, 7.7158203125, 7.99609375, 8.2763671875, 8.556640625, 8.8369140625, 9.1171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 9.0, 5.0, 6.0, 7.0, 11.0, 24.0, 8.0, 15.0, 29.0, 32.0, 31.0, 39.0, 41.0, 42.0, 43.0, 43.0, 47.0, 57.0, 49.0, 34.0, 55.0, 44.0, 38.0, 35.0, 44.0, 36.0, 27.0, 19.0, 22.0, 19.0, 27.0, 18.0, 7.0, 8.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.03021240234375, -3.8885498046875, -3.74688720703125, -3.605224609375, -3.46356201171875, -3.3218994140625, -3.18023681640625, -3.03857421875, -2.89691162109375, -2.7552490234375, -2.61358642578125, -2.471923828125, -2.33026123046875, -2.1885986328125, -2.04693603515625, -1.9052734375, -1.76361083984375, -1.6219482421875, -1.48028564453125, -1.338623046875, -1.19696044921875, -1.0552978515625, -0.91363525390625, -0.77197265625, -0.63031005859375, -0.4886474609375, -0.34698486328125, -0.205322265625, -0.06365966796875, 0.0780029296875, 0.21966552734375, 0.361328125, 0.50299072265625, 0.6446533203125, 0.78631591796875, 0.927978515625, 1.06964111328125, 1.2113037109375, 1.35296630859375, 1.49462890625, 1.63629150390625, 1.7779541015625, 1.91961669921875, 2.061279296875, 2.20294189453125, 2.3446044921875, 2.48626708984375, 2.6279296875, 2.76959228515625, 2.9112548828125, 3.05291748046875, 3.194580078125, 3.33624267578125, 3.4779052734375, 3.61956787109375, 3.76123046875, 3.90289306640625, 4.0445556640625, 4.18621826171875, 4.327880859375, 4.46954345703125, 4.6112060546875, 4.75286865234375, 4.89453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 2.0, 8.0, 3.0, 16.0, 13.0, 10.0, 14.0, 24.0, 18.0, 22.0, 22.0, 27.0, 28.0, 26.0, 37.0, 38.0, 34.0, 44.0, 48.0, 41.0, 41.0, 44.0, 50.0, 54.0, 30.0, 42.0, 30.0, 30.0, 21.0, 20.0, 14.0, 19.0, 19.0, 16.0, 16.0, 15.0, 11.0, 10.0, 7.0, 5.0, 5.0, 2.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.47711181640625, -24.631746292114258, -23.786380767822266, -22.941015243530273, -22.09564971923828, -21.25028419494629, -20.404918670654297, -19.559553146362305, -18.714187622070312, -17.86882209777832, -17.023456573486328, -16.178091049194336, -15.332725524902344, -14.487360000610352, -13.64199447631836, -12.796628952026367, -11.951263427734375, -11.105897903442383, -10.26053237915039, -9.415166854858398, -8.569801330566406, -7.724435806274414, -6.879070281982422, -6.03370475769043, -5.1883392333984375, -4.342973709106445, -3.497608184814453, -2.652242660522461, -1.8068771362304688, -0.9615116119384766, -0.11614608764648438, 0.7292194366455078, 1.5745868682861328, 2.419952392578125, 3.265317916870117, 4.110683441162109, 4.956048965454102, 5.801414489746094, 6.646780014038086, 7.492145538330078, 8.33751106262207, 9.182876586914062, 10.028242111206055, 10.873607635498047, 11.718973159790039, 12.564338684082031, 13.409704208374023, 14.255069732666016, 15.100435256958008, 15.94580078125, 16.791166305541992, 17.636531829833984, 18.481897354125977, 19.32726287841797, 20.17262840270996, 21.017993927001953, 21.863359451293945, 22.708724975585938, 23.55409049987793, 24.399456024169922, 25.244821548461914, 26.090187072753906, 26.9355525970459, 27.78091812133789, 28.626283645629883]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 6.0, 7.0, 12.0, 12.0, 22.0, 32.0, 19.0, 17.0, 21.0, 25.0, 30.0, 31.0, 37.0, 32.0, 40.0, 33.0, 40.0, 34.0, 38.0, 42.0, 36.0, 41.0, 27.0, 36.0, 30.0, 31.0, 27.0, 22.0, 27.0, 21.0, 19.0, 20.0, 25.0, 19.0, 16.0, 7.0, 7.0, 11.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.2093505859375, -26.263307571411133, -25.317264556884766, -24.3712215423584, -23.42517852783203, -22.479137420654297, -21.533092498779297, -20.587051391601562, -19.641008377075195, -18.694965362548828, -17.74892234802246, -16.802879333496094, -15.856837272644043, -14.910794258117676, -13.964751243591309, -13.018709182739258, -12.072665214538574, -11.126622200012207, -10.18057918548584, -9.234537124633789, -8.288494110107422, -7.342451095581055, -6.3964080810546875, -5.4503655433654785, -4.504322528839111, -3.5582797527313232, -2.612236976623535, -1.666193962097168, -0.7201511859893799, 0.2258915901184082, 1.1719346046447754, 2.1179771423339844, 3.0640201568603516, 4.010063171386719, 4.956105709075928, 5.902148723602295, 6.848191261291504, 7.794234275817871, 8.740277290344238, 9.686319351196289, 10.632362365722656, 11.578405380249023, 12.52444839477539, 13.470491409301758, 14.416533470153809, 15.362576484680176, 16.30862045288086, 17.254661560058594, 18.200706481933594, 19.14674949645996, 20.092792510986328, 21.038835525512695, 21.984878540039062, 22.930919647216797, 23.876964569091797, 24.82300567626953, 25.7690486907959, 26.715091705322266, 27.661134719848633, 28.607177734375, 29.553220748901367, 30.499263763427734, 31.44530487060547, 32.39134979248047, 33.3373908996582]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 17.0, 29.0, 63.0, 90.0, 162.0, 315.0, 514.0, 872.0, 1549.0, 2684.0, 4715.0, 7637.0, 13199.0, 21054.0, 33542.0, 51775.0, 77574.0, 112133.0, 154459.0, 206580.0, 263657.0, 316930.0, 361472.0, 388105.0, 392939.0, 374847.0, 336170.0, 284669.0, 228972.0, 174911.0, 128207.0, 89383.0, 61171.0, 39719.0, 25367.0, 15724.0, 9480.0, 5797.0, 3335.0, 1971.0, 1067.0, 675.0, 347.0, 187.0, 113.0, 39.0, 36.0, 13.0, 7.0, 9.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.5625, -19.923828125, -19.28515625, -18.646484375, -18.0078125, -17.369140625, -16.73046875, -16.091796875, -15.453125, -14.814453125, -14.17578125, -13.537109375, -12.8984375, -12.259765625, -11.62109375, -10.982421875, -10.34375, -9.705078125, -9.06640625, -8.427734375, -7.7890625, -7.150390625, -6.51171875, -5.873046875, -5.234375, -4.595703125, -3.95703125, -3.318359375, -2.6796875, -2.041015625, -1.40234375, -0.763671875, -0.125, 0.513671875, 1.15234375, 1.791015625, 2.4296875, 3.068359375, 3.70703125, 4.345703125, 4.984375, 5.623046875, 6.26171875, 6.900390625, 7.5390625, 8.177734375, 8.81640625, 9.455078125, 10.09375, 10.732421875, 11.37109375, 12.009765625, 12.6484375, 13.287109375, 13.92578125, 14.564453125, 15.203125, 15.841796875, 16.48046875, 17.119140625, 17.7578125, 18.396484375, 19.03515625, 19.673828125, 20.3125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 12.0, 18.0, 31.0, 23.0, 19.0, 16.0, 29.0, 31.0, 33.0, 32.0, 33.0, 40.0, 35.0, 35.0, 35.0, 34.0, 47.0, 32.0, 43.0, 31.0, 37.0, 25.0, 34.0, 27.0, 25.0, 28.0, 19.0, 20.0, 22.0, 21.0, 24.0, 11.0, 11.0, 8.0, 8.0, 13.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.136474609375, -23.27294921875, -22.409423828125, -21.5458984375, -20.682373046875, -19.81884765625, -18.955322265625, -18.091796875, -17.228271484375, -16.36474609375, -15.501220703125, -14.6376953125, -13.774169921875, -12.91064453125, -12.047119140625, -11.18359375, -10.320068359375, -9.45654296875, -8.593017578125, -7.7294921875, -6.865966796875, -6.00244140625, -5.138916015625, -4.275390625, -3.411865234375, -2.54833984375, -1.684814453125, -0.8212890625, 0.042236328125, 0.90576171875, 1.769287109375, 2.6328125, 3.496337890625, 4.35986328125, 5.223388671875, 6.0869140625, 6.950439453125, 7.81396484375, 8.677490234375, 9.541015625, 10.404541015625, 11.26806640625, 12.131591796875, 12.9951171875, 13.858642578125, 14.72216796875, 15.585693359375, 16.44921875, 17.312744140625, 18.17626953125, 19.039794921875, 19.9033203125, 20.766845703125, 21.63037109375, 22.493896484375, 23.357421875, 24.220947265625, 25.08447265625, 25.947998046875, 26.8115234375, 27.675048828125, 28.53857421875, 29.402099609375, 30.265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 15.0, 29.0, 28.0, 66.0, 106.0, 209.0, 386.0, 623.0, 1023.0, 1867.0, 3062.0, 4922.0, 8338.0, 12943.0, 20077.0, 30275.0, 44864.0, 63777.0, 89150.0, 119020.0, 156013.0, 194571.0, 237551.0, 275897.0, 308997.0, 329293.0, 337186.0, 331520.0, 311798.0, 280327.0, 243963.0, 201909.0, 162601.0, 124649.0, 93297.0, 67133.0, 47226.0, 32202.0, 21249.0, 13818.0, 8778.0, 5398.0, 3401.0, 1979.0, 1123.0, 673.0, 399.0, 243.0, 133.0, 91.0, 45.0, 18.0, 14.0, 8.0, 3.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8408203125, -18.244140625, -17.6474609375, -17.05078125, -16.4541015625, -15.857421875, -15.2607421875, -14.6640625, -14.0673828125, -13.470703125, -12.8740234375, -12.27734375, -11.6806640625, -11.083984375, -10.4873046875, -9.890625, -9.2939453125, -8.697265625, -8.1005859375, -7.50390625, -6.9072265625, -6.310546875, -5.7138671875, -5.1171875, -4.5205078125, -3.923828125, -3.3271484375, -2.73046875, -2.1337890625, -1.537109375, -0.9404296875, -0.34375, 0.2529296875, 0.849609375, 1.4462890625, 2.04296875, 2.6396484375, 3.236328125, 3.8330078125, 4.4296875, 5.0263671875, 5.623046875, 6.2197265625, 6.81640625, 7.4130859375, 8.009765625, 8.6064453125, 9.203125, 9.7998046875, 10.396484375, 10.9931640625, 11.58984375, 12.1865234375, 12.783203125, 13.3798828125, 13.9765625, 14.5732421875, 15.169921875, 15.7666015625, 16.36328125, 16.9599609375, 17.556640625, 18.1533203125, 18.75]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 15.0, 20.0, 22.0, 21.0, 35.0, 39.0, 39.0, 51.0, 53.0, 70.0, 78.0, 81.0, 113.0, 103.0, 123.0, 142.0, 141.0, 139.0, 153.0, 161.0, 170.0, 155.0, 199.0, 163.0, 165.0, 160.0, 166.0, 148.0, 161.0, 125.0, 125.0, 118.0, 90.0, 80.0, 60.0, 52.0, 61.0, 30.0, 46.0, 39.0, 23.0, 32.0, 21.0, 19.0, 12.0, 8.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.5234375, -10.1771240234375, -9.830810546875, -9.4844970703125, -9.13818359375, -8.7918701171875, -8.445556640625, -8.0992431640625, -7.7529296875, -7.4066162109375, -7.060302734375, -6.7139892578125, -6.36767578125, -6.0213623046875, -5.675048828125, -5.3287353515625, -4.982421875, -4.6361083984375, -4.289794921875, -3.9434814453125, -3.59716796875, -3.2508544921875, -2.904541015625, -2.5582275390625, -2.2119140625, -1.8656005859375, -1.519287109375, -1.1729736328125, -0.82666015625, -0.4803466796875, -0.134033203125, 0.2122802734375, 0.55859375, 0.9049072265625, 1.251220703125, 1.5975341796875, 1.94384765625, 2.2901611328125, 2.636474609375, 2.9827880859375, 3.3291015625, 3.6754150390625, 4.021728515625, 4.3680419921875, 4.71435546875, 5.0606689453125, 5.406982421875, 5.7532958984375, 6.099609375, 6.4459228515625, 6.792236328125, 7.1385498046875, 7.48486328125, 7.8311767578125, 8.177490234375, 8.5238037109375, 8.8701171875, 9.2164306640625, 9.562744140625, 9.9090576171875, 10.25537109375, 10.6016845703125, 10.947998046875, 11.2943115234375, 11.640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 10.0, 11.0, 18.0, 18.0, 17.0, 20.0, 21.0, 20.0, 20.0, 31.0, 43.0, 33.0, 38.0, 54.0, 37.0, 38.0, 42.0, 48.0, 40.0, 62.0, 47.0, 44.0, 26.0, 31.0, 26.0, 20.0, 28.0, 22.0, 21.0, 15.0, 11.0, 12.0, 15.0, 3.0, 4.0, 12.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.037424087524414, -29.118236541748047, -28.199047088623047, -27.279857635498047, -26.36067008972168, -25.441482543945312, -24.522293090820312, -23.603103637695312, -22.683916091918945, -21.764728546142578, -20.845539093017578, -19.926349639892578, -19.00716209411621, -18.087974548339844, -17.168785095214844, -16.249595642089844, -15.330408096313477, -14.411219596862793, -13.49203109741211, -12.572842597961426, -11.653654098510742, -10.734465599060059, -9.815277099609375, -8.896088600158691, -7.976900100708008, -7.057711601257324, -6.138523101806641, -5.219334602355957, -4.300146102905273, -3.38095760345459, -2.4617691040039062, -1.5425806045532227, -0.6233901977539062, 0.29579830169677734, 1.214986801147461, 2.1341753005981445, 3.053363800048828, 3.9725522994995117, 4.891740798950195, 5.810929298400879, 6.7301177978515625, 7.649306297302246, 8.56849479675293, 9.487683296203613, 10.406871795654297, 11.32606029510498, 12.245248794555664, 13.164437294006348, 14.083625793457031, 15.002814292907715, 15.922002792358398, 16.841190338134766, 17.760379791259766, 18.679569244384766, 19.598756790161133, 20.5179443359375, 21.4371337890625, 22.3563232421875, 23.275510787963867, 24.194698333740234, 25.113887786865234, 26.033077239990234, 26.9522647857666, 27.87145233154297, 28.79064178466797]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 5.0, 14.0, 5.0, 16.0, 14.0, 18.0, 24.0, 19.0, 28.0, 21.0, 29.0, 29.0, 31.0, 37.0, 39.0, 42.0, 37.0, 26.0, 38.0, 35.0, 38.0, 37.0, 28.0, 30.0, 31.0, 29.0, 31.0, 36.0, 32.0, 19.0, 26.0, 25.0, 19.0, 14.0, 13.0, 11.0, 16.0, 10.0, 8.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-32.605098724365234, -31.65038299560547, -30.695667266845703, -29.740951538085938, -28.786235809326172, -27.831520080566406, -26.876802444458008, -25.922086715698242, -24.967370986938477, -24.01265525817871, -23.057939529418945, -22.10322380065918, -21.14850616455078, -20.193790435791016, -19.23907470703125, -18.284358978271484, -17.32964324951172, -16.374927520751953, -15.420211791992188, -14.465495109558105, -13.51077938079834, -12.556063652038574, -11.601346969604492, -10.646631240844727, -9.691915512084961, -8.737199783325195, -7.7824835777282715, -6.827767372131348, -5.873051643371582, -4.918335914611816, -3.9636197090148926, -3.0089035034179688, -2.0541858673095703, -1.0994699001312256, -0.14475393295288086, 0.8099620342254639, 1.7646780014038086, 2.719393730163574, 3.674109935760498, 4.628826141357422, 5.5835418701171875, 6.538257598876953, 7.492973804473877, 8.4476900100708, 9.402405738830566, 10.357121467590332, 11.311838150024414, 12.26655387878418, 13.221269607543945, 14.175985336303711, 15.130701065063477, 16.085416793823242, 17.04013442993164, 17.994850158691406, 18.949565887451172, 19.904281616210938, 20.858997344970703, 21.81371307373047, 22.768428802490234, 23.72314453125, 24.677860260009766, 25.63257598876953, 26.58729362487793, 27.542009353637695, 28.49672508239746]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 9.0, 18.0, 17.0, 18.0, 23.0, 35.0, 47.0, 62.0, 85.0, 115.0, 160.0, 266.0, 348.0, 566.0, 931.0, 1587.0, 2956.0, 6046.0, 13141.0, 29937.0, 70081.0, 149794.0, 247288.0, 247141.0, 150861.0, 70225.0, 30147.0, 13193.0, 6000.0, 2998.0, 1599.0, 972.0, 585.0, 431.0, 233.0, 164.0, 130.0, 94.0, 83.0, 45.0, 30.0, 28.0, 23.0, 9.0, 7.0, 3.0, 7.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-11.6875, -11.3333740234375, -10.979248046875, -10.6251220703125, -10.27099609375, -9.9168701171875, -9.562744140625, -9.2086181640625, -8.8544921875, -8.5003662109375, -8.146240234375, -7.7921142578125, -7.43798828125, -7.0838623046875, -6.729736328125, -6.3756103515625, -6.021484375, -5.6673583984375, -5.313232421875, -4.9591064453125, -4.60498046875, -4.2508544921875, -3.896728515625, -3.5426025390625, -3.1884765625, -2.8343505859375, -2.480224609375, -2.1260986328125, -1.77197265625, -1.4178466796875, -1.063720703125, -0.7095947265625, -0.35546875, -0.0013427734375, 0.352783203125, 0.7069091796875, 1.06103515625, 1.4151611328125, 1.769287109375, 2.1234130859375, 2.4775390625, 2.8316650390625, 3.185791015625, 3.5399169921875, 3.89404296875, 4.2481689453125, 4.602294921875, 4.9564208984375, 5.310546875, 5.6646728515625, 6.018798828125, 6.3729248046875, 6.72705078125, 7.0811767578125, 7.435302734375, 7.7894287109375, 8.1435546875, 8.4976806640625, 8.851806640625, 9.2059326171875, 9.56005859375, 9.9141845703125, 10.268310546875, 10.6224365234375, 10.9765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 9.0, 11.0, 7.0, 16.0, 13.0, 19.0, 22.0, 21.0, 27.0, 22.0, 27.0, 29.0, 30.0, 38.0, 40.0, 40.0, 39.0, 24.0, 39.0, 36.0, 36.0, 36.0, 30.0, 31.0, 27.0, 33.0, 29.0, 34.0, 38.0, 17.0, 27.0, 23.0, 19.0, 16.0, 12.0, 11.0, 17.0, 9.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-32.59375, -31.6396484375, -30.685546875, -29.7314453125, -28.77734375, -27.8232421875, -26.869140625, -25.9150390625, -24.9609375, -24.0068359375, -23.052734375, -22.0986328125, -21.14453125, -20.1904296875, -19.236328125, -18.2822265625, -17.328125, -16.3740234375, -15.419921875, -14.4658203125, -13.51171875, -12.5576171875, -11.603515625, -10.6494140625, -9.6953125, -8.7412109375, -7.787109375, -6.8330078125, -5.87890625, -4.9248046875, -3.970703125, -3.0166015625, -2.0625, -1.1083984375, -0.154296875, 0.7998046875, 1.75390625, 2.7080078125, 3.662109375, 4.6162109375, 5.5703125, 6.5244140625, 7.478515625, 8.4326171875, 9.38671875, 10.3408203125, 11.294921875, 12.2490234375, 13.203125, 14.1572265625, 15.111328125, 16.0654296875, 17.01953125, 17.9736328125, 18.927734375, 19.8818359375, 20.8359375, 21.7900390625, 22.744140625, 23.6982421875, 24.65234375, 25.6064453125, 26.560546875, 27.5146484375, 28.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 9.0, 10.0, 7.0, 24.0, 15.0, 24.0, 40.0, 55.0, 65.0, 83.0, 111.0, 183.0, 288.0, 417.0, 732.0, 1406.0, 2889.0, 6814.0, 19228.0, 70743.0, 301135.0, 459803.0, 132757.0, 32667.0, 10317.0, 4103.0, 1909.0, 1004.0, 584.0, 350.0, 218.0, 144.0, 94.0, 83.0, 59.0, 47.0, 19.0, 29.0, 16.0, 12.0, 19.0, 13.0, 4.0, 11.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.109375, -16.561279296875, -16.01318359375, -15.465087890625, -14.9169921875, -14.368896484375, -13.82080078125, -13.272705078125, -12.724609375, -12.176513671875, -11.62841796875, -11.080322265625, -10.5322265625, -9.984130859375, -9.43603515625, -8.887939453125, -8.33984375, -7.791748046875, -7.24365234375, -6.695556640625, -6.1474609375, -5.599365234375, -5.05126953125, -4.503173828125, -3.955078125, -3.406982421875, -2.85888671875, -2.310791015625, -1.7626953125, -1.214599609375, -0.66650390625, -0.118408203125, 0.4296875, 0.977783203125, 1.52587890625, 2.073974609375, 2.6220703125, 3.170166015625, 3.71826171875, 4.266357421875, 4.814453125, 5.362548828125, 5.91064453125, 6.458740234375, 7.0068359375, 7.554931640625, 8.10302734375, 8.651123046875, 9.19921875, 9.747314453125, 10.29541015625, 10.843505859375, 11.3916015625, 11.939697265625, 12.48779296875, 13.035888671875, 13.583984375, 14.132080078125, 14.68017578125, 15.228271484375, 15.7763671875, 16.324462890625, 16.87255859375, 17.420654296875, 17.96875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 8.0, 9.0, 10.0, 11.0, 16.0, 23.0, 25.0, 18.0, 23.0, 21.0, 28.0, 36.0, 35.0, 32.0, 47.0, 45.0, 45.0, 38.0, 39.0, 36.0, 37.0, 38.0, 45.0, 27.0, 31.0, 31.0, 29.0, 22.0, 25.0, 16.0, 25.0, 20.0, 16.0, 10.0, 17.0, 8.0, 10.0, 5.0, 9.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.171875, -20.53076171875, -19.8896484375, -19.24853515625, -18.607421875, -17.96630859375, -17.3251953125, -16.68408203125, -16.04296875, -15.40185546875, -14.7607421875, -14.11962890625, -13.478515625, -12.83740234375, -12.1962890625, -11.55517578125, -10.9140625, -10.27294921875, -9.6318359375, -8.99072265625, -8.349609375, -7.70849609375, -7.0673828125, -6.42626953125, -5.78515625, -5.14404296875, -4.5029296875, -3.86181640625, -3.220703125, -2.57958984375, -1.9384765625, -1.29736328125, -0.65625, -0.01513671875, 0.6259765625, 1.26708984375, 1.908203125, 2.54931640625, 3.1904296875, 3.83154296875, 4.47265625, 5.11376953125, 5.7548828125, 6.39599609375, 7.037109375, 7.67822265625, 8.3193359375, 8.96044921875, 9.6015625, 10.24267578125, 10.8837890625, 11.52490234375, 12.166015625, 12.80712890625, 13.4482421875, 14.08935546875, 14.73046875, 15.37158203125, 16.0126953125, 16.65380859375, 17.294921875, 17.93603515625, 18.5771484375, 19.21826171875, 19.859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 22.0, 10.0, 21.0, 28.0, 57.0, 64.0, 98.0, 161.0, 218.0, 267.0, 394.0, 543.0, 775.0, 1130.0, 1731.0, 2531.0, 3991.0, 6490.0, 11164.0, 20895.0, 43776.0, 114835.0, 355173.0, 303842.0, 95643.0, 38593.0, 18797.0, 10109.0, 5994.0, 3661.0, 2386.0, 1559.0, 1085.0, 743.0, 501.0, 370.0, 261.0, 175.0, 123.0, 95.0, 61.0, 49.0, 39.0, 30.0, 23.0, 12.0, 3.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.5753173828125, -5.400634765625, -5.2259521484375, -5.05126953125, -4.8765869140625, -4.701904296875, -4.5272216796875, -4.3525390625, -4.1778564453125, -4.003173828125, -3.8284912109375, -3.65380859375, -3.4791259765625, -3.304443359375, -3.1297607421875, -2.955078125, -2.7803955078125, -2.605712890625, -2.4310302734375, -2.25634765625, -2.0816650390625, -1.906982421875, -1.7322998046875, -1.5576171875, -1.3829345703125, -1.208251953125, -1.0335693359375, -0.85888671875, -0.6842041015625, -0.509521484375, -0.3348388671875, -0.16015625, 0.0145263671875, 0.189208984375, 0.3638916015625, 0.53857421875, 0.7132568359375, 0.887939453125, 1.0626220703125, 1.2373046875, 1.4119873046875, 1.586669921875, 1.7613525390625, 1.93603515625, 2.1107177734375, 2.285400390625, 2.4600830078125, 2.634765625, 2.8094482421875, 2.984130859375, 3.1588134765625, 3.33349609375, 3.5081787109375, 3.682861328125, 3.8575439453125, 4.0322265625, 4.2069091796875, 4.381591796875, 4.5562744140625, 4.73095703125, 4.9056396484375, 5.080322265625, 5.2550048828125, 5.4296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 5.0, 11.0, 16.0, 23.0, 26.0, 22.0, 19.0, 25.0, 32.0, 42.0, 58.0, 59.0, 57.0, 62.0, 54.0, 65.0, 50.0, 38.0, 50.0, 46.0, 30.0, 43.0, 29.0, 24.0, 20.0, 12.0, 18.0, 10.0, 6.0, 11.0, 6.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002586841583251953, -0.0002507306635379791, -0.00024277716875076294, -0.00023482367396354675, -0.00022687017917633057, -0.00021891668438911438, -0.0002109631896018982, -0.000203009694814682, -0.00019505620002746582, -0.00018710270524024963, -0.00017914921045303345, -0.00017119571566581726, -0.00016324222087860107, -0.0001552887260913849, -0.0001473352313041687, -0.00013938173651695251, -0.00013142824172973633, -0.00012347474694252014, -0.00011552125215530396, -0.00010756775736808777, -9.961426258087158e-05, -9.16607677936554e-05, -8.370727300643921e-05, -7.575377821922302e-05, -6.780028343200684e-05, -5.984678864479065e-05, -5.189329385757446e-05, -4.3939799070358276e-05, -3.598630428314209e-05, -2.8032809495925903e-05, -2.0079314708709717e-05, -1.212581992149353e-05, -4.172325134277344e-06, 3.7811696529388428e-06, 1.173466444015503e-05, 1.9688159227371216e-05, 2.7641654014587402e-05, 3.559514880180359e-05, 4.3548643589019775e-05, 5.150213837623596e-05, 5.945563316345215e-05, 6.740912795066833e-05, 7.536262273788452e-05, 8.331611752510071e-05, 9.12696123123169e-05, 9.922310709953308e-05, 0.00010717660188674927, 0.00011513009667396545, 0.00012308359146118164, 0.00013103708624839783, 0.00013899058103561401, 0.0001469440758228302, 0.0001548975706100464, 0.00016285106539726257, 0.00017080456018447876, 0.00017875805497169495, 0.00018671154975891113, 0.00019466504454612732, 0.0002026185393333435, 0.0002105720341205597, 0.00021852552890777588, 0.00022647902369499207, 0.00023443251848220825, 0.00024238601326942444, 0.0002503395080566406]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 18.0, 36.0, 52.0, 62.0, 115.0, 145.0, 238.0, 395.0, 580.0, 846.0, 1310.0, 1926.0, 3074.0, 5036.0, 7866.0, 13510.0, 23139.0, 40203.0, 71154.0, 123251.0, 184408.0, 201932.0, 151706.0, 92303.0, 51989.0, 29422.0, 16900.0, 10228.0, 6009.0, 3821.0, 2303.0, 1575.0, 1004.0, 691.0, 432.0, 315.0, 200.0, 131.0, 87.0, 58.0, 32.0, 19.0, 12.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0], "bins": [-7.5546875, -7.34613037109375, -7.1375732421875, -6.92901611328125, -6.720458984375, -6.51190185546875, -6.3033447265625, -6.09478759765625, -5.88623046875, -5.67767333984375, -5.4691162109375, -5.26055908203125, -5.052001953125, -4.84344482421875, -4.6348876953125, -4.42633056640625, -4.2177734375, -4.00921630859375, -3.8006591796875, -3.59210205078125, -3.383544921875, -3.17498779296875, -2.9664306640625, -2.75787353515625, -2.54931640625, -2.34075927734375, -2.1322021484375, -1.92364501953125, -1.715087890625, -1.50653076171875, -1.2979736328125, -1.08941650390625, -0.880859375, -0.67230224609375, -0.4637451171875, -0.25518798828125, -0.046630859375, 0.16192626953125, 0.3704833984375, 0.57904052734375, 0.78759765625, 0.99615478515625, 1.2047119140625, 1.41326904296875, 1.621826171875, 1.83038330078125, 2.0389404296875, 2.24749755859375, 2.4560546875, 2.66461181640625, 2.8731689453125, 3.08172607421875, 3.290283203125, 3.49884033203125, 3.7073974609375, 3.91595458984375, 4.12451171875, 4.33306884765625, 4.5416259765625, 4.75018310546875, 4.958740234375, 5.16729736328125, 5.3758544921875, 5.58441162109375, 5.79296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 2.0, 7.0, 4.0, 8.0, 10.0, 13.0, 17.0, 23.0, 30.0, 20.0, 35.0, 29.0, 39.0, 44.0, 52.0, 75.0, 73.0, 81.0, 55.0, 54.0, 44.0, 39.0, 34.0, 26.0, 31.0, 21.0, 17.0, 26.0, 6.0, 16.0, 11.0, 8.0, 9.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.611328125, -2.526397705078125, -2.44146728515625, -2.356536865234375, -2.2716064453125, -2.186676025390625, -2.10174560546875, -2.016815185546875, -1.931884765625, -1.846954345703125, -1.76202392578125, -1.677093505859375, -1.5921630859375, -1.507232666015625, -1.42230224609375, -1.337371826171875, -1.25244140625, -1.167510986328125, -1.08258056640625, -0.997650146484375, -0.9127197265625, -0.827789306640625, -0.74285888671875, -0.657928466796875, -0.572998046875, -0.488067626953125, -0.40313720703125, -0.318206787109375, -0.2332763671875, -0.148345947265625, -0.06341552734375, 0.021514892578125, 0.1064453125, 0.191375732421875, 0.27630615234375, 0.361236572265625, 0.4461669921875, 0.531097412109375, 0.61602783203125, 0.700958251953125, 0.785888671875, 0.870819091796875, 0.95574951171875, 1.040679931640625, 1.1256103515625, 1.210540771484375, 1.29547119140625, 1.380401611328125, 1.46533203125, 1.550262451171875, 1.63519287109375, 1.720123291015625, 1.8050537109375, 1.889984130859375, 1.97491455078125, 2.059844970703125, 2.144775390625, 2.229705810546875, 2.31463623046875, 2.399566650390625, 2.4844970703125, 2.569427490234375, 2.65435791015625, 2.739288330078125, 2.82421875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 6.0, 2.0, 7.0, 9.0, 7.0, 6.0, 21.0, 12.0, 15.0, 20.0, 17.0, 24.0, 24.0, 31.0, 44.0, 29.0, 39.0, 43.0, 43.0, 42.0, 40.0, 45.0, 37.0, 60.0, 55.0, 43.0, 37.0, 20.0, 24.0, 32.0, 23.0, 18.0, 27.0, 19.0, 13.0, 10.0, 11.0, 7.0, 4.0, 11.0, 5.0, 10.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.369731903076172, -29.448453903198242, -28.527175903320312, -27.605897903442383, -26.684619903564453, -25.763341903686523, -24.842063903808594, -23.920785903930664, -22.999507904052734, -22.078229904174805, -21.156951904296875, -20.235673904418945, -19.314395904541016, -18.393117904663086, -17.471839904785156, -16.550561904907227, -15.629283905029297, -14.708005905151367, -13.786727905273438, -12.865449905395508, -11.944171905517578, -11.022893905639648, -10.101615905761719, -9.180337905883789, -8.25905990600586, -7.33778190612793, -6.41650390625, -5.49522590637207, -4.573947906494141, -3.652669906616211, -2.7313919067382812, -1.8101139068603516, -0.8888339996337891, 0.032444000244140625, 0.9537220001220703, 1.875, 2.7962779998779297, 3.7175559997558594, 4.638833999633789, 5.560111999511719, 6.481389999389648, 7.402667999267578, 8.323945999145508, 9.245223999023438, 10.166501998901367, 11.087779998779297, 12.009057998657227, 12.930335998535156, 13.851613998413086, 14.772891998291016, 15.694169998168945, 16.615447998046875, 17.536725997924805, 18.458003997802734, 19.379281997680664, 20.300559997558594, 21.221837997436523, 22.143115997314453, 23.064393997192383, 23.985671997070312, 24.906949996948242, 25.828227996826172, 26.7495059967041, 27.67078399658203, 28.59206199645996]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 1.0, 6.0, 4.0, 8.0, 8.0, 11.0, 9.0, 11.0, 19.0, 16.0, 25.0, 19.0, 21.0, 24.0, 29.0, 31.0, 28.0, 38.0, 35.0, 37.0, 40.0, 34.0, 35.0, 40.0, 38.0, 33.0, 30.0, 33.0, 32.0, 28.0, 29.0, 36.0, 30.0, 29.0, 25.0, 17.0, 18.0, 18.0, 13.0, 17.0, 11.0, 9.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-32.98612976074219, -32.0234260559082, -31.06072235107422, -30.098018646240234, -29.13531494140625, -28.172611236572266, -27.20990753173828, -26.247203826904297, -25.284500122070312, -24.321796417236328, -23.359092712402344, -22.39638900756836, -21.433685302734375, -20.47098159790039, -19.508277893066406, -18.545574188232422, -17.582870483398438, -16.620166778564453, -15.657463073730469, -14.694759368896484, -13.7320556640625, -12.769351959228516, -11.806648254394531, -10.843944549560547, -9.881240844726562, -8.918537139892578, -7.955833435058594, -6.993129730224609, -6.030426025390625, -5.067722320556641, -4.105018615722656, -3.142314910888672, -2.1796131134033203, -1.216909408569336, -0.25420570373535156, 0.7084980010986328, 1.6712017059326172, 2.6339054107666016, 3.596609115600586, 4.55931282043457, 5.522016525268555, 6.484720230102539, 7.447423934936523, 8.410127639770508, 9.372831344604492, 10.335535049438477, 11.298238754272461, 12.260942459106445, 13.22364616394043, 14.186349868774414, 15.149053573608398, 16.111757278442383, 17.074460983276367, 18.03716468811035, 18.999868392944336, 19.96257209777832, 20.925275802612305, 21.88797950744629, 22.850683212280273, 23.813386917114258, 24.776090621948242, 25.738794326782227, 26.70149803161621, 27.664201736450195, 28.62690544128418]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 19.0, 43.0, 40.0, 74.0, 129.0, 179.0, 330.0, 514.0, 834.0, 1254.0, 1981.0, 3095.0, 4545.0, 6825.0, 9804.0, 13816.0, 19163.0, 26259.0, 34019.0, 43385.0, 53107.0, 62710.0, 71817.0, 77856.0, 82382.0, 82103.0, 79504.0, 73777.0, 65059.0, 55680.0, 45711.0, 36196.0, 27862.0, 21038.0, 15130.0, 10677.0, 7310.0, 5047.0, 3351.0, 2150.0, 1400.0, 907.0, 568.0, 354.0, 212.0, 130.0, 76.0, 48.0, 31.0, 19.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-14.6484375, -14.1923828125, -13.736328125, -13.2802734375, -12.82421875, -12.3681640625, -11.912109375, -11.4560546875, -11.0, -10.5439453125, -10.087890625, -9.6318359375, -9.17578125, -8.7197265625, -8.263671875, -7.8076171875, -7.3515625, -6.8955078125, -6.439453125, -5.9833984375, -5.52734375, -5.0712890625, -4.615234375, -4.1591796875, -3.703125, -3.2470703125, -2.791015625, -2.3349609375, -1.87890625, -1.4228515625, -0.966796875, -0.5107421875, -0.0546875, 0.4013671875, 0.857421875, 1.3134765625, 1.76953125, 2.2255859375, 2.681640625, 3.1376953125, 3.59375, 4.0498046875, 4.505859375, 4.9619140625, 5.41796875, 5.8740234375, 6.330078125, 6.7861328125, 7.2421875, 7.6982421875, 8.154296875, 8.6103515625, 9.06640625, 9.5224609375, 9.978515625, 10.4345703125, 10.890625, 11.3466796875, 11.802734375, 12.2587890625, 12.71484375, 13.1708984375, 13.626953125, 14.0830078125, 14.5390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 15.0, 9.0, 9.0, 16.0, 19.0, 25.0, 20.0, 21.0, 25.0, 27.0, 30.0, 31.0, 36.0, 32.0, 41.0, 42.0, 31.0, 31.0, 38.0, 42.0, 34.0, 30.0, 35.0, 30.0, 27.0, 29.0, 36.0, 33.0, 29.0, 24.0, 19.0, 16.0, 18.0, 14.0, 15.0, 11.0, 11.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0], "bins": [-32.15625, -31.217529296875, -30.27880859375, -29.340087890625, -28.4013671875, -27.462646484375, -26.52392578125, -25.585205078125, -24.646484375, -23.707763671875, -22.76904296875, -21.830322265625, -20.8916015625, -19.952880859375, -19.01416015625, -18.075439453125, -17.13671875, -16.197998046875, -15.25927734375, -14.320556640625, -13.3818359375, -12.443115234375, -11.50439453125, -10.565673828125, -9.626953125, -8.688232421875, -7.74951171875, -6.810791015625, -5.8720703125, -4.933349609375, -3.99462890625, -3.055908203125, -2.1171875, -1.178466796875, -0.23974609375, 0.698974609375, 1.6376953125, 2.576416015625, 3.51513671875, 4.453857421875, 5.392578125, 6.331298828125, 7.27001953125, 8.208740234375, 9.1474609375, 10.086181640625, 11.02490234375, 11.963623046875, 12.90234375, 13.841064453125, 14.77978515625, 15.718505859375, 16.6572265625, 17.595947265625, 18.53466796875, 19.473388671875, 20.412109375, 21.350830078125, 22.28955078125, 23.228271484375, 24.1669921875, 25.105712890625, 26.04443359375, 26.983154296875, 27.921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 13.0, 10.0, 33.0, 47.0, 87.0, 129.0, 190.0, 305.0, 490.0, 769.0, 1211.0, 1883.0, 2959.0, 4413.0, 6742.0, 9946.0, 14315.0, 19932.0, 27051.0, 35716.0, 45832.0, 56271.0, 66001.0, 75554.0, 81996.0, 85612.0, 84474.0, 79874.0, 73234.0, 63591.0, 52885.0, 42770.0, 33212.0, 24315.0, 17983.0, 12538.0, 8918.0, 6018.0, 3951.0, 2605.0, 1769.0, 1078.0, 706.0, 426.0, 270.0, 189.0, 99.0, 56.0, 29.0, 25.0, 12.0, 14.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-15.578125, -15.1038818359375, -14.629638671875, -14.1553955078125, -13.68115234375, -13.2069091796875, -12.732666015625, -12.2584228515625, -11.7841796875, -11.3099365234375, -10.835693359375, -10.3614501953125, -9.88720703125, -9.4129638671875, -8.938720703125, -8.4644775390625, -7.990234375, -7.5159912109375, -7.041748046875, -6.5675048828125, -6.09326171875, -5.6190185546875, -5.144775390625, -4.6705322265625, -4.1962890625, -3.7220458984375, -3.247802734375, -2.7735595703125, -2.29931640625, -1.8250732421875, -1.350830078125, -0.8765869140625, -0.40234375, 0.0718994140625, 0.546142578125, 1.0203857421875, 1.49462890625, 1.9688720703125, 2.443115234375, 2.9173583984375, 3.3916015625, 3.8658447265625, 4.340087890625, 4.8143310546875, 5.28857421875, 5.7628173828125, 6.237060546875, 6.7113037109375, 7.185546875, 7.6597900390625, 8.134033203125, 8.6082763671875, 9.08251953125, 9.5567626953125, 10.031005859375, 10.5052490234375, 10.9794921875, 11.4537353515625, 11.927978515625, 12.4022216796875, 12.87646484375, 13.3507080078125, 13.824951171875, 14.2991943359375, 14.7734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 6.0, 7.0, 11.0, 17.0, 21.0, 18.0, 18.0, 20.0, 22.0, 21.0, 20.0, 29.0, 38.0, 28.0, 33.0, 36.0, 27.0, 35.0, 39.0, 33.0, 31.0, 36.0, 27.0, 34.0, 38.0, 29.0, 24.0, 28.0, 32.0, 27.0, 32.0, 26.0, 22.0, 21.0, 12.0, 18.0, 11.0, 7.0, 12.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-19.328125, -18.720703125, -18.11328125, -17.505859375, -16.8984375, -16.291015625, -15.68359375, -15.076171875, -14.46875, -13.861328125, -13.25390625, -12.646484375, -12.0390625, -11.431640625, -10.82421875, -10.216796875, -9.609375, -9.001953125, -8.39453125, -7.787109375, -7.1796875, -6.572265625, -5.96484375, -5.357421875, -4.75, -4.142578125, -3.53515625, -2.927734375, -2.3203125, -1.712890625, -1.10546875, -0.498046875, 0.109375, 0.716796875, 1.32421875, 1.931640625, 2.5390625, 3.146484375, 3.75390625, 4.361328125, 4.96875, 5.576171875, 6.18359375, 6.791015625, 7.3984375, 8.005859375, 8.61328125, 9.220703125, 9.828125, 10.435546875, 11.04296875, 11.650390625, 12.2578125, 12.865234375, 13.47265625, 14.080078125, 14.6875, 15.294921875, 15.90234375, 16.509765625, 17.1171875, 17.724609375, 18.33203125, 18.939453125, 19.546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 30.0, 24.0, 37.0, 74.0, 111.0, 165.0, 243.0, 337.0, 611.0, 998.0, 1639.0, 2580.0, 4186.0, 7130.0, 11096.0, 17135.0, 25858.0, 37386.0, 51830.0, 68444.0, 85018.0, 97881.0, 106351.0, 106656.0, 99120.0, 85714.0, 70044.0, 53789.0, 38756.0, 27067.0, 17843.0, 11480.0, 7167.0, 4543.0, 2717.0, 1645.0, 1011.0, 644.0, 432.0, 250.0, 183.0, 103.0, 72.0, 47.0, 32.0, 24.0, 13.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6640625, -8.385009765625, -8.10595703125, -7.826904296875, -7.5478515625, -7.268798828125, -6.98974609375, -6.710693359375, -6.431640625, -6.152587890625, -5.87353515625, -5.594482421875, -5.3154296875, -5.036376953125, -4.75732421875, -4.478271484375, -4.19921875, -3.920166015625, -3.64111328125, -3.362060546875, -3.0830078125, -2.803955078125, -2.52490234375, -2.245849609375, -1.966796875, -1.687744140625, -1.40869140625, -1.129638671875, -0.8505859375, -0.571533203125, -0.29248046875, -0.013427734375, 0.265625, 0.544677734375, 0.82373046875, 1.102783203125, 1.3818359375, 1.660888671875, 1.93994140625, 2.218994140625, 2.498046875, 2.777099609375, 3.05615234375, 3.335205078125, 3.6142578125, 3.893310546875, 4.17236328125, 4.451416015625, 4.73046875, 5.009521484375, 5.28857421875, 5.567626953125, 5.8466796875, 6.125732421875, 6.40478515625, 6.683837890625, 6.962890625, 7.241943359375, 7.52099609375, 7.800048828125, 8.0791015625, 8.358154296875, 8.63720703125, 8.916259765625, 9.1953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 9.0, 12.0, 25.0, 23.0, 15.0, 20.0, 16.0, 49.0, 32.0, 37.0, 52.0, 37.0, 55.0, 50.0, 52.0, 57.0, 51.0, 42.0, 45.0, 56.0, 41.0, 34.0, 26.0, 35.0, 24.0, 22.0, 13.0, 15.0, 9.0, 11.0, 8.0, 9.0, 0.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009870529174804688, -0.0009476840496063232, -0.0009083151817321777, -0.0008689463138580322, -0.0008295774459838867, -0.0007902085781097412, -0.0007508397102355957, -0.0007114708423614502, -0.0006721019744873047, -0.0006327331066131592, -0.0005933642387390137, -0.0005539953708648682, -0.0005146265029907227, -0.00047525763511657715, -0.00043588876724243164, -0.00039651989936828613, -0.0003571510314941406, -0.0003177821636199951, -0.0002784132957458496, -0.0002390444278717041, -0.0001996755599975586, -0.00016030669212341309, -0.00012093782424926758, -8.156895637512207e-05, -4.220008850097656e-05, -2.8312206268310547e-06, 3.653764724731445e-05, 7.590651512145996e-05, 0.00011527538299560547, 0.00015464425086975098, 0.00019401311874389648, 0.000233381986618042, 0.0002727508544921875, 0.000312119722366333, 0.0003514885902404785, 0.000390857458114624, 0.00043022632598876953, 0.00046959519386291504, 0.0005089640617370605, 0.0005483329296112061, 0.0005877017974853516, 0.0006270706653594971, 0.0006664395332336426, 0.0007058084011077881, 0.0007451772689819336, 0.0007845461368560791, 0.0008239150047302246, 0.0008632838726043701, 0.0009026527404785156, 0.0009420216083526611, 0.0009813904762268066, 0.0010207593441009521, 0.0010601282119750977, 0.0010994970798492432, 0.0011388659477233887, 0.0011782348155975342, 0.0012176036834716797, 0.0012569725513458252, 0.0012963414192199707, 0.0013357102870941162, 0.0013750791549682617, 0.0014144480228424072, 0.0014538168907165527, 0.0014931857585906982, 0.0015325546264648438]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 8.0, 13.0, 26.0, 32.0, 67.0, 103.0, 142.0, 218.0, 318.0, 519.0, 870.0, 1643.0, 2931.0, 5331.0, 9574.0, 17309.0, 29472.0, 48288.0, 73254.0, 100597.0, 125263.0, 138097.0, 134072.0, 114911.0, 89105.0, 61961.0, 39725.0, 23716.0, 13678.0, 7547.0, 4192.0, 2307.0, 1260.0, 750.0, 446.0, 292.0, 155.0, 113.0, 86.0, 49.0, 37.0, 26.0, 16.0, 11.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-14.1484375, -13.729736328125, -13.31103515625, -12.892333984375, -12.4736328125, -12.054931640625, -11.63623046875, -11.217529296875, -10.798828125, -10.380126953125, -9.96142578125, -9.542724609375, -9.1240234375, -8.705322265625, -8.28662109375, -7.867919921875, -7.44921875, -7.030517578125, -6.61181640625, -6.193115234375, -5.7744140625, -5.355712890625, -4.93701171875, -4.518310546875, -4.099609375, -3.680908203125, -3.26220703125, -2.843505859375, -2.4248046875, -2.006103515625, -1.58740234375, -1.168701171875, -0.75, -0.331298828125, 0.08740234375, 0.506103515625, 0.9248046875, 1.343505859375, 1.76220703125, 2.180908203125, 2.599609375, 3.018310546875, 3.43701171875, 3.855712890625, 4.2744140625, 4.693115234375, 5.11181640625, 5.530517578125, 5.94921875, 6.367919921875, 6.78662109375, 7.205322265625, 7.6240234375, 8.042724609375, 8.46142578125, 8.880126953125, 9.298828125, 9.717529296875, 10.13623046875, 10.554931640625, 10.9736328125, 11.392333984375, 11.81103515625, 12.229736328125, 12.6484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 11.0, 10.0, 11.0, 22.0, 17.0, 15.0, 27.0, 27.0, 38.0, 36.0, 49.0, 42.0, 50.0, 50.0, 48.0, 61.0, 41.0, 71.0, 58.0, 32.0, 40.0, 36.0, 37.0, 32.0, 20.0, 16.0, 17.0, 13.0, 9.0, 7.0, 4.0, 5.0, 3.0, 5.0, 6.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -5.00262451171875, -4.8333740234375, -4.66412353515625, -4.494873046875, -4.32562255859375, -4.1563720703125, -3.98712158203125, -3.81787109375, -3.64862060546875, -3.4793701171875, -3.31011962890625, -3.140869140625, -2.97161865234375, -2.8023681640625, -2.63311767578125, -2.4638671875, -2.29461669921875, -2.1253662109375, -1.95611572265625, -1.786865234375, -1.61761474609375, -1.4483642578125, -1.27911376953125, -1.10986328125, -0.94061279296875, -0.7713623046875, -0.60211181640625, -0.432861328125, -0.26361083984375, -0.0943603515625, 0.07489013671875, 0.244140625, 0.41339111328125, 0.5826416015625, 0.75189208984375, 0.921142578125, 1.09039306640625, 1.2596435546875, 1.42889404296875, 1.59814453125, 1.76739501953125, 1.9366455078125, 2.10589599609375, 2.275146484375, 2.44439697265625, 2.6136474609375, 2.78289794921875, 2.9521484375, 3.12139892578125, 3.2906494140625, 3.45989990234375, 3.629150390625, 3.79840087890625, 3.9676513671875, 4.13690185546875, 4.30615234375, 4.47540283203125, 4.6446533203125, 4.81390380859375, 4.983154296875, 5.15240478515625, 5.3216552734375, 5.49090576171875, 5.66015625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 8.0, 8.0, 14.0, 22.0, 15.0, 27.0, 29.0, 22.0, 19.0, 38.0, 36.0, 40.0, 38.0, 33.0, 46.0, 47.0, 40.0, 40.0, 48.0, 34.0, 40.0, 36.0, 39.0, 39.0, 36.0, 19.0, 26.0, 15.0, 24.0, 14.0, 19.0, 15.0, 9.0, 6.0, 5.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-31.360553741455078, -30.456148147583008, -29.551740646362305, -28.647335052490234, -27.742929458618164, -26.838523864746094, -25.93411636352539, -25.02971076965332, -24.12530517578125, -23.22089958190918, -22.316492080688477, -21.412086486816406, -20.507680892944336, -19.603275299072266, -18.698867797851562, -17.794462203979492, -16.89005470275879, -15.985648155212402, -15.081242561340332, -14.176836013793945, -13.272430419921875, -12.368023872375488, -11.463617324829102, -10.559211730957031, -9.654805183410645, -8.750398635864258, -7.8459930419921875, -6.941586494445801, -6.037180423736572, -5.132774353027344, -4.228367805480957, -3.3239617347717285, -2.419557571411133, -1.5151513814926147, -0.6107451915740967, 0.29366111755371094, 1.1980671882629395, 2.102473258972168, 3.0068798065185547, 3.911285877227783, 4.815691947937012, 5.72009801864624, 6.624504089355469, 7.5289106369018555, 8.433317184448242, 9.337722778320312, 10.2421293258667, 11.146535873413086, 12.050941467285156, 12.955348014831543, 13.859753608703613, 14.76416015625, 15.66856575012207, 16.57297134399414, 17.477378845214844, 18.381784439086914, 19.286190032958984, 20.190595626831055, 21.095003128051758, 21.999408721923828, 22.9038143157959, 23.80821990966797, 24.712627410888672, 25.617033004760742, 26.521440505981445]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 3.0, 7.0, 8.0, 7.0, 13.0, 16.0, 14.0, 17.0, 31.0, 19.0, 28.0, 25.0, 33.0, 31.0, 44.0, 29.0, 38.0, 29.0, 45.0, 40.0, 34.0, 37.0, 35.0, 29.0, 29.0, 31.0, 32.0, 28.0, 27.0, 35.0, 23.0, 18.0, 25.0, 15.0, 18.0, 13.0, 14.0, 22.0, 10.0, 4.0, 7.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.366943359375, -31.360740661621094, -30.354537963867188, -29.34833526611328, -28.342132568359375, -27.33592987060547, -26.329727172851562, -25.323524475097656, -24.31732177734375, -23.311119079589844, -22.304916381835938, -21.29871368408203, -20.292510986328125, -19.28630828857422, -18.280105590820312, -17.273902893066406, -16.267702102661133, -15.261499404907227, -14.25529670715332, -13.249094009399414, -12.242891311645508, -11.236688613891602, -10.230486869812012, -9.224284172058105, -8.2180814743042, -7.211878776550293, -6.205676078796387, -5.199473857879639, -4.193271160125732, -3.187068462371826, -2.180866241455078, -1.1746635437011719, -0.16846084594726562, 0.8377417325973511, 1.8439443111419678, 2.850146770477295, 3.856349468231201, 4.862552165985107, 5.8687543869018555, 6.874957084655762, 7.881159782409668, 8.887362480163574, 9.89356517791748, 10.89976692199707, 11.905969619750977, 12.912172317504883, 13.918375015258789, 14.924577713012695, 15.930780410766602, 16.936983108520508, 17.943185806274414, 18.94938850402832, 19.955591201782227, 20.961793899536133, 21.967994689941406, 22.974197387695312, 23.98040008544922, 24.986602783203125, 25.99280548095703, 26.999008178710938, 28.005210876464844, 29.01141357421875, 30.017616271972656, 31.023818969726562, 32.03002166748047]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 13.0, 25.0, 54.0, 70.0, 130.0, 225.0, 382.0, 629.0, 1130.0, 1879.0, 3054.0, 4963.0, 7859.0, 12500.0, 19175.0, 29254.0, 43055.0, 61719.0, 88056.0, 119850.0, 157499.0, 199586.0, 245223.0, 287276.0, 322134.0, 344399.0, 352326.0, 341685.0, 317450.0, 280198.0, 238100.0, 193598.0, 151161.0, 113562.0, 82726.0, 58390.0, 40613.0, 26978.0, 17633.0, 11365.0, 7194.0, 4412.0, 2787.0, 1599.0, 979.0, 576.0, 338.0, 191.0, 117.0, 79.0, 46.0, 18.0, 10.0, 12.0, 4.0, 2.0, 0.0, 1.0], "bins": [-19.609375, -19.00439453125, -18.3994140625, -17.79443359375, -17.189453125, -16.58447265625, -15.9794921875, -15.37451171875, -14.76953125, -14.16455078125, -13.5595703125, -12.95458984375, -12.349609375, -11.74462890625, -11.1396484375, -10.53466796875, -9.9296875, -9.32470703125, -8.7197265625, -8.11474609375, -7.509765625, -6.90478515625, -6.2998046875, -5.69482421875, -5.08984375, -4.48486328125, -3.8798828125, -3.27490234375, -2.669921875, -2.06494140625, -1.4599609375, -0.85498046875, -0.25, 0.35498046875, 0.9599609375, 1.56494140625, 2.169921875, 2.77490234375, 3.3798828125, 3.98486328125, 4.58984375, 5.19482421875, 5.7998046875, 6.40478515625, 7.009765625, 7.61474609375, 8.2197265625, 8.82470703125, 9.4296875, 10.03466796875, 10.6396484375, 11.24462890625, 11.849609375, 12.45458984375, 13.0595703125, 13.66455078125, 14.26953125, 14.87451171875, 15.4794921875, 16.08447265625, 16.689453125, 17.29443359375, 17.8994140625, 18.50439453125, 19.109375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 3.0, 7.0, 6.0, 12.0, 15.0, 11.0, 14.0, 21.0, 23.0, 25.0, 30.0, 24.0, 32.0, 31.0, 39.0, 31.0, 42.0, 33.0, 41.0, 39.0, 34.0, 36.0, 33.0, 28.0, 35.0, 28.0, 34.0, 29.0, 29.0, 29.0, 21.0, 21.0, 26.0, 13.0, 22.0, 8.0, 16.0, 19.0, 12.0, 5.0, 5.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.96533203125, -28.0400390625, -27.11474609375, -26.189453125, -25.26416015625, -24.3388671875, -23.41357421875, -22.48828125, -21.56298828125, -20.6376953125, -19.71240234375, -18.787109375, -17.86181640625, -16.9365234375, -16.01123046875, -15.0859375, -14.16064453125, -13.2353515625, -12.31005859375, -11.384765625, -10.45947265625, -9.5341796875, -8.60888671875, -7.68359375, -6.75830078125, -5.8330078125, -4.90771484375, -3.982421875, -3.05712890625, -2.1318359375, -1.20654296875, -0.28125, 0.64404296875, 1.5693359375, 2.49462890625, 3.419921875, 4.34521484375, 5.2705078125, 6.19580078125, 7.12109375, 8.04638671875, 8.9716796875, 9.89697265625, 10.822265625, 11.74755859375, 12.6728515625, 13.59814453125, 14.5234375, 15.44873046875, 16.3740234375, 17.29931640625, 18.224609375, 19.14990234375, 20.0751953125, 21.00048828125, 21.92578125, 22.85107421875, 23.7763671875, 24.70166015625, 25.626953125, 26.55224609375, 27.4775390625, 28.40283203125, 29.328125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 4.0, 19.0, 25.0, 30.0, 63.0, 108.0, 213.0, 323.0, 652.0, 1078.0, 1775.0, 2996.0, 4799.0, 7789.0, 12119.0, 18539.0, 28270.0, 40800.0, 58281.0, 80828.0, 109984.0, 141509.0, 178531.0, 216736.0, 253286.0, 286204.0, 310522.0, 325027.0, 324355.0, 312154.0, 289187.0, 257978.0, 221069.0, 182704.0, 145413.0, 111827.0, 83991.0, 60233.0, 42811.0, 29035.0, 19502.0, 12756.0, 8069.0, 4948.0, 3139.0, 1953.0, 1121.0, 660.0, 366.0, 251.0, 111.0, 67.0, 37.0, 23.0, 10.0, 9.0, 3.0, 1.0, 1.0, 1.0], "bins": [-19.4375, -18.8310546875, -18.224609375, -17.6181640625, -17.01171875, -16.4052734375, -15.798828125, -15.1923828125, -14.5859375, -13.9794921875, -13.373046875, -12.7666015625, -12.16015625, -11.5537109375, -10.947265625, -10.3408203125, -9.734375, -9.1279296875, -8.521484375, -7.9150390625, -7.30859375, -6.7021484375, -6.095703125, -5.4892578125, -4.8828125, -4.2763671875, -3.669921875, -3.0634765625, -2.45703125, -1.8505859375, -1.244140625, -0.6376953125, -0.03125, 0.5751953125, 1.181640625, 1.7880859375, 2.39453125, 3.0009765625, 3.607421875, 4.2138671875, 4.8203125, 5.4267578125, 6.033203125, 6.6396484375, 7.24609375, 7.8525390625, 8.458984375, 9.0654296875, 9.671875, 10.2783203125, 10.884765625, 11.4912109375, 12.09765625, 12.7041015625, 13.310546875, 13.9169921875, 14.5234375, 15.1298828125, 15.736328125, 16.3427734375, 16.94921875, 17.5556640625, 18.162109375, 18.7685546875, 19.375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 3.0, 12.0, 12.0, 12.0, 16.0, 35.0, 39.0, 56.0, 49.0, 76.0, 85.0, 92.0, 90.0, 133.0, 156.0, 126.0, 163.0, 160.0, 172.0, 181.0, 201.0, 171.0, 171.0, 190.0, 202.0, 172.0, 184.0, 147.0, 153.0, 114.0, 101.0, 89.0, 91.0, 88.0, 57.0, 43.0, 39.0, 38.0, 34.0, 25.0, 30.0, 16.0, 14.0, 8.0, 4.0, 6.0, 4.0, 7.0, 2.0], "bins": [-15.53125, -15.111328125, -14.69140625, -14.271484375, -13.8515625, -13.431640625, -13.01171875, -12.591796875, -12.171875, -11.751953125, -11.33203125, -10.912109375, -10.4921875, -10.072265625, -9.65234375, -9.232421875, -8.8125, -8.392578125, -7.97265625, -7.552734375, -7.1328125, -6.712890625, -6.29296875, -5.873046875, -5.453125, -5.033203125, -4.61328125, -4.193359375, -3.7734375, -3.353515625, -2.93359375, -2.513671875, -2.09375, -1.673828125, -1.25390625, -0.833984375, -0.4140625, 0.005859375, 0.42578125, 0.845703125, 1.265625, 1.685546875, 2.10546875, 2.525390625, 2.9453125, 3.365234375, 3.78515625, 4.205078125, 4.625, 5.044921875, 5.46484375, 5.884765625, 6.3046875, 6.724609375, 7.14453125, 7.564453125, 7.984375, 8.404296875, 8.82421875, 9.244140625, 9.6640625, 10.083984375, 10.50390625, 10.923828125, 11.34375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 8.0, 15.0, 9.0, 23.0, 12.0, 18.0, 21.0, 28.0, 33.0, 30.0, 35.0, 41.0, 42.0, 30.0, 45.0, 42.0, 49.0, 46.0, 55.0, 48.0, 45.0, 33.0, 43.0, 33.0, 41.0, 27.0, 21.0, 19.0, 19.0, 17.0, 15.0, 8.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.88132858276367, -37.82698440551758, -36.77263641357422, -35.718292236328125, -34.66394805908203, -33.60960388183594, -32.55525588989258, -31.500911712646484, -30.446565628051758, -29.39221954345703, -28.337875366210938, -27.28352928161621, -26.229183197021484, -25.17483901977539, -24.120492935180664, -23.066146850585938, -22.011802673339844, -20.957456588745117, -19.903112411499023, -18.848766326904297, -17.794422149658203, -16.740076065063477, -15.68572998046875, -14.63138484954834, -13.57703971862793, -12.52269458770752, -11.46834945678711, -10.414003372192383, -9.359658241271973, -8.305313110351562, -7.250967502593994, -6.196621894836426, -5.14227294921875, -4.08792781829834, -3.0335822105407715, -1.9792368412017822, -0.924891471862793, 0.1294536590576172, 1.1837992668151855, 2.238144874572754, 3.292490005493164, 4.346835136413574, 5.401180744171143, 6.455526351928711, 7.509871482849121, 8.564216613769531, 9.618562698364258, 10.672907829284668, 11.727252960205078, 12.781598091125488, 13.835943222045898, 14.890289306640625, 15.944634437561035, 16.998979568481445, 18.053325653076172, 19.107669830322266, 20.162015914916992, 21.21636199951172, 22.270706176757812, 23.32505226135254, 24.379398345947266, 25.43374252319336, 26.488088607788086, 27.542434692382812, 28.596778869628906]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 7.0, 6.0, 7.0, 5.0, 10.0, 10.0, 13.0, 15.0, 14.0, 12.0, 18.0, 23.0, 24.0, 21.0, 33.0, 34.0, 24.0, 25.0, 34.0, 41.0, 41.0, 35.0, 37.0, 42.0, 39.0, 37.0, 31.0, 31.0, 36.0, 37.0, 32.0, 27.0, 16.0, 18.0, 22.0, 18.0, 19.0, 15.0, 18.0, 15.0, 17.0, 15.0, 8.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.670753479003906, -33.59934616088867, -32.52793884277344, -31.45652961730957, -30.385122299194336, -29.3137149810791, -28.242305755615234, -27.1708984375, -26.099491119384766, -25.02808380126953, -23.956676483154297, -22.88526725769043, -21.813859939575195, -20.74245262145996, -19.671043395996094, -18.59963607788086, -17.528228759765625, -16.45682144165039, -15.38541316986084, -14.314004898071289, -13.242597579956055, -12.17119026184082, -11.09978199005127, -10.028373718261719, -8.956966400146484, -7.885558605194092, -6.814150810241699, -5.742743015289307, -4.671335220336914, -3.5999274253845215, -2.528519630432129, -1.4571118354797363, -0.3857002258300781, 0.6857075691223145, 1.757115364074707, 2.8285231590270996, 3.899930953979492, 4.971338748931885, 6.042746543884277, 7.11415433883667, 8.185562133789062, 9.256969451904297, 10.328377723693848, 11.399785995483398, 12.471193313598633, 13.542600631713867, 14.614008903503418, 15.685417175292969, 16.756824493408203, 17.828231811523438, 18.899639129638672, 19.97104835510254, 21.042455673217773, 22.113862991333008, 23.185272216796875, 24.25667953491211, 25.328086853027344, 26.399494171142578, 27.470901489257812, 28.54231071472168, 29.613718032836914, 30.68512535095215, 31.756534576416016, 32.82794189453125, 33.899349212646484]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 5.0, 11.0, 5.0, 8.0, 16.0, 12.0, 19.0, 28.0, 27.0, 46.0, 71.0, 105.0, 103.0, 197.0, 282.0, 374.0, 617.0, 1086.0, 1784.0, 3177.0, 6042.0, 12048.0, 25329.0, 54502.0, 111674.0, 197383.0, 244639.0, 187074.0, 104331.0, 49718.0, 23697.0, 11062.0, 5519.0, 2974.0, 1606.0, 989.0, 634.0, 382.0, 286.0, 204.0, 124.0, 111.0, 72.0, 51.0, 36.0, 34.0, 16.0, 16.0, 14.0, 11.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.265625, -9.9169921875, -9.568359375, -9.2197265625, -8.87109375, -8.5224609375, -8.173828125, -7.8251953125, -7.4765625, -7.1279296875, -6.779296875, -6.4306640625, -6.08203125, -5.7333984375, -5.384765625, -5.0361328125, -4.6875, -4.3388671875, -3.990234375, -3.6416015625, -3.29296875, -2.9443359375, -2.595703125, -2.2470703125, -1.8984375, -1.5498046875, -1.201171875, -0.8525390625, -0.50390625, -0.1552734375, 0.193359375, 0.5419921875, 0.890625, 1.2392578125, 1.587890625, 1.9365234375, 2.28515625, 2.6337890625, 2.982421875, 3.3310546875, 3.6796875, 4.0283203125, 4.376953125, 4.7255859375, 5.07421875, 5.4228515625, 5.771484375, 6.1201171875, 6.46875, 6.8173828125, 7.166015625, 7.5146484375, 7.86328125, 8.2119140625, 8.560546875, 8.9091796875, 9.2578125, 9.6064453125, 9.955078125, 10.3037109375, 10.65234375, 11.0009765625, 11.349609375, 11.6982421875, 12.046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 6.0, 9.0, 15.0, 8.0, 16.0, 13.0, 15.0, 17.0, 23.0, 23.0, 20.0, 36.0, 34.0, 23.0, 25.0, 34.0, 44.0, 39.0, 34.0, 39.0, 40.0, 39.0, 35.0, 32.0, 31.0, 38.0, 35.0, 33.0, 27.0, 17.0, 17.0, 21.0, 18.0, 18.0, 15.0, 18.0, 15.0, 17.0, 16.0, 7.0, 9.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.375, -33.30517578125, -32.2353515625, -31.16552734375, -30.095703125, -29.02587890625, -27.9560546875, -26.88623046875, -25.81640625, -24.74658203125, -23.6767578125, -22.60693359375, -21.537109375, -20.46728515625, -19.3974609375, -18.32763671875, -17.2578125, -16.18798828125, -15.1181640625, -14.04833984375, -12.978515625, -11.90869140625, -10.8388671875, -9.76904296875, -8.69921875, -7.62939453125, -6.5595703125, -5.48974609375, -4.419921875, -3.35009765625, -2.2802734375, -1.21044921875, -0.140625, 0.92919921875, 1.9990234375, 3.06884765625, 4.138671875, 5.20849609375, 6.2783203125, 7.34814453125, 8.41796875, 9.48779296875, 10.5576171875, 11.62744140625, 12.697265625, 13.76708984375, 14.8369140625, 15.90673828125, 16.9765625, 18.04638671875, 19.1162109375, 20.18603515625, 21.255859375, 22.32568359375, 23.3955078125, 24.46533203125, 25.53515625, 26.60498046875, 27.6748046875, 28.74462890625, 29.814453125, 30.88427734375, 31.9541015625, 33.02392578125, 34.09375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 12.0, 15.0, 17.0, 22.0, 24.0, 35.0, 32.0, 50.0, 84.0, 104.0, 140.0, 185.0, 272.0, 339.0, 521.0, 768.0, 1057.0, 1745.0, 2785.0, 4860.0, 8583.0, 16334.0, 33626.0, 73573.0, 165705.0, 288017.0, 235352.0, 112219.0, 49894.0, 23451.0, 11844.0, 6509.0, 3704.0, 2224.0, 1417.0, 885.0, 605.0, 417.0, 293.0, 205.0, 156.0, 110.0, 71.0, 58.0, 68.0, 44.0, 22.0, 28.0, 25.0, 17.0, 11.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0], "bins": [-10.6875, -10.3509521484375, -10.014404296875, -9.6778564453125, -9.34130859375, -9.0047607421875, -8.668212890625, -8.3316650390625, -7.9951171875, -7.6585693359375, -7.322021484375, -6.9854736328125, -6.64892578125, -6.3123779296875, -5.975830078125, -5.6392822265625, -5.302734375, -4.9661865234375, -4.629638671875, -4.2930908203125, -3.95654296875, -3.6199951171875, -3.283447265625, -2.9468994140625, -2.6103515625, -2.2738037109375, -1.937255859375, -1.6007080078125, -1.26416015625, -0.9276123046875, -0.591064453125, -0.2545166015625, 0.08203125, 0.4185791015625, 0.755126953125, 1.0916748046875, 1.42822265625, 1.7647705078125, 2.101318359375, 2.4378662109375, 2.7744140625, 3.1109619140625, 3.447509765625, 3.7840576171875, 4.12060546875, 4.4571533203125, 4.793701171875, 5.1302490234375, 5.466796875, 5.8033447265625, 6.139892578125, 6.4764404296875, 6.81298828125, 7.1495361328125, 7.486083984375, 7.8226318359375, 8.1591796875, 8.4957275390625, 8.832275390625, 9.1688232421875, 9.50537109375, 9.8419189453125, 10.178466796875, 10.5150146484375, 10.8515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 5.0, 12.0, 8.0, 14.0, 23.0, 15.0, 26.0, 23.0, 20.0, 25.0, 28.0, 40.0, 19.0, 39.0, 35.0, 36.0, 37.0, 44.0, 40.0, 38.0, 45.0, 33.0, 41.0, 32.0, 39.0, 41.0, 37.0, 30.0, 26.0, 26.0, 24.0, 10.0, 15.0, 8.0, 16.0, 13.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-26.90625, -26.113037109375, -25.31982421875, -24.526611328125, -23.7333984375, -22.940185546875, -22.14697265625, -21.353759765625, -20.560546875, -19.767333984375, -18.97412109375, -18.180908203125, -17.3876953125, -16.594482421875, -15.80126953125, -15.008056640625, -14.21484375, -13.421630859375, -12.62841796875, -11.835205078125, -11.0419921875, -10.248779296875, -9.45556640625, -8.662353515625, -7.869140625, -7.075927734375, -6.28271484375, -5.489501953125, -4.6962890625, -3.903076171875, -3.10986328125, -2.316650390625, -1.5234375, -0.730224609375, 0.06298828125, 0.856201171875, 1.6494140625, 2.442626953125, 3.23583984375, 4.029052734375, 4.822265625, 5.615478515625, 6.40869140625, 7.201904296875, 7.9951171875, 8.788330078125, 9.58154296875, 10.374755859375, 11.16796875, 11.961181640625, 12.75439453125, 13.547607421875, 14.3408203125, 15.134033203125, 15.92724609375, 16.720458984375, 17.513671875, 18.306884765625, 19.10009765625, 19.893310546875, 20.6865234375, 21.479736328125, 22.27294921875, 23.066162109375, 23.859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 2.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 13.0, 17.0, 21.0, 23.0, 43.0, 70.0, 85.0, 98.0, 165.0, 270.0, 435.0, 722.0, 1256.0, 2521.0, 5658.0, 15867.0, 57273.0, 390835.0, 475990.0, 67233.0, 17673.0, 6070.0, 2685.0, 1403.0, 736.0, 452.0, 285.0, 181.0, 113.0, 93.0, 56.0, 48.0, 32.0, 22.0, 16.0, 9.0, 14.0, 9.0, 4.0, 6.0, 3.0, 3.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.4140625, -11.0687255859375, -10.723388671875, -10.3780517578125, -10.03271484375, -9.6873779296875, -9.342041015625, -8.9967041015625, -8.6513671875, -8.3060302734375, -7.960693359375, -7.6153564453125, -7.27001953125, -6.9246826171875, -6.579345703125, -6.2340087890625, -5.888671875, -5.5433349609375, -5.197998046875, -4.8526611328125, -4.50732421875, -4.1619873046875, -3.816650390625, -3.4713134765625, -3.1259765625, -2.7806396484375, -2.435302734375, -2.0899658203125, -1.74462890625, -1.3992919921875, -1.053955078125, -0.7086181640625, -0.36328125, -0.0179443359375, 0.327392578125, 0.6727294921875, 1.01806640625, 1.3634033203125, 1.708740234375, 2.0540771484375, 2.3994140625, 2.7447509765625, 3.090087890625, 3.4354248046875, 3.78076171875, 4.1260986328125, 4.471435546875, 4.8167724609375, 5.162109375, 5.5074462890625, 5.852783203125, 6.1981201171875, 6.54345703125, 6.8887939453125, 7.234130859375, 7.5794677734375, 7.9248046875, 8.2701416015625, 8.615478515625, 8.9608154296875, 9.30615234375, 9.6514892578125, 9.996826171875, 10.3421630859375, 10.6875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 13.0, 17.0, 26.0, 21.0, 31.0, 38.0, 52.0, 55.0, 75.0, 40.0, 65.0, 74.0, 59.0, 69.0, 54.0, 51.0, 42.0, 34.0, 27.0, 33.0, 24.0, 21.0, 14.0, 10.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00029754638671875, -0.000288400799036026, -0.000279255211353302, -0.000270109623670578, -0.000260964035987854, -0.00025181844830513, -0.000242672860622406, -0.000233527272939682, -0.000224381685256958, -0.000215236097574234, -0.00020609050989151, -0.000196944922208786, -0.000187799334526062, -0.000178653746843338, -0.00016950815916061401, -0.00016036257147789001, -0.00015121698379516602, -0.00014207139611244202, -0.00013292580842971802, -0.00012378022074699402, -0.00011463463306427002, -0.00010548904538154602, -9.634345769882202e-05, -8.719787001609802e-05, -7.805228233337402e-05, -6.890669465065002e-05, -5.9761106967926025e-05, -5.0615519285202026e-05, -4.146993160247803e-05, -3.232434391975403e-05, -2.317875623703003e-05, -1.403316855430603e-05, -4.887580871582031e-06, 4.258006811141968e-06, 1.3403594493865967e-05, 2.2549182176589966e-05, 3.1694769859313965e-05, 4.0840357542037964e-05, 4.998594522476196e-05, 5.913153290748596e-05, 6.827712059020996e-05, 7.742270827293396e-05, 8.656829595565796e-05, 9.571388363838196e-05, 0.00010485947132110596, 0.00011400505900382996, 0.00012315064668655396, 0.00013229623436927795, 0.00014144182205200195, 0.00015058740973472595, 0.00015973299741744995, 0.00016887858510017395, 0.00017802417278289795, 0.00018716976046562195, 0.00019631534814834595, 0.00020546093583106995, 0.00021460652351379395, 0.00022375211119651794, 0.00023289769887924194, 0.00024204328656196594, 0.00025118887424468994, 0.00026033446192741394, 0.00026948004961013794, 0.00027862563729286194, 0.00028777122497558594]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 12.0, 23.0, 24.0, 39.0, 55.0, 80.0, 112.0, 162.0, 234.0, 320.0, 510.0, 814.0, 1171.0, 1954.0, 3473.0, 6826.0, 14487.0, 34403.0, 87902.0, 213174.0, 325762.0, 208808.0, 85017.0, 33480.0, 14333.0, 6516.0, 3442.0, 1904.0, 1154.0, 739.0, 519.0, 352.0, 229.0, 177.0, 99.0, 80.0, 43.0, 34.0, 26.0, 22.0, 12.0, 8.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-11.65625, -11.3277587890625, -10.999267578125, -10.6707763671875, -10.34228515625, -10.0137939453125, -9.685302734375, -9.3568115234375, -9.0283203125, -8.6998291015625, -8.371337890625, -8.0428466796875, -7.71435546875, -7.3858642578125, -7.057373046875, -6.7288818359375, -6.400390625, -6.0718994140625, -5.743408203125, -5.4149169921875, -5.08642578125, -4.7579345703125, -4.429443359375, -4.1009521484375, -3.7724609375, -3.4439697265625, -3.115478515625, -2.7869873046875, -2.45849609375, -2.1300048828125, -1.801513671875, -1.4730224609375, -1.14453125, -0.8160400390625, -0.487548828125, -0.1590576171875, 0.16943359375, 0.4979248046875, 0.826416015625, 1.1549072265625, 1.4833984375, 1.8118896484375, 2.140380859375, 2.4688720703125, 2.79736328125, 3.1258544921875, 3.454345703125, 3.7828369140625, 4.111328125, 4.4398193359375, 4.768310546875, 5.0968017578125, 5.42529296875, 5.7537841796875, 6.082275390625, 6.4107666015625, 6.7392578125, 7.0677490234375, 7.396240234375, 7.7247314453125, 8.05322265625, 8.3817138671875, 8.710205078125, 9.0386962890625, 9.3671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 4.0, 10.0, 15.0, 16.0, 22.0, 17.0, 39.0, 49.0, 67.0, 85.0, 121.0, 107.0, 103.0, 85.0, 61.0, 41.0, 47.0, 19.0, 20.0, 12.0, 9.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.73046875, -4.596435546875, -4.46240234375, -4.328369140625, -4.1943359375, -4.060302734375, -3.92626953125, -3.792236328125, -3.658203125, -3.524169921875, -3.39013671875, -3.256103515625, -3.1220703125, -2.988037109375, -2.85400390625, -2.719970703125, -2.5859375, -2.451904296875, -2.31787109375, -2.183837890625, -2.0498046875, -1.915771484375, -1.78173828125, -1.647705078125, -1.513671875, -1.379638671875, -1.24560546875, -1.111572265625, -0.9775390625, -0.843505859375, -0.70947265625, -0.575439453125, -0.44140625, -0.307373046875, -0.17333984375, -0.039306640625, 0.0947265625, 0.228759765625, 0.36279296875, 0.496826171875, 0.630859375, 0.764892578125, 0.89892578125, 1.032958984375, 1.1669921875, 1.301025390625, 1.43505859375, 1.569091796875, 1.703125, 1.837158203125, 1.97119140625, 2.105224609375, 2.2392578125, 2.373291015625, 2.50732421875, 2.641357421875, 2.775390625, 2.909423828125, 3.04345703125, 3.177490234375, 3.3115234375, 3.445556640625, 3.57958984375, 3.713623046875, 3.84765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 5.0, 13.0, 12.0, 16.0, 13.0, 19.0, 23.0, 23.0, 23.0, 34.0, 41.0, 44.0, 29.0, 45.0, 43.0, 39.0, 51.0, 43.0, 48.0, 47.0, 47.0, 40.0, 38.0, 38.0, 36.0, 24.0, 34.0, 22.0, 21.0, 13.0, 17.0, 8.0, 9.0, 6.0, 2.0, 6.0, 6.0, 6.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-39.281368255615234, -38.222625732421875, -37.16388702392578, -36.10514831542969, -35.04640579223633, -33.98766326904297, -32.928924560546875, -31.87018394470215, -30.811443328857422, -29.752702713012695, -28.69396209716797, -27.635221481323242, -26.576480865478516, -25.51774024963379, -24.458999633789062, -23.400259017944336, -22.34151840209961, -21.282777786254883, -20.224037170410156, -19.16529655456543, -18.106555938720703, -17.047815322875977, -15.98907470703125, -14.930334091186523, -13.871593475341797, -12.81285285949707, -11.754112243652344, -10.695371627807617, -9.63663101196289, -8.577890396118164, -7.5191497802734375, -6.460409164428711, -5.401668548583984, -4.342927932739258, -3.2841873168945312, -2.2254467010498047, -1.1667060852050781, -0.10796546936035156, 0.950775146484375, 2.0095157623291016, 3.068256378173828, 4.126996994018555, 5.185737609863281, 6.244478225708008, 7.303218841552734, 8.361959457397461, 9.420700073242188, 10.479440689086914, 11.53818130493164, 12.596921920776367, 13.655662536621094, 14.71440315246582, 15.773143768310547, 16.831884384155273, 17.890625, 18.949365615844727, 20.008106231689453, 21.06684684753418, 22.125587463378906, 23.184328079223633, 24.24306869506836, 25.301809310913086, 26.360549926757812, 27.41929054260254, 28.478031158447266]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 4.0, 9.0, 5.0, 15.0, 9.0, 16.0, 14.0, 14.0, 16.0, 19.0, 29.0, 21.0, 26.0, 31.0, 35.0, 22.0, 33.0, 30.0, 46.0, 39.0, 36.0, 37.0, 41.0, 29.0, 36.0, 37.0, 28.0, 46.0, 27.0, 27.0, 18.0, 18.0, 18.0, 18.0, 19.0, 18.0, 18.0, 17.0, 14.0, 21.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-34.208221435546875, -33.152442932128906, -32.09666442871094, -31.04088592529297, -29.985107421875, -28.92932891845703, -27.873552322387695, -26.817773818969727, -25.761995315551758, -24.70621681213379, -23.65043830871582, -22.59465980529785, -21.538883209228516, -20.483104705810547, -19.427326202392578, -18.37154769897461, -17.31576919555664, -16.259990692138672, -15.204212188720703, -14.14843463897705, -13.092656135559082, -12.036877632141113, -10.981100082397461, -9.925321578979492, -8.869543075561523, -7.813764572143555, -6.757986545562744, -5.702208518981934, -4.646430015563965, -3.590651512145996, -2.5348734855651855, -1.479095458984375, -0.4233131408691406, 0.632465124130249, 1.6882433891296387, 2.7440216541290283, 3.799799919128418, 4.855578422546387, 5.911356449127197, 6.967134475708008, 8.022912979125977, 9.078691482543945, 10.134469985961914, 11.190247535705566, 12.246026039123535, 13.301804542541504, 14.357582092285156, 15.413360595703125, 16.469139099121094, 17.524917602539062, 18.58069610595703, 19.636474609375, 20.69225311279297, 21.748031616210938, 22.803808212280273, 23.859586715698242, 24.91536521911621, 25.97114372253418, 27.02692222595215, 28.082700729370117, 29.138477325439453, 30.194255828857422, 31.25003433227539, 32.30581283569336, 33.36159133911133]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 19.0, 27.0, 40.0, 68.0, 145.0, 191.0, 299.0, 505.0, 810.0, 1343.0, 2000.0, 3086.0, 4709.0, 7181.0, 10364.0, 15014.0, 20369.0, 27517.0, 37032.0, 46177.0, 56106.0, 65925.0, 74100.0, 80820.0, 83589.0, 83040.0, 78993.0, 72491.0, 62822.0, 53254.0, 43006.0, 33588.0, 25091.0, 18557.0, 13334.0, 9268.0, 6113.0, 4195.0, 2729.0, 1757.0, 1093.0, 702.0, 403.0, 256.0, 157.0, 93.0, 85.0, 35.0, 24.0, 11.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-16.046875, -15.5582275390625, -15.069580078125, -14.5809326171875, -14.09228515625, -13.6036376953125, -13.114990234375, -12.6263427734375, -12.1376953125, -11.6490478515625, -11.160400390625, -10.6717529296875, -10.18310546875, -9.6944580078125, -9.205810546875, -8.7171630859375, -8.228515625, -7.7398681640625, -7.251220703125, -6.7625732421875, -6.27392578125, -5.7852783203125, -5.296630859375, -4.8079833984375, -4.3193359375, -3.8306884765625, -3.342041015625, -2.8533935546875, -2.36474609375, -1.8760986328125, -1.387451171875, -0.8988037109375, -0.41015625, 0.0784912109375, 0.567138671875, 1.0557861328125, 1.54443359375, 2.0330810546875, 2.521728515625, 3.0103759765625, 3.4990234375, 3.9876708984375, 4.476318359375, 4.9649658203125, 5.45361328125, 5.9422607421875, 6.430908203125, 6.9195556640625, 7.408203125, 7.8968505859375, 8.385498046875, 8.8741455078125, 9.36279296875, 9.8514404296875, 10.340087890625, 10.8287353515625, 11.3173828125, 11.8060302734375, 12.294677734375, 12.7833251953125, 13.27197265625, 13.7606201171875, 14.249267578125, 14.7379150390625, 15.2265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 3.0, 9.0, 5.0, 19.0, 5.0, 18.0, 13.0, 15.0, 17.0, 24.0, 21.0, 25.0, 25.0, 31.0, 41.0, 18.0, 34.0, 32.0, 42.0, 40.0, 37.0, 41.0, 34.0, 32.0, 37.0, 33.0, 32.0, 43.0, 28.0, 25.0, 19.0, 18.0, 14.0, 21.0, 22.0, 12.0, 17.0, 20.0, 14.0, 19.0, 6.0, 8.0, 6.0, 1.0, 6.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.25, -32.2177734375, -31.185546875, -30.1533203125, -29.12109375, -28.0888671875, -27.056640625, -26.0244140625, -24.9921875, -23.9599609375, -22.927734375, -21.8955078125, -20.86328125, -19.8310546875, -18.798828125, -17.7666015625, -16.734375, -15.7021484375, -14.669921875, -13.6376953125, -12.60546875, -11.5732421875, -10.541015625, -9.5087890625, -8.4765625, -7.4443359375, -6.412109375, -5.3798828125, -4.34765625, -3.3154296875, -2.283203125, -1.2509765625, -0.21875, 0.8134765625, 1.845703125, 2.8779296875, 3.91015625, 4.9423828125, 5.974609375, 7.0068359375, 8.0390625, 9.0712890625, 10.103515625, 11.1357421875, 12.16796875, 13.2001953125, 14.232421875, 15.2646484375, 16.296875, 17.3291015625, 18.361328125, 19.3935546875, 20.42578125, 21.4580078125, 22.490234375, 23.5224609375, 24.5546875, 25.5869140625, 26.619140625, 27.6513671875, 28.68359375, 29.7158203125, 30.748046875, 31.7802734375, 32.8125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 12.0, 20.0, 39.0, 50.0, 68.0, 149.0, 227.0, 340.0, 579.0, 926.0, 1452.0, 2223.0, 3556.0, 5364.0, 8328.0, 12148.0, 17430.0, 24283.0, 33103.0, 43448.0, 55339.0, 66309.0, 77349.0, 85150.0, 89443.0, 88804.0, 84803.0, 76494.0, 65963.0, 54432.0, 42748.0, 32554.0, 23668.0, 17186.0, 11741.0, 8121.0, 5312.0, 3462.0, 2304.0, 1383.0, 828.0, 512.0, 337.0, 187.0, 140.0, 94.0, 68.0, 29.0, 19.0, 11.0, 5.0, 8.0, 2.0, 0.0, 2.0], "bins": [-18.078125, -17.5458984375, -17.013671875, -16.4814453125, -15.94921875, -15.4169921875, -14.884765625, -14.3525390625, -13.8203125, -13.2880859375, -12.755859375, -12.2236328125, -11.69140625, -11.1591796875, -10.626953125, -10.0947265625, -9.5625, -9.0302734375, -8.498046875, -7.9658203125, -7.43359375, -6.9013671875, -6.369140625, -5.8369140625, -5.3046875, -4.7724609375, -4.240234375, -3.7080078125, -3.17578125, -2.6435546875, -2.111328125, -1.5791015625, -1.046875, -0.5146484375, 0.017578125, 0.5498046875, 1.08203125, 1.6142578125, 2.146484375, 2.6787109375, 3.2109375, 3.7431640625, 4.275390625, 4.8076171875, 5.33984375, 5.8720703125, 6.404296875, 6.9365234375, 7.46875, 8.0009765625, 8.533203125, 9.0654296875, 9.59765625, 10.1298828125, 10.662109375, 11.1943359375, 11.7265625, 12.2587890625, 12.791015625, 13.3232421875, 13.85546875, 14.3876953125, 14.919921875, 15.4521484375, 15.984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 7.0, 8.0, 8.0, 10.0, 2.0, 7.0, 10.0, 16.0, 17.0, 20.0, 23.0, 14.0, 26.0, 31.0, 21.0, 29.0, 43.0, 38.0, 31.0, 43.0, 40.0, 38.0, 43.0, 36.0, 33.0, 32.0, 37.0, 40.0, 29.0, 35.0, 26.0, 27.0, 19.0, 27.0, 23.0, 16.0, 13.0, 8.0, 13.0, 17.0, 11.0, 9.0, 8.0, 2.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0], "bins": [-26.296875, -25.57666015625, -24.8564453125, -24.13623046875, -23.416015625, -22.69580078125, -21.9755859375, -21.25537109375, -20.53515625, -19.81494140625, -19.0947265625, -18.37451171875, -17.654296875, -16.93408203125, -16.2138671875, -15.49365234375, -14.7734375, -14.05322265625, -13.3330078125, -12.61279296875, -11.892578125, -11.17236328125, -10.4521484375, -9.73193359375, -9.01171875, -8.29150390625, -7.5712890625, -6.85107421875, -6.130859375, -5.41064453125, -4.6904296875, -3.97021484375, -3.25, -2.52978515625, -1.8095703125, -1.08935546875, -0.369140625, 0.35107421875, 1.0712890625, 1.79150390625, 2.51171875, 3.23193359375, 3.9521484375, 4.67236328125, 5.392578125, 6.11279296875, 6.8330078125, 7.55322265625, 8.2734375, 8.99365234375, 9.7138671875, 10.43408203125, 11.154296875, 11.87451171875, 12.5947265625, 13.31494140625, 14.03515625, 14.75537109375, 15.4755859375, 16.19580078125, 16.916015625, 17.63623046875, 18.3564453125, 19.07666015625, 19.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 12.0, 22.0, 20.0, 40.0, 61.0, 85.0, 123.0, 243.0, 339.0, 611.0, 1061.0, 1754.0, 2905.0, 4854.0, 7813.0, 12814.0, 19644.0, 29448.0, 42158.0, 57826.0, 74515.0, 90277.0, 102112.0, 107816.0, 105268.0, 95373.0, 81250.0, 65050.0, 48109.0, 34429.0, 22926.0, 15099.0, 9561.0, 5856.0, 3671.0, 2179.0, 1297.0, 781.0, 447.0, 228.0, 158.0, 107.0, 91.0, 42.0, 18.0, 15.0, 12.0, 11.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0], "bins": [-9.546875, -9.2457275390625, -8.944580078125, -8.6434326171875, -8.34228515625, -8.0411376953125, -7.739990234375, -7.4388427734375, -7.1376953125, -6.8365478515625, -6.535400390625, -6.2342529296875, -5.93310546875, -5.6319580078125, -5.330810546875, -5.0296630859375, -4.728515625, -4.4273681640625, -4.126220703125, -3.8250732421875, -3.52392578125, -3.2227783203125, -2.921630859375, -2.6204833984375, -2.3193359375, -2.0181884765625, -1.717041015625, -1.4158935546875, -1.11474609375, -0.8135986328125, -0.512451171875, -0.2113037109375, 0.08984375, 0.3909912109375, 0.692138671875, 0.9932861328125, 1.29443359375, 1.5955810546875, 1.896728515625, 2.1978759765625, 2.4990234375, 2.8001708984375, 3.101318359375, 3.4024658203125, 3.70361328125, 4.0047607421875, 4.305908203125, 4.6070556640625, 4.908203125, 5.2093505859375, 5.510498046875, 5.8116455078125, 6.11279296875, 6.4139404296875, 6.715087890625, 7.0162353515625, 7.3173828125, 7.6185302734375, 7.919677734375, 8.2208251953125, 8.52197265625, 8.8231201171875, 9.124267578125, 9.4254150390625, 9.7265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 10.0, 11.0, 8.0, 17.0, 12.0, 19.0, 21.0, 26.0, 35.0, 20.0, 31.0, 32.0, 43.0, 39.0, 44.0, 31.0, 50.0, 44.0, 45.0, 42.0, 44.0, 28.0, 45.0, 34.0, 33.0, 26.0, 30.0, 22.0, 16.0, 19.0, 12.0, 19.0, 11.0, 13.0, 16.0, 7.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0010995864868164062, -0.0010648220777511597, -0.001030057668685913, -0.0009952932596206665, -0.0009605288505554199, -0.0009257644414901733, -0.0008910000324249268, -0.0008562356233596802, -0.0008214712142944336, -0.000786706805229187, -0.0007519423961639404, -0.0007171779870986938, -0.0006824135780334473, -0.0006476491689682007, -0.0006128847599029541, -0.0005781203508377075, -0.0005433559417724609, -0.0005085915327072144, -0.0004738271236419678, -0.0004390627145767212, -0.0004042983055114746, -0.00036953389644622803, -0.00033476948738098145, -0.00030000507831573486, -0.0002652406692504883, -0.0002304762601852417, -0.00019571185111999512, -0.00016094744205474854, -0.00012618303298950195, -9.141862392425537e-05, -5.665421485900879e-05, -2.1889805793762207e-05, 1.2874603271484375e-05, 4.763901233673096e-05, 8.240342140197754e-05, 0.00011716783046722412, 0.0001519322395324707, 0.00018669664859771729, 0.00022146105766296387, 0.00025622546672821045, 0.00029098987579345703, 0.0003257542848587036, 0.0003605186939239502, 0.0003952831029891968, 0.00043004751205444336, 0.00046481192111968994, 0.0004995763301849365, 0.0005343407392501831, 0.0005691051483154297, 0.0006038695573806763, 0.0006386339664459229, 0.0006733983755111694, 0.000708162784576416, 0.0007429271936416626, 0.0007776916027069092, 0.0008124560117721558, 0.0008472204208374023, 0.0008819848299026489, 0.0009167492389678955, 0.0009515136480331421, 0.0009862780570983887, 0.0010210424661636353, 0.0010558068752288818, 0.0010905712842941284, 0.001125335693359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 11.0, 29.0, 42.0, 66.0, 97.0, 134.0, 258.0, 498.0, 735.0, 1463.0, 2608.0, 4569.0, 7996.0, 13761.0, 22364.0, 35200.0, 52111.0, 72650.0, 93393.0, 110428.0, 120366.0, 118899.0, 107268.0, 89025.0, 66905.0, 47745.0, 31734.0, 19962.0, 11986.0, 7128.0, 4009.0, 2216.0, 1217.0, 727.0, 369.0, 218.0, 137.0, 81.0, 44.0, 34.0, 23.0, 15.0, 13.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.888427734375, -11.50341796875, -11.118408203125, -10.7333984375, -10.348388671875, -9.96337890625, -9.578369140625, -9.193359375, -8.808349609375, -8.42333984375, -8.038330078125, -7.6533203125, -7.268310546875, -6.88330078125, -6.498291015625, -6.11328125, -5.728271484375, -5.34326171875, -4.958251953125, -4.5732421875, -4.188232421875, -3.80322265625, -3.418212890625, -3.033203125, -2.648193359375, -2.26318359375, -1.878173828125, -1.4931640625, -1.108154296875, -0.72314453125, -0.338134765625, 0.046875, 0.431884765625, 0.81689453125, 1.201904296875, 1.5869140625, 1.971923828125, 2.35693359375, 2.741943359375, 3.126953125, 3.511962890625, 3.89697265625, 4.281982421875, 4.6669921875, 5.052001953125, 5.43701171875, 5.822021484375, 6.20703125, 6.592041015625, 6.97705078125, 7.362060546875, 7.7470703125, 8.132080078125, 8.51708984375, 8.902099609375, 9.287109375, 9.672119140625, 10.05712890625, 10.442138671875, 10.8271484375, 11.212158203125, 11.59716796875, 11.982177734375, 12.3671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 3.0, 6.0, 5.0, 2.0, 9.0, 10.0, 17.0, 19.0, 17.0, 18.0, 13.0, 22.0, 22.0, 32.0, 36.0, 36.0, 32.0, 37.0, 28.0, 47.0, 34.0, 30.0, 47.0, 40.0, 44.0, 39.0, 46.0, 25.0, 27.0, 30.0, 19.0, 23.0, 22.0, 25.0, 27.0, 24.0, 15.0, 16.0, 6.0, 10.0, 10.0, 9.0, 2.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.9296875, -4.79071044921875, -4.6517333984375, -4.51275634765625, -4.373779296875, -4.23480224609375, -4.0958251953125, -3.95684814453125, -3.81787109375, -3.67889404296875, -3.5399169921875, -3.40093994140625, -3.261962890625, -3.12298583984375, -2.9840087890625, -2.84503173828125, -2.7060546875, -2.56707763671875, -2.4281005859375, -2.28912353515625, -2.150146484375, -2.01116943359375, -1.8721923828125, -1.73321533203125, -1.59423828125, -1.45526123046875, -1.3162841796875, -1.17730712890625, -1.038330078125, -0.89935302734375, -0.7603759765625, -0.62139892578125, -0.482421875, -0.34344482421875, -0.2044677734375, -0.06549072265625, 0.073486328125, 0.21246337890625, 0.3514404296875, 0.49041748046875, 0.62939453125, 0.76837158203125, 0.9073486328125, 1.04632568359375, 1.185302734375, 1.32427978515625, 1.4632568359375, 1.60223388671875, 1.7412109375, 1.88018798828125, 2.0191650390625, 2.15814208984375, 2.297119140625, 2.43609619140625, 2.5750732421875, 2.71405029296875, 2.85302734375, 2.99200439453125, 3.1309814453125, 3.26995849609375, 3.408935546875, 3.54791259765625, 3.6868896484375, 3.82586669921875, 3.96484375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 7.0, 15.0, 11.0, 9.0, 18.0, 17.0, 30.0, 27.0, 26.0, 41.0, 39.0, 39.0, 30.0, 41.0, 41.0, 43.0, 43.0, 46.0, 45.0, 41.0, 39.0, 39.0, 44.0, 46.0, 35.0, 22.0, 16.0, 25.0, 13.0, 12.0, 26.0, 11.0, 14.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-37.66508483886719, -36.61985778808594, -35.57462692260742, -34.52939987182617, -33.484169006347656, -32.438941955566406, -31.393714904785156, -30.348485946655273, -29.30325698852539, -28.258028030395508, -27.212799072265625, -26.167572021484375, -25.122343063354492, -24.07711410522461, -23.03188705444336, -21.986658096313477, -20.941429138183594, -19.89620018005371, -18.850971221923828, -17.805744171142578, -16.760515213012695, -15.715286254882812, -14.670058250427246, -13.62483024597168, -12.579601287841797, -11.534372329711914, -10.489144325256348, -9.443916320800781, -8.398687362670898, -7.353458881378174, -6.308230400085449, -5.263001918792725, -4.217769622802734, -3.1725411415100098, -2.127312660217285, -1.0820841789245605, -0.03685569763183594, 1.0083727836608887, 2.0536012649536133, 3.098829746246338, 4.1440582275390625, 5.189286708831787, 6.234515190124512, 7.279743671417236, 8.324972152709961, 9.370201110839844, 10.41542911529541, 11.460657119750977, 12.50588607788086, 13.551115036010742, 14.596343040466309, 15.641571044921875, 16.686800003051758, 17.73202896118164, 18.77725601196289, 19.822484970092773, 20.867713928222656, 21.91294288635254, 22.958171844482422, 24.003398895263672, 25.048627853393555, 26.093856811523438, 27.139083862304688, 28.18431282043457, 29.229541778564453]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 10.0, 6.0, 5.0, 13.0, 2.0, 21.0, 11.0, 15.0, 20.0, 20.0, 15.0, 31.0, 25.0, 31.0, 39.0, 23.0, 39.0, 33.0, 42.0, 38.0, 37.0, 44.0, 23.0, 40.0, 45.0, 36.0, 44.0, 39.0, 22.0, 24.0, 24.0, 25.0, 24.0, 18.0, 29.0, 17.0, 14.0, 11.0, 9.0, 8.0, 9.0, 5.0, 11.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.61280822753906, -36.38051223754883, -35.14822006225586, -33.915924072265625, -32.683631896972656, -31.451335906982422, -30.219039916992188, -28.986745834350586, -27.754451751708984, -26.522157669067383, -25.28986358642578, -24.057567596435547, -22.825273513793945, -21.592979431152344, -20.36068344116211, -19.128389358520508, -17.896095275878906, -16.663801193237305, -15.431506156921387, -14.199211120605469, -12.966917037963867, -11.734622955322266, -10.502327919006348, -9.27003288269043, -8.037738800048828, -6.805444240570068, -5.573149681091309, -4.340855121612549, -3.108560562133789, -1.8762660026550293, -0.6439714431762695, 0.5883235931396484, 1.8206138610839844, 3.052908420562744, 4.285202980041504, 5.517497539520264, 6.749792098999023, 7.982086658477783, 9.214381217956543, 10.446676254272461, 11.678970336914062, 12.911264419555664, 14.143559455871582, 15.3758544921875, 16.6081485748291, 17.840442657470703, 19.072738647460938, 20.30503273010254, 21.53732681274414, 22.769620895385742, 24.001914978027344, 25.234210968017578, 26.46650505065918, 27.69879913330078, 28.931095123291016, 30.163389205932617, 31.39568328857422, 32.62797927856445, 33.86027145385742, 35.092567443847656, 36.324859619140625, 37.55715560913086, 38.789451599121094, 40.02174377441406, 41.2540397644043]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 19.0, 36.0, 65.0, 109.0, 191.0, 329.0, 527.0, 899.0, 1464.0, 2440.0, 4275.0, 6642.0, 10497.0, 16416.0, 25349.0, 38101.0, 55740.0, 78862.0, 111336.0, 148101.0, 192300.0, 238431.0, 285618.0, 324179.0, 351223.0, 361037.0, 353355.0, 328087.0, 290213.0, 245805.0, 199533.0, 153574.0, 115137.0, 83657.0, 58633.0, 39715.0, 26386.0, 17049.0, 11327.0, 7012.0, 4236.0, 2574.0, 1596.0, 903.0, 536.0, 305.0, 206.0, 104.0, 67.0, 37.0, 18.0, 6.0, 10.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-21.46875, -20.78857421875, -20.1083984375, -19.42822265625, -18.748046875, -18.06787109375, -17.3876953125, -16.70751953125, -16.02734375, -15.34716796875, -14.6669921875, -13.98681640625, -13.306640625, -12.62646484375, -11.9462890625, -11.26611328125, -10.5859375, -9.90576171875, -9.2255859375, -8.54541015625, -7.865234375, -7.18505859375, -6.5048828125, -5.82470703125, -5.14453125, -4.46435546875, -3.7841796875, -3.10400390625, -2.423828125, -1.74365234375, -1.0634765625, -0.38330078125, 0.296875, 0.97705078125, 1.6572265625, 2.33740234375, 3.017578125, 3.69775390625, 4.3779296875, 5.05810546875, 5.73828125, 6.41845703125, 7.0986328125, 7.77880859375, 8.458984375, 9.13916015625, 9.8193359375, 10.49951171875, 11.1796875, 11.85986328125, 12.5400390625, 13.22021484375, 13.900390625, 14.58056640625, 15.2607421875, 15.94091796875, 16.62109375, 17.30126953125, 17.9814453125, 18.66162109375, 19.341796875, 20.02197265625, 20.7021484375, 21.38232421875, 22.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 10.0, 6.0, 5.0, 12.0, 3.0, 19.0, 12.0, 16.0, 17.0, 21.0, 15.0, 32.0, 26.0, 27.0, 38.0, 28.0, 34.0, 36.0, 39.0, 40.0, 31.0, 46.0, 30.0, 34.0, 48.0, 36.0, 41.0, 41.0, 20.0, 25.0, 27.0, 24.0, 25.0, 18.0, 26.0, 19.0, 16.0, 8.0, 12.0, 5.0, 12.0, 6.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.91162109375, -33.7294921875, -32.54736328125, -31.365234375, -30.18310546875, -29.0009765625, -27.81884765625, -26.63671875, -25.45458984375, -24.2724609375, -23.09033203125, -21.908203125, -20.72607421875, -19.5439453125, -18.36181640625, -17.1796875, -15.99755859375, -14.8154296875, -13.63330078125, -12.451171875, -11.26904296875, -10.0869140625, -8.90478515625, -7.72265625, -6.54052734375, -5.3583984375, -4.17626953125, -2.994140625, -1.81201171875, -0.6298828125, 0.55224609375, 1.734375, 2.91650390625, 4.0986328125, 5.28076171875, 6.462890625, 7.64501953125, 8.8271484375, 10.00927734375, 11.19140625, 12.37353515625, 13.5556640625, 14.73779296875, 15.919921875, 17.10205078125, 18.2841796875, 19.46630859375, 20.6484375, 21.83056640625, 23.0126953125, 24.19482421875, 25.376953125, 26.55908203125, 27.7412109375, 28.92333984375, 30.10546875, 31.28759765625, 32.4697265625, 33.65185546875, 34.833984375, 36.01611328125, 37.1982421875, 38.38037109375, 39.5625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 16.0, 40.0, 62.0, 141.0, 241.0, 398.0, 790.0, 1403.0, 2440.0, 4201.0, 7216.0, 12081.0, 19407.0, 31095.0, 47924.0, 71636.0, 101957.0, 139510.0, 184938.0, 233933.0, 282746.0, 323201.0, 353413.0, 368351.0, 362999.0, 340274.0, 304128.0, 259400.0, 209995.0, 162829.0, 120230.0, 86491.0, 59116.0, 38853.0, 25289.0, 15309.0, 9313.0, 5554.0, 3196.0, 1888.0, 1012.0, 571.0, 315.0, 191.0, 92.0, 45.0, 23.0, 15.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.359375, -24.608154296875, -23.85693359375, -23.105712890625, -22.3544921875, -21.603271484375, -20.85205078125, -20.100830078125, -19.349609375, -18.598388671875, -17.84716796875, -17.095947265625, -16.3447265625, -15.593505859375, -14.84228515625, -14.091064453125, -13.33984375, -12.588623046875, -11.83740234375, -11.086181640625, -10.3349609375, -9.583740234375, -8.83251953125, -8.081298828125, -7.330078125, -6.578857421875, -5.82763671875, -5.076416015625, -4.3251953125, -3.573974609375, -2.82275390625, -2.071533203125, -1.3203125, -0.569091796875, 0.18212890625, 0.933349609375, 1.6845703125, 2.435791015625, 3.18701171875, 3.938232421875, 4.689453125, 5.440673828125, 6.19189453125, 6.943115234375, 7.6943359375, 8.445556640625, 9.19677734375, 9.947998046875, 10.69921875, 11.450439453125, 12.20166015625, 12.952880859375, 13.7041015625, 14.455322265625, 15.20654296875, 15.957763671875, 16.708984375, 17.460205078125, 18.21142578125, 18.962646484375, 19.7138671875, 20.465087890625, 21.21630859375, 21.967529296875, 22.71875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 15.0, 15.0, 27.0, 24.0, 35.0, 47.0, 34.0, 55.0, 67.0, 77.0, 88.0, 113.0, 104.0, 117.0, 154.0, 183.0, 171.0, 169.0, 187.0, 218.0, 191.0, 202.0, 160.0, 184.0, 172.0, 159.0, 133.0, 145.0, 107.0, 109.0, 104.0, 95.0, 82.0, 69.0, 34.0, 51.0, 38.0, 28.0, 29.0, 16.0, 9.0, 16.0, 7.0, 8.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-15.640625, -15.1466064453125, -14.652587890625, -14.1585693359375, -13.66455078125, -13.1705322265625, -12.676513671875, -12.1824951171875, -11.6884765625, -11.1944580078125, -10.700439453125, -10.2064208984375, -9.71240234375, -9.2183837890625, -8.724365234375, -8.2303466796875, -7.736328125, -7.2423095703125, -6.748291015625, -6.2542724609375, -5.76025390625, -5.2662353515625, -4.772216796875, -4.2781982421875, -3.7841796875, -3.2901611328125, -2.796142578125, -2.3021240234375, -1.80810546875, -1.3140869140625, -0.820068359375, -0.3260498046875, 0.16796875, 0.6619873046875, 1.156005859375, 1.6500244140625, 2.14404296875, 2.6380615234375, 3.132080078125, 3.6260986328125, 4.1201171875, 4.6141357421875, 5.108154296875, 5.6021728515625, 6.09619140625, 6.5902099609375, 7.084228515625, 7.5782470703125, 8.072265625, 8.5662841796875, 9.060302734375, 9.5543212890625, 10.04833984375, 10.5423583984375, 11.036376953125, 11.5303955078125, 12.0244140625, 12.5184326171875, 13.012451171875, 13.5064697265625, 14.00048828125, 14.4945068359375, 14.988525390625, 15.4825439453125, 15.9765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 11.0, 13.0, 15.0, 19.0, 22.0, 19.0, 25.0, 31.0, 32.0, 25.0, 33.0, 36.0, 33.0, 36.0, 40.0, 37.0, 37.0, 44.0, 37.0, 34.0, 43.0, 34.0, 45.0, 31.0, 31.0, 28.0, 18.0, 38.0, 24.0, 13.0, 12.0, 15.0, 12.0, 11.0, 7.0, 5.0, 9.0, 8.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.408935546875, -33.33503723144531, -32.261138916015625, -31.187240600585938, -30.11334228515625, -29.039443969726562, -27.965545654296875, -26.891647338867188, -25.8177490234375, -24.743850708007812, -23.669952392578125, -22.596054077148438, -21.52215576171875, -20.448257446289062, -19.374359130859375, -18.300460815429688, -17.226564407348633, -16.152666091918945, -15.078767776489258, -14.00486946105957, -12.930971145629883, -11.857072830200195, -10.783175468444824, -9.709277153015137, -8.63537883758545, -7.561480522155762, -6.487582206726074, -5.413684368133545, -4.339786052703857, -3.26588773727417, -2.1919898986816406, -1.1180915832519531, -0.044193267822265625, 1.0297049283981323, 2.1036031246185303, 3.1775012016296387, 4.251399517059326, 5.325297832489014, 6.399195671081543, 7.4730939865112305, 8.546992301940918, 9.620890617370605, 10.694788932800293, 11.768686294555664, 12.842584609985352, 13.916482925415039, 14.990381240844727, 16.064279556274414, 17.1381778717041, 18.21207618713379, 19.285974502563477, 20.359872817993164, 21.43377113342285, 22.50766944885254, 23.581565856933594, 24.65546417236328, 25.72936248779297, 26.803260803222656, 27.877159118652344, 28.95105743408203, 30.02495574951172, 31.098854064941406, 32.172752380371094, 33.24665069580078, 34.32054901123047]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 6.0, 13.0, 5.0, 11.0, 7.0, 12.0, 18.0, 17.0, 18.0, 21.0, 22.0, 20.0, 25.0, 25.0, 34.0, 33.0, 31.0, 24.0, 37.0, 37.0, 44.0, 33.0, 38.0, 30.0, 33.0, 26.0, 41.0, 28.0, 35.0, 27.0, 30.0, 18.0, 37.0, 30.0, 21.0, 16.0, 9.0, 16.0, 12.0, 4.0, 11.0, 14.0, 9.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0], "bins": [-41.06578063964844, -39.782291412353516, -38.498802185058594, -37.21531677246094, -35.931827545166016, -34.648338317871094, -33.36484909057617, -32.08135986328125, -30.797870635986328, -29.514381408691406, -28.230894088745117, -26.947404861450195, -25.663915634155273, -24.380428314208984, -23.096939086914062, -21.81344985961914, -20.52996253967285, -19.24647331237793, -17.96298599243164, -16.67949676513672, -15.396007537841797, -14.112519264221191, -12.829030990600586, -11.545541763305664, -10.262053489685059, -8.978565216064453, -7.695075988769531, -6.411587715148926, -5.128098964691162, -3.8446102142333984, -2.561121940612793, -1.277632713317871, 0.005855560302734375, 1.2893441915512085, 2.5728328227996826, 3.856321334838867, 5.139810085296631, 6.4232988357543945, 7.706787109375, 8.990276336669922, 10.273764610290527, 11.557252883911133, 12.840742111206055, 14.12423038482666, 15.407718658447266, 16.691207885742188, 17.97469711303711, 19.25818634033203, 20.54167366027832, 21.825162887573242, 23.10865020751953, 24.392139434814453, 25.675628662109375, 26.959117889404297, 28.242605209350586, 29.526094436645508, 30.809581756591797, 32.09307098388672, 33.37656021118164, 34.66004943847656, 35.94353485107422, 37.22702407836914, 38.51051330566406, 39.794002532958984, 41.077491760253906]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 14.0, 34.0, 56.0, 84.0, 115.0, 172.0, 252.0, 424.0, 625.0, 964.0, 1549.0, 2307.0, 3825.0, 5936.0, 9627.0, 15507.0, 24961.0, 39333.0, 60329.0, 88980.0, 119982.0, 142558.0, 143776.0, 122241.0, 91663.0, 62859.0, 41383.0, 25782.0, 16089.0, 10099.0, 6266.0, 3878.0, 2423.0, 1598.0, 987.0, 613.0, 371.0, 288.0, 189.0, 126.0, 94.0, 53.0, 44.0, 26.0, 11.0, 10.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.69140625, -6.46868896484375, -6.2459716796875, -6.02325439453125, -5.800537109375, -5.57781982421875, -5.3551025390625, -5.13238525390625, -4.90966796875, -4.68695068359375, -4.4642333984375, -4.24151611328125, -4.018798828125, -3.79608154296875, -3.5733642578125, -3.35064697265625, -3.1279296875, -2.90521240234375, -2.6824951171875, -2.45977783203125, -2.237060546875, -2.01434326171875, -1.7916259765625, -1.56890869140625, -1.34619140625, -1.12347412109375, -0.9007568359375, -0.67803955078125, -0.455322265625, -0.23260498046875, -0.0098876953125, 0.21282958984375, 0.435546875, 0.65826416015625, 0.8809814453125, 1.10369873046875, 1.326416015625, 1.54913330078125, 1.7718505859375, 1.99456787109375, 2.21728515625, 2.44000244140625, 2.6627197265625, 2.88543701171875, 3.108154296875, 3.33087158203125, 3.5535888671875, 3.77630615234375, 3.9990234375, 4.22174072265625, 4.4444580078125, 4.66717529296875, 4.889892578125, 5.11260986328125, 5.3353271484375, 5.55804443359375, 5.78076171875, 6.00347900390625, 6.2261962890625, 6.44891357421875, 6.671630859375, 6.89434814453125, 7.1170654296875, 7.33978271484375, 7.5625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 7.0, 12.0, 5.0, 10.0, 8.0, 14.0, 17.0, 17.0, 20.0, 20.0, 21.0, 24.0, 22.0, 26.0, 34.0, 34.0, 29.0, 27.0, 34.0, 36.0, 43.0, 37.0, 36.0, 30.0, 34.0, 28.0, 39.0, 31.0, 31.0, 29.0, 28.0, 20.0, 36.0, 28.0, 20.0, 16.0, 13.0, 14.0, 10.0, 5.0, 10.0, 17.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-41.34375, -40.0556640625, -38.767578125, -37.4794921875, -36.19140625, -34.9033203125, -33.615234375, -32.3271484375, -31.0390625, -29.7509765625, -28.462890625, -27.1748046875, -25.88671875, -24.5986328125, -23.310546875, -22.0224609375, -20.734375, -19.4462890625, -18.158203125, -16.8701171875, -15.58203125, -14.2939453125, -13.005859375, -11.7177734375, -10.4296875, -9.1416015625, -7.853515625, -6.5654296875, -5.27734375, -3.9892578125, -2.701171875, -1.4130859375, -0.125, 1.1630859375, 2.451171875, 3.7392578125, 5.02734375, 6.3154296875, 7.603515625, 8.8916015625, 10.1796875, 11.4677734375, 12.755859375, 14.0439453125, 15.33203125, 16.6201171875, 17.908203125, 19.1962890625, 20.484375, 21.7724609375, 23.060546875, 24.3486328125, 25.63671875, 26.9248046875, 28.212890625, 29.5009765625, 30.7890625, 32.0771484375, 33.365234375, 34.6533203125, 35.94140625, 37.2294921875, 38.517578125, 39.8056640625, 41.09375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 11.0, 14.0, 20.0, 35.0, 48.0, 70.0, 92.0, 113.0, 136.0, 226.0, 327.0, 469.0, 719.0, 1104.0, 1689.0, 2720.0, 4418.0, 7503.0, 13524.0, 24735.0, 47445.0, 92556.0, 171863.0, 240855.0, 199268.0, 112398.0, 57337.0, 30041.0, 16060.0, 9021.0, 5074.0, 3019.0, 1844.0, 1242.0, 819.0, 556.0, 378.0, 239.0, 154.0, 120.0, 88.0, 72.0, 34.0, 21.0, 24.0, 15.0, 11.0, 12.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5, -9.1998291015625, -8.899658203125, -8.5994873046875, -8.29931640625, -7.9991455078125, -7.698974609375, -7.3988037109375, -7.0986328125, -6.7984619140625, -6.498291015625, -6.1981201171875, -5.89794921875, -5.5977783203125, -5.297607421875, -4.9974365234375, -4.697265625, -4.3970947265625, -4.096923828125, -3.7967529296875, -3.49658203125, -3.1964111328125, -2.896240234375, -2.5960693359375, -2.2958984375, -1.9957275390625, -1.695556640625, -1.3953857421875, -1.09521484375, -0.7950439453125, -0.494873046875, -0.1947021484375, 0.10546875, 0.4056396484375, 0.705810546875, 1.0059814453125, 1.30615234375, 1.6063232421875, 1.906494140625, 2.2066650390625, 2.5068359375, 2.8070068359375, 3.107177734375, 3.4073486328125, 3.70751953125, 4.0076904296875, 4.307861328125, 4.6080322265625, 4.908203125, 5.2083740234375, 5.508544921875, 5.8087158203125, 6.10888671875, 6.4090576171875, 6.709228515625, 7.0093994140625, 7.3095703125, 7.6097412109375, 7.909912109375, 8.2100830078125, 8.51025390625, 8.8104248046875, 9.110595703125, 9.4107666015625, 9.7109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 4.0, 6.0, 8.0, 8.0, 5.0, 7.0, 23.0, 9.0, 14.0, 15.0, 27.0, 22.0, 33.0, 34.0, 26.0, 33.0, 52.0, 38.0, 34.0, 37.0, 32.0, 44.0, 51.0, 33.0, 40.0, 23.0, 31.0, 34.0, 34.0, 26.0, 41.0, 30.0, 31.0, 23.0, 20.0, 20.0, 6.0, 4.0, 6.0, 10.0, 4.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.9091796875, -25.974609375, -25.0400390625, -24.10546875, -23.1708984375, -22.236328125, -21.3017578125, -20.3671875, -19.4326171875, -18.498046875, -17.5634765625, -16.62890625, -15.6943359375, -14.759765625, -13.8251953125, -12.890625, -11.9560546875, -11.021484375, -10.0869140625, -9.15234375, -8.2177734375, -7.283203125, -6.3486328125, -5.4140625, -4.4794921875, -3.544921875, -2.6103515625, -1.67578125, -0.7412109375, 0.193359375, 1.1279296875, 2.0625, 2.9970703125, 3.931640625, 4.8662109375, 5.80078125, 6.7353515625, 7.669921875, 8.6044921875, 9.5390625, 10.4736328125, 11.408203125, 12.3427734375, 13.27734375, 14.2119140625, 15.146484375, 16.0810546875, 17.015625, 17.9501953125, 18.884765625, 19.8193359375, 20.75390625, 21.6884765625, 22.623046875, 23.5576171875, 24.4921875, 25.4267578125, 26.361328125, 27.2958984375, 28.23046875, 29.1650390625, 30.099609375, 31.0341796875, 31.96875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 7.0, 18.0, 16.0, 20.0, 35.0, 58.0, 63.0, 118.0, 162.0, 249.0, 311.0, 465.0, 675.0, 1066.0, 1686.0, 2753.0, 4769.0, 8941.0, 17970.0, 40205.0, 109703.0, 357445.0, 327583.0, 100095.0, 37073.0, 16675.0, 8448.0, 4492.0, 2611.0, 1591.0, 1084.0, 673.0, 476.0, 310.0, 205.0, 139.0, 120.0, 63.0, 63.0, 35.0, 18.0, 17.0, 15.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 2.0, 3.0], "bins": [-7.0234375, -6.822509765625, -6.62158203125, -6.420654296875, -6.2197265625, -6.018798828125, -5.81787109375, -5.616943359375, -5.416015625, -5.215087890625, -5.01416015625, -4.813232421875, -4.6123046875, -4.411376953125, -4.21044921875, -4.009521484375, -3.80859375, -3.607666015625, -3.40673828125, -3.205810546875, -3.0048828125, -2.803955078125, -2.60302734375, -2.402099609375, -2.201171875, -2.000244140625, -1.79931640625, -1.598388671875, -1.3974609375, -1.196533203125, -0.99560546875, -0.794677734375, -0.59375, -0.392822265625, -0.19189453125, 0.009033203125, 0.2099609375, 0.410888671875, 0.61181640625, 0.812744140625, 1.013671875, 1.214599609375, 1.41552734375, 1.616455078125, 1.8173828125, 2.018310546875, 2.21923828125, 2.420166015625, 2.62109375, 2.822021484375, 3.02294921875, 3.223876953125, 3.4248046875, 3.625732421875, 3.82666015625, 4.027587890625, 4.228515625, 4.429443359375, 4.63037109375, 4.831298828125, 5.0322265625, 5.233154296875, 5.43408203125, 5.635009765625, 5.8359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 11.0, 27.0, 39.0, 40.0, 41.0, 60.0, 81.0, 96.0, 95.0, 70.0, 81.0, 76.0, 78.0, 54.0, 43.0, 29.0, 23.0, 12.0, 7.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003726482391357422, -0.0003587491810321808, -0.0003448501229286194, -0.000330951064825058, -0.0003170520067214966, -0.0003031529486179352, -0.0002892538905143738, -0.0002753548324108124, -0.000261455774307251, -0.0002475567162036896, -0.00023365765810012817, -0.00021975859999656677, -0.00020585954189300537, -0.00019196048378944397, -0.00017806142568588257, -0.00016416236758232117, -0.00015026330947875977, -0.00013636425137519836, -0.00012246519327163696, -0.00010856613516807556, -9.466707706451416e-05, -8.076801896095276e-05, -6.686896085739136e-05, -5.2969902753829956e-05, -3.9070844650268555e-05, -2.5171786546707153e-05, -1.1272728443145752e-05, 2.6263296604156494e-06, 1.652538776397705e-05, 3.0424445867538452e-05, 4.4323503971099854e-05, 5.8222562074661255e-05, 7.212162017822266e-05, 8.602067828178406e-05, 9.991973638534546e-05, 0.00011381879448890686, 0.00012771785259246826, 0.00014161691069602966, 0.00015551596879959106, 0.00016941502690315247, 0.00018331408500671387, 0.00019721314311027527, 0.00021111220121383667, 0.00022501125931739807, 0.00023891031742095947, 0.0002528093755245209, 0.0002667084336280823, 0.0002806074917316437, 0.0002945065498352051, 0.0003084056079387665, 0.0003223046660423279, 0.0003362037241458893, 0.0003501027822494507, 0.0003640018403530121, 0.0003779008984565735, 0.0003917999565601349, 0.0004056990146636963, 0.0004195980727672577, 0.0004334971308708191, 0.0004473961889743805, 0.0004612952470779419, 0.0004751943051815033, 0.0004890933632850647, 0.0005029924213886261, 0.0005168914794921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 7.0, 4.0, 8.0, 8.0, 18.0, 22.0, 47.0, 56.0, 89.0, 145.0, 189.0, 314.0, 464.0, 692.0, 1075.0, 1731.0, 2733.0, 4568.0, 7400.0, 12581.0, 21568.0, 37297.0, 64173.0, 105932.0, 156922.0, 186595.0, 163548.0, 112362.0, 69430.0, 40699.0, 23305.0, 13695.0, 8020.0, 4767.0, 2889.0, 1846.0, 1173.0, 735.0, 498.0, 334.0, 207.0, 143.0, 91.0, 60.0, 39.0, 26.0, 15.0, 20.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.9630126953125, -4.789306640625, -4.6156005859375, -4.44189453125, -4.2681884765625, -4.094482421875, -3.9207763671875, -3.7470703125, -3.5733642578125, -3.399658203125, -3.2259521484375, -3.05224609375, -2.8785400390625, -2.704833984375, -2.5311279296875, -2.357421875, -2.1837158203125, -2.010009765625, -1.8363037109375, -1.66259765625, -1.4888916015625, -1.315185546875, -1.1414794921875, -0.9677734375, -0.7940673828125, -0.620361328125, -0.4466552734375, -0.27294921875, -0.0992431640625, 0.074462890625, 0.2481689453125, 0.421875, 0.5955810546875, 0.769287109375, 0.9429931640625, 1.11669921875, 1.2904052734375, 1.464111328125, 1.6378173828125, 1.8115234375, 1.9852294921875, 2.158935546875, 2.3326416015625, 2.50634765625, 2.6800537109375, 2.853759765625, 3.0274658203125, 3.201171875, 3.3748779296875, 3.548583984375, 3.7222900390625, 3.89599609375, 4.0697021484375, 4.243408203125, 4.4171142578125, 4.5908203125, 4.7645263671875, 4.938232421875, 5.1119384765625, 5.28564453125, 5.4593505859375, 5.633056640625, 5.8067626953125, 5.98046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 16.0, 14.0, 16.0, 19.0, 21.0, 37.0, 40.0, 49.0, 55.0, 71.0, 67.0, 65.0, 69.0, 69.0, 52.0, 54.0, 55.0, 49.0, 34.0, 26.0, 15.0, 13.0, 21.0, 9.0, 9.0, 6.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.876739501953125, -2.79449462890625, -2.712249755859375, -2.6300048828125, -2.547760009765625, -2.46551513671875, -2.383270263671875, -2.301025390625, -2.218780517578125, -2.13653564453125, -2.054290771484375, -1.9720458984375, -1.889801025390625, -1.80755615234375, -1.725311279296875, -1.64306640625, -1.560821533203125, -1.47857666015625, -1.396331787109375, -1.3140869140625, -1.231842041015625, -1.14959716796875, -1.067352294921875, -0.985107421875, -0.902862548828125, -0.82061767578125, -0.738372802734375, -0.6561279296875, -0.573883056640625, -0.49163818359375, -0.409393310546875, -0.3271484375, -0.244903564453125, -0.16265869140625, -0.080413818359375, 0.0018310546875, 0.084075927734375, 0.16632080078125, 0.248565673828125, 0.330810546875, 0.413055419921875, 0.49530029296875, 0.577545166015625, 0.6597900390625, 0.742034912109375, 0.82427978515625, 0.906524658203125, 0.98876953125, 1.071014404296875, 1.15325927734375, 1.235504150390625, 1.3177490234375, 1.399993896484375, 1.48223876953125, 1.564483642578125, 1.646728515625, 1.728973388671875, 1.81121826171875, 1.893463134765625, 1.9757080078125, 2.057952880859375, 2.14019775390625, 2.222442626953125, 2.3046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 3.0, 11.0, 18.0, 12.0, 25.0, 21.0, 22.0, 35.0, 24.0, 32.0, 24.0, 33.0, 35.0, 34.0, 40.0, 37.0, 42.0, 44.0, 37.0, 36.0, 41.0, 40.0, 34.0, 35.0, 32.0, 32.0, 23.0, 30.0, 25.0, 18.0, 12.0, 17.0, 13.0, 13.0, 7.0, 5.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-35.025413513183594, -33.94660186767578, -32.867794036865234, -31.788982391357422, -30.710172653198242, -29.631362915039062, -28.55255126953125, -27.47374153137207, -26.39493179321289, -25.31612205505371, -24.23731231689453, -23.15850067138672, -22.07969093322754, -21.00088119506836, -19.922069549560547, -18.843259811401367, -17.764450073242188, -16.685640335083008, -15.606829643249512, -14.528018951416016, -13.449209213256836, -12.370399475097656, -11.29158878326416, -10.212778091430664, -9.133968353271484, -8.055158615112305, -6.976347923278809, -5.897537708282471, -4.818727493286133, -3.739917278289795, -2.661107063293457, -1.5822968482971191, -0.5034904479980469, 0.575319766998291, 1.654129981994629, 2.732940196990967, 3.8117504119873047, 4.890560626983643, 5.9693708419799805, 7.048181056976318, 8.126991271972656, 9.205801010131836, 10.284611701965332, 11.363422393798828, 12.442232131958008, 13.521041870117188, 14.599852561950684, 15.67866325378418, 16.75747299194336, 17.83628273010254, 18.91509246826172, 19.99390411376953, 21.07271385192871, 22.15152359008789, 23.230335235595703, 24.309144973754883, 25.387954711914062, 26.466764450073242, 27.545574188232422, 28.624385833740234, 29.703195571899414, 30.782005310058594, 31.860816955566406, 32.93962478637695, 34.018436431884766]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 5.0, 11.0, 13.0, 7.0, 15.0, 20.0, 20.0, 21.0, 24.0, 13.0, 30.0, 25.0, 32.0, 28.0, 31.0, 27.0, 38.0, 37.0, 38.0, 39.0, 34.0, 31.0, 30.0, 27.0, 36.0, 36.0, 28.0, 35.0, 28.0, 16.0, 32.0, 37.0, 20.0, 19.0, 9.0, 15.0, 11.0, 8.0, 6.0, 14.0, 13.0, 4.0, 5.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0], "bins": [-41.17984390258789, -39.9048957824707, -38.629947662353516, -37.35499954223633, -36.08005142211914, -34.80510330200195, -33.530155181884766, -32.25520706176758, -30.98025894165039, -29.705310821533203, -28.430362701416016, -27.155414581298828, -25.88046646118164, -24.605518341064453, -23.330570220947266, -22.055622100830078, -20.78067398071289, -19.505725860595703, -18.230777740478516, -16.955829620361328, -15.68088150024414, -14.405933380126953, -13.130985260009766, -11.856037139892578, -10.58108901977539, -9.306140899658203, -8.031192779541016, -6.756244659423828, -5.481296539306641, -4.206348419189453, -2.9314002990722656, -1.6564521789550781, -0.38150787353515625, 0.8934402465820312, 2.1683883666992188, 3.4433364868164062, 4.718284606933594, 5.993232727050781, 7.268180847167969, 8.543128967285156, 9.818077087402344, 11.093025207519531, 12.367973327636719, 13.642921447753906, 14.917869567871094, 16.19281768798828, 17.46776580810547, 18.742713928222656, 20.017662048339844, 21.29261016845703, 22.56755828857422, 23.842506408691406, 25.117454528808594, 26.39240264892578, 27.66735076904297, 28.942298889160156, 30.217247009277344, 31.49219512939453, 32.76714324951172, 34.042091369628906, 35.317039489746094, 36.59198760986328, 37.86693572998047, 39.141883850097656, 40.416831970214844]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 19.0, 16.0, 30.0, 51.0, 81.0, 123.0, 145.0, 250.0, 350.0, 522.0, 794.0, 1207.0, 2025.0, 3220.0, 5357.0, 9076.0, 15222.0, 24350.0, 37914.0, 55152.0, 75852.0, 96470.0, 112710.0, 120434.0, 116856.0, 103638.0, 84543.0, 62838.0, 43726.0, 28808.0, 18279.0, 11141.0, 6780.0, 3955.0, 2411.0, 1435.0, 910.0, 601.0, 406.0, 261.0, 169.0, 119.0, 98.0, 66.0, 52.0, 22.0, 13.0, 8.0, 13.0, 8.0, 3.0, 7.0, 3.0, 4.0], "bins": [-26.90625, -26.107666015625, -25.30908203125, -24.510498046875, -23.7119140625, -22.913330078125, -22.11474609375, -21.316162109375, -20.517578125, -19.718994140625, -18.92041015625, -18.121826171875, -17.3232421875, -16.524658203125, -15.72607421875, -14.927490234375, -14.12890625, -13.330322265625, -12.53173828125, -11.733154296875, -10.9345703125, -10.135986328125, -9.33740234375, -8.538818359375, -7.740234375, -6.941650390625, -6.14306640625, -5.344482421875, -4.5458984375, -3.747314453125, -2.94873046875, -2.150146484375, -1.3515625, -0.552978515625, 0.24560546875, 1.044189453125, 1.8427734375, 2.641357421875, 3.43994140625, 4.238525390625, 5.037109375, 5.835693359375, 6.63427734375, 7.432861328125, 8.2314453125, 9.030029296875, 9.82861328125, 10.627197265625, 11.42578125, 12.224365234375, 13.02294921875, 13.821533203125, 14.6201171875, 15.418701171875, 16.21728515625, 17.015869140625, 17.814453125, 18.613037109375, 19.41162109375, 20.210205078125, 21.0087890625, 21.807373046875, 22.60595703125, 23.404541015625, 24.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 10.0, 6.0, 10.0, 12.0, 8.0, 16.0, 22.0, 21.0, 17.0, 23.0, 16.0, 30.0, 25.0, 34.0, 28.0, 29.0, 29.0, 35.0, 42.0, 37.0, 35.0, 36.0, 31.0, 30.0, 27.0, 41.0, 31.0, 33.0, 29.0, 26.0, 18.0, 39.0, 28.0, 22.0, 17.0, 9.0, 17.0, 8.0, 8.0, 9.0, 15.0, 9.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0], "bins": [-41.0625, -39.7861328125, -38.509765625, -37.2333984375, -35.95703125, -34.6806640625, -33.404296875, -32.1279296875, -30.8515625, -29.5751953125, -28.298828125, -27.0224609375, -25.74609375, -24.4697265625, -23.193359375, -21.9169921875, -20.640625, -19.3642578125, -18.087890625, -16.8115234375, -15.53515625, -14.2587890625, -12.982421875, -11.7060546875, -10.4296875, -9.1533203125, -7.876953125, -6.6005859375, -5.32421875, -4.0478515625, -2.771484375, -1.4951171875, -0.21875, 1.0576171875, 2.333984375, 3.6103515625, 4.88671875, 6.1630859375, 7.439453125, 8.7158203125, 9.9921875, 11.2685546875, 12.544921875, 13.8212890625, 15.09765625, 16.3740234375, 17.650390625, 18.9267578125, 20.203125, 21.4794921875, 22.755859375, 24.0322265625, 25.30859375, 26.5849609375, 27.861328125, 29.1376953125, 30.4140625, 31.6904296875, 32.966796875, 34.2431640625, 35.51953125, 36.7958984375, 38.072265625, 39.3486328125, 40.625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 10.0, 29.0, 30.0, 47.0, 72.0, 112.0, 152.0, 269.0, 385.0, 567.0, 879.0, 1353.0, 2018.0, 2944.0, 4559.0, 7159.0, 10608.0, 16441.0, 24031.0, 34674.0, 48446.0, 64300.0, 80471.0, 95313.0, 104052.0, 106019.0, 100590.0, 87805.0, 71866.0, 55723.0, 40743.0, 28790.0, 19735.0, 13167.0, 8661.0, 5679.0, 3775.0, 2456.0, 1549.0, 1066.0, 684.0, 463.0, 302.0, 215.0, 115.0, 84.0, 50.0, 35.0, 24.0, 13.0, 11.0, 10.0, 4.0, 2.0, 3.0], "bins": [-28.5625, -27.728271484375, -26.89404296875, -26.059814453125, -25.2255859375, -24.391357421875, -23.55712890625, -22.722900390625, -21.888671875, -21.054443359375, -20.22021484375, -19.385986328125, -18.5517578125, -17.717529296875, -16.88330078125, -16.049072265625, -15.21484375, -14.380615234375, -13.54638671875, -12.712158203125, -11.8779296875, -11.043701171875, -10.20947265625, -9.375244140625, -8.541015625, -7.706787109375, -6.87255859375, -6.038330078125, -5.2041015625, -4.369873046875, -3.53564453125, -2.701416015625, -1.8671875, -1.032958984375, -0.19873046875, 0.635498046875, 1.4697265625, 2.303955078125, 3.13818359375, 3.972412109375, 4.806640625, 5.640869140625, 6.47509765625, 7.309326171875, 8.1435546875, 8.977783203125, 9.81201171875, 10.646240234375, 11.48046875, 12.314697265625, 13.14892578125, 13.983154296875, 14.8173828125, 15.651611328125, 16.48583984375, 17.320068359375, 18.154296875, 18.988525390625, 19.82275390625, 20.656982421875, 21.4912109375, 22.325439453125, 23.15966796875, 23.993896484375, 24.828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 3.0, 6.0, 7.0, 9.0, 17.0, 15.0, 18.0, 19.0, 25.0, 24.0, 34.0, 30.0, 34.0, 38.0, 37.0, 32.0, 49.0, 32.0, 29.0, 39.0, 40.0, 37.0, 35.0, 44.0, 41.0, 32.0, 26.0, 28.0, 24.0, 36.0, 19.0, 12.0, 19.0, 11.0, 15.0, 15.0, 8.0, 8.0, 9.0, 5.0, 10.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-32.46875, -31.539306640625, -30.60986328125, -29.680419921875, -28.7509765625, -27.821533203125, -26.89208984375, -25.962646484375, -25.033203125, -24.103759765625, -23.17431640625, -22.244873046875, -21.3154296875, -20.385986328125, -19.45654296875, -18.527099609375, -17.59765625, -16.668212890625, -15.73876953125, -14.809326171875, -13.8798828125, -12.950439453125, -12.02099609375, -11.091552734375, -10.162109375, -9.232666015625, -8.30322265625, -7.373779296875, -6.4443359375, -5.514892578125, -4.58544921875, -3.656005859375, -2.7265625, -1.797119140625, -0.86767578125, 0.061767578125, 0.9912109375, 1.920654296875, 2.85009765625, 3.779541015625, 4.708984375, 5.638427734375, 6.56787109375, 7.497314453125, 8.4267578125, 9.356201171875, 10.28564453125, 11.215087890625, 12.14453125, 13.073974609375, 14.00341796875, 14.932861328125, 15.8623046875, 16.791748046875, 17.72119140625, 18.650634765625, 19.580078125, 20.509521484375, 21.43896484375, 22.368408203125, 23.2978515625, 24.227294921875, 25.15673828125, 26.086181640625, 27.015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 12.0, 17.0, 25.0, 30.0, 48.0, 84.0, 98.0, 178.0, 265.0, 372.0, 595.0, 928.0, 1427.0, 2159.0, 3602.0, 5655.0, 9022.0, 14010.0, 21581.0, 32217.0, 46460.0, 63651.0, 81026.0, 97646.0, 108389.0, 111123.0, 105261.0, 92111.0, 74404.0, 56747.0, 40681.0, 27479.0, 18561.0, 11997.0, 7580.0, 4740.0, 3003.0, 1921.0, 1174.0, 782.0, 485.0, 335.0, 231.0, 153.0, 104.0, 61.0, 54.0, 31.0, 14.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-10.9140625, -10.58642578125, -10.2587890625, -9.93115234375, -9.603515625, -9.27587890625, -8.9482421875, -8.62060546875, -8.29296875, -7.96533203125, -7.6376953125, -7.31005859375, -6.982421875, -6.65478515625, -6.3271484375, -5.99951171875, -5.671875, -5.34423828125, -5.0166015625, -4.68896484375, -4.361328125, -4.03369140625, -3.7060546875, -3.37841796875, -3.05078125, -2.72314453125, -2.3955078125, -2.06787109375, -1.740234375, -1.41259765625, -1.0849609375, -0.75732421875, -0.4296875, -0.10205078125, 0.2255859375, 0.55322265625, 0.880859375, 1.20849609375, 1.5361328125, 1.86376953125, 2.19140625, 2.51904296875, 2.8466796875, 3.17431640625, 3.501953125, 3.82958984375, 4.1572265625, 4.48486328125, 4.8125, 5.14013671875, 5.4677734375, 5.79541015625, 6.123046875, 6.45068359375, 6.7783203125, 7.10595703125, 7.43359375, 7.76123046875, 8.0888671875, 8.41650390625, 8.744140625, 9.07177734375, 9.3994140625, 9.72705078125, 10.0546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 5.0, 5.0, 4.0, 14.0, 20.0, 21.0, 25.0, 29.0, 35.0, 43.0, 33.0, 71.0, 57.0, 61.0, 64.0, 79.0, 53.0, 46.0, 56.0, 51.0, 40.0, 39.0, 32.0, 24.0, 21.0, 13.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018558502197265625, -0.0018012374639511108, -0.0017466247081756592, -0.0016920119524002075, -0.0016373991966247559, -0.0015827864408493042, -0.0015281736850738525, -0.0014735609292984009, -0.0014189481735229492, -0.0013643354177474976, -0.001309722661972046, -0.0012551099061965942, -0.0012004971504211426, -0.001145884394645691, -0.0010912716388702393, -0.0010366588830947876, -0.000982046127319336, -0.0009274333715438843, -0.0008728206157684326, -0.000818207859992981, -0.0007635951042175293, -0.0007089823484420776, -0.000654369592666626, -0.0005997568368911743, -0.0005451440811157227, -0.000490531325340271, -0.00043591856956481934, -0.0003813058137893677, -0.000326693058013916, -0.00027208030223846436, -0.0002174675464630127, -0.00016285479068756104, -0.00010824203491210938, -5.3629279136657715e-05, 9.834766387939453e-07, 5.5596232414245605e-05, 0.00011020898818969727, 0.00016482174396514893, 0.00021943449974060059, 0.00027404725551605225, 0.0003286600112915039, 0.00038327276706695557, 0.0004378855228424072, 0.0004924982786178589, 0.0005471110343933105, 0.0006017237901687622, 0.0006563365459442139, 0.0007109493017196655, 0.0007655620574951172, 0.0008201748132705688, 0.0008747875690460205, 0.0009294003248214722, 0.0009840130805969238, 0.0010386258363723755, 0.0010932385921478271, 0.0011478513479232788, 0.0012024641036987305, 0.0012570768594741821, 0.0013116896152496338, 0.0013663023710250854, 0.0014209151268005371, 0.0014755278825759888, 0.0015301406383514404, 0.001584753394126892, 0.0016393661499023438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 7.0, 7.0, 13.0, 21.0, 23.0, 49.0, 60.0, 98.0, 157.0, 223.0, 351.0, 559.0, 893.0, 1326.0, 1948.0, 3080.0, 4747.0, 7059.0, 10700.0, 15733.0, 22366.0, 31288.0, 41565.0, 54064.0, 67139.0, 78725.0, 87663.0, 93768.0, 93576.0, 88087.0, 79285.0, 66791.0, 54242.0, 41939.0, 31169.0, 22434.0, 15712.0, 10662.0, 7081.0, 4926.0, 3158.0, 2022.0, 1327.0, 921.0, 536.0, 374.0, 256.0, 151.0, 97.0, 68.0, 37.0, 35.0, 16.0, 14.0, 7.0, 1.0, 6.0, 1.0], "bins": [-9.9921875, -9.6983642578125, -9.404541015625, -9.1107177734375, -8.81689453125, -8.5230712890625, -8.229248046875, -7.9354248046875, -7.6416015625, -7.3477783203125, -7.053955078125, -6.7601318359375, -6.46630859375, -6.1724853515625, -5.878662109375, -5.5848388671875, -5.291015625, -4.9971923828125, -4.703369140625, -4.4095458984375, -4.11572265625, -3.8218994140625, -3.528076171875, -3.2342529296875, -2.9404296875, -2.6466064453125, -2.352783203125, -2.0589599609375, -1.76513671875, -1.4713134765625, -1.177490234375, -0.8836669921875, -0.58984375, -0.2960205078125, -0.002197265625, 0.2916259765625, 0.58544921875, 0.8792724609375, 1.173095703125, 1.4669189453125, 1.7607421875, 2.0545654296875, 2.348388671875, 2.6422119140625, 2.93603515625, 3.2298583984375, 3.523681640625, 3.8175048828125, 4.111328125, 4.4051513671875, 4.698974609375, 4.9927978515625, 5.28662109375, 5.5804443359375, 5.874267578125, 6.1680908203125, 6.4619140625, 6.7557373046875, 7.049560546875, 7.3433837890625, 7.63720703125, 7.9310302734375, 8.224853515625, 8.5186767578125, 8.8125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 5.0, 3.0, 5.0, 13.0, 5.0, 22.0, 14.0, 21.0, 21.0, 32.0, 27.0, 47.0, 36.0, 36.0, 42.0, 46.0, 60.0, 43.0, 47.0, 53.0, 41.0, 39.0, 51.0, 43.0, 32.0, 22.0, 31.0, 21.0, 32.0, 24.0, 19.0, 15.0, 8.0, 11.0, 8.0, 7.0, 12.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.976318359375, -6.78466796875, -6.593017578125, -6.4013671875, -6.209716796875, -6.01806640625, -5.826416015625, -5.634765625, -5.443115234375, -5.25146484375, -5.059814453125, -4.8681640625, -4.676513671875, -4.48486328125, -4.293212890625, -4.1015625, -3.909912109375, -3.71826171875, -3.526611328125, -3.3349609375, -3.143310546875, -2.95166015625, -2.760009765625, -2.568359375, -2.376708984375, -2.18505859375, -1.993408203125, -1.8017578125, -1.610107421875, -1.41845703125, -1.226806640625, -1.03515625, -0.843505859375, -0.65185546875, -0.460205078125, -0.2685546875, -0.076904296875, 0.11474609375, 0.306396484375, 0.498046875, 0.689697265625, 0.88134765625, 1.072998046875, 1.2646484375, 1.456298828125, 1.64794921875, 1.839599609375, 2.03125, 2.222900390625, 2.41455078125, 2.606201171875, 2.7978515625, 2.989501953125, 3.18115234375, 3.372802734375, 3.564453125, 3.756103515625, 3.94775390625, 4.139404296875, 4.3310546875, 4.522705078125, 4.71435546875, 4.906005859375, 5.09765625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 7.0, 1.0, 2.0, 6.0, 8.0, 8.0, 15.0, 10.0, 13.0, 19.0, 25.0, 22.0, 27.0, 29.0, 29.0, 24.0, 29.0, 32.0, 33.0, 37.0, 32.0, 37.0, 47.0, 37.0, 45.0, 33.0, 37.0, 39.0, 33.0, 34.0, 30.0, 24.0, 24.0, 26.0, 29.0, 21.0, 21.0, 14.0, 11.0, 10.0, 10.0, 6.0, 8.0, 7.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.17542266845703, -32.05216598510742, -30.928911209106445, -29.805654525756836, -28.682397842407227, -27.55914306640625, -26.43588638305664, -25.31262969970703, -24.189373016357422, -23.066116333007812, -21.942861557006836, -20.819604873657227, -19.696348190307617, -18.57309341430664, -17.44983673095703, -16.326580047607422, -15.203325271606445, -14.080069541931152, -12.956812858581543, -11.83355712890625, -10.71030044555664, -9.587044715881348, -8.463788986206055, -7.3405327796936035, -6.217276573181152, -5.094020366668701, -3.970764398574829, -2.847508430480957, -1.7242522239685059, -0.6009960174560547, 0.5222597122192383, 1.6455159187316895, 2.7687721252441406, 3.892028331756592, 5.015284538269043, 6.138540267944336, 7.261796474456787, 8.385052680969238, 9.508308410644531, 10.63156509399414, 11.754820823669434, 12.878076553344727, 14.001333236694336, 15.124588966369629, 16.247844696044922, 17.37110137939453, 18.49435806274414, 19.617612838745117, 20.740869522094727, 21.864126205444336, 22.987380981445312, 24.110637664794922, 25.23389434814453, 26.35715103149414, 27.480405807495117, 28.603662490844727, 29.726917266845703, 30.850173950195312, 31.97342872619629, 33.09668731689453, 34.219940185546875, 35.343196868896484, 36.466453552246094, 37.5897102355957, 38.71296691894531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 11.0, 13.0, 12.0, 8.0, 12.0, 13.0, 21.0, 17.0, 13.0, 27.0, 23.0, 24.0, 27.0, 31.0, 33.0, 32.0, 34.0, 40.0, 30.0, 45.0, 39.0, 35.0, 33.0, 42.0, 27.0, 47.0, 28.0, 31.0, 35.0, 36.0, 20.0, 31.0, 19.0, 18.0, 13.0, 18.0, 8.0, 11.0, 8.0, 7.0, 9.0, 5.0, 2.0, 2.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-55.858551025390625, -54.249752044677734, -52.640953063964844, -51.03215408325195, -49.42335510253906, -47.81455612182617, -46.20575714111328, -44.59695816040039, -42.9881591796875, -41.37936019897461, -39.77056121826172, -38.16176223754883, -36.55296325683594, -34.94416427612305, -33.335365295410156, -31.726566314697266, -30.117769241333008, -28.508970260620117, -26.900171279907227, -25.291372299194336, -23.682573318481445, -22.073776245117188, -20.464977264404297, -18.856178283691406, -17.247379302978516, -15.638580322265625, -14.029781341552734, -12.420982360839844, -10.812183380126953, -9.203385353088379, -7.594586372375488, -5.985787391662598, -4.376987457275391, -2.7681884765625, -1.1593897342681885, 0.44940900802612305, 2.0582079887390137, 3.667006492614746, 5.275805473327637, 6.884604454040527, 8.493403434753418, 10.102202415466309, 11.7110013961792, 13.319799423217773, 14.928598403930664, 16.537397384643555, 18.146196365356445, 19.754995346069336, 21.363794326782227, 22.972593307495117, 24.581392288208008, 26.1901912689209, 27.79899024963379, 29.407787322998047, 31.016586303710938, 32.62538528442383, 34.23418426513672, 35.84298324584961, 37.4517822265625, 39.06058120727539, 40.66938018798828, 42.27817916870117, 43.88697814941406, 45.49577713012695, 47.104576110839844]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 4.0, 13.0, 16.0, 22.0, 25.0, 35.0, 62.0, 91.0, 137.0, 180.0, 281.0, 428.0, 581.0, 888.0, 1265.0, 1782.0, 2328.0, 2962.0, 3683.0, 4707.0, 6506.0, 1002653.0, 5365.0, 4163.0, 3232.0, 2610.0, 1941.0, 1426.0, 946.0, 712.0, 490.0, 316.0, 225.0, 172.0, 95.0, 74.0, 56.0, 39.0, 24.0, 18.0, 16.0, 10.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.62738037109375, -339.39031982421875, -328.15325927734375, -316.91619873046875, -305.67913818359375, -294.44207763671875, -283.20501708984375, -271.96795654296875, -260.73089599609375, -249.49383544921875, -238.25677490234375, -227.01971435546875, -215.78265380859375, -204.54559326171875, -193.30853271484375, -182.07147216796875, -170.8344268798828, -159.5973663330078, -148.3603057861328, -137.1232452392578, -125.88618469238281, -114.64912414550781, -103.41207122802734, -92.17501068115234, -80.93795013427734, -69.70088958740234, -58.463829040527344, -47.22677230834961, -35.98971176147461, -24.75265121459961, -13.515594482421875, -2.278533935546875, 8.958526611328125, 20.195587158203125, 31.432645797729492, 42.66970443725586, 53.90676498413086, 65.14382934570312, 76.3808822631836, 87.6179428100586, 98.8550033569336, 110.0920639038086, 121.3291244506836, 132.56617736816406, 143.80323791503906, 155.04029846191406, 166.27735900878906, 177.51441955566406, 188.75148010253906, 199.98854064941406, 211.22560119628906, 222.46266174316406, 233.69972229003906, 244.93678283691406, 256.173828125, 267.410888671875, 278.64794921875, 289.885009765625, 301.1220703125, 312.359130859375, 323.59619140625, 334.833251953125, 346.0703125, 357.307373046875, 368.54443359375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 9.0, 18.0, 21.0, 23.0, 27.0, 52.0, 84.0, 124.0, 182.0, 285.0, 486.0, 869.0, 1516.0, 2660.0, 4889.0, 8977.0, 16412.0, 27901.0, 51772.0, 51267556.0, 36338.0, 22557.0, 13006.0, 6814.0, 3788.0, 2001.0, 1172.0, 676.0, 391.0, 254.0, 164.0, 99.0, 65.0, 42.0, 25.0, 17.0, 8.0, 12.0, 14.0, 6.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.46112060546875, -341.21087646484375, -330.9606628417969, -320.7104187011719, -310.4601745605469, -300.2099609375, -289.959716796875, -279.70947265625, -269.459228515625, -259.208984375, -248.95875549316406, -238.70852661132812, -228.45828247070312, -218.2080535888672, -207.95782470703125, -197.70758056640625, -187.45736694335938, -177.20713806152344, -166.95689392089844, -156.7066650390625, -146.4564208984375, -136.20619201660156, -125.95596313476562, -115.70572662353516, -105.45549011230469, -95.20525360107422, -84.95501708984375, -74.70478820800781, -64.45455169677734, -54.204315185546875, -43.95408248901367, -33.70384979248047, -23.453643798828125, -13.203409194946289, -2.953174591064453, 7.297060012817383, 17.54729461669922, 27.797531127929688, 38.04776382446289, 48.297996520996094, 58.54823303222656, 68.79846954345703, 79.0487060546875, 89.29893493652344, 99.5491714477539, 109.79940795898438, 120.04963684082031, 130.29986572265625, 140.55010986328125, 150.8003387451172, 161.0505828857422, 171.30081176757812, 181.55105590820312, 191.80128479003906, 202.051513671875, 212.3017578125, 222.55198669433594, 232.80221557617188, 243.05245971679688, 253.3026885986328, 263.55291748046875, 273.80316162109375, 284.05340576171875, 294.3036193847656, 304.5538635253906]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 12.0, 10.0, 22.0, 23.0, 37.0, 54.0, 91.0, 154.0, 227.0, 354.0, 578.0, 892.0, 1449.0, 2466.0, 4133.0, 7253.0, 13437.0, 26828.0, 58162.0, 146052.0, 440805.0, 1844792.0, 2769601.0, 631666.0, 197253.0, 75066.0, 33076.0, 16347.0, 8630.0, 4698.0, 2776.0, 1732.0, 1037.0, 620.0, 398.0, 257.0, 153.0, 94.0, 67.0, 33.0, 29.0, 19.0, 18.0, 9.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.155029296875, -26.31005859375, -25.465087890625, -24.6201171875, -23.775146484375, -22.93017578125, -22.085205078125, -21.240234375, -20.395263671875, -19.55029296875, -18.705322265625, -17.8603515625, -17.015380859375, -16.17041015625, -15.325439453125, -14.48046875, -13.635498046875, -12.79052734375, -11.945556640625, -11.1005859375, -10.255615234375, -9.41064453125, -8.565673828125, -7.720703125, -6.875732421875, -6.03076171875, -5.185791015625, -4.3408203125, -3.495849609375, -2.65087890625, -1.805908203125, -0.9609375, -0.115966796875, 0.72900390625, 1.573974609375, 2.4189453125, 3.263916015625, 4.10888671875, 4.953857421875, 5.798828125, 6.643798828125, 7.48876953125, 8.333740234375, 9.1787109375, 10.023681640625, 10.86865234375, 11.713623046875, 12.55859375, 13.403564453125, 14.24853515625, 15.093505859375, 15.9384765625, 16.783447265625, 17.62841796875, 18.473388671875, 19.318359375, 20.163330078125, 21.00830078125, 21.853271484375, 22.6982421875, 23.543212890625, 24.38818359375, 25.233154296875, 26.078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 9.0, 12.0, 11.0, 18.0, 19.0, 19.0, 19.0, 33.0, 32.0, 44.0, 35.0, 41.0, 48.0, 64.0, 107.0, 275.0, 550.0, 222.0, 87.0, 43.0, 36.0, 34.0, 32.0, 27.0, 35.0, 27.0, 21.0, 27.0, 22.0, 10.0, 10.0, 12.0, 10.0, 11.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.7392578125, -35.541015625, -34.3427734375, -33.14453125, -31.9462890625, -30.748046875, -29.5498046875, -28.3515625, -27.1533203125, -25.955078125, -24.7568359375, -23.55859375, -22.3603515625, -21.162109375, -19.9638671875, -18.765625, -17.5673828125, -16.369140625, -15.1708984375, -13.97265625, -12.7744140625, -11.576171875, -10.3779296875, -9.1796875, -7.9814453125, -6.783203125, -5.5849609375, -4.38671875, -3.1884765625, -1.990234375, -0.7919921875, 0.40625, 1.6044921875, 2.802734375, 4.0009765625, 5.19921875, 6.3974609375, 7.595703125, 8.7939453125, 9.9921875, 11.1904296875, 12.388671875, 13.5869140625, 14.78515625, 15.9833984375, 17.181640625, 18.3798828125, 19.578125, 20.7763671875, 21.974609375, 23.1728515625, 24.37109375, 25.5693359375, 26.767578125, 27.9658203125, 29.1640625, 30.3623046875, 31.560546875, 32.7587890625, 33.95703125, 35.1552734375, 36.353515625, 37.5517578125, 38.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 24.0, 23.0, 36.0, 42.0, 62.0, 101.0, 166.0, 236.0, 381.0, 578.0, 989.0, 1647.0, 2598.0, 4592.0, 7944.0, 14399.0, 27209.0, 53753.0, 109829.0, 234572.0, 541636.0, 2383466.0, 1984640.0, 493519.0, 216953.0, 102664.0, 50446.0, 26291.0, 13826.0, 7809.0, 4359.0, 2608.0, 1506.0, 917.0, 577.0, 371.0, 214.0, 151.0, 100.0, 60.0, 42.0, 39.0, 15.0, 6.0, 7.0, 9.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.96875, -12.5498046875, -12.130859375, -11.7119140625, -11.29296875, -10.8740234375, -10.455078125, -10.0361328125, -9.6171875, -9.1982421875, -8.779296875, -8.3603515625, -7.94140625, -7.5224609375, -7.103515625, -6.6845703125, -6.265625, -5.8466796875, -5.427734375, -5.0087890625, -4.58984375, -4.1708984375, -3.751953125, -3.3330078125, -2.9140625, -2.4951171875, -2.076171875, -1.6572265625, -1.23828125, -0.8193359375, -0.400390625, 0.0185546875, 0.4375, 0.8564453125, 1.275390625, 1.6943359375, 2.11328125, 2.5322265625, 2.951171875, 3.3701171875, 3.7890625, 4.2080078125, 4.626953125, 5.0458984375, 5.46484375, 5.8837890625, 6.302734375, 6.7216796875, 7.140625, 7.5595703125, 7.978515625, 8.3974609375, 8.81640625, 9.2353515625, 9.654296875, 10.0732421875, 10.4921875, 10.9111328125, 11.330078125, 11.7490234375, 12.16796875, 12.5869140625, 13.005859375, 13.4248046875, 13.84375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 8.0, 7.0, 15.0, 20.0, 29.0, 32.0, 30.0, 27.0, 46.0, 53.0, 65.0, 122.0, 469.0, 550.0, 109.0, 68.0, 45.0, 51.0, 37.0, 47.0, 42.0, 26.0, 23.0, 13.0, 20.0, 6.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.322265625, -38.01953125, -36.716796875, -35.4140625, -34.111328125, -32.80859375, -31.505859375, -30.203125, -28.900390625, -27.59765625, -26.294921875, -24.9921875, -23.689453125, -22.38671875, -21.083984375, -19.78125, -18.478515625, -17.17578125, -15.873046875, -14.5703125, -13.267578125, -11.96484375, -10.662109375, -9.359375, -8.056640625, -6.75390625, -5.451171875, -4.1484375, -2.845703125, -1.54296875, -0.240234375, 1.0625, 2.365234375, 3.66796875, 4.970703125, 6.2734375, 7.576171875, 8.87890625, 10.181640625, 11.484375, 12.787109375, 14.08984375, 15.392578125, 16.6953125, 17.998046875, 19.30078125, 20.603515625, 21.90625, 23.208984375, 24.51171875, 25.814453125, 27.1171875, 28.419921875, 29.72265625, 31.025390625, 32.328125, 33.630859375, 34.93359375, 36.236328125, 37.5390625, 38.841796875, 40.14453125, 41.447265625, 42.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 9.0, 5.0, 5.0, 3.0, 5.0, 4.0, 14.0, 16.0, 28.0, 23.0, 47.0, 63.0, 77.0, 69.0, 98.0, 129.0, 168.0, 240.0, 328.0, 449.0, 636.0, 876.0, 1510.0, 2655.0, 4479.0, 9783.0, 24320.0, 94634.0, 5985274.0, 115574.0, 26953.0, 10141.0, 4866.0, 2738.0, 1608.0, 1061.0, 743.0, 443.0, 362.0, 262.0, 205.0, 104.0, 69.0, 80.0, 92.0, 56.0, 38.0, 28.0, 27.0, 11.0, 7.0, 4.0, 4.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-112.3125, -108.751953125, -105.19140625, -101.630859375, -98.0703125, -94.509765625, -90.94921875, -87.388671875, -83.828125, -80.267578125, -76.70703125, -73.146484375, -69.5859375, -66.025390625, -62.46484375, -58.904296875, -55.34375, -51.783203125, -48.22265625, -44.662109375, -41.1015625, -37.541015625, -33.98046875, -30.419921875, -26.859375, -23.298828125, -19.73828125, -16.177734375, -12.6171875, -9.056640625, -5.49609375, -1.935546875, 1.625, 5.185546875, 8.74609375, 12.306640625, 15.8671875, 19.427734375, 22.98828125, 26.548828125, 30.109375, 33.669921875, 37.23046875, 40.791015625, 44.3515625, 47.912109375, 51.47265625, 55.033203125, 58.59375, 62.154296875, 65.71484375, 69.275390625, 72.8359375, 76.396484375, 79.95703125, 83.517578125, 87.078125, 90.638671875, 94.19921875, 97.759765625, 101.3203125, 104.880859375, 108.44140625, 112.001953125, 115.5625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 6.0, 9.0, 14.0, 14.0, 12.0, 15.0, 17.0, 25.0, 28.0, 38.0, 35.0, 47.0, 49.0, 74.0, 126.0, 560.0, 485.0, 77.0, 55.0, 58.0, 36.0, 39.0, 28.0, 25.0, 20.0, 18.0, 19.0, 7.0, 12.0, 10.0, 6.0, 3.0, 10.0, 2.0, 6.0, 10.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.46630859375, -45.7763671875, -44.08642578125, -42.396484375, -40.70654296875, -39.0166015625, -37.32666015625, -35.63671875, -33.94677734375, -32.2568359375, -30.56689453125, -28.876953125, -27.18701171875, -25.4970703125, -23.80712890625, -22.1171875, -20.42724609375, -18.7373046875, -17.04736328125, -15.357421875, -13.66748046875, -11.9775390625, -10.28759765625, -8.59765625, -6.90771484375, -5.2177734375, -3.52783203125, -1.837890625, -0.14794921875, 1.5419921875, 3.23193359375, 4.921875, 6.61181640625, 8.3017578125, 9.99169921875, 11.681640625, 13.37158203125, 15.0615234375, 16.75146484375, 18.44140625, 20.13134765625, 21.8212890625, 23.51123046875, 25.201171875, 26.89111328125, 28.5810546875, 30.27099609375, 31.9609375, 33.65087890625, 35.3408203125, 37.03076171875, 38.720703125, 40.41064453125, 42.1005859375, 43.79052734375, 45.48046875, 47.17041015625, 48.8603515625, 50.55029296875, 52.240234375, 53.93017578125, 55.6201171875, 57.31005859375, 59.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 15.0, 30.0, 92.0, 679.0, 119.0, 28.0, 14.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1535.124755859375, -1502.946533203125, -1470.768310546875, -1438.590087890625, -1406.411865234375, -1374.233642578125, -1342.055419921875, -1309.8773193359375, -1277.6990966796875, -1245.5208740234375, -1213.3426513671875, -1181.1644287109375, -1148.9862060546875, -1116.80810546875, -1084.6298828125, -1052.45166015625, -1020.2733764648438, -988.0951538085938, -955.9169311523438, -923.73876953125, -891.560546875, -859.38232421875, -827.2041015625, -795.02587890625, -762.84765625, -730.66943359375, -698.4912109375, -666.31298828125, -634.1348266601562, -601.9566040039062, -569.7783813476562, -537.6001586914062, -505.42193603515625, -473.24371337890625, -441.0655212402344, -408.8872985839844, -376.7091064453125, -344.5308837890625, -312.3526611328125, -280.1744384765625, -247.99624633789062, -215.8180389404297, -183.63983154296875, -151.46160888671875, -119.28340148925781, -87.10519409179688, -54.926971435546875, -22.748764038085938, 9.429443359375, 41.6076545715332, 73.7858657836914, 105.96408081054688, 138.1422882080078, 170.32049560546875, 202.49871826171875, 234.6769256591797, 266.8551330566406, 299.0333557128906, 331.2115478515625, 363.3897705078125, 395.5679931640625, 427.7461853027344, 459.9244079589844, 492.10260009765625, 524.2808227539062]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 5.0, 6.0, 8.0, 6.0, 12.0, 33.0, 60.0, 612.0, 137.0, 40.0, 22.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 7.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1853.9193115234375, -1803.4644775390625, -1753.0096435546875, -1702.5546875, -1652.099853515625, -1601.64501953125, -1551.190185546875, -1500.7353515625, -1450.2803955078125, -1399.8255615234375, -1349.3707275390625, -1298.915771484375, -1248.4609375, -1198.006103515625, -1147.55126953125, -1097.096435546875, -1046.6416015625, -996.186767578125, -945.7318725585938, -895.2770385742188, -844.8221435546875, -794.3673095703125, -743.9124755859375, -693.4575805664062, -643.002685546875, -592.5478515625, -542.0929565429688, -491.63812255859375, -441.1832275390625, -390.7283935546875, -340.2735290527344, -289.81866455078125, -239.36376953125, -188.90890502929688, -138.45404052734375, -87.99919128417969, -37.54432678222656, 12.910537719726562, 63.365386962890625, 113.82025146484375, 164.27511596679688, 214.72998046875, 265.1848449707031, 315.63970947265625, 366.09454345703125, 416.5494384765625, 467.0042724609375, 517.4591064453125, 567.9140014648438, 618.3688354492188, 668.82373046875, 719.278564453125, 769.7334594726562, 820.1882934570312, 870.6431884765625, 921.0980224609375, 971.5528564453125, 1022.0076904296875, 1072.4625244140625, 1122.91748046875, 1173.372314453125, 1223.8271484375, 1274.281982421875, 1324.73681640625, 1375.1917724609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 9.0, 10.0, 16.0, 18.0, 12.0, 42.0, 55.0, 65.0, 86.0, 113.0, 191.0, 208.0, 309.0, 432.0, 649.0, 1035.0, 1582.0, 3056.0, 6078.0, 13127.0, 34586.0, 123474.0, 3404402.0, 511747.0, 56217.0, 18821.0, 8390.0, 4056.0, 2151.0, 1219.0, 744.0, 478.0, 296.0, 185.0, 127.0, 97.0, 58.0, 43.0, 22.0, 16.0, 16.0, 11.0, 7.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.76171875, -4.61181640625, -4.4619140625, -4.31201171875, -4.162109375, -4.01220703125, -3.8623046875, -3.71240234375, -3.5625, -3.41259765625, -3.2626953125, -3.11279296875, -2.962890625, -2.81298828125, -2.6630859375, -2.51318359375, -2.36328125, -2.21337890625, -2.0634765625, -1.91357421875, -1.763671875, -1.61376953125, -1.4638671875, -1.31396484375, -1.1640625, -1.01416015625, -0.8642578125, -0.71435546875, -0.564453125, -0.41455078125, -0.2646484375, -0.11474609375, 0.03515625, 0.18505859375, 0.3349609375, 0.48486328125, 0.634765625, 0.78466796875, 0.9345703125, 1.08447265625, 1.234375, 1.38427734375, 1.5341796875, 1.68408203125, 1.833984375, 1.98388671875, 2.1337890625, 2.28369140625, 2.43359375, 2.58349609375, 2.7333984375, 2.88330078125, 3.033203125, 3.18310546875, 3.3330078125, 3.48291015625, 3.6328125, 3.78271484375, 3.9326171875, 4.08251953125, 4.232421875, 4.38232421875, 4.5322265625, 4.68212890625, 4.83203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 13.0, 17.0, 17.0, 32.0, 144.0, 453.0, 209.0, 41.0, 23.0, 20.0, 4.0, 1.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6782073974609375, -0.656707763671875, -0.6352081298828125, -0.61370849609375, -0.5922088623046875, -0.570709228515625, -0.5492095947265625, -0.5277099609375, -0.5062103271484375, -0.484710693359375, -0.4632110595703125, -0.44171142578125, -0.4202117919921875, -0.398712158203125, -0.3772125244140625, -0.355712890625, -0.3342132568359375, -0.312713623046875, -0.2912139892578125, -0.26971435546875, -0.2482147216796875, -0.226715087890625, -0.2052154541015625, -0.1837158203125, -0.1622161865234375, -0.140716552734375, -0.1192169189453125, -0.09771728515625, -0.0762176513671875, -0.054718017578125, -0.0332183837890625, -0.01171875, 0.0097808837890625, 0.031280517578125, 0.0527801513671875, 0.07427978515625, 0.0957794189453125, 0.117279052734375, 0.1387786865234375, 0.1602783203125, 0.1817779541015625, 0.203277587890625, 0.2247772216796875, 0.24627685546875, 0.2677764892578125, 0.289276123046875, 0.3107757568359375, 0.332275390625, 0.3537750244140625, 0.375274658203125, 0.3967742919921875, 0.41827392578125, 0.4397735595703125, 0.461273193359375, 0.4827728271484375, 0.5042724609375, 0.5257720947265625, 0.547271728515625, 0.5687713623046875, 0.59027099609375, 0.6117706298828125, 0.633270263671875, 0.6547698974609375, 0.67626953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 6.0, 18.0, 14.0, 25.0, 34.0, 37.0, 71.0, 113.0, 189.0, 296.0, 558.0, 1144.0, 2502.0, 6618.0, 22889.0, 124147.0, 1392822.0, 2416322.0, 182407.0, 29932.0, 8266.0, 2997.0, 1301.0, 619.0, 348.0, 182.0, 129.0, 78.0, 56.0, 40.0, 24.0, 20.0, 16.0, 10.0, 9.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.12890625, -4.00030517578125, -3.8717041015625, -3.74310302734375, -3.614501953125, -3.48590087890625, -3.3572998046875, -3.22869873046875, -3.10009765625, -2.97149658203125, -2.8428955078125, -2.71429443359375, -2.585693359375, -2.45709228515625, -2.3284912109375, -2.19989013671875, -2.0712890625, -1.94268798828125, -1.8140869140625, -1.68548583984375, -1.556884765625, -1.42828369140625, -1.2996826171875, -1.17108154296875, -1.04248046875, -0.91387939453125, -0.7852783203125, -0.65667724609375, -0.528076171875, -0.39947509765625, -0.2708740234375, -0.14227294921875, -0.013671875, 0.11492919921875, 0.2435302734375, 0.37213134765625, 0.500732421875, 0.62933349609375, 0.7579345703125, 0.88653564453125, 1.01513671875, 1.14373779296875, 1.2723388671875, 1.40093994140625, 1.529541015625, 1.65814208984375, 1.7867431640625, 1.91534423828125, 2.0439453125, 2.17254638671875, 2.3011474609375, 2.42974853515625, 2.558349609375, 2.68695068359375, 2.8155517578125, 2.94415283203125, 3.07275390625, 3.20135498046875, 3.3299560546875, 3.45855712890625, 3.587158203125, 3.71575927734375, 3.8443603515625, 3.97296142578125, 4.1015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 10.0, 20.0, 17.0, 32.0, 26.0, 37.0, 37.0, 67.0, 64.0, 92.0, 110.0, 135.0, 169.0, 205.0, 246.0, 264.0, 310.0, 404.0, 371.0, 302.0, 222.0, 198.0, 149.0, 128.0, 116.0, 68.0, 52.0, 41.0, 39.0, 23.0, 17.0, 16.0, 14.0, 9.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.69287109375, -0.673431396484375, -0.65399169921875, -0.634552001953125, -0.6151123046875, -0.595672607421875, -0.57623291015625, -0.556793212890625, -0.537353515625, -0.517913818359375, -0.49847412109375, -0.479034423828125, -0.4595947265625, -0.440155029296875, -0.42071533203125, -0.401275634765625, -0.3818359375, -0.362396240234375, -0.34295654296875, -0.323516845703125, -0.3040771484375, -0.284637451171875, -0.26519775390625, -0.245758056640625, -0.226318359375, -0.206878662109375, -0.18743896484375, -0.167999267578125, -0.1485595703125, -0.129119873046875, -0.10968017578125, -0.090240478515625, -0.07080078125, -0.051361083984375, -0.03192138671875, -0.012481689453125, 0.0069580078125, 0.026397705078125, 0.04583740234375, 0.065277099609375, 0.084716796875, 0.104156494140625, 0.12359619140625, 0.143035888671875, 0.1624755859375, 0.181915283203125, 0.20135498046875, 0.220794677734375, 0.240234375, 0.259674072265625, 0.27911376953125, 0.298553466796875, 0.3179931640625, 0.337432861328125, 0.35687255859375, 0.376312255859375, 0.395751953125, 0.415191650390625, 0.43463134765625, 0.454071044921875, 0.4735107421875, 0.492950439453125, 0.51239013671875, 0.531829833984375, 0.55126953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 33.0, 69.0, 143.0, 316.0, 289.0, 90.0, 28.0, 14.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.354766845703125, -35.63087844848633, -34.90699005126953, -34.183101654052734, -33.45921325683594, -32.735328674316406, -32.01144027709961, -31.287551879882812, -30.563663482666016, -29.83977508544922, -29.115886688232422, -28.392000198364258, -27.66811180114746, -26.944223403930664, -26.2203369140625, -25.496448516845703, -24.772560119628906, -24.04867172241211, -23.324783325195312, -22.60089683532715, -21.87700843811035, -21.153120040893555, -20.42923355102539, -19.705345153808594, -18.981456756591797, -18.257568359375, -17.533679962158203, -16.80979347229004, -16.085905075073242, -15.362016677856445, -14.638129234313965, -13.914241790771484, -13.190354347229004, -12.466466903686523, -11.742578506469727, -11.01869010925293, -10.29480266571045, -9.570915222167969, -8.847026824951172, -8.123138427734375, -7.3992509841918945, -6.675363063812256, -5.951475143432617, -5.2275872230529785, -4.50369930267334, -3.779811382293701, -3.0559234619140625, -2.332035541534424, -1.6081476211547852, -0.8842597007751465, -0.1603717803955078, 0.5635161399841309, 1.2874040603637695, 2.011291980743408, 2.735179901123047, 3.4590678215026855, 4.182955741882324, 4.906843662261963, 5.630731582641602, 6.35461950302124, 7.078507423400879, 7.802395343780518, 8.526283264160156, 9.250171661376953, 9.974059104919434]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 9.0, 3.0, 4.0, 7.0, 7.0, 13.0, 16.0, 22.0, 25.0, 33.0, 47.0, 36.0, 40.0, 58.0, 59.0, 56.0, 65.0, 58.0, 59.0, 57.0, 53.0, 40.0, 45.0, 29.0, 33.0, 26.0, 29.0, 18.0, 15.0, 13.0, 11.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.024668216705322, -6.797572612762451, -6.570477485656738, -6.343381881713867, -6.116286277770996, -5.889191150665283, -5.662095546722412, -5.435000419616699, -5.207904815673828, -4.980809211730957, -4.753714084625244, -4.526618480682373, -4.29952335357666, -4.072427749633789, -3.845332145690918, -3.618236780166626, -3.391141414642334, -3.164046049118042, -2.93695068359375, -2.709855079650879, -2.482759714126587, -2.255664348602295, -2.028568744659424, -1.8014733791351318, -1.5743780136108398, -1.3472826480865479, -1.1201871633529663, -0.8930917382240295, -0.6659963130950928, -0.4389009475708008, -0.21180546283721924, 0.015290021896362305, 0.2423858642578125, 0.46948128938674927, 0.696576714515686, 0.9236721396446228, 1.1507675647735596, 1.3778629302978516, 1.604958415031433, 1.8320538997650146, 2.0591492652893066, 2.2862446308135986, 2.5133399963378906, 2.7404356002807617, 2.9675309658050537, 3.1946263313293457, 3.421721935272217, 3.648817300796509, 3.875912666320801, 4.103008270263672, 4.330103397369385, 4.557199001312256, 4.784294128417969, 5.01138973236084, 5.238485336303711, 5.465580940246582, 5.692676067352295, 5.919771671295166, 6.146866798400879, 6.37396240234375, 6.601058006286621, 6.828153133392334, 7.055248737335205, 7.282343864440918, 7.509439468383789]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 4.0, 14.0, 14.0, 18.0, 20.0, 35.0, 37.0, 47.0, 87.0, 125.0, 165.0, 268.0, 450.0, 710.0, 1251.0, 2464.0, 5679.0, 17087.0, 106324.0, 807249.0, 81151.0, 14780.0, 5184.0, 2283.0, 1211.0, 640.0, 405.0, 274.0, 155.0, 108.0, 97.0, 43.0, 36.0, 30.0, 27.0, 19.0, 16.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78125, -4.62921142578125, -4.4771728515625, -4.32513427734375, -4.173095703125, -4.02105712890625, -3.8690185546875, -3.71697998046875, -3.56494140625, -3.41290283203125, -3.2608642578125, -3.10882568359375, -2.956787109375, -2.80474853515625, -2.6527099609375, -2.50067138671875, -2.3486328125, -2.19659423828125, -2.0445556640625, -1.89251708984375, -1.740478515625, -1.58843994140625, -1.4364013671875, -1.28436279296875, -1.13232421875, -0.98028564453125, -0.8282470703125, -0.67620849609375, -0.524169921875, -0.37213134765625, -0.2200927734375, -0.06805419921875, 0.083984375, 0.23602294921875, 0.3880615234375, 0.54010009765625, 0.692138671875, 0.84417724609375, 0.9962158203125, 1.14825439453125, 1.30029296875, 1.45233154296875, 1.6043701171875, 1.75640869140625, 1.908447265625, 2.06048583984375, 2.2125244140625, 2.36456298828125, 2.5166015625, 2.66864013671875, 2.8206787109375, 2.97271728515625, 3.124755859375, 3.27679443359375, 3.4288330078125, 3.58087158203125, 3.73291015625, 3.88494873046875, 4.0369873046875, 4.18902587890625, 4.341064453125, 4.49310302734375, 4.6451416015625, 4.79718017578125, 4.94921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 14.0, 10.0, 20.0, 33.0, 55.0, 127.0, 167.0, 159.0, 160.0, 101.0, 63.0, 17.0, 11.0, 11.0, 11.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56689453125, -0.5516586303710938, -0.5364227294921875, -0.5211868286132812, -0.505950927734375, -0.49071502685546875, -0.4754791259765625, -0.46024322509765625, -0.44500732421875, -0.42977142333984375, -0.4145355224609375, -0.39929962158203125, -0.384063720703125, -0.36882781982421875, -0.3535919189453125, -0.33835601806640625, -0.3231201171875, -0.30788421630859375, -0.2926483154296875, -0.27741241455078125, -0.262176513671875, -0.24694061279296875, -0.2317047119140625, -0.21646881103515625, -0.20123291015625, -0.18599700927734375, -0.1707611083984375, -0.15552520751953125, -0.140289306640625, -0.12505340576171875, -0.1098175048828125, -0.09458160400390625, -0.079345703125, -0.06410980224609375, -0.0488739013671875, -0.03363800048828125, -0.018402099609375, -0.00316619873046875, 0.0120697021484375, 0.02730560302734375, 0.04254150390625, 0.05777740478515625, 0.0730133056640625, 0.08824920654296875, 0.103485107421875, 0.11872100830078125, 0.1339569091796875, 0.14919281005859375, 0.1644287109375, 0.17966461181640625, 0.1949005126953125, 0.21013641357421875, 0.225372314453125, 0.24060821533203125, 0.2558441162109375, 0.27108001708984375, 0.28631591796875, 0.30155181884765625, 0.3167877197265625, 0.33202362060546875, 0.347259521484375, 0.36249542236328125, 0.3777313232421875, 0.39296722412109375, 0.408203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 11.0, 9.0, 12.0, 18.0, 31.0, 20.0, 34.0, 53.0, 53.0, 88.0, 152.0, 253.0, 416.0, 825.0, 1702.0, 4464.0, 14333.0, 103457.0, 826069.0, 76762.0, 12366.0, 4014.0, 1531.0, 717.0, 411.0, 222.0, 140.0, 144.0, 70.0, 56.0, 40.0, 18.0, 17.0, 14.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.3203125, -5.151123046875, -4.98193359375, -4.812744140625, -4.6435546875, -4.474365234375, -4.30517578125, -4.135986328125, -3.966796875, -3.797607421875, -3.62841796875, -3.459228515625, -3.2900390625, -3.120849609375, -2.95166015625, -2.782470703125, -2.61328125, -2.444091796875, -2.27490234375, -2.105712890625, -1.9365234375, -1.767333984375, -1.59814453125, -1.428955078125, -1.259765625, -1.090576171875, -0.92138671875, -0.752197265625, -0.5830078125, -0.413818359375, -0.24462890625, -0.075439453125, 0.09375, 0.262939453125, 0.43212890625, 0.601318359375, 0.7705078125, 0.939697265625, 1.10888671875, 1.278076171875, 1.447265625, 1.616455078125, 1.78564453125, 1.954833984375, 2.1240234375, 2.293212890625, 2.46240234375, 2.631591796875, 2.80078125, 2.969970703125, 3.13916015625, 3.308349609375, 3.4775390625, 3.646728515625, 3.81591796875, 3.985107421875, 4.154296875, 4.323486328125, 4.49267578125, 4.661865234375, 4.8310546875, 5.000244140625, 5.16943359375, 5.338623046875, 5.5078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 17.0, 15.0, 14.0, 15.0, 16.0, 18.0, 31.0, 22.0, 17.0, 26.0, 28.0, 31.0, 39.0, 40.0, 36.0, 31.0, 30.0, 38.0, 45.0, 45.0, 35.0, 27.0, 38.0, 39.0, 28.0, 28.0, 32.0, 26.0, 29.0, 22.0, 16.0, 11.0, 18.0, 12.0, 14.0, 10.0, 9.0, 6.0, 5.0, 3.0, 6.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.3828125, -1.3380889892578125, -1.293365478515625, -1.2486419677734375, -1.20391845703125, -1.1591949462890625, -1.114471435546875, -1.0697479248046875, -1.0250244140625, -0.9803009033203125, -0.935577392578125, -0.8908538818359375, -0.84613037109375, -0.8014068603515625, -0.756683349609375, -0.7119598388671875, -0.667236328125, -0.6225128173828125, -0.577789306640625, -0.5330657958984375, -0.48834228515625, -0.4436187744140625, -0.398895263671875, -0.3541717529296875, -0.3094482421875, -0.2647247314453125, -0.220001220703125, -0.1752777099609375, -0.13055419921875, -0.0858306884765625, -0.041107177734375, 0.0036163330078125, 0.04833984375, 0.0930633544921875, 0.137786865234375, 0.1825103759765625, 0.22723388671875, 0.2719573974609375, 0.316680908203125, 0.3614044189453125, 0.4061279296875, 0.4508514404296875, 0.495574951171875, 0.5402984619140625, 0.58502197265625, 0.6297454833984375, 0.674468994140625, 0.7191925048828125, 0.763916015625, 0.8086395263671875, 0.853363037109375, 0.8980865478515625, 0.94281005859375, 0.9875335693359375, 1.032257080078125, 1.0769805908203125, 1.1217041015625, 1.1664276123046875, 1.211151123046875, 1.2558746337890625, 1.30059814453125, 1.3453216552734375, 1.390045166015625, 1.4347686767578125, 1.4794921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 8.0, 14.0, 11.0, 10.0, 15.0, 23.0, 29.0, 45.0, 66.0, 91.0, 147.0, 173.0, 281.0, 503.0, 998.0, 2060.0, 5653.0, 26249.0, 727129.0, 260539.0, 16590.0, 4232.0, 1604.0, 815.0, 397.0, 301.0, 154.0, 97.0, 91.0, 46.0, 49.0, 31.0, 16.0, 13.0, 16.0, 9.0, 8.0, 7.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.62030029296875, -7.3812255859375, -7.14215087890625, -6.903076171875, -6.66400146484375, -6.4249267578125, -6.18585205078125, -5.94677734375, -5.70770263671875, -5.4686279296875, -5.22955322265625, -4.990478515625, -4.75140380859375, -4.5123291015625, -4.27325439453125, -4.0341796875, -3.79510498046875, -3.5560302734375, -3.31695556640625, -3.077880859375, -2.83880615234375, -2.5997314453125, -2.36065673828125, -2.12158203125, -1.88250732421875, -1.6434326171875, -1.40435791015625, -1.165283203125, -0.92620849609375, -0.6871337890625, -0.44805908203125, -0.208984375, 0.03009033203125, 0.2691650390625, 0.50823974609375, 0.747314453125, 0.98638916015625, 1.2254638671875, 1.46453857421875, 1.70361328125, 1.94268798828125, 2.1817626953125, 2.42083740234375, 2.659912109375, 2.89898681640625, 3.1380615234375, 3.37713623046875, 3.6162109375, 3.85528564453125, 4.0943603515625, 4.33343505859375, 4.572509765625, 4.81158447265625, 5.0506591796875, 5.28973388671875, 5.52880859375, 5.76788330078125, 6.0069580078125, 6.24603271484375, 6.485107421875, 6.72418212890625, 6.9632568359375, 7.20233154296875, 7.44140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 3.0, 4.0, 6.0, 12.0, 11.0, 20.0, 25.0, 24.0, 25.0, 43.0, 60.0, 89.0, 124.0, 107.0, 111.0, 67.0, 44.0, 33.0, 31.0, 14.0, 18.0, 16.0, 12.0, 15.0, 15.0, 6.0, 5.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003960132598876953, -0.0003804527223110199, -0.0003648921847343445, -0.00034933164715766907, -0.00033377110958099365, -0.00031821057200431824, -0.0003026500344276428, -0.0002870894968509674, -0.000271528959274292, -0.0002559684216976166, -0.00024040788412094116, -0.00022484734654426575, -0.00020928680896759033, -0.00019372627139091492, -0.0001781657338142395, -0.0001626051962375641, -0.00014704465866088867, -0.00013148412108421326, -0.00011592358350753784, -0.00010036304593086243, -8.480250835418701e-05, -6.92419707775116e-05, -5.368143320083618e-05, -3.8120895624160767e-05, -2.256035804748535e-05, -6.9998204708099365e-06, 8.560717105865479e-06, 2.4121254682540894e-05, 3.968179225921631e-05, 5.5242329835891724e-05, 7.080286741256714e-05, 8.636340498924255e-05, 0.00010192394256591797, 0.00011748448014259338, 0.0001330450177192688, 0.00014860555529594421, 0.00016416609287261963, 0.00017972663044929504, 0.00019528716802597046, 0.00021084770560264587, 0.0002264082431793213, 0.0002419687807559967, 0.0002575293183326721, 0.00027308985590934753, 0.00028865039348602295, 0.00030421093106269836, 0.0003197714686393738, 0.0003353320062160492, 0.0003508925437927246, 0.0003664530813694, 0.00038201361894607544, 0.00039757415652275085, 0.00041313469409942627, 0.0004286952316761017, 0.0004442557692527771, 0.0004598163068294525, 0.00047537684440612793, 0.0004909373819828033, 0.0005064979195594788, 0.0005220584571361542, 0.0005376189947128296, 0.000553179532289505, 0.0005687400698661804, 0.0005843006074428558, 0.0005998611450195312]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 3.0, 4.0, 15.0, 11.0, 27.0, 45.0, 54.0, 88.0, 129.0, 269.0, 467.0, 960.0, 2192.0, 6252.0, 29043.0, 730750.0, 252650.0, 17598.0, 4596.0, 1687.0, 804.0, 382.0, 208.0, 108.0, 74.0, 43.0, 29.0, 18.0, 17.0, 10.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.7489013671875, -7.497802734375, -7.2467041015625, -6.99560546875, -6.7445068359375, -6.493408203125, -6.2423095703125, -5.9912109375, -5.7401123046875, -5.489013671875, -5.2379150390625, -4.98681640625, -4.7357177734375, -4.484619140625, -4.2335205078125, -3.982421875, -3.7313232421875, -3.480224609375, -3.2291259765625, -2.97802734375, -2.7269287109375, -2.475830078125, -2.2247314453125, -1.9736328125, -1.7225341796875, -1.471435546875, -1.2203369140625, -0.96923828125, -0.7181396484375, -0.467041015625, -0.2159423828125, 0.03515625, 0.2862548828125, 0.537353515625, 0.7884521484375, 1.03955078125, 1.2906494140625, 1.541748046875, 1.7928466796875, 2.0439453125, 2.2950439453125, 2.546142578125, 2.7972412109375, 3.04833984375, 3.2994384765625, 3.550537109375, 3.8016357421875, 4.052734375, 4.3038330078125, 4.554931640625, 4.8060302734375, 5.05712890625, 5.3082275390625, 5.559326171875, 5.8104248046875, 6.0615234375, 6.3126220703125, 6.563720703125, 6.8148193359375, 7.06591796875, 7.3170166015625, 7.568115234375, 7.8192138671875, 8.0703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 4.0, 5.0, 4.0, 15.0, 6.0, 11.0, 11.0, 22.0, 41.0, 48.0, 73.0, 99.0, 124.0, 116.0, 119.0, 88.0, 63.0, 40.0, 24.0, 20.0, 16.0, 15.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.088165283203125, -2.97515869140625, -2.862152099609375, -2.7491455078125, -2.636138916015625, -2.52313232421875, -2.410125732421875, -2.297119140625, -2.184112548828125, -2.07110595703125, -1.958099365234375, -1.8450927734375, -1.732086181640625, -1.61907958984375, -1.506072998046875, -1.39306640625, -1.280059814453125, -1.16705322265625, -1.054046630859375, -0.9410400390625, -0.828033447265625, -0.71502685546875, -0.602020263671875, -0.489013671875, -0.376007080078125, -0.26300048828125, -0.149993896484375, -0.0369873046875, 0.076019287109375, 0.18902587890625, 0.302032470703125, 0.4150390625, 0.528045654296875, 0.64105224609375, 0.754058837890625, 0.8670654296875, 0.980072021484375, 1.09307861328125, 1.206085205078125, 1.319091796875, 1.432098388671875, 1.54510498046875, 1.658111572265625, 1.7711181640625, 1.884124755859375, 1.99713134765625, 2.110137939453125, 2.22314453125, 2.336151123046875, 2.44915771484375, 2.562164306640625, 2.6751708984375, 2.788177490234375, 2.90118408203125, 3.014190673828125, 3.127197265625, 3.240203857421875, 3.35321044921875, 3.466217041015625, 3.5792236328125, 3.692230224609375, 3.80523681640625, 3.918243408203125, 4.03125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 6.0, 14.0, 9.0, 20.0, 49.0, 102.0, 240.0, 346.0, 129.0, 43.0, 9.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.63504028320312, -67.18753814697266, -65.74003601074219, -64.29254150390625, -62.845035552978516, -61.39753723144531, -59.950035095214844, -58.502532958984375, -57.055030822753906, -55.60752868652344, -54.160030364990234, -52.712528228759766, -51.2650260925293, -49.817527770996094, -48.370025634765625, -46.922523498535156, -45.47502517700195, -44.027523040771484, -42.58002471923828, -41.13252258300781, -39.685020446777344, -38.237518310546875, -36.79001998901367, -35.3425178527832, -33.89501953125, -32.44751739501953, -31.000017166137695, -29.55251693725586, -28.10501480102539, -26.657514572143555, -25.21001434326172, -23.76251220703125, -22.31501007080078, -20.867509841918945, -19.420007705688477, -17.97250747680664, -16.525005340576172, -15.077505111694336, -13.6300048828125, -12.182503700256348, -10.735002517700195, -9.287501335144043, -7.840000629425049, -6.392499923706055, -4.944998741149902, -3.49749755859375, -2.049997329711914, -0.6024961471557617, 0.8450050354003906, 2.292505979537964, 3.740006923675537, 5.187507629394531, 6.635008811950684, 8.082509994506836, 9.530010223388672, 10.977511405944824, 12.425012588500977, 13.872513771057129, 15.320014953613281, 16.767515182495117, 18.215015411376953, 19.662517547607422, 21.110017776489258, 22.557518005371094, 24.005020141601562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 1.0, 9.0, 6.0, 15.0, 14.0, 31.0, 42.0, 46.0, 89.0, 116.0, 128.0, 133.0, 101.0, 69.0, 65.0, 40.0, 30.0, 17.0, 12.0, 9.0, 2.0, 7.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.842880249023438, -27.773225784301758, -26.703571319580078, -25.6339168548584, -24.56426239013672, -23.494609832763672, -22.424955368041992, -21.355300903320312, -20.285646438598633, -19.215991973876953, -18.146337509155273, -17.076683044433594, -16.007030487060547, -14.93737506866455, -13.867721557617188, -12.798067092895508, -11.728412628173828, -10.658758163452148, -9.589103698730469, -8.519450187683105, -7.449795722961426, -6.380141258239746, -5.310487270355225, -4.240833282470703, -3.1711788177490234, -2.101524591445923, -1.0318703651428223, 0.03778386116027832, 1.107438087463379, 2.1770925521850586, 3.24674654006958, 4.316400527954102, 5.386051177978516, 6.455705642700195, 7.525359630584717, 8.595013618469238, 9.664668083190918, 10.734322547912598, 11.803976058959961, 12.87363052368164, 13.94328498840332, 15.012939453125, 16.08259391784668, 17.15224838256836, 18.221900939941406, 19.29155731201172, 20.361209869384766, 21.430864334106445, 22.500518798828125, 23.570173263549805, 24.639827728271484, 25.709482192993164, 26.779136657714844, 27.84878921508789, 28.91844367980957, 29.98809814453125, 31.05775260925293, 32.12740707397461, 33.197059631347656, 34.26671600341797, 35.336368560791016, 36.40602493286133, 37.475677490234375, 38.54533386230469, 39.614986419677734]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 11.0, 8.0, 14.0, 25.0, 42.0, 113.0, 729.0, 141389.0, 4050070.0, 1506.0, 224.0, 63.0, 33.0, 17.0, 14.0, 11.0, 4.0, 1.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -33.41259765625, -31.0439453125, -28.67529296875, -26.306640625, -23.93798828125, -21.5693359375, -19.20068359375, -16.83203125, -14.46337890625, -12.0947265625, -9.72607421875, -7.357421875, -4.98876953125, -2.6201171875, -0.25146484375, 2.1171875, 4.48583984375, 6.8544921875, 9.22314453125, 11.591796875, 13.96044921875, 16.3291015625, 18.69775390625, 21.06640625, 23.43505859375, 25.8037109375, 28.17236328125, 30.541015625, 32.90966796875, 35.2783203125, 37.64697265625, 40.015625, 42.38427734375, 44.7529296875, 47.12158203125, 49.490234375, 51.85888671875, 54.2275390625, 56.59619140625, 58.96484375, 61.33349609375, 63.7021484375, 66.07080078125, 68.439453125, 70.80810546875, 73.1767578125, 75.54541015625, 77.9140625, 80.28271484375, 82.6513671875, 85.02001953125, 87.388671875, 89.75732421875, 92.1259765625, 94.49462890625, 96.86328125, 99.23193359375, 101.6005859375, 103.96923828125, 106.337890625, 108.70654296875, 111.0751953125, 113.44384765625, 115.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 5.0, 7.0, 10.0, 13.0, 18.0, 19.0, 25.0, 41.0, 74.0, 114.0, 145.0, 126.0, 113.0, 90.0, 60.0, 45.0, 30.0, 15.0, 13.0, 8.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5048828125, -0.49160003662109375, -0.4783172607421875, -0.46503448486328125, -0.451751708984375, -0.43846893310546875, -0.4251861572265625, -0.41190338134765625, -0.39862060546875, -0.38533782958984375, -0.3720550537109375, -0.35877227783203125, -0.345489501953125, -0.33220672607421875, -0.3189239501953125, -0.30564117431640625, -0.2923583984375, -0.27907562255859375, -0.2657928466796875, -0.25251007080078125, -0.239227294921875, -0.22594451904296875, -0.2126617431640625, -0.19937896728515625, -0.18609619140625, -0.17281341552734375, -0.1595306396484375, -0.14624786376953125, -0.132965087890625, -0.11968231201171875, -0.1063995361328125, -0.09311676025390625, -0.079833984375, -0.06655120849609375, -0.0532684326171875, -0.03998565673828125, -0.026702880859375, -0.01342010498046875, -0.0001373291015625, 0.01314544677734375, 0.02642822265625, 0.03971099853515625, 0.0529937744140625, 0.06627655029296875, 0.079559326171875, 0.09284210205078125, 0.1061248779296875, 0.11940765380859375, 0.1326904296875, 0.14597320556640625, 0.1592559814453125, 0.17253875732421875, 0.185821533203125, 0.19910430908203125, 0.2123870849609375, 0.22566986083984375, 0.23895263671875, 0.25223541259765625, 0.2655181884765625, 0.27880096435546875, 0.292083740234375, 0.30536651611328125, 0.3186492919921875, 0.33193206787109375, 0.34521484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 14.0, 9.0, 28.0, 37.0, 43.0, 65.0, 101.0, 114.0, 251.0, 641.0, 2508.0, 19503.0, 666305.0, 3462243.0, 37552.0, 3661.0, 705.0, 223.0, 94.0, 61.0, 38.0, 24.0, 24.0, 7.0, 9.0, 3.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.453125, -20.94384765625, -20.4345703125, -19.92529296875, -19.416015625, -18.90673828125, -18.3974609375, -17.88818359375, -17.37890625, -16.86962890625, -16.3603515625, -15.85107421875, -15.341796875, -14.83251953125, -14.3232421875, -13.81396484375, -13.3046875, -12.79541015625, -12.2861328125, -11.77685546875, -11.267578125, -10.75830078125, -10.2490234375, -9.73974609375, -9.23046875, -8.72119140625, -8.2119140625, -7.70263671875, -7.193359375, -6.68408203125, -6.1748046875, -5.66552734375, -5.15625, -4.64697265625, -4.1376953125, -3.62841796875, -3.119140625, -2.60986328125, -2.1005859375, -1.59130859375, -1.08203125, -0.57275390625, -0.0634765625, 0.44580078125, 0.955078125, 1.46435546875, 1.9736328125, 2.48291015625, 2.9921875, 3.50146484375, 4.0107421875, 4.52001953125, 5.029296875, 5.53857421875, 6.0478515625, 6.55712890625, 7.06640625, 7.57568359375, 8.0849609375, 8.59423828125, 9.103515625, 9.61279296875, 10.1220703125, 10.63134765625, 11.140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 14.0, 10.0, 11.0, 14.0, 21.0, 25.0, 30.0, 50.0, 49.0, 57.0, 69.0, 103.0, 123.0, 191.0, 297.0, 563.0, 1046.0, 514.0, 238.0, 148.0, 84.0, 90.0, 55.0, 62.0, 33.0, 37.0, 20.0, 19.0, 14.0, 15.0, 6.0, 11.0, 12.0, 4.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6168594360351562, -0.5979766845703125, -0.5790939331054688, -0.560211181640625, -0.5413284301757812, -0.5224456787109375, -0.5035629272460938, -0.48468017578125, -0.46579742431640625, -0.4469146728515625, -0.42803192138671875, -0.409149169921875, -0.39026641845703125, -0.3713836669921875, -0.35250091552734375, -0.3336181640625, -0.31473541259765625, -0.2958526611328125, -0.27696990966796875, -0.258087158203125, -0.23920440673828125, -0.2203216552734375, -0.20143890380859375, -0.18255615234375, -0.16367340087890625, -0.1447906494140625, -0.12590789794921875, -0.107025146484375, -0.08814239501953125, -0.0692596435546875, -0.05037689208984375, -0.031494140625, -0.01261138916015625, 0.0062713623046875, 0.02515411376953125, 0.044036865234375, 0.06291961669921875, 0.0818023681640625, 0.10068511962890625, 0.11956787109375, 0.13845062255859375, 0.1573333740234375, 0.17621612548828125, 0.195098876953125, 0.21398162841796875, 0.2328643798828125, 0.25174713134765625, 0.2706298828125, 0.28951263427734375, 0.3083953857421875, 0.32727813720703125, 0.346160888671875, 0.36504364013671875, 0.3839263916015625, 0.40280914306640625, 0.42169189453125, 0.44057464599609375, 0.4594573974609375, 0.47834014892578125, 0.497222900390625, 0.5161056518554688, 0.5349884033203125, 0.5538711547851562, 0.57275390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 35.0, 267.0, 669.0, 33.0, 3.0, 5.0], "bins": [-118.1395034790039, -116.18077850341797, -114.22205352783203, -112.26333618164062, -110.30461120605469, -108.34588623046875, -106.38716125488281, -104.42843627929688, -102.46971893310547, -100.51099395751953, -98.5522689819336, -96.59355163574219, -94.63482666015625, -92.67610168457031, -90.71737670898438, -88.75865173339844, -86.7999267578125, -84.84120178222656, -82.88247680664062, -80.92375946044922, -78.96503448486328, -77.00630950927734, -75.0475845336914, -73.0888671875, -71.13014221191406, -69.17141723632812, -67.21269226074219, -65.25397491455078, -63.295249938964844, -61.336524963378906, -59.37779998779297, -57.4190788269043, -55.46035385131836, -53.50162887573242, -51.54290771484375, -49.58418273925781, -47.62546157836914, -45.6667366027832, -43.70801544189453, -41.749290466308594, -39.79056930541992, -37.831844329833984, -35.87312316894531, -33.914398193359375, -31.955677032470703, -29.996952056884766, -28.03822898864746, -26.079505920410156, -24.12078094482422, -22.162057876586914, -20.20333480834961, -18.244609832763672, -16.285888671875, -14.327164649963379, -12.368440628051758, -10.409717559814453, -8.450995445251465, -6.49227237701416, -4.533548831939697, -2.5748252868652344, -0.6161022186279297, 1.342620849609375, 3.301344871520996, 5.260067939758301, 7.2187910079956055]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 7.0, 8.0, 6.0, 16.0, 12.0, 11.0, 27.0, 27.0, 27.0, 28.0, 40.0, 52.0, 67.0, 45.0, 42.0, 66.0, 57.0, 59.0, 62.0, 45.0, 38.0, 46.0, 28.0, 29.0, 22.0, 19.0, 17.0, 23.0, 14.0, 13.0, 8.0, 9.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.362530708312988, -4.1781206130981445, -3.993710994720459, -3.8093011379241943, -3.6248912811279297, -3.440481424331665, -3.2560715675354004, -3.0716614723205566, -2.887251853942871, -2.7028419971466064, -2.518432140350342, -2.334022283554077, -2.1496124267578125, -1.9652025699615479, -1.7807925939559937, -1.596382737159729, -1.4119727611541748, -1.2275629043579102, -1.0431530475616455, -0.8587431311607361, -0.6743332743644714, -0.4899234175682068, -0.30551350116729736, -0.12110364437103271, 0.06330621242523193, 0.24771608412265778, 0.4321259558200836, 0.6165358424186707, 0.8009456992149353, 0.9853555560112, 1.1697654724121094, 1.354175329208374, 1.5385851860046387, 1.7229950428009033, 1.907404899597168, 2.0918147563934326, 2.2762246131896973, 2.460634469985962, 2.6450443267822266, 2.8294544219970703, 3.013864040374756, 3.1982738971710205, 3.382683753967285, 3.56709361076355, 3.7515034675598145, 3.935913324356079, 4.120323181152344, 4.3047332763671875, 4.489143371582031, 4.673553466796875, 4.8579630851745605, 5.042373180389404, 5.22678279876709, 5.411192893981934, 5.595602512359619, 5.780012607574463, 5.964422225952148, 6.148832321166992, 6.333241939544678, 6.5176520347595215, 6.702061653137207, 6.886471748352051, 7.070881366729736, 7.25529146194458, 7.439701080322266]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 10.0, 11.0, 18.0, 23.0, 32.0, 45.0, 58.0, 136.0, 179.0, 370.0, 713.0, 1673.0, 4945.0, 19049.0, 134894.0, 760238.0, 102757.0, 16048.0, 4225.0, 1645.0, 672.0, 309.0, 151.0, 94.0, 56.0, 47.0, 43.0, 24.0, 17.0, 14.0, 7.0, 9.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-11.6953125, -11.3743896484375, -11.053466796875, -10.7325439453125, -10.41162109375, -10.0906982421875, -9.769775390625, -9.4488525390625, -9.1279296875, -8.8070068359375, -8.486083984375, -8.1651611328125, -7.84423828125, -7.5233154296875, -7.202392578125, -6.8814697265625, -6.560546875, -6.2396240234375, -5.918701171875, -5.5977783203125, -5.27685546875, -4.9559326171875, -4.635009765625, -4.3140869140625, -3.9931640625, -3.6722412109375, -3.351318359375, -3.0303955078125, -2.70947265625, -2.3885498046875, -2.067626953125, -1.7467041015625, -1.42578125, -1.1048583984375, -0.783935546875, -0.4630126953125, -0.14208984375, 0.1788330078125, 0.499755859375, 0.8206787109375, 1.1416015625, 1.4625244140625, 1.783447265625, 2.1043701171875, 2.42529296875, 2.7462158203125, 3.067138671875, 3.3880615234375, 3.708984375, 4.0299072265625, 4.350830078125, 4.6717529296875, 4.99267578125, 5.3135986328125, 5.634521484375, 5.9554443359375, 6.2763671875, 6.5972900390625, 6.918212890625, 7.2391357421875, 7.56005859375, 7.8809814453125, 8.201904296875, 8.5228271484375, 8.84375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 7.0, 16.0, 30.0, 31.0, 67.0, 89.0, 125.0, 150.0, 136.0, 128.0, 89.0, 54.0, 30.0, 24.0, 12.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5089340209960938, -0.4856414794921875, -0.46234893798828125, -0.439056396484375, -0.41576385498046875, -0.3924713134765625, -0.36917877197265625, -0.34588623046875, -0.32259368896484375, -0.2993011474609375, -0.27600860595703125, -0.252716064453125, -0.22942352294921875, -0.2061309814453125, -0.18283843994140625, -0.1595458984375, -0.13625335693359375, -0.1129608154296875, -0.08966827392578125, -0.066375732421875, -0.04308319091796875, -0.0197906494140625, 0.00350189208984375, 0.02679443359375, 0.05008697509765625, 0.0733795166015625, 0.09667205810546875, 0.119964599609375, 0.14325714111328125, 0.1665496826171875, 0.18984222412109375, 0.213134765625, 0.23642730712890625, 0.2597198486328125, 0.28301239013671875, 0.306304931640625, 0.32959747314453125, 0.3528900146484375, 0.37618255615234375, 0.39947509765625, 0.42276763916015625, 0.4460601806640625, 0.46935272216796875, 0.492645263671875, 0.5159378051757812, 0.5392303466796875, 0.5625228881835938, 0.5858154296875, 0.6091079711914062, 0.6324005126953125, 0.6556930541992188, 0.678985595703125, 0.7022781372070312, 0.7255706787109375, 0.7488632202148438, 0.77215576171875, 0.7954483032226562, 0.8187408447265625, 0.8420333862304688, 0.865325927734375, 0.8886184692382812, 0.9119110107421875, 0.9352035522460938, 0.95849609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 3.0, 8.0, 12.0, 13.0, 29.0, 38.0, 65.0, 152.0, 1333.0, 533037.0, 512022.0, 1405.0, 192.0, 71.0, 50.0, 27.0, 16.0, 14.0, 11.0, 7.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -21.9951171875, -21.115234375, -20.2353515625, -19.35546875, -18.4755859375, -17.595703125, -16.7158203125, -15.8359375, -14.9560546875, -14.076171875, -13.1962890625, -12.31640625, -11.4365234375, -10.556640625, -9.6767578125, -8.796875, -7.9169921875, -7.037109375, -6.1572265625, -5.27734375, -4.3974609375, -3.517578125, -2.6376953125, -1.7578125, -0.8779296875, 0.001953125, 0.8818359375, 1.76171875, 2.6416015625, 3.521484375, 4.4013671875, 5.28125, 6.1611328125, 7.041015625, 7.9208984375, 8.80078125, 9.6806640625, 10.560546875, 11.4404296875, 12.3203125, 13.2001953125, 14.080078125, 14.9599609375, 15.83984375, 16.7197265625, 17.599609375, 18.4794921875, 19.359375, 20.2392578125, 21.119140625, 21.9990234375, 22.87890625, 23.7587890625, 24.638671875, 25.5185546875, 26.3984375, 27.2783203125, 28.158203125, 29.0380859375, 29.91796875, 30.7978515625, 31.677734375, 32.5576171875, 33.4375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 10.0, 4.0, 6.0, 6.0, 10.0, 11.0, 12.0, 14.0, 19.0, 20.0, 17.0, 28.0, 23.0, 37.0, 27.0, 47.0, 37.0, 44.0, 41.0, 45.0, 39.0, 47.0, 35.0, 50.0, 36.0, 39.0, 33.0, 35.0, 29.0, 19.0, 27.0, 32.0, 14.0, 24.0, 14.0, 12.0, 9.0, 5.0, 8.0, 12.0, 4.0, 8.0, 3.0, 3.0, 5.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.172760009765625, -1.12677001953125, -1.080780029296875, -1.0347900390625, -0.988800048828125, -0.94281005859375, -0.896820068359375, -0.850830078125, -0.804840087890625, -0.75885009765625, -0.712860107421875, -0.6668701171875, -0.620880126953125, -0.57489013671875, -0.528900146484375, -0.48291015625, -0.436920166015625, -0.39093017578125, -0.344940185546875, -0.2989501953125, -0.252960205078125, -0.20697021484375, -0.160980224609375, -0.114990234375, -0.069000244140625, -0.02301025390625, 0.022979736328125, 0.0689697265625, 0.114959716796875, 0.16094970703125, 0.206939697265625, 0.2529296875, 0.298919677734375, 0.34490966796875, 0.390899658203125, 0.4368896484375, 0.482879638671875, 0.52886962890625, 0.574859619140625, 0.620849609375, 0.666839599609375, 0.71282958984375, 0.758819580078125, 0.8048095703125, 0.850799560546875, 0.89678955078125, 0.942779541015625, 0.98876953125, 1.034759521484375, 1.08074951171875, 1.126739501953125, 1.1727294921875, 1.218719482421875, 1.26470947265625, 1.310699462890625, 1.356689453125, 1.402679443359375, 1.44866943359375, 1.494659423828125, 1.5406494140625, 1.586639404296875, 1.63262939453125, 1.678619384765625, 1.724609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 8.0, 13.0, 15.0, 30.0, 40.0, 104.0, 313.0, 5239.0, 1037895.0, 4343.0, 316.0, 81.0, 54.0, 23.0, 18.0, 12.0, 11.0, 5.0, 3.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.375, -48.72216796875, -47.0693359375, -45.41650390625, -43.763671875, -42.11083984375, -40.4580078125, -38.80517578125, -37.15234375, -35.49951171875, -33.8466796875, -32.19384765625, -30.541015625, -28.88818359375, -27.2353515625, -25.58251953125, -23.9296875, -22.27685546875, -20.6240234375, -18.97119140625, -17.318359375, -15.66552734375, -14.0126953125, -12.35986328125, -10.70703125, -9.05419921875, -7.4013671875, -5.74853515625, -4.095703125, -2.44287109375, -0.7900390625, 0.86279296875, 2.515625, 4.16845703125, 5.8212890625, 7.47412109375, 9.126953125, 10.77978515625, 12.4326171875, 14.08544921875, 15.73828125, 17.39111328125, 19.0439453125, 20.69677734375, 22.349609375, 24.00244140625, 25.6552734375, 27.30810546875, 28.9609375, 30.61376953125, 32.2666015625, 33.91943359375, 35.572265625, 37.22509765625, 38.8779296875, 40.53076171875, 42.18359375, 43.83642578125, 45.4892578125, 47.14208984375, 48.794921875, 50.44775390625, 52.1005859375, 53.75341796875, 55.40625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 4.0, 4.0, 7.0, 12.0, 14.0, 25.0, 21.0, 43.0, 69.0, 142.0, 319.0, 141.0, 50.0, 43.0, 17.0, 21.0, 15.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005359649658203125, -0.0051773786544799805, -0.004995107650756836, -0.004812836647033691, -0.004630565643310547, -0.004448294639587402, -0.004266023635864258, -0.004083752632141113, -0.0039014816284179688, -0.0037192106246948242, -0.0035369396209716797, -0.003354668617248535, -0.0031723976135253906, -0.002990126609802246, -0.0028078556060791016, -0.002625584602355957, -0.0024433135986328125, -0.002261042594909668, -0.0020787715911865234, -0.001896500587463379, -0.0017142295837402344, -0.0015319585800170898, -0.0013496875762939453, -0.0011674165725708008, -0.0009851455688476562, -0.0008028745651245117, -0.0006206035614013672, -0.00043833255767822266, -0.0002560615539550781, -7.37905502319336e-05, 0.00010848045349121094, 0.00029075145721435547, 0.0004730224609375, 0.0006552934646606445, 0.0008375644683837891, 0.0010198354721069336, 0.0012021064758300781, 0.0013843774795532227, 0.0015666484832763672, 0.0017489194869995117, 0.0019311904907226562, 0.0021134614944458008, 0.0022957324981689453, 0.00247800350189209, 0.0026602745056152344, 0.002842545509338379, 0.0030248165130615234, 0.003207087516784668, 0.0033893585205078125, 0.003571629524230957, 0.0037539005279541016, 0.003936171531677246, 0.004118442535400391, 0.004300713539123535, 0.00448298454284668, 0.004665255546569824, 0.004847526550292969, 0.005029797554016113, 0.005212068557739258, 0.005394339561462402, 0.005576610565185547, 0.005758881568908691, 0.005941152572631836, 0.0061234235763549805, 0.006305694580078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 9.0, 21.0, 23.0, 32.0, 32.0, 50.0, 97.0, 139.0, 210.0, 365.0, 566.0, 984.0, 1738.0, 3095.0, 6194.0, 13839.0, 38792.0, 181097.0, 646111.0, 106079.0, 27771.0, 10383.0, 4876.0, 2503.0, 1448.0, 772.0, 458.0, 307.0, 187.0, 109.0, 80.0, 56.0, 33.0, 25.0, 16.0, 14.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.765625, -9.48944091796875, -9.2132568359375, -8.93707275390625, -8.660888671875, -8.38470458984375, -8.1085205078125, -7.83233642578125, -7.55615234375, -7.27996826171875, -7.0037841796875, -6.72760009765625, -6.451416015625, -6.17523193359375, -5.8990478515625, -5.62286376953125, -5.3466796875, -5.07049560546875, -4.7943115234375, -4.51812744140625, -4.241943359375, -3.96575927734375, -3.6895751953125, -3.41339111328125, -3.13720703125, -2.86102294921875, -2.5848388671875, -2.30865478515625, -2.032470703125, -1.75628662109375, -1.4801025390625, -1.20391845703125, -0.927734375, -0.65155029296875, -0.3753662109375, -0.09918212890625, 0.177001953125, 0.45318603515625, 0.7293701171875, 1.00555419921875, 1.28173828125, 1.55792236328125, 1.8341064453125, 2.11029052734375, 2.386474609375, 2.66265869140625, 2.9388427734375, 3.21502685546875, 3.4912109375, 3.76739501953125, 4.0435791015625, 4.31976318359375, 4.595947265625, 4.87213134765625, 5.1483154296875, 5.42449951171875, 5.70068359375, 5.97686767578125, 6.2530517578125, 6.52923583984375, 6.805419921875, 7.08160400390625, 7.3577880859375, 7.63397216796875, 7.91015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 2.0, 12.0, 15.0, 23.0, 28.0, 35.0, 36.0, 45.0, 76.0, 102.0, 156.0, 132.0, 97.0, 54.0, 30.0, 33.0, 21.0, 23.0, 12.0, 13.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.2359619140625, -5.089111328125, -4.9422607421875, -4.79541015625, -4.6485595703125, -4.501708984375, -4.3548583984375, -4.2080078125, -4.0611572265625, -3.914306640625, -3.7674560546875, -3.62060546875, -3.4737548828125, -3.326904296875, -3.1800537109375, -3.033203125, -2.8863525390625, -2.739501953125, -2.5926513671875, -2.44580078125, -2.2989501953125, -2.152099609375, -2.0052490234375, -1.8583984375, -1.7115478515625, -1.564697265625, -1.4178466796875, -1.27099609375, -1.1241455078125, -0.977294921875, -0.8304443359375, -0.68359375, -0.5367431640625, -0.389892578125, -0.2430419921875, -0.09619140625, 0.0506591796875, 0.197509765625, 0.3443603515625, 0.4912109375, 0.6380615234375, 0.784912109375, 0.9317626953125, 1.07861328125, 1.2254638671875, 1.372314453125, 1.5191650390625, 1.666015625, 1.8128662109375, 1.959716796875, 2.1065673828125, 2.25341796875, 2.4002685546875, 2.547119140625, 2.6939697265625, 2.8408203125, 2.9876708984375, 3.134521484375, 3.2813720703125, 3.42822265625, 3.5750732421875, 3.721923828125, 3.8687744140625, 4.015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 16.0, 28.0, 52.0, 125.0, 220.0, 251.0, 145.0, 90.0, 34.0, 11.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.79340362548828, -38.62612533569336, -37.45884704589844, -36.29157257080078, -35.12429428100586, -33.95701599121094, -32.789737701416016, -31.622459411621094, -30.455183029174805, -29.287904739379883, -28.120628356933594, -26.953350067138672, -25.78607177734375, -24.61879539489746, -23.45151710510254, -22.28424072265625, -21.116962432861328, -19.949684143066406, -18.782407760620117, -17.615129470825195, -16.447853088378906, -15.280574798583984, -14.113296508789062, -12.946019172668457, -11.778741836547852, -10.611464500427246, -9.44418716430664, -8.276908874511719, -7.109631538391113, -5.942354202270508, -4.775076389312744, -3.6077985763549805, -2.440521240234375, -1.2732436656951904, -0.10596609115600586, 1.0613114833831787, 2.2285890579223633, 3.3958663940429688, 4.563144207000732, 5.730422019958496, 6.897699356079102, 8.064976692199707, 9.232254028320312, 10.399532318115234, 11.56680965423584, 12.734086990356445, 13.901365280151367, 15.068642616271973, 16.235919952392578, 17.4031982421875, 18.57047462463379, 19.73775291442871, 20.905029296875, 22.072307586669922, 23.239585876464844, 24.406864166259766, 25.574140548706055, 26.741418838500977, 27.908695220947266, 29.075973510742188, 30.24325180053711, 31.4105281829834, 32.57780456542969, 33.74508285522461, 34.91236114501953]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 6.0, 12.0, 14.0, 17.0, 19.0, 45.0, 38.0, 55.0, 58.0, 54.0, 64.0, 67.0, 68.0, 62.0, 73.0, 68.0, 38.0, 37.0, 38.0, 44.0, 27.0, 18.0, 16.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-18.703041076660156, -18.215940475463867, -17.728839874267578, -17.24173927307129, -16.754638671875, -16.26753807067871, -15.780437469482422, -15.293335914611816, -14.806235313415527, -14.319134712219238, -13.83203411102295, -13.34493350982666, -12.857832908630371, -12.370731353759766, -11.883630752563477, -11.396530151367188, -10.909429550170898, -10.42232894897461, -9.93522834777832, -9.448127746582031, -8.961027145385742, -8.473926544189453, -7.986825466156006, -7.499724388122559, -7.012624740600586, -6.525524139404297, -6.038423538208008, -5.551322937011719, -5.0642218589782715, -4.577121257781982, -4.090020656585693, -3.602919816970825, -3.115818977355957, -2.628718376159668, -2.1416175365448, -1.6545169353485107, -1.1674162149429321, -0.6803154945373535, -0.19321489334106445, 0.2938859462738037, 0.7809865474700928, 1.2680872678756714, 1.75518798828125, 2.242288589477539, 2.729389190673828, 3.2164900302886963, 3.7035906314849854, 4.1906914710998535, 4.677792072296143, 5.164892673492432, 5.651993274688721, 6.139094352722168, 6.626194953918457, 7.113295555114746, 7.600396156311035, 8.087496757507324, 8.574597358703613, 9.061697959899902, 9.548798561096191, 10.03589916229248, 10.52299976348877, 11.010101318359375, 11.497201919555664, 11.984302520751953, 12.471403121948242]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 8.0, 6.0, 8.0, 10.0, 10.0, 10.0, 16.0, 23.0, 45.0, 67.0, 112.0, 198.0, 532.0, 1586.0, 7268.0, 77299.0, 3961116.0, 133725.0, 9162.0, 1744.0, 504.0, 235.0, 140.0, 109.0, 63.0, 43.0, 46.0, 32.0, 27.0, 25.0, 27.0, 16.0, 14.0, 10.0, 9.0, 12.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.1319580078125, -13.506103515625, -12.8802490234375, -12.25439453125, -11.6285400390625, -11.002685546875, -10.3768310546875, -9.7509765625, -9.1251220703125, -8.499267578125, -7.8734130859375, -7.24755859375, -6.6217041015625, -5.995849609375, -5.3699951171875, -4.744140625, -4.1182861328125, -3.492431640625, -2.8665771484375, -2.24072265625, -1.6148681640625, -0.989013671875, -0.3631591796875, 0.2626953125, 0.8885498046875, 1.514404296875, 2.1402587890625, 2.76611328125, 3.3919677734375, 4.017822265625, 4.6436767578125, 5.26953125, 5.8953857421875, 6.521240234375, 7.1470947265625, 7.77294921875, 8.3988037109375, 9.024658203125, 9.6505126953125, 10.2763671875, 10.9022216796875, 11.528076171875, 12.1539306640625, 12.77978515625, 13.4056396484375, 14.031494140625, 14.6573486328125, 15.283203125, 15.9090576171875, 16.534912109375, 17.1607666015625, 17.78662109375, 18.4124755859375, 19.038330078125, 19.6641845703125, 20.2900390625, 20.9158935546875, 21.541748046875, 22.1676025390625, 22.79345703125, 23.4193115234375, 24.045166015625, 24.6710205078125, 25.296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 38.0, 68.0, 120.0, 172.0, 186.0, 189.0, 83.0, 72.0, 36.0, 14.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5703125, -0.5393524169921875, -0.508392333984375, -0.4774322509765625, -0.44647216796875, -0.4155120849609375, -0.384552001953125, -0.3535919189453125, -0.3226318359375, -0.2916717529296875, -0.260711669921875, -0.2297515869140625, -0.19879150390625, -0.1678314208984375, -0.136871337890625, -0.1059112548828125, -0.074951171875, -0.0439910888671875, -0.013031005859375, 0.0179290771484375, 0.04888916015625, 0.0798492431640625, 0.110809326171875, 0.1417694091796875, 0.1727294921875, 0.2036895751953125, 0.234649658203125, 0.2656097412109375, 0.29656982421875, 0.3275299072265625, 0.358489990234375, 0.3894500732421875, 0.42041015625, 0.4513702392578125, 0.482330322265625, 0.5132904052734375, 0.54425048828125, 0.5752105712890625, 0.606170654296875, 0.6371307373046875, 0.6680908203125, 0.6990509033203125, 0.730010986328125, 0.7609710693359375, 0.79193115234375, 0.8228912353515625, 0.853851318359375, 0.8848114013671875, 0.915771484375, 0.9467315673828125, 0.977691650390625, 1.0086517333984375, 1.03961181640625, 1.0705718994140625, 1.101531982421875, 1.1324920654296875, 1.1634521484375, 1.1944122314453125, 1.225372314453125, 1.2563323974609375, 1.28729248046875, 1.3182525634765625, 1.349212646484375, 1.3801727294921875, 1.4111328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 10.0, 17.0, 20.0, 34.0, 42.0, 99.0, 227.0, 1659.0, 3809754.0, 380951.0, 1072.0, 181.0, 77.0, 52.0, 37.0, 19.0, 17.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.96875, -35.28173828125, -33.5947265625, -31.90771484375, -30.220703125, -28.53369140625, -26.8466796875, -25.15966796875, -23.47265625, -21.78564453125, -20.0986328125, -18.41162109375, -16.724609375, -15.03759765625, -13.3505859375, -11.66357421875, -9.9765625, -8.28955078125, -6.6025390625, -4.91552734375, -3.228515625, -1.54150390625, 0.1455078125, 1.83251953125, 3.51953125, 5.20654296875, 6.8935546875, 8.58056640625, 10.267578125, 11.95458984375, 13.6416015625, 15.32861328125, 17.015625, 18.70263671875, 20.3896484375, 22.07666015625, 23.763671875, 25.45068359375, 27.1376953125, 28.82470703125, 30.51171875, 32.19873046875, 33.8857421875, 35.57275390625, 37.259765625, 38.94677734375, 40.6337890625, 42.32080078125, 44.0078125, 45.69482421875, 47.3818359375, 49.06884765625, 50.755859375, 52.44287109375, 54.1298828125, 55.81689453125, 57.50390625, 59.19091796875, 60.8779296875, 62.56494140625, 64.251953125, 65.93896484375, 67.6259765625, 69.31298828125, 71.0]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 8.0, 16.0, 23.0, 34.0, 54.0, 71.0, 124.0, 185.0, 419.0, 1213.0, 1010.0, 358.0, 196.0, 137.0, 65.0, 47.0, 29.0, 22.0, 12.0, 13.0, 5.0, 5.0, 10.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0787353515625, -1.035400390625, -0.9920654296875, -0.94873046875, -0.9053955078125, -0.862060546875, -0.8187255859375, -0.775390625, -0.7320556640625, -0.688720703125, -0.6453857421875, -0.60205078125, -0.5587158203125, -0.515380859375, -0.4720458984375, -0.4287109375, -0.3853759765625, -0.342041015625, -0.2987060546875, -0.25537109375, -0.2120361328125, -0.168701171875, -0.1253662109375, -0.08203125, -0.0386962890625, 0.004638671875, 0.0479736328125, 0.09130859375, 0.1346435546875, 0.177978515625, 0.2213134765625, 0.2646484375, 0.3079833984375, 0.351318359375, 0.3946533203125, 0.43798828125, 0.4813232421875, 0.524658203125, 0.5679931640625, 0.611328125, 0.6546630859375, 0.697998046875, 0.7413330078125, 0.78466796875, 0.8280029296875, 0.871337890625, 0.9146728515625, 0.9580078125, 1.0013427734375, 1.044677734375, 1.0880126953125, 1.13134765625, 1.1746826171875, 1.218017578125, 1.2613525390625, 1.3046875, 1.3480224609375, 1.391357421875, 1.4346923828125, 1.47802734375, 1.5213623046875, 1.564697265625, 1.6080322265625, 1.6513671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 22.0, 699.0, 281.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.898273468017578, -23.83354377746582, -20.768814086914062, -17.704084396362305, -14.639354705810547, -11.574625015258789, -8.509895324707031, -5.445165634155273, -2.3804359436035156, 0.6842937469482422, 3.7490234375, 6.813753128051758, 9.878482818603516, 12.943212509155273, 16.00794219970703, 19.07267189025879, 22.137401580810547, 25.202131271362305, 28.266860961914062, 31.33159065246582, 34.39632034301758, 37.46105194091797, 40.525779724121094, 43.59050750732422, 46.65523910522461, 49.719970703125, 52.784698486328125, 55.84942626953125, 58.91415786743164, 61.97888946533203, 65.04361724853516, 68.10834503173828, 71.17308044433594, 74.23780822753906, 77.30253601074219, 80.36727142333984, 83.43199920654297, 86.4967269897461, 89.56146240234375, 92.62619018554688, 95.69091796875, 98.75564575195312, 101.82037353515625, 104.8851089477539, 107.94983673095703, 111.01456451416016, 114.07929992675781, 117.14402770996094, 120.20875549316406, 123.27348327636719, 126.33821105957031, 129.40293884277344, 132.46768188476562, 135.53240966796875, 138.59713745117188, 141.661865234375, 144.72659301757812, 147.79132080078125, 150.85604858398438, 153.9207763671875, 156.98550415039062, 160.0502471923828, 163.11497497558594, 166.17970275878906, 169.2444305419922]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 8.0, 20.0, 38.0, 46.0, 120.0, 127.0, 146.0, 157.0, 136.0, 84.0, 57.0, 35.0, 17.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.236019134521484, -16.62786102294922, -16.019704818725586, -15.41154670715332, -14.803389549255371, -14.195232391357422, -13.587075233459473, -12.978918075561523, -12.370759963989258, -11.762602806091309, -11.15444564819336, -10.546287536621094, -9.938130378723145, -9.329973220825195, -8.721816062927246, -8.113658905029297, -7.505501747131348, -6.897344589233398, -6.289186954498291, -5.681029796600342, -5.072872161865234, -4.464715003967285, -3.856557846069336, -3.2484002113342285, -2.6402430534362793, -2.032085657119751, -1.4239283800125122, -0.8157711029052734, -0.20761370658874512, 0.4005436897277832, 1.0087008476257324, 1.6168584823608398, 2.225015640258789, 2.8331730365753174, 3.4413304328918457, 4.049487590789795, 4.657645225524902, 5.265802383422852, 5.873959541320801, 6.482117176055908, 7.090274333953857, 7.698431491851807, 8.306589126586914, 8.914746284484863, 9.522903442382812, 10.131061553955078, 10.739217758178711, 11.347375869750977, 11.955533027648926, 12.563690185546875, 13.171847343444824, 13.780004501342773, 14.388162612915039, 14.996319770812988, 15.604476928710938, 16.212635040283203, 16.820791244506836, 17.4289493560791, 18.037105560302734, 18.645263671875, 19.253419876098633, 19.8615779876709, 20.46973419189453, 21.077892303466797, 21.686050415039062]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 6.0, 9.0, 23.0, 15.0, 18.0, 16.0, 18.0, 39.0, 37.0, 33.0, 48.0, 58.0, 100.0, 951.0, 742633.0, 303593.0, 524.0, 67.0, 50.0, 53.0, 38.0, 36.0, 46.0, 35.0, 19.0, 21.0, 13.0, 11.0, 9.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.46142578125, -29.5634765625, -28.66552734375, -27.767578125, -26.86962890625, -25.9716796875, -25.07373046875, -24.17578125, -23.27783203125, -22.3798828125, -21.48193359375, -20.583984375, -19.68603515625, -18.7880859375, -17.89013671875, -16.9921875, -16.09423828125, -15.1962890625, -14.29833984375, -13.400390625, -12.50244140625, -11.6044921875, -10.70654296875, -9.80859375, -8.91064453125, -8.0126953125, -7.11474609375, -6.216796875, -5.31884765625, -4.4208984375, -3.52294921875, -2.625, -1.72705078125, -0.8291015625, 0.06884765625, 0.966796875, 1.86474609375, 2.7626953125, 3.66064453125, 4.55859375, 5.45654296875, 6.3544921875, 7.25244140625, 8.150390625, 9.04833984375, 9.9462890625, 10.84423828125, 11.7421875, 12.64013671875, 13.5380859375, 14.43603515625, 15.333984375, 16.23193359375, 17.1298828125, 18.02783203125, 18.92578125, 19.82373046875, 20.7216796875, 21.61962890625, 22.517578125, 23.41552734375, 24.3134765625, 25.21142578125, 26.109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 9.0, 82.0, 278.0, 446.0, 181.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.556640625, -0.468719482421875, -0.38079833984375, -0.292877197265625, -0.2049560546875, -0.117034912109375, -0.02911376953125, 0.058807373046875, 0.146728515625, 0.234649658203125, 0.32257080078125, 0.410491943359375, 0.4984130859375, 0.586334228515625, 0.67425537109375, 0.762176513671875, 0.85009765625, 0.938018798828125, 1.02593994140625, 1.113861083984375, 1.2017822265625, 1.289703369140625, 1.37762451171875, 1.465545654296875, 1.553466796875, 1.641387939453125, 1.72930908203125, 1.817230224609375, 1.9051513671875, 1.993072509765625, 2.08099365234375, 2.168914794921875, 2.2568359375, 2.344757080078125, 2.43267822265625, 2.520599365234375, 2.6085205078125, 2.696441650390625, 2.78436279296875, 2.872283935546875, 2.960205078125, 3.048126220703125, 3.13604736328125, 3.223968505859375, 3.3118896484375, 3.399810791015625, 3.48773193359375, 3.575653076171875, 3.66357421875, 3.751495361328125, 3.83941650390625, 3.927337646484375, 4.0152587890625, 4.103179931640625, 4.19110107421875, 4.279022216796875, 4.366943359375, 4.454864501953125, 4.54278564453125, 4.630706787109375, 4.7186279296875, 4.806549072265625, 4.89447021484375, 4.982391357421875, 5.0703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 14.0, 14.0, 21.0, 48.0, 84.0, 137.0, 335.0, 738.0, 2112.0, 7190.0, 35950.0, 245726.0, 596862.0, 131414.0, 20473.0, 4785.0, 1562.0, 578.0, 261.0, 105.0, 59.0, 31.0, 21.0, 10.0, 5.0, 3.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.55767822265625, -9.2872314453125, -9.01678466796875, -8.746337890625, -8.47589111328125, -8.2054443359375, -7.93499755859375, -7.66455078125, -7.39410400390625, -7.1236572265625, -6.85321044921875, -6.582763671875, -6.31231689453125, -6.0418701171875, -5.77142333984375, -5.5009765625, -5.23052978515625, -4.9600830078125, -4.68963623046875, -4.419189453125, -4.14874267578125, -3.8782958984375, -3.60784912109375, -3.33740234375, -3.06695556640625, -2.7965087890625, -2.52606201171875, -2.255615234375, -1.98516845703125, -1.7147216796875, -1.44427490234375, -1.173828125, -0.90338134765625, -0.6329345703125, -0.36248779296875, -0.092041015625, 0.17840576171875, 0.4488525390625, 0.71929931640625, 0.98974609375, 1.26019287109375, 1.5306396484375, 1.80108642578125, 2.071533203125, 2.34197998046875, 2.6124267578125, 2.88287353515625, 3.1533203125, 3.42376708984375, 3.6942138671875, 3.96466064453125, 4.235107421875, 4.50555419921875, 4.7760009765625, 5.04644775390625, 5.31689453125, 5.58734130859375, 5.8577880859375, 6.12823486328125, 6.398681640625, 6.66912841796875, 6.9395751953125, 7.21002197265625, 7.48046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 10.0, 8.0, 12.0, 16.0, 26.0, 34.0, 48.0, 40.0, 43.0, 52.0, 57.0, 60.0, 53.0, 57.0, 56.0, 48.0, 57.0, 58.0, 53.0, 34.0, 32.0, 24.0, 24.0, 23.0, 18.0, 11.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.1015625, -4.96270751953125, -4.8238525390625, -4.68499755859375, -4.546142578125, -4.40728759765625, -4.2684326171875, -4.12957763671875, -3.99072265625, -3.85186767578125, -3.7130126953125, -3.57415771484375, -3.435302734375, -3.29644775390625, -3.1575927734375, -3.01873779296875, -2.8798828125, -2.74102783203125, -2.6021728515625, -2.46331787109375, -2.324462890625, -2.18560791015625, -2.0467529296875, -1.90789794921875, -1.76904296875, -1.63018798828125, -1.4913330078125, -1.35247802734375, -1.213623046875, -1.07476806640625, -0.9359130859375, -0.79705810546875, -0.658203125, -0.51934814453125, -0.3804931640625, -0.24163818359375, -0.102783203125, 0.03607177734375, 0.1749267578125, 0.31378173828125, 0.45263671875, 0.59149169921875, 0.7303466796875, 0.86920166015625, 1.008056640625, 1.14691162109375, 1.2857666015625, 1.42462158203125, 1.5634765625, 1.70233154296875, 1.8411865234375, 1.98004150390625, 2.118896484375, 2.25775146484375, 2.3966064453125, 2.53546142578125, 2.67431640625, 2.81317138671875, 2.9520263671875, 3.09088134765625, 3.229736328125, 3.36859130859375, 3.5074462890625, 3.64630126953125, 3.78515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 15.0, 10.0, 25.0, 23.0, 25.0, 55.0, 107.0, 161.0, 272.0, 479.0, 1001.0, 2476.0, 7277.0, 29003.0, 197433.0, 640235.0, 137404.0, 22569.0, 5897.0, 2064.0, 918.0, 458.0, 231.0, 120.0, 93.0, 59.0, 34.0, 26.0, 18.0, 17.0, 12.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.48248291015625, -5.2579345703125, -5.03338623046875, -4.808837890625, -4.58428955078125, -4.3597412109375, -4.13519287109375, -3.91064453125, -3.68609619140625, -3.4615478515625, -3.23699951171875, -3.012451171875, -2.78790283203125, -2.5633544921875, -2.33880615234375, -2.1142578125, -1.88970947265625, -1.6651611328125, -1.44061279296875, -1.216064453125, -0.99151611328125, -0.7669677734375, -0.54241943359375, -0.31787109375, -0.09332275390625, 0.1312255859375, 0.35577392578125, 0.580322265625, 0.80487060546875, 1.0294189453125, 1.25396728515625, 1.478515625, 1.70306396484375, 1.9276123046875, 2.15216064453125, 2.376708984375, 2.60125732421875, 2.8258056640625, 3.05035400390625, 3.27490234375, 3.49945068359375, 3.7239990234375, 3.94854736328125, 4.173095703125, 4.39764404296875, 4.6221923828125, 4.84674072265625, 5.0712890625, 5.29583740234375, 5.5203857421875, 5.74493408203125, 5.969482421875, 6.19403076171875, 6.4185791015625, 6.64312744140625, 6.86767578125, 7.09222412109375, 7.3167724609375, 7.54132080078125, 7.765869140625, 7.99041748046875, 8.2149658203125, 8.43951416015625, 8.6640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 9.0, 10.0, 19.0, 13.0, 23.0, 22.0, 44.0, 60.0, 85.0, 123.0, 144.0, 121.0, 91.0, 70.0, 37.0, 30.0, 28.0, 17.0, 5.0, 11.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001102447509765625, -0.0010695457458496094, -0.0010366439819335938, -0.0010037422180175781, -0.0009708404541015625, -0.0009379386901855469, -0.0009050369262695312, -0.0008721351623535156, -0.0008392333984375, -0.0008063316345214844, -0.0007734298706054688, -0.0007405281066894531, -0.0007076263427734375, -0.0006747245788574219, -0.0006418228149414062, -0.0006089210510253906, -0.000576019287109375, -0.0005431175231933594, -0.0005102157592773438, -0.0004773139953613281, -0.0004444122314453125, -0.0004115104675292969, -0.00037860870361328125, -0.0003457069396972656, -0.00031280517578125, -0.0002799034118652344, -0.00024700164794921875, -0.00021409988403320312, -0.0001811981201171875, -0.00014829635620117188, -0.00011539459228515625, -8.249282836914062e-05, -4.9591064453125e-05, -1.6689300537109375e-05, 1.621246337890625e-05, 4.9114227294921875e-05, 8.20159912109375e-05, 0.00011491775512695312, 0.00014781951904296875, 0.00018072128295898438, 0.000213623046875, 0.0002465248107910156, 0.00027942657470703125, 0.0003123283386230469, 0.0003452301025390625, 0.0003781318664550781, 0.00041103363037109375, 0.0004439353942871094, 0.000476837158203125, 0.0005097389221191406, 0.0005426406860351562, 0.0005755424499511719, 0.0006084442138671875, 0.0006413459777832031, 0.0006742477416992188, 0.0007071495056152344, 0.00074005126953125, 0.0007729530334472656, 0.0008058547973632812, 0.0008387565612792969, 0.0008716583251953125, 0.0009045600891113281, 0.0009374618530273438, 0.0009703636169433594, 0.001003265380859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 17.0, 34.0, 43.0, 76.0, 110.0, 207.0, 384.0, 782.0, 1676.0, 4311.0, 14225.0, 65470.0, 417968.0, 449022.0, 71079.0, 15159.0, 4557.0, 1710.0, 776.0, 394.0, 210.0, 104.0, 77.0, 42.0, 36.0, 16.0, 11.0, 13.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.3660888671875, -6.154052734375, -5.9420166015625, -5.72998046875, -5.5179443359375, -5.305908203125, -5.0938720703125, -4.8818359375, -4.6697998046875, -4.457763671875, -4.2457275390625, -4.03369140625, -3.8216552734375, -3.609619140625, -3.3975830078125, -3.185546875, -2.9735107421875, -2.761474609375, -2.5494384765625, -2.33740234375, -2.1253662109375, -1.913330078125, -1.7012939453125, -1.4892578125, -1.2772216796875, -1.065185546875, -0.8531494140625, -0.64111328125, -0.4290771484375, -0.217041015625, -0.0050048828125, 0.20703125, 0.4190673828125, 0.631103515625, 0.8431396484375, 1.05517578125, 1.2672119140625, 1.479248046875, 1.6912841796875, 1.9033203125, 2.1153564453125, 2.327392578125, 2.5394287109375, 2.75146484375, 2.9635009765625, 3.175537109375, 3.3875732421875, 3.599609375, 3.8116455078125, 4.023681640625, 4.2357177734375, 4.44775390625, 4.6597900390625, 4.871826171875, 5.0838623046875, 5.2958984375, 5.5079345703125, 5.719970703125, 5.9320068359375, 6.14404296875, 6.3560791015625, 6.568115234375, 6.7801513671875, 6.9921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 10.0, 6.0, 24.0, 23.0, 26.0, 31.0, 35.0, 50.0, 71.0, 78.0, 103.0, 91.0, 96.0, 74.0, 58.0, 49.0, 33.0, 33.0, 24.0, 26.0, 11.0, 11.0, 7.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.229095458984375, -3.12225341796875, -3.015411376953125, -2.9085693359375, -2.801727294921875, -2.69488525390625, -2.588043212890625, -2.481201171875, -2.374359130859375, -2.26751708984375, -2.160675048828125, -2.0538330078125, -1.946990966796875, -1.84014892578125, -1.733306884765625, -1.62646484375, -1.519622802734375, -1.41278076171875, -1.305938720703125, -1.1990966796875, -1.092254638671875, -0.98541259765625, -0.878570556640625, -0.771728515625, -0.664886474609375, -0.55804443359375, -0.451202392578125, -0.3443603515625, -0.237518310546875, -0.13067626953125, -0.023834228515625, 0.0830078125, 0.189849853515625, 0.29669189453125, 0.403533935546875, 0.5103759765625, 0.617218017578125, 0.72406005859375, 0.830902099609375, 0.937744140625, 1.044586181640625, 1.15142822265625, 1.258270263671875, 1.3651123046875, 1.471954345703125, 1.57879638671875, 1.685638427734375, 1.79248046875, 1.899322509765625, 2.00616455078125, 2.113006591796875, 2.2198486328125, 2.326690673828125, 2.43353271484375, 2.540374755859375, 2.647216796875, 2.754058837890625, 2.86090087890625, 2.967742919921875, 3.0745849609375, 3.181427001953125, 3.28826904296875, 3.395111083984375, 3.501953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 10.0, 43.0, 490.0, 422.0, 44.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.52777862548828, -40.722900390625, -34.91802215576172, -29.113140106201172, -23.30826187133789, -17.50338363647461, -11.698501586914062, -5.893623352050781, -0.0887451171875, 5.716134071350098, 11.521013259887695, 17.32589340209961, 23.13077163696289, 28.935649871826172, 34.74053192138672, 40.54541015625, 46.35028839111328, 52.15516662597656, 57.960044860839844, 63.76492691040039, 69.56980895996094, 75.37467956542969, 81.1795654296875, 86.98444366455078, 92.78932189941406, 98.59420013427734, 104.39907836914062, 110.20396423339844, 116.00883483886719, 121.813720703125, 127.61859893798828, 133.42347717285156, 139.22836303710938, 145.0332489013672, 150.83811950683594, 156.64300537109375, 162.4478759765625, 168.2527618408203, 174.05764770507812, 179.86251831054688, 185.66738891601562, 191.47227478027344, 197.2771453857422, 203.08203125, 208.88690185546875, 214.69178771972656, 220.49667358398438, 226.30154418945312, 232.10643005371094, 237.91131591796875, 243.7161865234375, 249.5210723876953, 255.32594299316406, 261.1308288574219, 266.9356994628906, 272.7406005859375, 278.54547119140625, 284.350341796875, 290.1552429199219, 295.9601135253906, 301.7649841308594, 307.5698547363281, 313.374755859375, 319.17962646484375, 324.9844970703125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 5.0, 8.0, 18.0, 8.0, 21.0, 23.0, 26.0, 30.0, 43.0, 23.0, 51.0, 48.0, 48.0, 43.0, 51.0, 49.0, 48.0, 46.0, 56.0, 43.0, 41.0, 30.0, 35.0, 26.0, 32.0, 27.0, 23.0, 18.0, 17.0, 16.0, 7.0, 14.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.02764320373535, -21.275657653808594, -20.52367401123047, -19.77168846130371, -19.019702911376953, -18.267719268798828, -17.51573371887207, -16.763748168945312, -16.011764526367188, -15.259779930114746, -14.507794380187988, -13.755809783935547, -13.003824234008789, -12.251839637756348, -11.499855041503906, -10.747869491577148, -9.99588394165039, -9.24389934539795, -8.491913795471191, -7.73992919921875, -6.98794412612915, -6.235959053039551, -5.483974456787109, -4.73198938369751, -3.98000431060791, -3.2280192375183105, -2.47603440284729, -1.7240495681762695, -0.9720644950866699, -0.2200794219970703, 0.5319051742553711, 1.2838902473449707, 2.0358734130859375, 2.787858486175537, 3.5398433208465576, 4.291828155517578, 5.043813228607178, 5.795798301696777, 6.547782897949219, 7.299767971038818, 8.051753044128418, 8.80373764038086, 9.555723190307617, 10.307707786560059, 11.0596923828125, 11.811677932739258, 12.5636625289917, 13.31564712524414, 14.067632675170898, 14.81961727142334, 15.571602821350098, 16.32358741760254, 17.075572967529297, 17.827556610107422, 18.57954216003418, 19.331527709960938, 20.083511352539062, 20.83549690246582, 21.587480545043945, 22.339466094970703, 23.09145164489746, 23.84343719482422, 24.595420837402344, 25.3474063873291, 26.09939193725586]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 25.0, 176.0, 2026.0, 4185633.0, 5762.0, 348.0, 148.0, 80.0, 39.0, 27.0, 17.0, 6.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -22.22119140625, -18.8486328125, -15.47607421875, -12.103515625, -8.73095703125, -5.3583984375, -1.98583984375, 1.38671875, 4.75927734375, 8.1318359375, 11.50439453125, 14.876953125, 18.24951171875, 21.6220703125, 24.99462890625, 28.3671875, 31.73974609375, 35.1123046875, 38.48486328125, 41.857421875, 45.22998046875, 48.6025390625, 51.97509765625, 55.34765625, 58.72021484375, 62.0927734375, 65.46533203125, 68.837890625, 72.21044921875, 75.5830078125, 78.95556640625, 82.328125, 85.70068359375, 89.0732421875, 92.44580078125, 95.818359375, 99.19091796875, 102.5634765625, 105.93603515625, 109.30859375, 112.68115234375, 116.0537109375, 119.42626953125, 122.798828125, 126.17138671875, 129.5439453125, 132.91650390625, 136.2890625, 139.66162109375, 143.0341796875, 146.40673828125, 149.779296875, 153.15185546875, 156.5244140625, 159.89697265625, 163.26953125, 166.64208984375, 170.0146484375, 173.38720703125, 176.759765625, 180.13232421875, 183.5048828125, 186.87744140625, 190.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 30.0, 113.0, 267.0, 294.0, 210.0, 74.0, 17.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8115234375, -0.7143707275390625, -0.617218017578125, -0.5200653076171875, -0.42291259765625, -0.3257598876953125, -0.228607177734375, -0.1314544677734375, -0.0343017578125, 0.0628509521484375, 0.160003662109375, 0.2571563720703125, 0.35430908203125, 0.4514617919921875, 0.548614501953125, 0.6457672119140625, 0.742919921875, 0.8400726318359375, 0.937225341796875, 1.0343780517578125, 1.13153076171875, 1.2286834716796875, 1.325836181640625, 1.4229888916015625, 1.5201416015625, 1.6172943115234375, 1.714447021484375, 1.8115997314453125, 1.90875244140625, 2.0059051513671875, 2.103057861328125, 2.2002105712890625, 2.29736328125, 2.3945159912109375, 2.491668701171875, 2.5888214111328125, 2.68597412109375, 2.7831268310546875, 2.880279541015625, 2.9774322509765625, 3.0745849609375, 3.1717376708984375, 3.268890380859375, 3.3660430908203125, 3.46319580078125, 3.5603485107421875, 3.657501220703125, 3.7546539306640625, 3.851806640625, 3.9489593505859375, 4.046112060546875, 4.1432647705078125, 4.24041748046875, 4.3375701904296875, 4.434722900390625, 4.5318756103515625, 4.6290283203125, 4.7261810302734375, 4.823333740234375, 4.9204864501953125, 5.01763916015625, 5.1147918701171875, 5.211944580078125, 5.3090972900390625, 5.40625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 16.0, 42.0, 69.0, 129.0, 231.0, 1449.0, 4190834.0, 781.0, 283.0, 193.0, 128.0, 64.0, 38.0, 14.0, 4.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.625, -79.32421875, -75.0234375, -70.72265625, -66.421875, -62.12109375, -57.8203125, -53.51953125, -49.21875, -44.91796875, -40.6171875, -36.31640625, -32.015625, -27.71484375, -23.4140625, -19.11328125, -14.8125, -10.51171875, -6.2109375, -1.91015625, 2.390625, 6.69140625, 10.9921875, 15.29296875, 19.59375, 23.89453125, 28.1953125, 32.49609375, 36.796875, 41.09765625, 45.3984375, 49.69921875, 54.0, 58.30078125, 62.6015625, 66.90234375, 71.203125, 75.50390625, 79.8046875, 84.10546875, 88.40625, 92.70703125, 97.0078125, 101.30859375, 105.609375, 109.91015625, 114.2109375, 118.51171875, 122.8125, 127.11328125, 131.4140625, 135.71484375, 140.015625, 144.31640625, 148.6171875, 152.91796875, 157.21875, 161.51953125, 165.8203125, 170.12109375, 174.421875, 178.72265625, 183.0234375, 187.32421875, 191.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 33.0, 229.0, 3576.0, 221.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -3.76409912109375, -3.3211669921875, -2.87823486328125, -2.435302734375, -1.99237060546875, -1.5494384765625, -1.10650634765625, -0.66357421875, -0.22064208984375, 0.2222900390625, 0.66522216796875, 1.108154296875, 1.55108642578125, 1.9940185546875, 2.43695068359375, 2.8798828125, 3.32281494140625, 3.7657470703125, 4.20867919921875, 4.651611328125, 5.09454345703125, 5.5374755859375, 5.98040771484375, 6.42333984375, 6.86627197265625, 7.3092041015625, 7.75213623046875, 8.195068359375, 8.63800048828125, 9.0809326171875, 9.52386474609375, 9.966796875, 10.40972900390625, 10.8526611328125, 11.29559326171875, 11.738525390625, 12.18145751953125, 12.6243896484375, 13.06732177734375, 13.51025390625, 13.95318603515625, 14.3961181640625, 14.83905029296875, 15.281982421875, 15.72491455078125, 16.1678466796875, 16.61077880859375, 17.0537109375, 17.49664306640625, 17.9395751953125, 18.38250732421875, 18.825439453125, 19.26837158203125, 19.7113037109375, 20.15423583984375, 20.59716796875, 21.04010009765625, 21.4830322265625, 21.92596435546875, 22.368896484375, 22.81182861328125, 23.2547607421875, 23.69769287109375, 24.140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 8.0, 14.0, 87.0, 578.0, 266.0, 41.0, 12.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.8748836517334, -22.5186710357666, -19.162460327148438, -15.80624771118164, -12.450035095214844, -9.093822479248047, -5.737611770629883, -2.381399154663086, 0.9748134613037109, 4.33102560043335, 7.687237739562988, 11.043449401855469, 14.399662017822266, 17.755874633789062, 21.112085342407227, 24.468297958374023, 27.82451057434082, 31.180723190307617, 34.53693389892578, 37.89314651489258, 41.249359130859375, 44.60557174682617, 47.96178436279297, 51.3179931640625, 54.67420959472656, 58.03042221069336, 61.386634826660156, 64.74284362792969, 68.09906005859375, 71.45526885986328, 74.81147766113281, 78.16769409179688, 81.52391052246094, 84.88011932373047, 88.23633575439453, 91.59254455566406, 94.94876098632812, 98.30496978759766, 101.66117858886719, 105.01739501953125, 108.37361145019531, 111.72982025146484, 115.0860366821289, 118.44224548339844, 121.7984619140625, 125.15467071533203, 128.51087951660156, 131.86709594726562, 135.22329711914062, 138.5795135498047, 141.9357147216797, 145.29193115234375, 148.6481475830078, 152.00436401367188, 155.36056518554688, 158.71678161621094, 162.072998046875, 165.42921447753906, 168.78541564941406, 172.14163208007812, 175.4978485107422, 178.85406494140625, 182.21026611328125, 185.5664825439453, 188.92269897460938]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 13.0, 39.0, 53.0, 86.0, 111.0, 170.0, 161.0, 142.0, 103.0, 51.0, 33.0, 18.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.68478393554688, -71.40959167480469, -69.13440704345703, -66.85921478271484, -64.58403015136719, -62.308841705322266, -60.033653259277344, -57.758460998535156, -55.4832763671875, -53.20808792114258, -50.932899475097656, -48.657711029052734, -46.38252258300781, -44.10733413696289, -41.83214569091797, -39.55695343017578, -37.28176498413086, -35.00657653808594, -32.731388092041016, -30.456199645996094, -28.181011199951172, -25.90582275390625, -23.630632400512695, -21.355443954467773, -19.08025550842285, -16.80506706237793, -14.529878616333008, -12.25468921661377, -9.979500770568848, -7.704312324523926, -5.4291229248046875, -3.1539344787597656, -0.8787460327148438, 1.3964426517486572, 3.671631336212158, 5.946820259094238, 8.22200870513916, 10.497197151184082, 12.77238655090332, 15.047574996948242, 17.322763442993164, 19.597951889038086, 21.873140335083008, 24.148330688476562, 26.423519134521484, 28.698707580566406, 30.973896026611328, 33.24908447265625, 35.52427291870117, 37.799461364746094, 40.074649810791016, 42.34983825683594, 44.62502670288086, 46.90021514892578, 49.17540740966797, 51.450592041015625, 53.72578430175781, 56.000972747802734, 58.276161193847656, 60.55134963989258, 62.8265380859375, 65.10173034667969, 67.37691497802734, 69.65210723876953, 71.92729187011719]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 15.0, 29.0, 28.0, 49.0, 92.0, 154.0, 474.0, 2033.0, 30500.0, 972370.0, 39542.0, 2309.0, 523.0, 155.0, 89.0, 58.0, 31.0, 28.0, 16.0, 14.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.1875, -37.98291015625, -36.7783203125, -35.57373046875, -34.369140625, -33.16455078125, -31.9599609375, -30.75537109375, -29.55078125, -28.34619140625, -27.1416015625, -25.93701171875, -24.732421875, -23.52783203125, -22.3232421875, -21.11865234375, -19.9140625, -18.70947265625, -17.5048828125, -16.30029296875, -15.095703125, -13.89111328125, -12.6865234375, -11.48193359375, -10.27734375, -9.07275390625, -7.8681640625, -6.66357421875, -5.458984375, -4.25439453125, -3.0498046875, -1.84521484375, -0.640625, 0.56396484375, 1.7685546875, 2.97314453125, 4.177734375, 5.38232421875, 6.5869140625, 7.79150390625, 8.99609375, 10.20068359375, 11.4052734375, 12.60986328125, 13.814453125, 15.01904296875, 16.2236328125, 17.42822265625, 18.6328125, 19.83740234375, 21.0419921875, 22.24658203125, 23.451171875, 24.65576171875, 25.8603515625, 27.06494140625, 28.26953125, 29.47412109375, 30.6787109375, 31.88330078125, 33.087890625, 34.29248046875, 35.4970703125, 36.70166015625, 37.90625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 27.0, 45.0, 87.0, 147.0, 187.0, 194.0, 145.0, 94.0, 50.0, 15.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.170623779296875, -2.02679443359375, -1.882965087890625, -1.7391357421875, -1.595306396484375, -1.45147705078125, -1.307647705078125, -1.163818359375, -1.019989013671875, -0.87615966796875, -0.732330322265625, -0.5885009765625, -0.444671630859375, -0.30084228515625, -0.157012939453125, -0.01318359375, 0.130645751953125, 0.27447509765625, 0.418304443359375, 0.5621337890625, 0.705963134765625, 0.84979248046875, 0.993621826171875, 1.137451171875, 1.281280517578125, 1.42510986328125, 1.568939208984375, 1.7127685546875, 1.856597900390625, 2.00042724609375, 2.144256591796875, 2.2880859375, 2.431915283203125, 2.57574462890625, 2.719573974609375, 2.8634033203125, 3.007232666015625, 3.15106201171875, 3.294891357421875, 3.438720703125, 3.582550048828125, 3.72637939453125, 3.870208740234375, 4.0140380859375, 4.157867431640625, 4.30169677734375, 4.445526123046875, 4.58935546875, 4.733184814453125, 4.87701416015625, 5.020843505859375, 5.1646728515625, 5.308502197265625, 5.45233154296875, 5.596160888671875, 5.739990234375, 5.883819580078125, 6.02764892578125, 6.171478271484375, 6.3153076171875, 6.459136962890625, 6.60296630859375, 6.746795654296875, 6.890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 17.0, 12.0, 12.0, 21.0, 27.0, 37.0, 69.0, 113.0, 284.0, 687.0, 2523.0, 16488.0, 309360.0, 674590.0, 38334.0, 4246.0, 1008.0, 307.0, 147.0, 81.0, 44.0, 30.0, 32.0, 15.0, 16.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.4520263671875, -12.974365234375, -12.4967041015625, -12.01904296875, -11.5413818359375, -11.063720703125, -10.5860595703125, -10.1083984375, -9.6307373046875, -9.153076171875, -8.6754150390625, -8.19775390625, -7.7200927734375, -7.242431640625, -6.7647705078125, -6.287109375, -5.8094482421875, -5.331787109375, -4.8541259765625, -4.37646484375, -3.8988037109375, -3.421142578125, -2.9434814453125, -2.4658203125, -1.9881591796875, -1.510498046875, -1.0328369140625, -0.55517578125, -0.0775146484375, 0.400146484375, 0.8778076171875, 1.35546875, 1.8331298828125, 2.310791015625, 2.7884521484375, 3.26611328125, 3.7437744140625, 4.221435546875, 4.6990966796875, 5.1767578125, 5.6544189453125, 6.132080078125, 6.6097412109375, 7.08740234375, 7.5650634765625, 8.042724609375, 8.5203857421875, 8.998046875, 9.4757080078125, 9.953369140625, 10.4310302734375, 10.90869140625, 11.3863525390625, 11.864013671875, 12.3416748046875, 12.8193359375, 13.2969970703125, 13.774658203125, 14.2523193359375, 14.72998046875, 15.2076416015625, 15.685302734375, 16.1629638671875, 16.640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 13.0, 13.0, 17.0, 12.0, 27.0, 23.0, 36.0, 35.0, 46.0, 49.0, 60.0, 79.0, 69.0, 47.0, 59.0, 55.0, 50.0, 48.0, 42.0, 38.0, 31.0, 27.0, 29.0, 21.0, 19.0, 8.0, 10.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.3143310546875, -6.081787109375, -5.8492431640625, -5.61669921875, -5.3841552734375, -5.151611328125, -4.9190673828125, -4.6865234375, -4.4539794921875, -4.221435546875, -3.9888916015625, -3.75634765625, -3.5238037109375, -3.291259765625, -3.0587158203125, -2.826171875, -2.5936279296875, -2.361083984375, -2.1285400390625, -1.89599609375, -1.6634521484375, -1.430908203125, -1.1983642578125, -0.9658203125, -0.7332763671875, -0.500732421875, -0.2681884765625, -0.03564453125, 0.1968994140625, 0.429443359375, 0.6619873046875, 0.89453125, 1.1270751953125, 1.359619140625, 1.5921630859375, 1.82470703125, 2.0572509765625, 2.289794921875, 2.5223388671875, 2.7548828125, 2.9874267578125, 3.219970703125, 3.4525146484375, 3.68505859375, 3.9176025390625, 4.150146484375, 4.3826904296875, 4.615234375, 4.8477783203125, 5.080322265625, 5.3128662109375, 5.54541015625, 5.7779541015625, 6.010498046875, 6.2430419921875, 6.4755859375, 6.7081298828125, 6.940673828125, 7.1732177734375, 7.40576171875, 7.6383056640625, 7.870849609375, 8.1033935546875, 8.3359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 13.0, 17.0, 16.0, 48.0, 76.0, 166.0, 350.0, 866.0, 2495.0, 14111.0, 247329.0, 729246.0, 46152.0, 5315.0, 1332.0, 473.0, 229.0, 124.0, 73.0, 36.0, 15.0, 16.0, 13.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.390625, -10.0469970703125, -9.703369140625, -9.3597412109375, -9.01611328125, -8.6724853515625, -8.328857421875, -7.9852294921875, -7.6416015625, -7.2979736328125, -6.954345703125, -6.6107177734375, -6.26708984375, -5.9234619140625, -5.579833984375, -5.2362060546875, -4.892578125, -4.5489501953125, -4.205322265625, -3.8616943359375, -3.51806640625, -3.1744384765625, -2.830810546875, -2.4871826171875, -2.1435546875, -1.7999267578125, -1.456298828125, -1.1126708984375, -0.76904296875, -0.4254150390625, -0.081787109375, 0.2618408203125, 0.60546875, 0.9490966796875, 1.292724609375, 1.6363525390625, 1.97998046875, 2.3236083984375, 2.667236328125, 3.0108642578125, 3.3544921875, 3.6981201171875, 4.041748046875, 4.3853759765625, 4.72900390625, 5.0726318359375, 5.416259765625, 5.7598876953125, 6.103515625, 6.4471435546875, 6.790771484375, 7.1343994140625, 7.47802734375, 7.8216552734375, 8.165283203125, 8.5089111328125, 8.8525390625, 9.1961669921875, 9.539794921875, 9.8834228515625, 10.22705078125, 10.5706787109375, 10.914306640625, 11.2579345703125, 11.6015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 8.0, 0.0, 5.0, 10.0, 10.0, 14.0, 11.0, 32.0, 29.0, 23.0, 35.0, 50.0, 50.0, 72.0, 86.0, 76.0, 80.0, 100.0, 66.0, 51.0, 45.0, 33.0, 32.0, 19.0, 11.0, 10.0, 12.0, 8.0, 8.0, 4.0, 5.0, 2.0, 7.0, 1.0], "bins": [-0.0008153915405273438, -0.0007974803447723389, -0.000779569149017334, -0.0007616579532623291, -0.0007437467575073242, -0.0007258355617523193, -0.0007079243659973145, -0.0006900131702423096, -0.0006721019744873047, -0.0006541907787322998, -0.0006362795829772949, -0.00061836838722229, -0.0006004571914672852, -0.0005825459957122803, -0.0005646347999572754, -0.0005467236042022705, -0.0005288124084472656, -0.0005109012126922607, -0.0004929900169372559, -0.000475078821182251, -0.0004571676254272461, -0.0004392564296722412, -0.00042134523391723633, -0.00040343403816223145, -0.00038552284240722656, -0.0003676116466522217, -0.0003497004508972168, -0.0003317892551422119, -0.00031387805938720703, -0.00029596686363220215, -0.00027805566787719727, -0.0002601444721221924, -0.0002422332763671875, -0.00022432208061218262, -0.00020641088485717773, -0.00018849968910217285, -0.00017058849334716797, -0.00015267729759216309, -0.0001347661018371582, -0.00011685490608215332, -9.894371032714844e-05, -8.103251457214355e-05, -6.312131881713867e-05, -4.521012306213379e-05, -2.7298927307128906e-05, -9.387731552124023e-06, 8.52346420288086e-06, 2.6434659957885742e-05, 4.4345855712890625e-05, 6.225705146789551e-05, 8.016824722290039e-05, 9.807944297790527e-05, 0.00011599063873291016, 0.00013390183448791504, 0.00015181303024291992, 0.0001697242259979248, 0.0001876354217529297, 0.00020554661750793457, 0.00022345781326293945, 0.00024136900901794434, 0.0002592802047729492, 0.0002771914005279541, 0.000295102596282959, 0.00031301379203796387, 0.00033092498779296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 10.0, 27.0, 28.0, 90.0, 306.0, 2179.0, 96436.0, 934246.0, 13927.0, 905.0, 220.0, 96.0, 35.0, 18.0, 9.0, 7.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3125, -13.670654296875, -13.02880859375, -12.386962890625, -11.7451171875, -11.103271484375, -10.46142578125, -9.819580078125, -9.177734375, -8.535888671875, -7.89404296875, -7.252197265625, -6.6103515625, -5.968505859375, -5.32666015625, -4.684814453125, -4.04296875, -3.401123046875, -2.75927734375, -2.117431640625, -1.4755859375, -0.833740234375, -0.19189453125, 0.449951171875, 1.091796875, 1.733642578125, 2.37548828125, 3.017333984375, 3.6591796875, 4.301025390625, 4.94287109375, 5.584716796875, 6.2265625, 6.868408203125, 7.51025390625, 8.152099609375, 8.7939453125, 9.435791015625, 10.07763671875, 10.719482421875, 11.361328125, 12.003173828125, 12.64501953125, 13.286865234375, 13.9287109375, 14.570556640625, 15.21240234375, 15.854248046875, 16.49609375, 17.137939453125, 17.77978515625, 18.421630859375, 19.0634765625, 19.705322265625, 20.34716796875, 20.989013671875, 21.630859375, 22.272705078125, 22.91455078125, 23.556396484375, 24.1982421875, 24.840087890625, 25.48193359375, 26.123779296875, 26.765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 9.0, 5.0, 19.0, 48.0, 89.0, 129.0, 211.0, 180.0, 141.0, 99.0, 26.0, 14.0, 10.0, 6.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3046875, -3.0489501953125, -2.793212890625, -2.5374755859375, -2.28173828125, -2.0260009765625, -1.770263671875, -1.5145263671875, -1.2587890625, -1.0030517578125, -0.747314453125, -0.4915771484375, -0.23583984375, 0.0198974609375, 0.275634765625, 0.5313720703125, 0.787109375, 1.0428466796875, 1.298583984375, 1.5543212890625, 1.81005859375, 2.0657958984375, 2.321533203125, 2.5772705078125, 2.8330078125, 3.0887451171875, 3.344482421875, 3.6002197265625, 3.85595703125, 4.1116943359375, 4.367431640625, 4.6231689453125, 4.87890625, 5.1346435546875, 5.390380859375, 5.6461181640625, 5.90185546875, 6.1575927734375, 6.413330078125, 6.6690673828125, 6.9248046875, 7.1805419921875, 7.436279296875, 7.6920166015625, 7.94775390625, 8.2034912109375, 8.459228515625, 8.7149658203125, 8.970703125, 9.2264404296875, 9.482177734375, 9.7379150390625, 9.99365234375, 10.2493896484375, 10.505126953125, 10.7608642578125, 11.0166015625, 11.2723388671875, 11.528076171875, 11.7838134765625, 12.03955078125, 12.2952880859375, 12.551025390625, 12.8067626953125, 13.0625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 13.0, 64.0, 414.0, 430.0, 79.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.1070861816406, -263.6266174316406, -258.14617919921875, -252.66571044921875, -247.18524169921875, -241.7047882080078, -236.22433471679688, -230.74386596679688, -225.26339721679688, -219.78294372558594, -214.30247497558594, -208.822021484375, -203.341552734375, -197.86109924316406, -192.38064575195312, -186.90017700195312, -181.4197235107422, -175.93927001953125, -170.45880126953125, -164.9783477783203, -159.4978790283203, -154.01742553710938, -148.53695678710938, -143.05650329589844, -137.5760498046875, -132.09559631347656, -126.61512756347656, -121.13467407226562, -115.65420532226562, -110.17375183105469, -104.69329071044922, -99.21282958984375, -93.73236846923828, -88.25190734863281, -82.77144622802734, -77.29098510742188, -71.81053161621094, -66.33006286621094, -60.849609375, -55.36914825439453, -49.88868713378906, -44.408226013183594, -38.927764892578125, -33.44730758666992, -27.966846466064453, -22.486385345458984, -17.00592803955078, -11.525466918945312, -6.045005798339844, -0.5645456314086914, 4.915914535522461, 10.396373748779297, 15.876834869384766, 21.357295989990234, 26.837753295898438, 32.318214416503906, 37.798675537109375, 43.279136657714844, 48.75959777832031, 54.240055084228516, 59.720516204833984, 65.20097351074219, 70.68143463134766, 76.16189575195312, 81.6423568725586]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 14.0, 12.0, 18.0, 29.0, 30.0, 37.0, 40.0, 44.0, 56.0, 50.0, 67.0, 56.0, 70.0, 62.0, 65.0, 61.0, 42.0, 46.0, 39.0, 36.0, 22.0, 23.0, 15.0, 13.0, 11.0, 8.0, 4.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.801605224609375, -37.35639572143555, -35.91118621826172, -34.46597671508789, -33.02076721191406, -31.5755558013916, -30.130346298217773, -28.685134887695312, -27.239925384521484, -25.794715881347656, -24.349506378173828, -22.904296875, -21.45908546447754, -20.01387596130371, -18.568666458129883, -17.123455047607422, -15.678247451782227, -14.233037948608398, -12.787827491760254, -11.342617988586426, -9.897407531738281, -8.452198028564453, -7.006988525390625, -5.5617780685424805, -4.116568565368652, -2.671358585357666, -1.2261488437652588, 0.21906089782714844, 1.6642708778381348, 3.109480857849121, 4.554690361022949, 5.999900817871094, 7.445110321044922, 8.89031982421875, 10.335530281066895, 11.780739784240723, 13.225950241088867, 14.671159744262695, 16.116369247436523, 17.561580657958984, 19.006790161132812, 20.45199966430664, 21.89720916748047, 23.342418670654297, 24.787630081176758, 26.232839584350586, 27.678049087524414, 29.123260498046875, 30.56846809387207, 32.01367950439453, 33.45888900756836, 34.90409851074219, 36.349308013916016, 37.794517517089844, 39.23972702026367, 40.6849365234375, 42.13014602661133, 43.575355529785156, 45.020565032958984, 46.46577453613281, 47.91098403930664, 49.35619354248047, 50.80140686035156, 52.24661636352539, 53.69182586669922]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 20.0, 38.0, 77.0, 184.0, 415.0, 1346.0, 7000.0, 100349.0, 4029062.0, 48748.0, 4812.0, 1165.0, 439.0, 228.0, 101.0, 83.0, 53.0, 35.0, 25.0, 16.0, 15.0, 18.0, 10.0, 10.0, 4.0, 10.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.875, -11.98095703125, -11.0869140625, -10.19287109375, -9.298828125, -8.40478515625, -7.5107421875, -6.61669921875, -5.72265625, -4.82861328125, -3.9345703125, -3.04052734375, -2.146484375, -1.25244140625, -0.3583984375, 0.53564453125, 1.4296875, 2.32373046875, 3.2177734375, 4.11181640625, 5.005859375, 5.89990234375, 6.7939453125, 7.68798828125, 8.58203125, 9.47607421875, 10.3701171875, 11.26416015625, 12.158203125, 13.05224609375, 13.9462890625, 14.84033203125, 15.734375, 16.62841796875, 17.5224609375, 18.41650390625, 19.310546875, 20.20458984375, 21.0986328125, 21.99267578125, 22.88671875, 23.78076171875, 24.6748046875, 25.56884765625, 26.462890625, 27.35693359375, 28.2509765625, 29.14501953125, 30.0390625, 30.93310546875, 31.8271484375, 32.72119140625, 33.615234375, 34.50927734375, 35.4033203125, 36.29736328125, 37.19140625, 38.08544921875, 38.9794921875, 39.87353515625, 40.767578125, 41.66162109375, 42.5556640625, 43.44970703125, 44.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 9.0, 26.0, 41.0, 74.0, 151.0, 163.0, 178.0, 144.0, 99.0, 72.0, 28.0, 10.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.588623046875, -1.45849609375, -1.328369140625, -1.1982421875, -1.068115234375, -0.93798828125, -0.807861328125, -0.677734375, -0.547607421875, -0.41748046875, -0.287353515625, -0.1572265625, -0.027099609375, 0.10302734375, 0.233154296875, 0.36328125, 0.493408203125, 0.62353515625, 0.753662109375, 0.8837890625, 1.013916015625, 1.14404296875, 1.274169921875, 1.404296875, 1.534423828125, 1.66455078125, 1.794677734375, 1.9248046875, 2.054931640625, 2.18505859375, 2.315185546875, 2.4453125, 2.575439453125, 2.70556640625, 2.835693359375, 2.9658203125, 3.095947265625, 3.22607421875, 3.356201171875, 3.486328125, 3.616455078125, 3.74658203125, 3.876708984375, 4.0068359375, 4.136962890625, 4.26708984375, 4.397216796875, 4.52734375, 4.657470703125, 4.78759765625, 4.917724609375, 5.0478515625, 5.177978515625, 5.30810546875, 5.438232421875, 5.568359375, 5.698486328125, 5.82861328125, 5.958740234375, 6.0888671875, 6.218994140625, 6.34912109375, 6.479248046875, 6.609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 15.0, 27.0, 96.0, 397.0, 4178157.0, 15017.0, 290.0, 154.0, 74.0, 31.0, 10.0, 9.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -42.93505859375, -38.9638671875, -34.99267578125, -31.021484375, -27.05029296875, -23.0791015625, -19.10791015625, -15.13671875, -11.16552734375, -7.1943359375, -3.22314453125, 0.748046875, 4.71923828125, 8.6904296875, 12.66162109375, 16.6328125, 20.60400390625, 24.5751953125, 28.54638671875, 32.517578125, 36.48876953125, 40.4599609375, 44.43115234375, 48.40234375, 52.37353515625, 56.3447265625, 60.31591796875, 64.287109375, 68.25830078125, 72.2294921875, 76.20068359375, 80.171875, 84.14306640625, 88.1142578125, 92.08544921875, 96.056640625, 100.02783203125, 103.9990234375, 107.97021484375, 111.94140625, 115.91259765625, 119.8837890625, 123.85498046875, 127.826171875, 131.79736328125, 135.7685546875, 139.73974609375, 143.7109375, 147.68212890625, 151.6533203125, 155.62451171875, 159.595703125, 163.56689453125, 167.5380859375, 171.50927734375, 175.48046875, 179.45166015625, 183.4228515625, 187.39404296875, 191.365234375, 195.33642578125, 199.3076171875, 203.27880859375, 207.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 11.0, 66.0, 838.0, 2986.0, 137.0, 24.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.072418212890625, -1.67022705078125, -1.268035888671875, -0.8658447265625, -0.463653564453125, -0.06146240234375, 0.340728759765625, 0.742919921875, 1.145111083984375, 1.54730224609375, 1.949493408203125, 2.3516845703125, 2.753875732421875, 3.15606689453125, 3.558258056640625, 3.96044921875, 4.362640380859375, 4.76483154296875, 5.167022705078125, 5.5692138671875, 5.971405029296875, 6.37359619140625, 6.775787353515625, 7.177978515625, 7.580169677734375, 7.98236083984375, 8.384552001953125, 8.7867431640625, 9.188934326171875, 9.59112548828125, 9.993316650390625, 10.3955078125, 10.797698974609375, 11.19989013671875, 11.602081298828125, 12.0042724609375, 12.406463623046875, 12.80865478515625, 13.210845947265625, 13.613037109375, 14.015228271484375, 14.41741943359375, 14.819610595703125, 15.2218017578125, 15.623992919921875, 16.02618408203125, 16.428375244140625, 16.83056640625, 17.232757568359375, 17.63494873046875, 18.037139892578125, 18.4393310546875, 18.841522216796875, 19.24371337890625, 19.645904541015625, 20.048095703125, 20.450286865234375, 20.85247802734375, 21.254669189453125, 21.6568603515625, 22.059051513671875, 22.46124267578125, 22.863433837890625, 23.265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 18.0, 25.0, 75.0, 203.0, 291.0, 224.0, 80.0, 42.0, 11.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.61898422241211, -20.555347442626953, -19.49171257019043, -18.428075790405273, -17.36444091796875, -16.300804138183594, -15.237167358398438, -14.173531532287598, -13.109895706176758, -12.046259880065918, -10.982624053955078, -9.918987274169922, -8.855351448059082, -7.791715621948242, -6.728079319000244, -5.664443016052246, -4.600807189941406, -3.5371711254119873, -2.4735350608825684, -1.4098989963531494, -0.34626293182373047, 0.7173728942871094, 1.7810091972351074, 2.8446455001831055, 3.9082813262939453, 4.971917152404785, 6.035553455352783, 7.099189758300781, 8.162825584411621, 9.226461410522461, 10.290098190307617, 11.353734016418457, 12.417373657226562, 13.481009483337402, 14.544645309448242, 15.608282089233398, 16.671916961669922, 17.735553741455078, 18.799190521240234, 19.86282730102539, 20.926462173461914, 21.99009895324707, 23.053733825683594, 24.11737060546875, 25.181007385253906, 26.24464225769043, 27.308279037475586, 28.37191390991211, 29.435550689697266, 30.499187469482422, 31.562822341918945, 32.62645721435547, 33.690093994140625, 34.75373077392578, 35.81736755371094, 36.881004333496094, 37.94464111328125, 39.008277893066406, 40.07191467285156, 41.13554763793945, 42.19918441772461, 43.262821197509766, 44.32645797729492, 45.39009475708008, 46.45372772216797]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 10.0, 22.0, 26.0, 44.0, 61.0, 88.0, 111.0, 118.0, 102.0, 122.0, 93.0, 67.0, 40.0, 32.0, 27.0, 16.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.74936294555664, -34.500579833984375, -33.251800537109375, -32.00301742553711, -30.754234313964844, -29.505451202392578, -28.256669998168945, -27.007888793945312, -25.759105682373047, -24.51032257080078, -23.26154136657715, -22.012760162353516, -20.76397705078125, -19.515193939208984, -18.26641273498535, -17.01763153076172, -15.768848419189453, -14.520066261291504, -13.271284103393555, -12.022501945495605, -10.773719787597656, -9.524937629699707, -8.276155471801758, -7.027373313903809, -5.778591156005859, -4.52980899810791, -3.281026840209961, -2.0322446823120117, -0.7834625244140625, 0.4653196334838867, 1.714101791381836, 2.962883949279785, 4.211666107177734, 5.460448265075684, 6.709230422973633, 7.958012580871582, 9.206794738769531, 10.45557689666748, 11.70435905456543, 12.953141212463379, 14.201923370361328, 15.450705528259277, 16.699487686157227, 17.94826889038086, 19.197052001953125, 20.44583511352539, 21.694616317749023, 22.943397521972656, 24.192180633544922, 25.440963745117188, 26.68974494934082, 27.938526153564453, 29.18730926513672, 30.436092376708984, 31.684873580932617, 32.93365478515625, 34.182437896728516, 35.43122100830078, 36.68000030517578, 37.92878341674805, 39.17756652832031, 40.42634963989258, 41.675132751464844, 42.923912048339844, 44.17269515991211]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 9.0, 8.0, 8.0, 21.0, 20.0, 31.0, 31.0, 50.0, 76.0, 92.0, 149.0, 240.0, 413.0, 766.0, 2195.0, 9103.0, 56223.0, 539186.0, 389590.0, 39751.0, 6985.0, 1874.0, 704.0, 359.0, 193.0, 123.0, 84.0, 62.0, 58.0, 29.0, 28.0, 16.0, 11.0, 8.0, 8.0, 1.0, 9.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-14.6015625, -14.183349609375, -13.76513671875, -13.346923828125, -12.9287109375, -12.510498046875, -12.09228515625, -11.674072265625, -11.255859375, -10.837646484375, -10.41943359375, -10.001220703125, -9.5830078125, -9.164794921875, -8.74658203125, -8.328369140625, -7.91015625, -7.491943359375, -7.07373046875, -6.655517578125, -6.2373046875, -5.819091796875, -5.40087890625, -4.982666015625, -4.564453125, -4.146240234375, -3.72802734375, -3.309814453125, -2.8916015625, -2.473388671875, -2.05517578125, -1.636962890625, -1.21875, -0.800537109375, -0.38232421875, 0.035888671875, 0.4541015625, 0.872314453125, 1.29052734375, 1.708740234375, 2.126953125, 2.545166015625, 2.96337890625, 3.381591796875, 3.7998046875, 4.218017578125, 4.63623046875, 5.054443359375, 5.47265625, 5.890869140625, 6.30908203125, 6.727294921875, 7.1455078125, 7.563720703125, 7.98193359375, 8.400146484375, 8.818359375, 9.236572265625, 9.65478515625, 10.072998046875, 10.4912109375, 10.909423828125, 11.32763671875, 11.745849609375, 12.1640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 9.0, 23.0, 26.0, 53.0, 86.0, 129.0, 141.0, 117.0, 131.0, 116.0, 60.0, 58.0, 24.0, 20.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.34185791015625, -2.1993408203125, -2.05682373046875, -1.914306640625, -1.77178955078125, -1.6292724609375, -1.48675537109375, -1.34423828125, -1.20172119140625, -1.0592041015625, -0.91668701171875, -0.774169921875, -0.63165283203125, -0.4891357421875, -0.34661865234375, -0.2041015625, -0.06158447265625, 0.0809326171875, 0.22344970703125, 0.365966796875, 0.50848388671875, 0.6510009765625, 0.79351806640625, 0.93603515625, 1.07855224609375, 1.2210693359375, 1.36358642578125, 1.506103515625, 1.64862060546875, 1.7911376953125, 1.93365478515625, 2.076171875, 2.21868896484375, 2.3612060546875, 2.50372314453125, 2.646240234375, 2.78875732421875, 2.9312744140625, 3.07379150390625, 3.21630859375, 3.35882568359375, 3.5013427734375, 3.64385986328125, 3.786376953125, 3.92889404296875, 4.0714111328125, 4.21392822265625, 4.3564453125, 4.49896240234375, 4.6414794921875, 4.78399658203125, 4.926513671875, 5.06903076171875, 5.2115478515625, 5.35406494140625, 5.49658203125, 5.63909912109375, 5.7816162109375, 5.92413330078125, 6.066650390625, 6.20916748046875, 6.3516845703125, 6.49420166015625, 6.63671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 12.0, 15.0, 26.0, 49.0, 49.0, 84.0, 153.0, 286.0, 610.0, 1627.0, 5275.0, 27120.0, 288505.0, 645218.0, 65264.0, 9809.0, 2632.0, 913.0, 370.0, 185.0, 108.0, 68.0, 49.0, 28.0, 27.0, 13.0, 18.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.1234130859375, -10.778076171875, -10.4327392578125, -10.08740234375, -9.7420654296875, -9.396728515625, -9.0513916015625, -8.7060546875, -8.3607177734375, -8.015380859375, -7.6700439453125, -7.32470703125, -6.9793701171875, -6.634033203125, -6.2886962890625, -5.943359375, -5.5980224609375, -5.252685546875, -4.9073486328125, -4.56201171875, -4.2166748046875, -3.871337890625, -3.5260009765625, -3.1806640625, -2.8353271484375, -2.489990234375, -2.1446533203125, -1.79931640625, -1.4539794921875, -1.108642578125, -0.7633056640625, -0.41796875, -0.0726318359375, 0.272705078125, 0.6180419921875, 0.96337890625, 1.3087158203125, 1.654052734375, 1.9993896484375, 2.3447265625, 2.6900634765625, 3.035400390625, 3.3807373046875, 3.72607421875, 4.0714111328125, 4.416748046875, 4.7620849609375, 5.107421875, 5.4527587890625, 5.798095703125, 6.1434326171875, 6.48876953125, 6.8341064453125, 7.179443359375, 7.5247802734375, 7.8701171875, 8.2154541015625, 8.560791015625, 8.9061279296875, 9.25146484375, 9.5968017578125, 9.942138671875, 10.2874755859375, 10.6328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 11.0, 16.0, 17.0, 18.0, 14.0, 32.0, 38.0, 42.0, 43.0, 44.0, 60.0, 56.0, 48.0, 74.0, 50.0, 55.0, 54.0, 42.0, 41.0, 46.0, 35.0, 31.0, 21.0, 21.0, 13.0, 18.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.7020263671875, -8.427490234375, -8.1529541015625, -7.87841796875, -7.6038818359375, -7.329345703125, -7.0548095703125, -6.7802734375, -6.5057373046875, -6.231201171875, -5.9566650390625, -5.68212890625, -5.4075927734375, -5.133056640625, -4.8585205078125, -4.583984375, -4.3094482421875, -4.034912109375, -3.7603759765625, -3.48583984375, -3.2113037109375, -2.936767578125, -2.6622314453125, -2.3876953125, -2.1131591796875, -1.838623046875, -1.5640869140625, -1.28955078125, -1.0150146484375, -0.740478515625, -0.4659423828125, -0.19140625, 0.0831298828125, 0.357666015625, 0.6322021484375, 0.90673828125, 1.1812744140625, 1.455810546875, 1.7303466796875, 2.0048828125, 2.2794189453125, 2.553955078125, 2.8284912109375, 3.10302734375, 3.3775634765625, 3.652099609375, 3.9266357421875, 4.201171875, 4.4757080078125, 4.750244140625, 5.0247802734375, 5.29931640625, 5.5738525390625, 5.848388671875, 6.1229248046875, 6.3974609375, 6.6719970703125, 6.946533203125, 7.2210693359375, 7.49560546875, 7.7701416015625, 8.044677734375, 8.3192138671875, 8.59375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 16.0, 25.0, 50.0, 122.0, 321.0, 1249.0, 8457.0, 228050.0, 777919.0, 28857.0, 2578.0, 561.0, 180.0, 73.0, 34.0, 20.0, 7.0, 9.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.76580810546875, -4.5042724609375, -4.24273681640625, -3.981201171875, -3.71966552734375, -3.4581298828125, -3.19659423828125, -2.93505859375, -2.67352294921875, -2.4119873046875, -2.15045166015625, -1.888916015625, -1.62738037109375, -1.3658447265625, -1.10430908203125, -0.8427734375, -0.58123779296875, -0.3197021484375, -0.05816650390625, 0.203369140625, 0.46490478515625, 0.7264404296875, 0.98797607421875, 1.24951171875, 1.51104736328125, 1.7725830078125, 2.03411865234375, 2.295654296875, 2.55718994140625, 2.8187255859375, 3.08026123046875, 3.341796875, 3.60333251953125, 3.8648681640625, 4.12640380859375, 4.387939453125, 4.64947509765625, 4.9110107421875, 5.17254638671875, 5.43408203125, 5.69561767578125, 5.9571533203125, 6.21868896484375, 6.480224609375, 6.74176025390625, 7.0032958984375, 7.26483154296875, 7.5263671875, 7.78790283203125, 8.0494384765625, 8.31097412109375, 8.572509765625, 8.83404541015625, 9.0955810546875, 9.35711669921875, 9.61865234375, 9.88018798828125, 10.1417236328125, 10.40325927734375, 10.664794921875, 10.92633056640625, 11.1878662109375, 11.44940185546875, 11.7109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 6.0, 9.0, 18.0, 12.0, 17.0, 22.0, 27.0, 35.0, 36.0, 50.0, 64.0, 53.0, 93.0, 88.0, 82.0, 71.0, 42.0, 47.0, 31.0, 32.0, 27.0, 28.0, 23.0, 13.0, 15.0, 11.0, 8.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00024330615997314453, -0.00023275427520275116, -0.0002222023904323578, -0.00021165050566196442, -0.00020109862089157104, -0.00019054673612117767, -0.0001799948513507843, -0.00016944296658039093, -0.00015889108180999756, -0.0001483391970396042, -0.00013778731226921082, -0.00012723542749881744, -0.00011668354272842407, -0.0001061316579580307, -9.557977318763733e-05, -8.502788841724396e-05, -7.447600364685059e-05, -6.392411887645721e-05, -5.337223410606384e-05, -4.282034933567047e-05, -3.22684645652771e-05, -2.1716579794883728e-05, -1.1164695024490356e-05, -6.128102540969849e-07, 9.939074516296387e-06, 2.0490959286689758e-05, 3.104284405708313e-05, 4.15947288274765e-05, 5.214661359786987e-05, 6.269849836826324e-05, 7.325038313865662e-05, 8.380226790904999e-05, 9.435415267944336e-05, 0.00010490603744983673, 0.0001154579222202301, 0.00012600980699062347, 0.00013656169176101685, 0.00014711357653141022, 0.0001576654613018036, 0.00016821734607219696, 0.00017876923084259033, 0.0001893211156129837, 0.00019987300038337708, 0.00021042488515377045, 0.00022097676992416382, 0.0002315286546945572, 0.00024208053946495056, 0.00025263242423534393, 0.0002631843090057373, 0.0002737361937761307, 0.00028428807854652405, 0.0002948399633169174, 0.0003053918480873108, 0.00031594373285770416, 0.00032649561762809753, 0.0003370475023984909, 0.0003475993871688843, 0.00035815127193927765, 0.000368703156709671, 0.0003792550414800644, 0.00038980692625045776, 0.00040035881102085114, 0.0004109106957912445, 0.0004214625805616379, 0.00043201446533203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 12.0, 23.0, 30.0, 51.0, 101.0, 149.0, 348.0, 903.0, 2819.0, 13827.0, 107644.0, 626773.0, 259484.0, 29070.0, 4935.0, 1406.0, 487.0, 228.0, 103.0, 58.0, 31.0, 14.0, 12.0, 12.0, 13.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.59375, -5.449188232421875, -5.30462646484375, -5.160064697265625, -5.0155029296875, -4.870941162109375, -4.72637939453125, -4.581817626953125, -4.437255859375, -4.292694091796875, -4.14813232421875, -4.003570556640625, -3.8590087890625, -3.714447021484375, -3.56988525390625, -3.425323486328125, -3.28076171875, -3.136199951171875, -2.99163818359375, -2.847076416015625, -2.7025146484375, -2.557952880859375, -2.41339111328125, -2.268829345703125, -2.124267578125, -1.979705810546875, -1.83514404296875, -1.690582275390625, -1.5460205078125, -1.401458740234375, -1.25689697265625, -1.112335205078125, -0.9677734375, -0.823211669921875, -0.67864990234375, -0.534088134765625, -0.3895263671875, -0.244964599609375, -0.10040283203125, 0.044158935546875, 0.188720703125, 0.333282470703125, 0.47784423828125, 0.622406005859375, 0.7669677734375, 0.911529541015625, 1.05609130859375, 1.200653076171875, 1.34521484375, 1.489776611328125, 1.63433837890625, 1.778900146484375, 1.9234619140625, 2.068023681640625, 2.21258544921875, 2.357147216796875, 2.501708984375, 2.646270751953125, 2.79083251953125, 2.935394287109375, 3.0799560546875, 3.224517822265625, 3.36907958984375, 3.513641357421875, 3.658203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 6.0, 8.0, 11.0, 13.0, 21.0, 32.0, 41.0, 66.0, 78.0, 102.0, 117.0, 111.0, 109.0, 76.0, 66.0, 41.0, 29.0, 20.0, 14.0, 10.0, 4.0, 6.0, 9.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7578125, -4.641357421875, -4.52490234375, -4.408447265625, -4.2919921875, -4.175537109375, -4.05908203125, -3.942626953125, -3.826171875, -3.709716796875, -3.59326171875, -3.476806640625, -3.3603515625, -3.243896484375, -3.12744140625, -3.010986328125, -2.89453125, -2.778076171875, -2.66162109375, -2.545166015625, -2.4287109375, -2.312255859375, -2.19580078125, -2.079345703125, -1.962890625, -1.846435546875, -1.72998046875, -1.613525390625, -1.4970703125, -1.380615234375, -1.26416015625, -1.147705078125, -1.03125, -0.914794921875, -0.79833984375, -0.681884765625, -0.5654296875, -0.448974609375, -0.33251953125, -0.216064453125, -0.099609375, 0.016845703125, 0.13330078125, 0.249755859375, 0.3662109375, 0.482666015625, 0.59912109375, 0.715576171875, 0.83203125, 0.948486328125, 1.06494140625, 1.181396484375, 1.2978515625, 1.414306640625, 1.53076171875, 1.647216796875, 1.763671875, 1.880126953125, 1.99658203125, 2.113037109375, 2.2294921875, 2.345947265625, 2.46240234375, 2.578857421875, 2.6953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 15.0, 19.0, 20.0, 38.0, 61.0, 108.0, 156.0, 178.0, 162.0, 108.0, 61.0, 28.0, 15.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.219566345214844, -42.832008361816406, -41.44445037841797, -40.05689239501953, -38.669334411621094, -37.281776428222656, -35.89421844482422, -34.50666046142578, -33.119102478027344, -31.731544494628906, -30.34398651123047, -28.95642852783203, -27.568870544433594, -26.181312561035156, -24.79375648498535, -23.406198501586914, -22.01864242553711, -20.631084442138672, -19.243526458740234, -17.855968475341797, -16.46841049194336, -15.080853462219238, -13.693296432495117, -12.30573844909668, -10.918180465698242, -9.530622482299805, -8.143064498901367, -6.755507469177246, -5.367949485778809, -3.980391502380371, -2.59283447265625, -1.2052764892578125, 0.18228530883789062, 1.569843053817749, 2.9574007987976074, 4.344958305358887, 5.732516288757324, 7.120074272155762, 8.507631301879883, 9.89518928527832, 11.282747268676758, 12.670305252075195, 14.057863235473633, 15.445420265197754, 16.832977294921875, 18.220535278320312, 19.60809326171875, 20.995651245117188, 22.383209228515625, 23.770767211914062, 25.1583251953125, 26.545883178710938, 27.933441162109375, 29.320999145507812, 30.708555221557617, 32.09611511230469, 33.483673095703125, 34.87123107910156, 36.2587890625, 37.64634704589844, 39.033905029296875, 40.42146301269531, 41.80902099609375, 43.19657897949219, 44.58413314819336]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 5.0, 6.0, 6.0, 9.0, 15.0, 14.0, 24.0, 24.0, 25.0, 24.0, 22.0, 42.0, 37.0, 37.0, 53.0, 51.0, 54.0, 48.0, 50.0, 52.0, 41.0, 37.0, 32.0, 35.0, 26.0, 34.0, 41.0, 20.0, 15.0, 20.0, 17.0, 13.0, 10.0, 13.0, 10.0, 5.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.81150817871094, -37.59115219116211, -36.370792388916016, -35.15043640136719, -33.93008041381836, -32.709720611572266, -31.489364624023438, -30.269006729125977, -29.048648834228516, -27.828290939331055, -26.607934951782227, -25.387577056884766, -24.167219161987305, -22.946861267089844, -21.726505279541016, -20.506147384643555, -19.285791397094727, -18.065433502197266, -16.845077514648438, -15.624719619750977, -14.404361724853516, -13.184004783630371, -11.963647842407227, -10.743289947509766, -9.522933006286621, -8.302576065063477, -7.082218170166016, -5.861861228942871, -4.641503810882568, -3.4211463928222656, -2.200789451599121, -0.9804315567016602, 0.23992538452148438, 1.4602826833724976, 2.6806399822235107, 3.9009971618652344, 5.121354579925537, 6.34171199798584, 7.562068939208984, 8.782426834106445, 10.00278377532959, 11.223140716552734, 12.443498611450195, 13.66385555267334, 14.884212493896484, 16.104570388793945, 17.324928283691406, 18.545284271240234, 19.765642166137695, 20.986000061035156, 22.206356048583984, 23.426713943481445, 24.647071838378906, 25.867427825927734, 27.087785720825195, 28.308143615722656, 29.528499603271484, 30.748857498168945, 31.969213485717773, 33.189571380615234, 34.40992736816406, 35.630287170410156, 36.850643157958984, 38.07099914550781, 39.291358947753906]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 21.0, 20.0, 40.0, 69.0, 136.0, 292.0, 708.0, 2086.0, 7728.0, 54580.0, 3849582.0, 256205.0, 16335.0, 3839.0, 1269.0, 587.0, 269.0, 153.0, 88.0, 61.0, 41.0, 40.0, 21.0, 19.0, 21.0, 9.0, 12.0, 13.0, 4.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.6396484375, -8.123046875, -7.6064453125, -7.08984375, -6.5732421875, -6.056640625, -5.5400390625, -5.0234375, -4.5068359375, -3.990234375, -3.4736328125, -2.95703125, -2.4404296875, -1.923828125, -1.4072265625, -0.890625, -0.3740234375, 0.142578125, 0.6591796875, 1.17578125, 1.6923828125, 2.208984375, 2.7255859375, 3.2421875, 3.7587890625, 4.275390625, 4.7919921875, 5.30859375, 5.8251953125, 6.341796875, 6.8583984375, 7.375, 7.8916015625, 8.408203125, 8.9248046875, 9.44140625, 9.9580078125, 10.474609375, 10.9912109375, 11.5078125, 12.0244140625, 12.541015625, 13.0576171875, 13.57421875, 14.0908203125, 14.607421875, 15.1240234375, 15.640625, 16.1572265625, 16.673828125, 17.1904296875, 17.70703125, 18.2236328125, 18.740234375, 19.2568359375, 19.7734375, 20.2900390625, 20.806640625, 21.3232421875, 21.83984375, 22.3564453125, 22.873046875, 23.3896484375, 23.90625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 17.0, 28.0, 47.0, 73.0, 115.0, 133.0, 134.0, 134.0, 102.0, 84.0, 58.0, 30.0, 28.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.39215087890625, -2.2491455078125, -2.10614013671875, -1.963134765625, -1.82012939453125, -1.6771240234375, -1.53411865234375, -1.39111328125, -1.24810791015625, -1.1051025390625, -0.96209716796875, -0.819091796875, -0.67608642578125, -0.5330810546875, -0.39007568359375, -0.2470703125, -0.10406494140625, 0.0389404296875, 0.18194580078125, 0.324951171875, 0.46795654296875, 0.6109619140625, 0.75396728515625, 0.89697265625, 1.03997802734375, 1.1829833984375, 1.32598876953125, 1.468994140625, 1.61199951171875, 1.7550048828125, 1.89801025390625, 2.041015625, 2.18402099609375, 2.3270263671875, 2.47003173828125, 2.613037109375, 2.75604248046875, 2.8990478515625, 3.04205322265625, 3.18505859375, 3.32806396484375, 3.4710693359375, 3.61407470703125, 3.757080078125, 3.90008544921875, 4.0430908203125, 4.18609619140625, 4.3291015625, 4.47210693359375, 4.6151123046875, 4.75811767578125, 4.901123046875, 5.04412841796875, 5.1871337890625, 5.33013916015625, 5.47314453125, 5.61614990234375, 5.7591552734375, 5.90216064453125, 6.045166015625, 6.18817138671875, 6.3311767578125, 6.47418212890625, 6.6171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 24.0, 29.0, 48.0, 77.0, 94.0, 90.0, 217.0, 18203.0, 4175010.0, 245.0, 87.0, 55.0, 38.0, 26.0, 11.0, 6.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.125, -162.6005859375, -159.076171875, -155.5517578125, -152.02734375, -148.5029296875, -144.978515625, -141.4541015625, -137.9296875, -134.4052734375, -130.880859375, -127.3564453125, -123.83203125, -120.3076171875, -116.783203125, -113.2587890625, -109.734375, -106.2099609375, -102.685546875, -99.1611328125, -95.63671875, -92.1123046875, -88.587890625, -85.0634765625, -81.5390625, -78.0146484375, -74.490234375, -70.9658203125, -67.44140625, -63.9169921875, -60.392578125, -56.8681640625, -53.34375, -49.8193359375, -46.294921875, -42.7705078125, -39.24609375, -35.7216796875, -32.197265625, -28.6728515625, -25.1484375, -21.6240234375, -18.099609375, -14.5751953125, -11.05078125, -7.5263671875, -4.001953125, -0.4775390625, 3.046875, 6.5712890625, 10.095703125, 13.6201171875, 17.14453125, 20.6689453125, 24.193359375, 27.7177734375, 31.2421875, 34.7666015625, 38.291015625, 41.8154296875, 45.33984375, 48.8642578125, 52.388671875, 55.9130859375, 59.4375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 27.0, 2179.0, 1848.0, 21.0, 6.0, 2.0, 0.0, 1.0], "bins": [-37.46875, -36.82257080078125, -36.1763916015625, -35.53021240234375, -34.884033203125, -34.23785400390625, -33.5916748046875, -32.94549560546875, -32.29931640625, -31.65313720703125, -31.0069580078125, -30.36077880859375, -29.714599609375, -29.06842041015625, -28.4222412109375, -27.77606201171875, -27.1298828125, -26.48370361328125, -25.8375244140625, -25.19134521484375, -24.545166015625, -23.89898681640625, -23.2528076171875, -22.60662841796875, -21.96044921875, -21.31427001953125, -20.6680908203125, -20.02191162109375, -19.375732421875, -18.72955322265625, -18.0833740234375, -17.43719482421875, -16.791015625, -16.14483642578125, -15.4986572265625, -14.85247802734375, -14.206298828125, -13.56011962890625, -12.9139404296875, -12.26776123046875, -11.62158203125, -10.97540283203125, -10.3292236328125, -9.68304443359375, -9.036865234375, -8.39068603515625, -7.7445068359375, -7.09832763671875, -6.4521484375, -5.80596923828125, -5.1597900390625, -4.51361083984375, -3.867431640625, -3.22125244140625, -2.5750732421875, -1.92889404296875, -1.28271484375, -0.63653564453125, 0.0096435546875, 0.65582275390625, 1.302001953125, 1.94818115234375, 2.5943603515625, 3.24053955078125, 3.88671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 124.0, 752.0, 110.0, 12.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.0479736328125, -134.33514404296875, -131.62229919433594, -128.9094696044922, -126.19664001464844, -123.48380279541016, -120.77096557617188, -118.05813598632812, -115.34529876708984, -112.63246154785156, -109.91963195800781, -107.20679473876953, -104.49396514892578, -101.7811279296875, -99.06829833984375, -96.35546112060547, -93.64262390136719, -90.9297866821289, -88.21695709228516, -85.50411987304688, -82.79129028320312, -80.07845306396484, -77.36561584472656, -74.65278625488281, -71.93995666503906, -69.22711944580078, -66.51428985595703, -63.80145263671875, -61.088619232177734, -58.37578582763672, -55.6629524230957, -52.95011901855469, -50.237281799316406, -47.52444839477539, -44.811614990234375, -42.098777770996094, -39.38594436645508, -36.67311096191406, -33.96027755737305, -31.2474422454834, -28.534608840942383, -25.821775436401367, -23.10894012451172, -20.396106719970703, -17.683273315429688, -14.970438003540039, -12.257604598999023, -9.544769287109375, -6.831935882568359, -4.119101524353027, -1.4062676429748535, 1.3065662384033203, 4.019400596618652, 6.732234954833984, 9.445068359375, 12.157903671264648, 14.870737075805664, 17.58357048034668, 20.296405792236328, 23.009239196777344, 25.72207260131836, 28.434907913208008, 31.147741317749023, 33.86057662963867, 36.57341003417969]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 27.0, 50.0, 77.0, 149.0, 191.0, 189.0, 159.0, 75.0, 46.0, 27.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.57796859741211, -43.03083801269531, -41.48371124267578, -39.936580657958984, -38.38945007324219, -36.84231948852539, -35.295188903808594, -33.74806213378906, -32.200931549072266, -30.65380096435547, -29.106672286987305, -27.55954360961914, -26.012413024902344, -24.465282440185547, -22.918153762817383, -21.37102508544922, -19.823894500732422, -18.276763916015625, -16.72963523864746, -15.18250560760498, -13.6353759765625, -12.08824634552002, -10.541116714477539, -8.993987083435059, -7.446857452392578, -5.899727821350098, -4.352598190307617, -2.8054685592651367, -1.2583389282226562, 0.2887907028198242, 1.8359203338623047, 3.383049964904785, 4.930183410644531, 6.477313041687012, 8.024442672729492, 9.571572303771973, 11.118701934814453, 12.665831565856934, 14.212961196899414, 15.760090827941895, 17.307220458984375, 18.854351043701172, 20.401479721069336, 21.9486083984375, 23.495738983154297, 25.042869567871094, 26.589998245239258, 28.137126922607422, 29.68425750732422, 31.231388092041016, 32.77851867675781, 34.325645446777344, 35.87277603149414, 37.41990661621094, 38.96703338623047, 40.514163970947266, 42.06129455566406, 43.60842514038086, 45.155555725097656, 46.70268249511719, 48.249813079833984, 49.79694366455078, 51.34407043457031, 52.89120101928711, 54.438331604003906]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 4.0, 6.0, 11.0, 9.0, 15.0, 18.0, 34.0, 31.0, 52.0, 81.0, 136.0, 234.0, 501.0, 1116.0, 3334.0, 12865.0, 74845.0, 480679.0, 400755.0, 58414.0, 10387.0, 2884.0, 1038.0, 483.0, 206.0, 124.0, 73.0, 45.0, 40.0, 26.0, 30.0, 29.0, 9.0, 9.0, 8.0, 4.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5859375, -7.29345703125, -7.0009765625, -6.70849609375, -6.416015625, -6.12353515625, -5.8310546875, -5.53857421875, -5.24609375, -4.95361328125, -4.6611328125, -4.36865234375, -4.076171875, -3.78369140625, -3.4912109375, -3.19873046875, -2.90625, -2.61376953125, -2.3212890625, -2.02880859375, -1.736328125, -1.44384765625, -1.1513671875, -0.85888671875, -0.56640625, -0.27392578125, 0.0185546875, 0.31103515625, 0.603515625, 0.89599609375, 1.1884765625, 1.48095703125, 1.7734375, 2.06591796875, 2.3583984375, 2.65087890625, 2.943359375, 3.23583984375, 3.5283203125, 3.82080078125, 4.11328125, 4.40576171875, 4.6982421875, 4.99072265625, 5.283203125, 5.57568359375, 5.8681640625, 6.16064453125, 6.453125, 6.74560546875, 7.0380859375, 7.33056640625, 7.623046875, 7.91552734375, 8.2080078125, 8.50048828125, 8.79296875, 9.08544921875, 9.3779296875, 9.67041015625, 9.962890625, 10.25537109375, 10.5478515625, 10.84033203125, 11.1328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 11.0, 9.0, 25.0, 29.0, 53.0, 78.0, 78.0, 95.0, 113.0, 114.0, 109.0, 82.0, 64.0, 46.0, 44.0, 17.0, 21.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.546875, -1.4443359375, -1.341796875, -1.2392578125, -1.13671875, -1.0341796875, -0.931640625, -0.8291015625, -0.7265625, -0.6240234375, -0.521484375, -0.4189453125, -0.31640625, -0.2138671875, -0.111328125, -0.0087890625, 0.09375, 0.1962890625, 0.298828125, 0.4013671875, 0.50390625, 0.6064453125, 0.708984375, 0.8115234375, 0.9140625, 1.0166015625, 1.119140625, 1.2216796875, 1.32421875, 1.4267578125, 1.529296875, 1.6318359375, 1.734375, 1.8369140625, 1.939453125, 2.0419921875, 2.14453125, 2.2470703125, 2.349609375, 2.4521484375, 2.5546875, 2.6572265625, 2.759765625, 2.8623046875, 2.96484375, 3.0673828125, 3.169921875, 3.2724609375, 3.375, 3.4775390625, 3.580078125, 3.6826171875, 3.78515625, 3.8876953125, 3.990234375, 4.0927734375, 4.1953125, 4.2978515625, 4.400390625, 4.5029296875, 4.60546875, 4.7080078125, 4.810546875, 4.9130859375, 5.015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 7.0, 9.0, 12.0, 16.0, 23.0, 29.0, 36.0, 60.0, 88.0, 204.0, 394.0, 914.0, 2347.0, 7838.0, 45392.0, 450950.0, 479302.0, 48358.0, 8360.0, 2408.0, 858.0, 403.0, 228.0, 101.0, 76.0, 46.0, 27.0, 21.0, 12.0, 5.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5546875, -8.238037109375, -7.92138671875, -7.604736328125, -7.2880859375, -6.971435546875, -6.65478515625, -6.338134765625, -6.021484375, -5.704833984375, -5.38818359375, -5.071533203125, -4.7548828125, -4.438232421875, -4.12158203125, -3.804931640625, -3.48828125, -3.171630859375, -2.85498046875, -2.538330078125, -2.2216796875, -1.905029296875, -1.58837890625, -1.271728515625, -0.955078125, -0.638427734375, -0.32177734375, -0.005126953125, 0.3115234375, 0.628173828125, 0.94482421875, 1.261474609375, 1.578125, 1.894775390625, 2.21142578125, 2.528076171875, 2.8447265625, 3.161376953125, 3.47802734375, 3.794677734375, 4.111328125, 4.427978515625, 4.74462890625, 5.061279296875, 5.3779296875, 5.694580078125, 6.01123046875, 6.327880859375, 6.64453125, 6.961181640625, 7.27783203125, 7.594482421875, 7.9111328125, 8.227783203125, 8.54443359375, 8.861083984375, 9.177734375, 9.494384765625, 9.81103515625, 10.127685546875, 10.4443359375, 10.760986328125, 11.07763671875, 11.394287109375, 11.7109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 10.0, 6.0, 25.0, 13.0, 18.0, 25.0, 27.0, 45.0, 44.0, 58.0, 55.0, 44.0, 61.0, 66.0, 54.0, 66.0, 70.0, 55.0, 50.0, 43.0, 37.0, 19.0, 24.0, 19.0, 15.0, 14.0, 10.0, 3.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.7100830078125, -7.412353515625, -7.1146240234375, -6.81689453125, -6.5191650390625, -6.221435546875, -5.9237060546875, -5.6259765625, -5.3282470703125, -5.030517578125, -4.7327880859375, -4.43505859375, -4.1373291015625, -3.839599609375, -3.5418701171875, -3.244140625, -2.9464111328125, -2.648681640625, -2.3509521484375, -2.05322265625, -1.7554931640625, -1.457763671875, -1.1600341796875, -0.8623046875, -0.5645751953125, -0.266845703125, 0.0308837890625, 0.32861328125, 0.6263427734375, 0.924072265625, 1.2218017578125, 1.51953125, 1.8172607421875, 2.114990234375, 2.4127197265625, 2.71044921875, 3.0081787109375, 3.305908203125, 3.6036376953125, 3.9013671875, 4.1990966796875, 4.496826171875, 4.7945556640625, 5.09228515625, 5.3900146484375, 5.687744140625, 5.9854736328125, 6.283203125, 6.5809326171875, 6.878662109375, 7.1763916015625, 7.47412109375, 7.7718505859375, 8.069580078125, 8.3673095703125, 8.6650390625, 8.9627685546875, 9.260498046875, 9.5582275390625, 9.85595703125, 10.1536865234375, 10.451416015625, 10.7491455078125, 11.046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 16.0, 17.0, 34.0, 60.0, 94.0, 159.0, 272.0, 620.0, 1545.0, 4409.0, 20787.0, 187981.0, 701608.0, 110634.0, 14368.0, 3536.0, 1259.0, 538.0, 217.0, 157.0, 85.0, 42.0, 38.0, 17.0, 13.0, 5.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0546875, -3.90667724609375, -3.7586669921875, -3.61065673828125, -3.462646484375, -3.31463623046875, -3.1666259765625, -3.01861572265625, -2.87060546875, -2.72259521484375, -2.5745849609375, -2.42657470703125, -2.278564453125, -2.13055419921875, -1.9825439453125, -1.83453369140625, -1.6865234375, -1.53851318359375, -1.3905029296875, -1.24249267578125, -1.094482421875, -0.94647216796875, -0.7984619140625, -0.65045166015625, -0.50244140625, -0.35443115234375, -0.2064208984375, -0.05841064453125, 0.089599609375, 0.23760986328125, 0.3856201171875, 0.53363037109375, 0.681640625, 0.82965087890625, 0.9776611328125, 1.12567138671875, 1.273681640625, 1.42169189453125, 1.5697021484375, 1.71771240234375, 1.86572265625, 2.01373291015625, 2.1617431640625, 2.30975341796875, 2.457763671875, 2.60577392578125, 2.7537841796875, 2.90179443359375, 3.0498046875, 3.19781494140625, 3.3458251953125, 3.49383544921875, 3.641845703125, 3.78985595703125, 3.9378662109375, 4.08587646484375, 4.23388671875, 4.38189697265625, 4.5299072265625, 4.67791748046875, 4.825927734375, 4.97393798828125, 5.1219482421875, 5.26995849609375, 5.41796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 11.0, 11.0, 14.0, 26.0, 30.0, 45.0, 72.0, 96.0, 121.0, 150.0, 125.0, 95.0, 65.0, 42.0, 24.0, 13.0, 9.0, 10.0, 5.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043964385986328125, -0.00042353570461273193, -0.0004074275493621826, -0.0003913193941116333, -0.000375211238861084, -0.00035910308361053467, -0.00034299492835998535, -0.00032688677310943604, -0.0003107786178588867, -0.0002946704626083374, -0.0002785623073577881, -0.00026245415210723877, -0.00024634599685668945, -0.00023023784160614014, -0.00021412968635559082, -0.0001980215311050415, -0.0001819133758544922, -0.00016580522060394287, -0.00014969706535339355, -0.00013358891010284424, -0.00011748075485229492, -0.0001013725996017456, -8.526444435119629e-05, -6.915628910064697e-05, -5.3048133850097656e-05, -3.693997859954834e-05, -2.0831823348999023e-05, -4.723668098449707e-06, 1.138448715209961e-05, 2.7492642402648926e-05, 4.360079765319824e-05, 5.970895290374756e-05, 7.581710815429688e-05, 9.192526340484619e-05, 0.00010803341865539551, 0.00012414157390594482, 0.00014024972915649414, 0.00015635788440704346, 0.00017246603965759277, 0.0001885741949081421, 0.0002046823501586914, 0.00022079050540924072, 0.00023689866065979004, 0.00025300681591033936, 0.00026911497116088867, 0.000285223126411438, 0.0003013312816619873, 0.0003174394369125366, 0.00033354759216308594, 0.00034965574741363525, 0.00036576390266418457, 0.0003818720579147339, 0.0003979802131652832, 0.0004140883684158325, 0.00043019652366638184, 0.00044630467891693115, 0.00046241283416748047, 0.0004785209894180298, 0.0004946291446685791, 0.0005107372999191284, 0.0005268454551696777, 0.000542953610420227, 0.0005590617656707764, 0.0005751699209213257, 0.000591278076171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 15.0, 16.0, 33.0, 45.0, 90.0, 163.0, 402.0, 1075.0, 3485.0, 18357.0, 201912.0, 720057.0, 88974.0, 10221.0, 2283.0, 779.0, 310.0, 138.0, 76.0, 50.0, 19.0, 20.0, 13.0, 10.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9541015625, -5.798828125, -5.6435546875, -5.48828125, -5.3330078125, -5.177734375, -5.0224609375, -4.8671875, -4.7119140625, -4.556640625, -4.4013671875, -4.24609375, -4.0908203125, -3.935546875, -3.7802734375, -3.625, -3.4697265625, -3.314453125, -3.1591796875, -3.00390625, -2.8486328125, -2.693359375, -2.5380859375, -2.3828125, -2.2275390625, -2.072265625, -1.9169921875, -1.76171875, -1.6064453125, -1.451171875, -1.2958984375, -1.140625, -0.9853515625, -0.830078125, -0.6748046875, -0.51953125, -0.3642578125, -0.208984375, -0.0537109375, 0.1015625, 0.2568359375, 0.412109375, 0.5673828125, 0.72265625, 0.8779296875, 1.033203125, 1.1884765625, 1.34375, 1.4990234375, 1.654296875, 1.8095703125, 1.96484375, 2.1201171875, 2.275390625, 2.4306640625, 2.5859375, 2.7412109375, 2.896484375, 3.0517578125, 3.20703125, 3.3623046875, 3.517578125, 3.6728515625, 3.828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 4.0, 8.0, 6.0, 8.0, 16.0, 21.0, 32.0, 47.0, 62.0, 89.0, 128.0, 129.0, 129.0, 97.0, 83.0, 42.0, 34.0, 18.0, 12.0, 9.0, 8.0, 8.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.094696044921875, -4.96282958984375, -4.830963134765625, -4.6990966796875, -4.567230224609375, -4.43536376953125, -4.303497314453125, -4.171630859375, -4.039764404296875, -3.90789794921875, -3.776031494140625, -3.6441650390625, -3.512298583984375, -3.38043212890625, -3.248565673828125, -3.11669921875, -2.984832763671875, -2.85296630859375, -2.721099853515625, -2.5892333984375, -2.457366943359375, -2.32550048828125, -2.193634033203125, -2.061767578125, -1.929901123046875, -1.79803466796875, -1.666168212890625, -1.5343017578125, -1.402435302734375, -1.27056884765625, -1.138702392578125, -1.0068359375, -0.874969482421875, -0.74310302734375, -0.611236572265625, -0.4793701171875, -0.347503662109375, -0.21563720703125, -0.083770751953125, 0.048095703125, 0.179962158203125, 0.31182861328125, 0.443695068359375, 0.5755615234375, 0.707427978515625, 0.83929443359375, 0.971160888671875, 1.10302734375, 1.234893798828125, 1.36676025390625, 1.498626708984375, 1.6304931640625, 1.762359619140625, 1.89422607421875, 2.026092529296875, 2.157958984375, 2.289825439453125, 2.42169189453125, 2.553558349609375, 2.6854248046875, 2.817291259765625, 2.94915771484375, 3.081024169921875, 3.212890625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 12.0, 12.0, 41.0, 83.0, 168.0, 283.0, 237.0, 85.0, 50.0, 14.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.802215576171875, -37.279502868652344, -34.75679397583008, -32.23408508300781, -29.71137237548828, -27.188661575317383, -24.665950775146484, -22.143239974975586, -19.620529174804688, -17.09781837463379, -14.57510757446289, -12.052396774291992, -9.529685974121094, -7.006975173950195, -4.484264373779297, -1.9615535736083984, 0.5611572265625, 3.0838680267333984, 5.606578826904297, 8.129289627075195, 10.652000427246094, 13.174711227416992, 15.69742202758789, 18.22013282775879, 20.742843627929688, 23.265554428100586, 25.788265228271484, 28.310976028442383, 30.83368682861328, 33.35639953613281, 35.87910842895508, 38.401817321777344, 40.924530029296875, 43.447242736816406, 45.96995162963867, 48.49266052246094, 51.01537322998047, 53.5380859375, 56.060794830322266, 58.58350372314453, 61.10621643066406, 63.628929138183594, 66.15164184570312, 68.67434692382812, 71.19705963134766, 73.71977233886719, 76.24247741699219, 78.76519012451172, 81.28790283203125, 83.81061553955078, 86.33332824707031, 88.85603332519531, 91.37874603271484, 93.90145874023438, 96.42416381835938, 98.9468765258789, 101.46958923339844, 103.99230194091797, 106.5150146484375, 109.0377197265625, 111.56043243408203, 114.08314514160156, 116.60585021972656, 119.1285629272461, 121.65127563476562]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 8.0, 5.0, 11.0, 11.0, 16.0, 14.0, 12.0, 22.0, 21.0, 46.0, 37.0, 43.0, 38.0, 52.0, 45.0, 61.0, 51.0, 61.0, 53.0, 50.0, 54.0, 46.0, 41.0, 44.0, 29.0, 25.0, 20.0, 17.0, 13.0, 11.0, 6.0, 4.0, 8.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.054412841796875, -51.47208023071289, -49.889747619628906, -48.30741882324219, -46.7250862121582, -45.14275360107422, -43.560420989990234, -41.97808837890625, -40.395755767822266, -38.81342315673828, -37.2310905456543, -35.64875793457031, -34.066429138183594, -32.48409652709961, -30.901763916015625, -29.31943130493164, -27.73710060119629, -26.154767990112305, -24.572437286376953, -22.99010467529297, -21.407772064208984, -19.825439453125, -18.24310874938965, -16.660776138305664, -15.078444480895996, -13.496112823486328, -11.913780212402344, -10.331448554992676, -8.749116897583008, -7.166784286499023, -5.5844526290893555, -4.002120018005371, -2.419788360595703, -0.8374563455581665, 0.7448756694793701, 2.327207565307617, 3.9095396995544434, 5.4918718338012695, 7.0742034912109375, 8.656536102294922, 10.23886775970459, 11.821199417114258, 13.403532028198242, 14.98586368560791, 16.568195343017578, 18.150527954101562, 19.732860565185547, 21.31519317626953, 22.897523880004883, 24.479856491088867, 26.06218719482422, 27.644519805908203, 29.226852416992188, 30.809185028076172, 32.391517639160156, 33.973846435546875, 35.55617904663086, 37.138511657714844, 38.72084426879883, 40.30317687988281, 41.88550567626953, 43.467838287353516, 45.0501708984375, 46.632503509521484, 48.21483612060547]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 11.0, 10.0, 22.0, 43.0, 83.0, 199.0, 385.0, 1078.0, 3607.0, 20110.0, 999201.0, 3136049.0, 26729.0, 4391.0, 1261.0, 519.0, 242.0, 127.0, 68.0, 46.0, 26.0, 22.0, 14.0, 8.0, 2.0, 8.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -7.6690673828125, -7.033447265625, -6.3978271484375, -5.76220703125, -5.1265869140625, -4.490966796875, -3.8553466796875, -3.2197265625, -2.5841064453125, -1.948486328125, -1.3128662109375, -0.67724609375, -0.0416259765625, 0.593994140625, 1.2296142578125, 1.865234375, 2.5008544921875, 3.136474609375, 3.7720947265625, 4.40771484375, 5.0433349609375, 5.678955078125, 6.3145751953125, 6.9501953125, 7.5858154296875, 8.221435546875, 8.8570556640625, 9.49267578125, 10.1282958984375, 10.763916015625, 11.3995361328125, 12.03515625, 12.6707763671875, 13.306396484375, 13.9420166015625, 14.57763671875, 15.2132568359375, 15.848876953125, 16.4844970703125, 17.1201171875, 17.7557373046875, 18.391357421875, 19.0269775390625, 19.66259765625, 20.2982177734375, 20.933837890625, 21.5694580078125, 22.205078125, 22.8406982421875, 23.476318359375, 24.1119384765625, 24.74755859375, 25.3831787109375, 26.018798828125, 26.6544189453125, 27.2900390625, 27.9256591796875, 28.561279296875, 29.1968994140625, 29.83251953125, 30.4681396484375, 31.103759765625, 31.7393798828125, 32.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 5.0, 10.0, 15.0, 32.0, 37.0, 49.0, 68.0, 95.0, 94.0, 129.0, 100.0, 111.0, 73.0, 63.0, 45.0, 33.0, 22.0, 12.0, 12.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2125396728515625, -1.109649658203125, -1.0067596435546875, -0.90386962890625, -0.8009796142578125, -0.698089599609375, -0.5951995849609375, -0.4923095703125, -0.3894195556640625, -0.286529541015625, -0.1836395263671875, -0.08074951171875, 0.0221405029296875, 0.125030517578125, 0.2279205322265625, 0.330810546875, 0.4337005615234375, 0.536590576171875, 0.6394805908203125, 0.74237060546875, 0.8452606201171875, 0.948150634765625, 1.0510406494140625, 1.1539306640625, 1.2568206787109375, 1.359710693359375, 1.4626007080078125, 1.56549072265625, 1.6683807373046875, 1.771270751953125, 1.8741607666015625, 1.97705078125, 2.0799407958984375, 2.182830810546875, 2.2857208251953125, 2.38861083984375, 2.4915008544921875, 2.594390869140625, 2.6972808837890625, 2.8001708984375, 2.9030609130859375, 3.005950927734375, 3.1088409423828125, 3.21173095703125, 3.3146209716796875, 3.417510986328125, 3.5204010009765625, 3.623291015625, 3.7261810302734375, 3.829071044921875, 3.9319610595703125, 4.03485107421875, 4.1377410888671875, 4.240631103515625, 4.3435211181640625, 4.4464111328125, 4.5493011474609375, 4.652191162109375, 4.7550811767578125, 4.85797119140625, 4.9608612060546875, 5.063751220703125, 5.1666412353515625, 5.26953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 19.0, 33.0, 48.0, 79.0, 151.0, 335.0, 819.0, 3084.0, 24857.0, 4118008.0, 40466.0, 4113.0, 1234.0, 461.0, 212.0, 122.0, 72.0, 52.0, 40.0, 18.0, 14.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -23.219482421875, -22.34521484375, -21.470947265625, -20.5966796875, -19.722412109375, -18.84814453125, -17.973876953125, -17.099609375, -16.225341796875, -15.35107421875, -14.476806640625, -13.6025390625, -12.728271484375, -11.85400390625, -10.979736328125, -10.10546875, -9.231201171875, -8.35693359375, -7.482666015625, -6.6083984375, -5.734130859375, -4.85986328125, -3.985595703125, -3.111328125, -2.237060546875, -1.36279296875, -0.488525390625, 0.3857421875, 1.260009765625, 2.13427734375, 3.008544921875, 3.8828125, 4.757080078125, 5.63134765625, 6.505615234375, 7.3798828125, 8.254150390625, 9.12841796875, 10.002685546875, 10.876953125, 11.751220703125, 12.62548828125, 13.499755859375, 14.3740234375, 15.248291015625, 16.12255859375, 16.996826171875, 17.87109375, 18.745361328125, 19.61962890625, 20.493896484375, 21.3681640625, 22.242431640625, 23.11669921875, 23.990966796875, 24.865234375, 25.739501953125, 26.61376953125, 27.488037109375, 28.3623046875, 29.236572265625, 30.11083984375, 30.985107421875, 31.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 21.0, 82.0, 448.0, 2748.0, 595.0, 101.0, 30.0, 7.0, 9.0, 2.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.253662109375, -5.89794921875, -5.542236328125, -5.1865234375, -4.830810546875, -4.47509765625, -4.119384765625, -3.763671875, -3.407958984375, -3.05224609375, -2.696533203125, -2.3408203125, -1.985107421875, -1.62939453125, -1.273681640625, -0.91796875, -0.562255859375, -0.20654296875, 0.149169921875, 0.5048828125, 0.860595703125, 1.21630859375, 1.572021484375, 1.927734375, 2.283447265625, 2.63916015625, 2.994873046875, 3.3505859375, 3.706298828125, 4.06201171875, 4.417724609375, 4.7734375, 5.129150390625, 5.48486328125, 5.840576171875, 6.1962890625, 6.552001953125, 6.90771484375, 7.263427734375, 7.619140625, 7.974853515625, 8.33056640625, 8.686279296875, 9.0419921875, 9.397705078125, 9.75341796875, 10.109130859375, 10.46484375, 10.820556640625, 11.17626953125, 11.531982421875, 11.8876953125, 12.243408203125, 12.59912109375, 12.954833984375, 13.310546875, 13.666259765625, 14.02197265625, 14.377685546875, 14.7333984375, 15.089111328125, 15.44482421875, 15.800537109375, 16.15625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 37.0, 125.0, 289.0, 303.0, 149.0, 40.0, 30.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.252349853515625, -34.68742752075195, -33.12250518798828, -31.557580947875977, -29.992656707763672, -28.427734375, -26.862812042236328, -25.297889709472656, -23.73296546936035, -22.16804313659668, -20.603118896484375, -19.038196563720703, -17.47327423095703, -15.908349990844727, -14.343427658081055, -12.778504371643066, -11.213581085205078, -9.64865779876709, -8.083734512329102, -6.51881217956543, -4.953888893127441, -3.388965606689453, -1.8240432739257812, -0.25911998748779297, 1.3058032989501953, 2.8707263469696045, 4.435649394989014, 6.000572204589844, 7.565495491027832, 9.13041877746582, 10.695341110229492, 12.26026439666748, 13.825187683105469, 15.390110969543457, 16.955034255981445, 18.519956588745117, 20.084880828857422, 21.649803161621094, 23.214725494384766, 24.779647827148438, 26.344572067260742, 27.909494400024414, 29.47441864013672, 31.03934097290039, 32.60426330566406, 34.169189453125, 35.734107971191406, 37.299034118652344, 38.863956451416016, 40.42887878417969, 41.99380111694336, 43.55872344970703, 45.12364959716797, 46.68857192993164, 48.25349426269531, 49.818416595458984, 51.383338928222656, 52.94826126098633, 54.51318359375, 56.07810974121094, 57.64303207397461, 59.20795440673828, 60.77287673950195, 62.337799072265625, 63.90272521972656]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 17.0, 23.0, 34.0, 50.0, 61.0, 90.0, 103.0, 87.0, 95.0, 90.0, 82.0, 70.0, 74.0, 36.0, 32.0, 19.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65022659301758, -31.66196632385254, -30.673707962036133, -29.685447692871094, -28.697187423706055, -27.70892906188965, -26.72066879272461, -25.732410430908203, -24.744150161743164, -23.755889892578125, -22.76763153076172, -21.77937126159668, -20.79111099243164, -19.802852630615234, -18.814592361450195, -17.826332092285156, -16.83807373046875, -15.849814414978027, -14.861554145812988, -13.873294830322266, -12.885035514831543, -11.89677619934082, -10.908515930175781, -9.920256614685059, -8.931995391845703, -7.943735599517822, -6.9554762840271, -5.967216491699219, -4.978957176208496, -3.9906973838806152, -3.0024375915527344, -2.0141782760620117, -1.025918960571289, -0.03765934705734253, 0.950600266456604, 1.9388599395751953, 2.927119493484497, 3.915379047393799, 4.90363883972168, 5.891898155212402, 6.880157947540283, 7.868417739868164, 8.856677055358887, 9.84493637084961, 10.833196640014648, 11.821455955505371, 12.809715270996094, 13.797975540161133, 14.786234855651855, 15.774494171142578, 16.762754440307617, 17.751014709472656, 18.739273071289062, 19.7275333404541, 20.71579360961914, 21.704051971435547, 22.692312240600586, 23.680572509765625, 24.66883087158203, 25.65709114074707, 26.64535140991211, 27.633609771728516, 28.621870040893555, 29.610130310058594, 30.598388671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 13.0, 15.0, 19.0, 40.0, 60.0, 122.0, 222.0, 427.0, 1053.0, 3326.0, 16149.0, 133759.0, 703992.0, 164368.0, 19095.0, 3668.0, 1121.0, 511.0, 252.0, 150.0, 75.0, 37.0, 24.0, 23.0, 11.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4375, -13.0594482421875, -12.681396484375, -12.3033447265625, -11.92529296875, -11.5472412109375, -11.169189453125, -10.7911376953125, -10.4130859375, -10.0350341796875, -9.656982421875, -9.2789306640625, -8.90087890625, -8.5228271484375, -8.144775390625, -7.7667236328125, -7.388671875, -7.0106201171875, -6.632568359375, -6.2545166015625, -5.87646484375, -5.4984130859375, -5.120361328125, -4.7423095703125, -4.3642578125, -3.9862060546875, -3.608154296875, -3.2301025390625, -2.85205078125, -2.4739990234375, -2.095947265625, -1.7178955078125, -1.33984375, -0.9617919921875, -0.583740234375, -0.2056884765625, 0.17236328125, 0.5504150390625, 0.928466796875, 1.3065185546875, 1.6845703125, 2.0626220703125, 2.440673828125, 2.8187255859375, 3.19677734375, 3.5748291015625, 3.952880859375, 4.3309326171875, 4.708984375, 5.0870361328125, 5.465087890625, 5.8431396484375, 6.22119140625, 6.5992431640625, 6.977294921875, 7.3553466796875, 7.7333984375, 8.1114501953125, 8.489501953125, 8.8675537109375, 9.24560546875, 9.6236572265625, 10.001708984375, 10.3797607421875, 10.7578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 12.0, 14.0, 23.0, 32.0, 37.0, 46.0, 59.0, 89.0, 75.0, 107.0, 79.0, 93.0, 70.0, 56.0, 46.0, 54.0, 32.0, 22.0, 22.0, 14.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4833984375, -1.4015960693359375, -1.319793701171875, -1.2379913330078125, -1.15618896484375, -1.0743865966796875, -0.992584228515625, -0.9107818603515625, -0.8289794921875, -0.7471771240234375, -0.665374755859375, -0.5835723876953125, -0.50177001953125, -0.4199676513671875, -0.338165283203125, -0.2563629150390625, -0.174560546875, -0.0927581787109375, -0.010955810546875, 0.0708465576171875, 0.15264892578125, 0.2344512939453125, 0.316253662109375, 0.3980560302734375, 0.4798583984375, 0.5616607666015625, 0.643463134765625, 0.7252655029296875, 0.80706787109375, 0.8888702392578125, 0.970672607421875, 1.0524749755859375, 1.13427734375, 1.2160797119140625, 1.297882080078125, 1.3796844482421875, 1.46148681640625, 1.5432891845703125, 1.625091552734375, 1.7068939208984375, 1.7886962890625, 1.8704986572265625, 1.952301025390625, 2.0341033935546875, 2.11590576171875, 2.1977081298828125, 2.279510498046875, 2.3613128662109375, 2.443115234375, 2.5249176025390625, 2.606719970703125, 2.6885223388671875, 2.77032470703125, 2.8521270751953125, 2.933929443359375, 3.0157318115234375, 3.0975341796875, 3.1793365478515625, 3.261138916015625, 3.3429412841796875, 3.42474365234375, 3.5065460205078125, 3.588348388671875, 3.6701507568359375, 3.751953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 8.0, 8.0, 12.0, 18.0, 21.0, 28.0, 59.0, 76.0, 96.0, 183.0, 282.0, 424.0, 772.0, 1345.0, 3051.0, 7277.0, 19204.0, 57438.0, 177105.0, 405483.0, 248006.0, 82630.0, 27445.0, 9494.0, 4038.0, 1767.0, 907.0, 515.0, 285.0, 193.0, 129.0, 73.0, 41.0, 32.0, 25.0, 34.0, 15.0, 6.0, 5.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.748077392578125, -3.60748291015625, -3.466888427734375, -3.3262939453125, -3.185699462890625, -3.04510498046875, -2.904510498046875, -2.763916015625, -2.623321533203125, -2.48272705078125, -2.342132568359375, -2.2015380859375, -2.060943603515625, -1.92034912109375, -1.779754638671875, -1.63916015625, -1.498565673828125, -1.35797119140625, -1.217376708984375, -1.0767822265625, -0.936187744140625, -0.79559326171875, -0.654998779296875, -0.514404296875, -0.373809814453125, -0.23321533203125, -0.092620849609375, 0.0479736328125, 0.188568115234375, 0.32916259765625, 0.469757080078125, 0.6103515625, 0.750946044921875, 0.89154052734375, 1.032135009765625, 1.1727294921875, 1.313323974609375, 1.45391845703125, 1.594512939453125, 1.735107421875, 1.875701904296875, 2.01629638671875, 2.156890869140625, 2.2974853515625, 2.438079833984375, 2.57867431640625, 2.719268798828125, 2.85986328125, 3.000457763671875, 3.14105224609375, 3.281646728515625, 3.4222412109375, 3.562835693359375, 3.70343017578125, 3.844024658203125, 3.984619140625, 4.125213623046875, 4.26580810546875, 4.406402587890625, 4.5469970703125, 4.687591552734375, 4.82818603515625, 4.968780517578125, 5.109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 9.0, 3.0, 8.0, 16.0, 12.0, 28.0, 23.0, 21.0, 28.0, 21.0, 31.0, 31.0, 41.0, 35.0, 62.0, 47.0, 51.0, 50.0, 48.0, 58.0, 43.0, 43.0, 34.0, 38.0, 27.0, 33.0, 32.0, 23.0, 21.0, 16.0, 8.0, 12.0, 10.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.70477294921875, -5.4993896484375, -5.29400634765625, -5.088623046875, -4.88323974609375, -4.6778564453125, -4.47247314453125, -4.26708984375, -4.06170654296875, -3.8563232421875, -3.65093994140625, -3.445556640625, -3.24017333984375, -3.0347900390625, -2.82940673828125, -2.6240234375, -2.41864013671875, -2.2132568359375, -2.00787353515625, -1.802490234375, -1.59710693359375, -1.3917236328125, -1.18634033203125, -0.98095703125, -0.77557373046875, -0.5701904296875, -0.36480712890625, -0.159423828125, 0.04595947265625, 0.2513427734375, 0.45672607421875, 0.662109375, 0.86749267578125, 1.0728759765625, 1.27825927734375, 1.483642578125, 1.68902587890625, 1.8944091796875, 2.09979248046875, 2.30517578125, 2.51055908203125, 2.7159423828125, 2.92132568359375, 3.126708984375, 3.33209228515625, 3.5374755859375, 3.74285888671875, 3.9482421875, 4.15362548828125, 4.3590087890625, 4.56439208984375, 4.769775390625, 4.97515869140625, 5.1805419921875, 5.38592529296875, 5.59130859375, 5.79669189453125, 6.0020751953125, 6.20745849609375, 6.412841796875, 6.61822509765625, 6.8236083984375, 7.02899169921875, 7.234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 15.0, 13.0, 17.0, 48.0, 60.0, 88.0, 157.0, 248.0, 479.0, 1056.0, 2739.0, 9463.0, 50905.0, 505642.0, 423073.0, 41725.0, 8191.0, 2603.0, 977.0, 437.0, 250.0, 118.0, 76.0, 60.0, 31.0, 23.0, 14.0, 12.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.53515625, -5.37213134765625, -5.2091064453125, -5.04608154296875, -4.883056640625, -4.72003173828125, -4.5570068359375, -4.39398193359375, -4.23095703125, -4.06793212890625, -3.9049072265625, -3.74188232421875, -3.578857421875, -3.41583251953125, -3.2528076171875, -3.08978271484375, -2.9267578125, -2.76373291015625, -2.6007080078125, -2.43768310546875, -2.274658203125, -2.11163330078125, -1.9486083984375, -1.78558349609375, -1.62255859375, -1.45953369140625, -1.2965087890625, -1.13348388671875, -0.970458984375, -0.80743408203125, -0.6444091796875, -0.48138427734375, -0.318359375, -0.15533447265625, 0.0076904296875, 0.17071533203125, 0.333740234375, 0.49676513671875, 0.6597900390625, 0.82281494140625, 0.98583984375, 1.14886474609375, 1.3118896484375, 1.47491455078125, 1.637939453125, 1.80096435546875, 1.9639892578125, 2.12701416015625, 2.2900390625, 2.45306396484375, 2.6160888671875, 2.77911376953125, 2.942138671875, 3.10516357421875, 3.2681884765625, 3.43121337890625, 3.59423828125, 3.75726318359375, 3.9202880859375, 4.08331298828125, 4.246337890625, 4.40936279296875, 4.5723876953125, 4.73541259765625, 4.8984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 13.0, 17.0, 24.0, 36.0, 54.0, 85.0, 187.0, 226.0, 148.0, 78.0, 46.0, 29.0, 18.0, 11.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005793571472167969, -0.0005564391613006592, -0.0005335211753845215, -0.0005106031894683838, -0.0004876852035522461, -0.0004647672176361084, -0.0004418492317199707, -0.000418931245803833, -0.0003960132598876953, -0.0003730952739715576, -0.0003501772880554199, -0.0003272593021392822, -0.00030434131622314453, -0.00028142333030700684, -0.00025850534439086914, -0.00023558735847473145, -0.00021266937255859375, -0.00018975138664245605, -0.00016683340072631836, -0.00014391541481018066, -0.00012099742889404297, -9.807944297790527e-05, -7.516145706176758e-05, -5.224347114562988e-05, -2.9325485229492188e-05, -6.407499313354492e-06, 1.6510486602783203e-05, 3.94284725189209e-05, 6.23464584350586e-05, 8.526444435119629e-05, 0.00010818243026733398, 0.00013110041618347168, 0.00015401840209960938, 0.00017693638801574707, 0.00019985437393188477, 0.00022277235984802246, 0.00024569034576416016, 0.00026860833168029785, 0.00029152631759643555, 0.00031444430351257324, 0.00033736228942871094, 0.00036028027534484863, 0.00038319826126098633, 0.000406116247177124, 0.0004290342330932617, 0.0004519522190093994, 0.0004748702049255371, 0.0004977881908416748, 0.0005207061767578125, 0.0005436241626739502, 0.0005665421485900879, 0.0005894601345062256, 0.0006123781204223633, 0.000635296106338501, 0.0006582140922546387, 0.0006811320781707764, 0.0007040500640869141, 0.0007269680500030518, 0.0007498860359191895, 0.0007728040218353271, 0.0007957220077514648, 0.0008186399936676025, 0.0008415579795837402, 0.0008644759654998779, 0.0008873939514160156]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 17.0, 21.0, 21.0, 44.0, 71.0, 132.0, 178.0, 340.0, 638.0, 1347.0, 3402.0, 11888.0, 68093.0, 616163.0, 302497.0, 32238.0, 6931.0, 2298.0, 1005.0, 516.0, 253.0, 161.0, 92.0, 58.0, 43.0, 34.0, 13.0, 12.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.609375, -5.4482421875, -5.287109375, -5.1259765625, -4.96484375, -4.8037109375, -4.642578125, -4.4814453125, -4.3203125, -4.1591796875, -3.998046875, -3.8369140625, -3.67578125, -3.5146484375, -3.353515625, -3.1923828125, -3.03125, -2.8701171875, -2.708984375, -2.5478515625, -2.38671875, -2.2255859375, -2.064453125, -1.9033203125, -1.7421875, -1.5810546875, -1.419921875, -1.2587890625, -1.09765625, -0.9365234375, -0.775390625, -0.6142578125, -0.453125, -0.2919921875, -0.130859375, 0.0302734375, 0.19140625, 0.3525390625, 0.513671875, 0.6748046875, 0.8359375, 0.9970703125, 1.158203125, 1.3193359375, 1.48046875, 1.6416015625, 1.802734375, 1.9638671875, 2.125, 2.2861328125, 2.447265625, 2.6083984375, 2.76953125, 2.9306640625, 3.091796875, 3.2529296875, 3.4140625, 3.5751953125, 3.736328125, 3.8974609375, 4.05859375, 4.2197265625, 4.380859375, 4.5419921875, 4.703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 11.0, 23.0, 40.0, 65.0, 111.0, 190.0, 205.0, 154.0, 80.0, 44.0, 21.0, 16.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4453125, -7.2139892578125, -6.982666015625, -6.7513427734375, -6.52001953125, -6.2886962890625, -6.057373046875, -5.8260498046875, -5.5947265625, -5.3634033203125, -5.132080078125, -4.9007568359375, -4.66943359375, -4.4381103515625, -4.206787109375, -3.9754638671875, -3.744140625, -3.5128173828125, -3.281494140625, -3.0501708984375, -2.81884765625, -2.5875244140625, -2.356201171875, -2.1248779296875, -1.8935546875, -1.6622314453125, -1.430908203125, -1.1995849609375, -0.96826171875, -0.7369384765625, -0.505615234375, -0.2742919921875, -0.04296875, 0.1883544921875, 0.419677734375, 0.6510009765625, 0.88232421875, 1.1136474609375, 1.344970703125, 1.5762939453125, 1.8076171875, 2.0389404296875, 2.270263671875, 2.5015869140625, 2.73291015625, 2.9642333984375, 3.195556640625, 3.4268798828125, 3.658203125, 3.8895263671875, 4.120849609375, 4.3521728515625, 4.58349609375, 4.8148193359375, 5.046142578125, 5.2774658203125, 5.5087890625, 5.7401123046875, 5.971435546875, 6.2027587890625, 6.43408203125, 6.6654052734375, 6.896728515625, 7.1280517578125, 7.359375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 8.0, 17.0, 35.0, 67.0, 143.0, 169.0, 191.0, 159.0, 102.0, 41.0, 27.0, 15.0, 13.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.33306121826172, -57.65902328491211, -55.9849853515625, -54.310943603515625, -52.636905670166016, -50.962867736816406, -49.28882598876953, -47.61478805541992, -45.94075012207031, -44.2667121887207, -42.592674255371094, -40.91863250732422, -39.24459457397461, -37.570556640625, -35.896514892578125, -34.222476959228516, -32.548439025878906, -30.874401092529297, -29.200361251831055, -27.526321411132812, -25.852283477783203, -24.178245544433594, -22.50420570373535, -20.83016586303711, -19.1561279296875, -17.48208999633789, -15.808050155639648, -14.134011268615723, -12.459972381591797, -10.785933494567871, -9.111894607543945, -7.4378557205200195, -5.763820648193359, -4.089781761169434, -2.415742874145508, -0.741703987121582, 0.9323348999023438, 2.6063737869262695, 4.280412673950195, 5.954451560974121, 7.628490447998047, 9.302529335021973, 10.976568222045898, 12.650607109069824, 14.32464599609375, 15.998684883117676, 17.6727237701416, 19.346763610839844, 21.020801544189453, 22.694839477539062, 24.368879318237305, 26.042919158935547, 27.716957092285156, 29.390995025634766, 31.065034866333008, 32.73907470703125, 34.41311264038086, 36.08715057373047, 37.761192321777344, 39.43523025512695, 41.10926818847656, 42.78330612182617, 44.45734405517578, 46.131385803222656, 47.805423736572266]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 9.0, 12.0, 10.0, 8.0, 16.0, 20.0, 26.0, 26.0, 32.0, 33.0, 49.0, 40.0, 45.0, 53.0, 67.0, 50.0, 49.0, 47.0, 47.0, 52.0, 51.0, 35.0, 44.0, 18.0, 29.0, 23.0, 16.0, 16.0, 21.0, 13.0, 13.0, 6.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.59803771972656, -41.28614807128906, -39.97426223754883, -38.66237258911133, -37.350486755371094, -36.038597106933594, -34.72671127319336, -33.41482162475586, -32.102935791015625, -30.791048049926758, -29.47916030883789, -28.167272567749023, -26.855384826660156, -25.543495178222656, -24.23160743713379, -22.919719696044922, -21.607830047607422, -20.295942306518555, -18.984054565429688, -17.67216682434082, -16.360279083251953, -15.04839038848877, -13.736501693725586, -12.424613952636719, -11.112726211547852, -9.800838470458984, -8.488950729370117, -7.177062034606934, -5.865174293518066, -4.553286552429199, -3.241398334503174, -1.9295101165771484, -0.6176261901855469, 0.6942617893218994, 2.0061497688293457, 3.318037748336792, 4.629925727844238, 5.9418134689331055, 7.253701686859131, 8.565589904785156, 9.877477645874023, 11.18936538696289, 12.501253128051758, 13.813141822814941, 15.125029563903809, 16.43691635131836, 17.74880599975586, 19.060693740844727, 20.372581481933594, 21.68446922302246, 22.996356964111328, 24.308244705200195, 25.620132446289062, 26.932022094726562, 28.24390983581543, 29.555797576904297, 30.867685317993164, 32.17957305908203, 33.49146270751953, 34.803348541259766, 36.115238189697266, 37.4271240234375, 38.739013671875, 40.0509033203125, 41.362789154052734]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 7.0, 14.0, 9.0, 23.0, 28.0, 37.0, 59.0, 92.0, 138.0, 239.0, 448.0, 789.0, 1610.0, 3607.0, 9011.0, 28559.0, 145896.0, 3478814.0, 448161.0, 52495.0, 14370.0, 5217.0, 2194.0, 1050.0, 543.0, 323.0, 150.0, 98.0, 83.0, 55.0, 45.0, 26.0, 20.0, 14.0, 7.0, 12.0, 6.0, 7.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.07421875, -6.8438720703125, -6.613525390625, -6.3831787109375, -6.15283203125, -5.9224853515625, -5.692138671875, -5.4617919921875, -5.2314453125, -5.0010986328125, -4.770751953125, -4.5404052734375, -4.31005859375, -4.0797119140625, -3.849365234375, -3.6190185546875, -3.388671875, -3.1583251953125, -2.927978515625, -2.6976318359375, -2.46728515625, -2.2369384765625, -2.006591796875, -1.7762451171875, -1.5458984375, -1.3155517578125, -1.085205078125, -0.8548583984375, -0.62451171875, -0.3941650390625, -0.163818359375, 0.0665283203125, 0.296875, 0.5272216796875, 0.757568359375, 0.9879150390625, 1.21826171875, 1.4486083984375, 1.678955078125, 1.9093017578125, 2.1396484375, 2.3699951171875, 2.600341796875, 2.8306884765625, 3.06103515625, 3.2913818359375, 3.521728515625, 3.7520751953125, 3.982421875, 4.2127685546875, 4.443115234375, 4.6734619140625, 4.90380859375, 5.1341552734375, 5.364501953125, 5.5948486328125, 5.8251953125, 6.0555419921875, 6.285888671875, 6.5162353515625, 6.74658203125, 6.9769287109375, 7.207275390625, 7.4376220703125, 7.66796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 9.0, 14.0, 17.0, 21.0, 31.0, 29.0, 56.0, 62.0, 65.0, 80.0, 80.0, 95.0, 95.0, 69.0, 62.0, 60.0, 44.0, 29.0, 31.0, 12.0, 17.0, 14.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.5478668212890625, -1.467803955078125, -1.3877410888671875, -1.30767822265625, -1.2276153564453125, -1.147552490234375, -1.0674896240234375, -0.9874267578125, -0.9073638916015625, -0.827301025390625, -0.7472381591796875, -0.66717529296875, -0.5871124267578125, -0.507049560546875, -0.4269866943359375, -0.346923828125, -0.2668609619140625, -0.186798095703125, -0.1067352294921875, -0.02667236328125, 0.0533905029296875, 0.133453369140625, 0.2135162353515625, 0.2935791015625, 0.3736419677734375, 0.453704833984375, 0.5337677001953125, 0.61383056640625, 0.6938934326171875, 0.773956298828125, 0.8540191650390625, 0.93408203125, 1.0141448974609375, 1.094207763671875, 1.1742706298828125, 1.25433349609375, 1.3343963623046875, 1.414459228515625, 1.4945220947265625, 1.5745849609375, 1.6546478271484375, 1.734710693359375, 1.8147735595703125, 1.89483642578125, 1.9748992919921875, 2.054962158203125, 2.1350250244140625, 2.215087890625, 2.2951507568359375, 2.375213623046875, 2.4552764892578125, 2.53533935546875, 2.6154022216796875, 2.695465087890625, 2.7755279541015625, 2.8555908203125, 2.9356536865234375, 3.015716552734375, 3.0957794189453125, 3.17584228515625, 3.2559051513671875, 3.335968017578125, 3.4160308837890625, 3.49609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 7.0, 7.0, 16.0, 26.0, 35.0, 53.0, 62.0, 88.0, 110.0, 181.0, 283.0, 687.0, 2091.0, 11705.0, 158429.0, 3834126.0, 170384.0, 12262.0, 2287.0, 640.0, 256.0, 159.0, 118.0, 74.0, 50.0, 25.0, 38.0, 23.0, 12.0, 9.0, 9.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.5703125, -11.25341796875, -10.9365234375, -10.61962890625, -10.302734375, -9.98583984375, -9.6689453125, -9.35205078125, -9.03515625, -8.71826171875, -8.4013671875, -8.08447265625, -7.767578125, -7.45068359375, -7.1337890625, -6.81689453125, -6.5, -6.18310546875, -5.8662109375, -5.54931640625, -5.232421875, -4.91552734375, -4.5986328125, -4.28173828125, -3.96484375, -3.64794921875, -3.3310546875, -3.01416015625, -2.697265625, -2.38037109375, -2.0634765625, -1.74658203125, -1.4296875, -1.11279296875, -0.7958984375, -0.47900390625, -0.162109375, 0.15478515625, 0.4716796875, 0.78857421875, 1.10546875, 1.42236328125, 1.7392578125, 2.05615234375, 2.373046875, 2.68994140625, 3.0068359375, 3.32373046875, 3.640625, 3.95751953125, 4.2744140625, 4.59130859375, 4.908203125, 5.22509765625, 5.5419921875, 5.85888671875, 6.17578125, 6.49267578125, 6.8095703125, 7.12646484375, 7.443359375, 7.76025390625, 8.0771484375, 8.39404296875, 8.7109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 17.0, 18.0, 33.0, 65.0, 143.0, 283.0, 842.0, 1696.0, 568.0, 192.0, 88.0, 43.0, 24.0, 18.0, 11.0, 9.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.875, -4.767486572265625, -4.65997314453125, -4.552459716796875, -4.4449462890625, -4.337432861328125, -4.22991943359375, -4.122406005859375, -4.014892578125, -3.907379150390625, -3.79986572265625, -3.692352294921875, -3.5848388671875, -3.477325439453125, -3.36981201171875, -3.262298583984375, -3.15478515625, -3.047271728515625, -2.93975830078125, -2.832244873046875, -2.7247314453125, -2.617218017578125, -2.50970458984375, -2.402191162109375, -2.294677734375, -2.187164306640625, -2.07965087890625, -1.972137451171875, -1.8646240234375, -1.757110595703125, -1.64959716796875, -1.542083740234375, -1.4345703125, -1.327056884765625, -1.21954345703125, -1.112030029296875, -1.0045166015625, -0.897003173828125, -0.78948974609375, -0.681976318359375, -0.574462890625, -0.466949462890625, -0.35943603515625, -0.251922607421875, -0.1444091796875, -0.036895751953125, 0.07061767578125, 0.178131103515625, 0.28564453125, 0.393157958984375, 0.50067138671875, 0.608184814453125, 0.7156982421875, 0.823211669921875, 0.93072509765625, 1.038238525390625, 1.145751953125, 1.253265380859375, 1.36077880859375, 1.468292236328125, 1.5758056640625, 1.683319091796875, 1.79083251953125, 1.898345947265625, 2.005859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 30.0, 69.0, 122.0, 199.0, 231.0, 166.0, 87.0, 47.0, 15.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.04359245300293, -30.34857177734375, -29.653549194335938, -28.958526611328125, -28.263505935668945, -27.568485260009766, -26.873462677001953, -26.17844009399414, -25.48341941833496, -24.78839874267578, -24.09337615966797, -23.398353576660156, -22.703332901000977, -22.008312225341797, -21.313289642333984, -20.618267059326172, -19.923246383666992, -19.228225708007812, -18.533203125, -17.838180541992188, -17.143159866333008, -16.448139190673828, -15.753116607666016, -15.05809497833252, -14.363073348999023, -13.668051719665527, -12.973030090332031, -12.278008460998535, -11.582986831665039, -10.887965202331543, -10.192943572998047, -9.49792194366455, -8.802900314331055, -8.107878684997559, -7.4128570556640625, -6.717835426330566, -6.02281379699707, -5.327792167663574, -4.632770538330078, -3.937748908996582, -3.242727279663086, -2.54770565032959, -1.8526840209960938, -1.1576623916625977, -0.46264076232910156, 0.23238086700439453, 0.9274024963378906, 1.6224241256713867, 2.317445755004883, 3.012467384338379, 3.707489013671875, 4.402510643005371, 5.097532272338867, 5.792553901672363, 6.487575531005859, 7.1825971603393555, 7.877618789672852, 8.572640419006348, 9.267662048339844, 9.96268367767334, 10.657705307006836, 11.352726936340332, 12.047748565673828, 12.742770195007324, 13.43779182434082]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 14.0, 23.0, 27.0, 39.0, 40.0, 76.0, 77.0, 92.0, 91.0, 88.0, 67.0, 81.0, 72.0, 59.0, 49.0, 42.0, 22.0, 10.0, 13.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.350425720214844, -15.85556411743164, -15.360702514648438, -14.865840911865234, -14.370979309082031, -13.876117706298828, -13.381256103515625, -12.886394500732422, -12.391532897949219, -11.896671295166016, -11.401809692382812, -10.90694808959961, -10.412086486816406, -9.917224884033203, -9.42236328125, -8.927501678466797, -8.43264102935791, -7.937779426574707, -7.442917823791504, -6.948056221008301, -6.453194618225098, -5.9583330154418945, -5.46347188949585, -4.9686102867126465, -4.473748683929443, -3.9788870811462402, -3.484025478363037, -2.989164113998413, -2.49430251121521, -1.9994409084320068, -1.5045795440673828, -1.0097179412841797, -0.5148563385009766, -0.019994795322418213, 0.47486674785614014, 0.9697282314300537, 1.4645898342132568, 1.95945143699646, 2.454312801361084, 2.949174404144287, 3.4440360069274902, 3.9388976097106934, 4.4337592124938965, 4.928620338439941, 5.4234819412231445, 5.918343544006348, 6.413205146789551, 6.908066749572754, 7.402928352355957, 7.89778995513916, 8.392651557922363, 8.887513160705566, 9.38237476348877, 9.877236366271973, 10.37209701538086, 10.866958618164062, 11.361820220947266, 11.856681823730469, 12.351543426513672, 12.846405029296875, 13.341266632080078, 13.836128234863281, 14.330989837646484, 14.825851440429688, 15.32071304321289]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 9.0, 7.0, 11.0, 16.0, 18.0, 32.0, 43.0, 51.0, 69.0, 99.0, 155.0, 210.0, 382.0, 525.0, 966.0, 1684.0, 3283.0, 7125.0, 16954.0, 44832.0, 124049.0, 311895.0, 324068.0, 131444.0, 47333.0, 17925.0, 7486.0, 3488.0, 1748.0, 982.0, 600.0, 356.0, 232.0, 154.0, 96.0, 71.0, 47.0, 35.0, 24.0, 18.0, 7.0, 13.0, 9.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.94140625, -4.77117919921875, -4.6009521484375, -4.43072509765625, -4.260498046875, -4.09027099609375, -3.9200439453125, -3.74981689453125, -3.57958984375, -3.40936279296875, -3.2391357421875, -3.06890869140625, -2.898681640625, -2.72845458984375, -2.5582275390625, -2.38800048828125, -2.2177734375, -2.04754638671875, -1.8773193359375, -1.70709228515625, -1.536865234375, -1.36663818359375, -1.1964111328125, -1.02618408203125, -0.85595703125, -0.68572998046875, -0.5155029296875, -0.34527587890625, -0.175048828125, -0.00482177734375, 0.1654052734375, 0.33563232421875, 0.505859375, 0.67608642578125, 0.8463134765625, 1.01654052734375, 1.186767578125, 1.35699462890625, 1.5272216796875, 1.69744873046875, 1.86767578125, 2.03790283203125, 2.2081298828125, 2.37835693359375, 2.548583984375, 2.71881103515625, 2.8890380859375, 3.05926513671875, 3.2294921875, 3.39971923828125, 3.5699462890625, 3.74017333984375, 3.910400390625, 4.08062744140625, 4.2508544921875, 4.42108154296875, 4.59130859375, 4.76153564453125, 4.9317626953125, 5.10198974609375, 5.272216796875, 5.44244384765625, 5.6126708984375, 5.78289794921875, 5.953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 11.0, 21.0, 18.0, 31.0, 40.0, 48.0, 40.0, 59.0, 69.0, 79.0, 86.0, 67.0, 94.0, 67.0, 56.0, 34.0, 47.0, 30.0, 22.0, 18.0, 23.0, 13.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.66015625, -1.590423583984375, -1.52069091796875, -1.450958251953125, -1.3812255859375, -1.311492919921875, -1.24176025390625, -1.172027587890625, -1.102294921875, -1.032562255859375, -0.96282958984375, -0.893096923828125, -0.8233642578125, -0.753631591796875, -0.68389892578125, -0.614166259765625, -0.54443359375, -0.474700927734375, -0.40496826171875, -0.335235595703125, -0.2655029296875, -0.195770263671875, -0.12603759765625, -0.056304931640625, 0.013427734375, 0.083160400390625, 0.15289306640625, 0.222625732421875, 0.2923583984375, 0.362091064453125, 0.43182373046875, 0.501556396484375, 0.5712890625, 0.641021728515625, 0.71075439453125, 0.780487060546875, 0.8502197265625, 0.919952392578125, 0.98968505859375, 1.059417724609375, 1.129150390625, 1.198883056640625, 1.26861572265625, 1.338348388671875, 1.4080810546875, 1.477813720703125, 1.54754638671875, 1.617279052734375, 1.68701171875, 1.756744384765625, 1.82647705078125, 1.896209716796875, 1.9659423828125, 2.035675048828125, 2.10540771484375, 2.175140380859375, 2.244873046875, 2.314605712890625, 2.38433837890625, 2.454071044921875, 2.5238037109375, 2.593536376953125, 2.66326904296875, 2.733001708984375, 2.802734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 7.0, 3.0, 4.0, 22.0, 17.0, 33.0, 42.0, 52.0, 78.0, 98.0, 126.0, 226.0, 329.0, 486.0, 822.0, 1471.0, 3129.0, 7341.0, 20056.0, 62826.0, 196843.0, 409941.0, 229464.0, 75329.0, 23600.0, 8459.0, 3519.0, 1643.0, 910.0, 529.0, 348.0, 225.0, 165.0, 116.0, 83.0, 72.0, 40.0, 32.0, 16.0, 17.0, 9.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.87890625, -4.73779296875, -4.5966796875, -4.45556640625, -4.314453125, -4.17333984375, -4.0322265625, -3.89111328125, -3.75, -3.60888671875, -3.4677734375, -3.32666015625, -3.185546875, -3.04443359375, -2.9033203125, -2.76220703125, -2.62109375, -2.47998046875, -2.3388671875, -2.19775390625, -2.056640625, -1.91552734375, -1.7744140625, -1.63330078125, -1.4921875, -1.35107421875, -1.2099609375, -1.06884765625, -0.927734375, -0.78662109375, -0.6455078125, -0.50439453125, -0.36328125, -0.22216796875, -0.0810546875, 0.06005859375, 0.201171875, 0.34228515625, 0.4833984375, 0.62451171875, 0.765625, 0.90673828125, 1.0478515625, 1.18896484375, 1.330078125, 1.47119140625, 1.6123046875, 1.75341796875, 1.89453125, 2.03564453125, 2.1767578125, 2.31787109375, 2.458984375, 2.60009765625, 2.7412109375, 2.88232421875, 3.0234375, 3.16455078125, 3.3056640625, 3.44677734375, 3.587890625, 3.72900390625, 3.8701171875, 4.01123046875, 4.15234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 12.0, 9.0, 12.0, 14.0, 16.0, 15.0, 23.0, 30.0, 30.0, 36.0, 37.0, 34.0, 36.0, 37.0, 47.0, 41.0, 34.0, 38.0, 56.0, 44.0, 36.0, 35.0, 24.0, 30.0, 39.0, 25.0, 26.0, 19.0, 26.0, 21.0, 17.0, 17.0, 15.0, 9.0, 5.0, 7.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.98309326171875, -4.8138427734375, -4.64459228515625, -4.475341796875, -4.30609130859375, -4.1368408203125, -3.96759033203125, -3.79833984375, -3.62908935546875, -3.4598388671875, -3.29058837890625, -3.121337890625, -2.95208740234375, -2.7828369140625, -2.61358642578125, -2.4443359375, -2.27508544921875, -2.1058349609375, -1.93658447265625, -1.767333984375, -1.59808349609375, -1.4288330078125, -1.25958251953125, -1.09033203125, -0.92108154296875, -0.7518310546875, -0.58258056640625, -0.413330078125, -0.24407958984375, -0.0748291015625, 0.09442138671875, 0.263671875, 0.43292236328125, 0.6021728515625, 0.77142333984375, 0.940673828125, 1.10992431640625, 1.2791748046875, 1.44842529296875, 1.61767578125, 1.78692626953125, 1.9561767578125, 2.12542724609375, 2.294677734375, 2.46392822265625, 2.6331787109375, 2.80242919921875, 2.9716796875, 3.14093017578125, 3.3101806640625, 3.47943115234375, 3.648681640625, 3.81793212890625, 3.9871826171875, 4.15643310546875, 4.32568359375, 4.49493408203125, 4.6641845703125, 4.83343505859375, 5.002685546875, 5.17193603515625, 5.3411865234375, 5.51043701171875, 5.6796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 9.0, 16.0, 38.0, 54.0, 90.0, 202.0, 472.0, 1333.0, 4617.0, 19593.0, 126986.0, 621397.0, 232091.0, 31879.0, 6789.0, 1877.0, 604.0, 231.0, 109.0, 66.0, 31.0, 21.0, 12.0, 11.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.292388916015625, -3.15313720703125, -3.013885498046875, -2.8746337890625, -2.735382080078125, -2.59613037109375, -2.456878662109375, -2.317626953125, -2.178375244140625, -2.03912353515625, -1.899871826171875, -1.7606201171875, -1.621368408203125, -1.48211669921875, -1.342864990234375, -1.20361328125, -1.064361572265625, -0.92510986328125, -0.785858154296875, -0.6466064453125, -0.507354736328125, -0.36810302734375, -0.228851318359375, -0.089599609375, 0.049652099609375, 0.18890380859375, 0.328155517578125, 0.4674072265625, 0.606658935546875, 0.74591064453125, 0.885162353515625, 1.0244140625, 1.163665771484375, 1.30291748046875, 1.442169189453125, 1.5814208984375, 1.720672607421875, 1.85992431640625, 1.999176025390625, 2.138427734375, 2.277679443359375, 2.41693115234375, 2.556182861328125, 2.6954345703125, 2.834686279296875, 2.97393798828125, 3.113189697265625, 3.25244140625, 3.391693115234375, 3.53094482421875, 3.670196533203125, 3.8094482421875, 3.948699951171875, 4.08795166015625, 4.227203369140625, 4.366455078125, 4.505706787109375, 4.64495849609375, 4.784210205078125, 4.9234619140625, 5.062713623046875, 5.20196533203125, 5.341217041015625, 5.48046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 11.0, 10.0, 12.0, 11.0, 13.0, 26.0, 34.0, 37.0, 47.0, 83.0, 95.0, 128.0, 114.0, 104.0, 73.0, 42.0, 31.0, 32.0, 33.0, 21.0, 17.0, 12.0, 3.0, 9.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004596710205078125, -0.000444754958152771, -0.0004298388957977295, -0.000414922833442688, -0.0004000067710876465, -0.000385090708732605, -0.0003701746463775635, -0.00035525858402252197, -0.00034034252166748047, -0.00032542645931243896, -0.00031051039695739746, -0.00029559433460235596, -0.00028067827224731445, -0.00026576220989227295, -0.00025084614753723145, -0.00023593008518218994, -0.00022101402282714844, -0.00020609796047210693, -0.00019118189811706543, -0.00017626583576202393, -0.00016134977340698242, -0.00014643371105194092, -0.00013151764869689941, -0.00011660158634185791, -0.0001016855239868164, -8.67694616317749e-05, -7.18533992767334e-05, -5.6937336921691895e-05, -4.202127456665039e-05, -2.7105212211608887e-05, -1.2189149856567383e-05, 2.726912498474121e-06, 1.7642974853515625e-05, 3.255903720855713e-05, 4.747509956359863e-05, 6.239116191864014e-05, 7.730722427368164e-05, 9.222328662872314e-05, 0.00010713934898376465, 0.00012205541133880615, 0.00013697147369384766, 0.00015188753604888916, 0.00016680359840393066, 0.00018171966075897217, 0.00019663572311401367, 0.00021155178546905518, 0.00022646784782409668, 0.00024138391017913818, 0.0002562999725341797, 0.0002712160348892212, 0.0002861320972442627, 0.0003010481595993042, 0.0003159642219543457, 0.0003308802843093872, 0.0003457963466644287, 0.0003607124090194702, 0.0003756284713745117, 0.0003905445337295532, 0.0004054605960845947, 0.00042037665843963623, 0.00043529272079467773, 0.00045020878314971924, 0.00046512484550476074, 0.00048004090785980225, 0.0004949569702148438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 13.0, 7.0, 12.0, 16.0, 39.0, 48.0, 86.0, 136.0, 277.0, 540.0, 1152.0, 3022.0, 9338.0, 40095.0, 256451.0, 584762.0, 121229.0, 21770.0, 5612.0, 2098.0, 872.0, 418.0, 229.0, 117.0, 80.0, 52.0, 26.0, 19.0, 12.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.5859375, -4.4630126953125, -4.340087890625, -4.2171630859375, -4.09423828125, -3.9713134765625, -3.848388671875, -3.7254638671875, -3.6025390625, -3.4796142578125, -3.356689453125, -3.2337646484375, -3.11083984375, -2.9879150390625, -2.864990234375, -2.7420654296875, -2.619140625, -2.4962158203125, -2.373291015625, -2.2503662109375, -2.12744140625, -2.0045166015625, -1.881591796875, -1.7586669921875, -1.6357421875, -1.5128173828125, -1.389892578125, -1.2669677734375, -1.14404296875, -1.0211181640625, -0.898193359375, -0.7752685546875, -0.65234375, -0.5294189453125, -0.406494140625, -0.2835693359375, -0.16064453125, -0.0377197265625, 0.085205078125, 0.2081298828125, 0.3310546875, 0.4539794921875, 0.576904296875, 0.6998291015625, 0.82275390625, 0.9456787109375, 1.068603515625, 1.1915283203125, 1.314453125, 1.4373779296875, 1.560302734375, 1.6832275390625, 1.80615234375, 1.9290771484375, 2.052001953125, 2.1749267578125, 2.2978515625, 2.4207763671875, 2.543701171875, 2.6666259765625, 2.78955078125, 2.9124755859375, 3.035400390625, 3.1583251953125, 3.28125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 11.0, 24.0, 29.0, 47.0, 74.0, 99.0, 116.0, 128.0, 128.0, 103.0, 90.0, 43.0, 36.0, 20.0, 15.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.470428466796875, -5.33538818359375, -5.200347900390625, -5.0653076171875, -4.930267333984375, -4.79522705078125, -4.660186767578125, -4.525146484375, -4.390106201171875, -4.25506591796875, -4.120025634765625, -3.9849853515625, -3.849945068359375, -3.71490478515625, -3.579864501953125, -3.44482421875, -3.309783935546875, -3.17474365234375, -3.039703369140625, -2.9046630859375, -2.769622802734375, -2.63458251953125, -2.499542236328125, -2.364501953125, -2.229461669921875, -2.09442138671875, -1.959381103515625, -1.8243408203125, -1.689300537109375, -1.55426025390625, -1.419219970703125, -1.2841796875, -1.149139404296875, -1.01409912109375, -0.879058837890625, -0.7440185546875, -0.608978271484375, -0.47393798828125, -0.338897705078125, -0.203857421875, -0.068817138671875, 0.06622314453125, 0.201263427734375, 0.3363037109375, 0.471343994140625, 0.60638427734375, 0.741424560546875, 0.87646484375, 1.011505126953125, 1.14654541015625, 1.281585693359375, 1.4166259765625, 1.551666259765625, 1.68670654296875, 1.821746826171875, 1.956787109375, 2.091827392578125, 2.22686767578125, 2.361907958984375, 2.4969482421875, 2.631988525390625, 2.76702880859375, 2.902069091796875, 3.037109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 23.0, 43.0, 135.0, 236.0, 268.0, 171.0, 81.0, 21.0, 14.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.855140686035156, -34.44108200073242, -32.02701950073242, -29.612960815429688, -27.19890022277832, -24.784839630126953, -22.37078094482422, -19.95672035217285, -17.542659759521484, -15.128599166870117, -12.714539527893066, -10.300479888916016, -7.886419296264648, -5.472358703613281, -3.0582990646362305, -0.6442394256591797, 1.7698211669921875, 4.1838812828063965, 6.5979413986206055, 9.012001037597656, 11.426061630249023, 13.84012222290039, 16.254180908203125, 18.668241500854492, 21.08230209350586, 23.496362686157227, 25.910423278808594, 28.324481964111328, 30.738542556762695, 33.15260314941406, 35.5666618347168, 37.98072052001953, 40.39478302001953, 42.808841705322266, 45.222904205322266, 47.636962890625, 50.051025390625, 52.465084075927734, 54.87914276123047, 57.29320526123047, 59.7072639465332, 62.12132263183594, 64.53538513183594, 66.94944763183594, 69.3635025024414, 71.7775650024414, 74.1916275024414, 76.60568237304688, 79.01974487304688, 81.43380737304688, 83.84786224365234, 86.26192474365234, 88.67598724365234, 91.09004211425781, 93.50410461425781, 95.91816711425781, 98.33222961425781, 100.74629211425781, 103.16034698486328, 105.57440948486328, 107.98847198486328, 110.40252685546875, 112.81658935546875, 115.23065185546875, 117.64470672607422]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 5.0, 5.0, 10.0, 9.0, 11.0, 17.0, 22.0, 18.0, 32.0, 27.0, 39.0, 38.0, 51.0, 37.0, 55.0, 35.0, 50.0, 55.0, 68.0, 44.0, 51.0, 44.0, 40.0, 38.0, 26.0, 23.0, 22.0, 22.0, 23.0, 17.0, 7.0, 9.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.85997009277344, -38.75135803222656, -37.64274215698242, -36.53412628173828, -35.425514221191406, -34.31690216064453, -33.20828628540039, -32.09967041015625, -30.991058349609375, -29.882444381713867, -28.77383041381836, -27.66521644592285, -26.556602478027344, -25.447988510131836, -24.339374542236328, -23.23076057434082, -22.122146606445312, -21.013532638549805, -19.904918670654297, -18.79630470275879, -17.68769073486328, -16.579076766967773, -15.470462799072266, -14.361848831176758, -13.25323486328125, -12.144620895385742, -11.036006927490234, -9.927392959594727, -8.818778991699219, -7.710165023803711, -6.601551055908203, -5.492937088012695, -4.38432502746582, -3.2757110595703125, -2.1670970916748047, -1.0584831237792969, 0.05013084411621094, 1.1587448120117188, 2.2673587799072266, 3.3759727478027344, 4.484586715698242, 5.59320068359375, 6.701814651489258, 7.810428619384766, 8.919042587280273, 10.027656555175781, 11.136270523071289, 12.244884490966797, 13.353498458862305, 14.462112426757812, 15.57072639465332, 16.679340362548828, 17.787954330444336, 18.896568298339844, 20.00518226623535, 21.11379623413086, 22.222410202026367, 23.331024169921875, 24.439638137817383, 25.54825210571289, 26.6568660736084, 27.765480041503906, 28.874094009399414, 29.982707977294922, 31.09132194519043]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 8.0, 11.0, 15.0, 18.0, 38.0, 48.0, 69.0, 107.0, 178.0, 233.0, 408.0, 690.0, 1198.0, 2357.0, 5226.0, 13548.0, 44144.0, 246617.0, 3397805.0, 394318.0, 58403.0, 16982.0, 6098.0, 2698.0, 1311.0, 649.0, 399.0, 254.0, 147.0, 96.0, 62.0, 35.0, 29.0, 26.0, 13.0, 5.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4453125, -6.1934814453125, -5.941650390625, -5.6898193359375, -5.43798828125, -5.1861572265625, -4.934326171875, -4.6824951171875, -4.4306640625, -4.1788330078125, -3.927001953125, -3.6751708984375, -3.42333984375, -3.1715087890625, -2.919677734375, -2.6678466796875, -2.416015625, -2.1641845703125, -1.912353515625, -1.6605224609375, -1.40869140625, -1.1568603515625, -0.905029296875, -0.6531982421875, -0.4013671875, -0.1495361328125, 0.102294921875, 0.3541259765625, 0.60595703125, 0.8577880859375, 1.109619140625, 1.3614501953125, 1.61328125, 1.8651123046875, 2.116943359375, 2.3687744140625, 2.62060546875, 2.8724365234375, 3.124267578125, 3.3760986328125, 3.6279296875, 3.8797607421875, 4.131591796875, 4.3834228515625, 4.63525390625, 4.8870849609375, 5.138916015625, 5.3907470703125, 5.642578125, 5.8944091796875, 6.146240234375, 6.3980712890625, 6.64990234375, 6.9017333984375, 7.153564453125, 7.4053955078125, 7.6572265625, 7.9090576171875, 8.160888671875, 8.4127197265625, 8.66455078125, 8.9163818359375, 9.168212890625, 9.4200439453125, 9.671875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 13.0, 16.0, 15.0, 16.0, 36.0, 38.0, 44.0, 53.0, 52.0, 62.0, 58.0, 80.0, 67.0, 73.0, 74.0, 56.0, 51.0, 37.0, 47.0, 24.0, 19.0, 21.0, 20.0, 10.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.6775970458984375, -1.608123779296875, -1.5386505126953125, -1.46917724609375, -1.3997039794921875, -1.330230712890625, -1.2607574462890625, -1.1912841796875, -1.1218109130859375, -1.052337646484375, -0.9828643798828125, -0.91339111328125, -0.8439178466796875, -0.774444580078125, -0.7049713134765625, -0.635498046875, -0.5660247802734375, -0.496551513671875, -0.4270782470703125, -0.35760498046875, -0.2881317138671875, -0.218658447265625, -0.1491851806640625, -0.0797119140625, -0.0102386474609375, 0.059234619140625, 0.1287078857421875, 0.19818115234375, 0.2676544189453125, 0.337127685546875, 0.4066009521484375, 0.47607421875, 0.5455474853515625, 0.615020751953125, 0.6844940185546875, 0.75396728515625, 0.8234405517578125, 0.892913818359375, 0.9623870849609375, 1.0318603515625, 1.1013336181640625, 1.170806884765625, 1.2402801513671875, 1.30975341796875, 1.3792266845703125, 1.448699951171875, 1.5181732177734375, 1.587646484375, 1.6571197509765625, 1.726593017578125, 1.7960662841796875, 1.86553955078125, 1.9350128173828125, 2.004486083984375, 2.0739593505859375, 2.1434326171875, 2.2129058837890625, 2.282379150390625, 2.3518524169921875, 2.42132568359375, 2.4907989501953125, 2.560272216796875, 2.6297454833984375, 2.69921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 11.0, 13.0, 21.0, 47.0, 73.0, 121.0, 163.0, 315.0, 606.0, 1125.0, 2404.0, 5910.0, 19940.0, 103286.0, 1242626.0, 2614264.0, 162519.0, 27905.0, 7476.0, 2785.0, 1234.0, 590.0, 341.0, 193.0, 109.0, 65.0, 43.0, 19.0, 19.0, 10.0, 14.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6328125, -5.4393310546875, -5.245849609375, -5.0523681640625, -4.85888671875, -4.6654052734375, -4.471923828125, -4.2784423828125, -4.0849609375, -3.8914794921875, -3.697998046875, -3.5045166015625, -3.31103515625, -3.1175537109375, -2.924072265625, -2.7305908203125, -2.537109375, -2.3436279296875, -2.150146484375, -1.9566650390625, -1.76318359375, -1.5697021484375, -1.376220703125, -1.1827392578125, -0.9892578125, -0.7957763671875, -0.602294921875, -0.4088134765625, -0.21533203125, -0.0218505859375, 0.171630859375, 0.3651123046875, 0.55859375, 0.7520751953125, 0.945556640625, 1.1390380859375, 1.33251953125, 1.5260009765625, 1.719482421875, 1.9129638671875, 2.1064453125, 2.2999267578125, 2.493408203125, 2.6868896484375, 2.88037109375, 3.0738525390625, 3.267333984375, 3.4608154296875, 3.654296875, 3.8477783203125, 4.041259765625, 4.2347412109375, 4.42822265625, 4.6217041015625, 4.815185546875, 5.0086669921875, 5.2021484375, 5.3956298828125, 5.589111328125, 5.7825927734375, 5.97607421875, 6.1695556640625, 6.363037109375, 6.5565185546875, 6.75]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 10.0, 6.0, 18.0, 33.0, 49.0, 69.0, 142.0, 256.0, 502.0, 1268.0, 795.0, 407.0, 210.0, 109.0, 64.0, 36.0, 23.0, 19.0, 11.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6640625, -3.558837890625, -3.45361328125, -3.348388671875, -3.2431640625, -3.137939453125, -3.03271484375, -2.927490234375, -2.822265625, -2.717041015625, -2.61181640625, -2.506591796875, -2.4013671875, -2.296142578125, -2.19091796875, -2.085693359375, -1.98046875, -1.875244140625, -1.77001953125, -1.664794921875, -1.5595703125, -1.454345703125, -1.34912109375, -1.243896484375, -1.138671875, -1.033447265625, -0.92822265625, -0.822998046875, -0.7177734375, -0.612548828125, -0.50732421875, -0.402099609375, -0.296875, -0.191650390625, -0.08642578125, 0.018798828125, 0.1240234375, 0.229248046875, 0.33447265625, 0.439697265625, 0.544921875, 0.650146484375, 0.75537109375, 0.860595703125, 0.9658203125, 1.071044921875, 1.17626953125, 1.281494140625, 1.38671875, 1.491943359375, 1.59716796875, 1.702392578125, 1.8076171875, 1.912841796875, 2.01806640625, 2.123291015625, 2.228515625, 2.333740234375, 2.43896484375, 2.544189453125, 2.6494140625, 2.754638671875, 2.85986328125, 2.965087890625, 3.0703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 20.0, 50.0, 143.0, 291.0, 290.0, 137.0, 52.0, 9.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.51091003417969, -34.19767379760742, -32.88444137573242, -31.571205139160156, -30.257970809936523, -28.94473648071289, -27.631502151489258, -26.318267822265625, -25.00503158569336, -23.691797256469727, -22.378562927246094, -21.065326690673828, -19.752092361450195, -18.438858032226562, -17.12562370300293, -15.81238842010498, -14.499155044555664, -13.185920715332031, -11.872685432434082, -10.55945110321045, -9.2462158203125, -7.932981491088867, -6.619747161865234, -5.306511878967285, -3.9932775497436523, -2.6800427436828613, -1.3668081760406494, -0.0535736083984375, 1.2596611976623535, 2.5728960037231445, 3.8861303329467773, 5.199365615844727, 6.512599945068359, 7.82583475112915, 9.139069557189941, 10.452303886413574, 11.765539169311523, 13.078773498535156, 14.392007827758789, 15.705243110656738, 17.018478393554688, 18.33171272277832, 19.644947052001953, 20.95818328857422, 22.27141761779785, 23.584651947021484, 24.897886276245117, 26.21112060546875, 27.524354934692383, 28.837589263916016, 30.15082359313965, 31.46405792236328, 32.77729415893555, 34.09053039550781, 35.40376281738281, 36.71699905395508, 38.03023147583008, 39.343467712402344, 40.656700134277344, 41.96993637084961, 43.28316879272461, 44.596405029296875, 45.909637451171875, 47.22287368774414, 48.536109924316406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 8.0, 13.0, 18.0, 22.0, 31.0, 25.0, 35.0, 39.0, 36.0, 59.0, 48.0, 54.0, 55.0, 48.0, 62.0, 51.0, 63.0, 51.0, 46.0, 38.0, 30.0, 24.0, 24.0, 24.0, 29.0, 21.0, 12.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.892335891723633, -11.476560592651367, -11.060786247253418, -10.645010948181152, -10.229236602783203, -9.813461303710938, -9.397686004638672, -8.981910705566406, -8.566136360168457, -8.150361061096191, -7.734586715698242, -7.318811416625977, -6.903036594390869, -6.487261772155762, -6.071486473083496, -5.655711650848389, -5.239936828613281, -4.824162006378174, -4.408387184143066, -3.992611885070801, -3.5768370628356934, -3.161062240600586, -2.7452871799468994, -2.329512119293213, -1.9137372970581055, -1.4979623556137085, -1.0821874141693115, -0.6664124727249146, -0.2506375312805176, 0.16513729095458984, 0.5809123516082764, 0.9966874122619629, 1.412461280822754, 1.8282362222671509, 2.244011163711548, 2.6597862243652344, 3.075561046600342, 3.491335868835449, 3.9071109294891357, 4.322885990142822, 4.73866081237793, 5.154435634613037, 5.5702104568481445, 5.98598575592041, 6.401760578155518, 6.817535400390625, 7.233310699462891, 7.649085521697998, 8.064860343933105, 8.480635643005371, 8.89640998840332, 9.312185287475586, 9.727960586547852, 10.1437349319458, 10.559510231018066, 10.975284576416016, 11.391059875488281, 11.806835174560547, 12.222609519958496, 12.638384819030762, 13.054159164428711, 13.469934463500977, 13.885709762573242, 14.301485061645508, 14.717259407043457]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 5.0, 12.0, 20.0, 26.0, 35.0, 42.0, 77.0, 118.0, 169.0, 249.0, 397.0, 678.0, 1381.0, 2480.0, 6086.0, 15809.0, 51064.0, 199603.0, 559250.0, 148448.0, 39530.0, 12855.0, 5106.0, 2341.0, 1126.0, 644.0, 364.0, 226.0, 128.0, 94.0, 52.0, 35.0, 25.0, 21.0, 16.0, 8.0, 7.0, 10.0, 5.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.6944580078125, -5.478759765625, -5.2630615234375, -5.04736328125, -4.8316650390625, -4.615966796875, -4.4002685546875, -4.1845703125, -3.9688720703125, -3.753173828125, -3.5374755859375, -3.32177734375, -3.1060791015625, -2.890380859375, -2.6746826171875, -2.458984375, -2.2432861328125, -2.027587890625, -1.8118896484375, -1.59619140625, -1.3804931640625, -1.164794921875, -0.9490966796875, -0.7333984375, -0.5177001953125, -0.302001953125, -0.0863037109375, 0.12939453125, 0.3450927734375, 0.560791015625, 0.7764892578125, 0.9921875, 1.2078857421875, 1.423583984375, 1.6392822265625, 1.85498046875, 2.0706787109375, 2.286376953125, 2.5020751953125, 2.7177734375, 2.9334716796875, 3.149169921875, 3.3648681640625, 3.58056640625, 3.7962646484375, 4.011962890625, 4.2276611328125, 4.443359375, 4.6590576171875, 4.874755859375, 5.0904541015625, 5.30615234375, 5.5218505859375, 5.737548828125, 5.9532470703125, 6.1689453125, 6.3846435546875, 6.600341796875, 6.8160400390625, 7.03173828125, 7.2474365234375, 7.463134765625, 7.6788330078125, 7.89453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 16.0, 4.0, 14.0, 22.0, 32.0, 38.0, 41.0, 44.0, 61.0, 58.0, 51.0, 69.0, 56.0, 81.0, 69.0, 53.0, 53.0, 50.0, 44.0, 30.0, 28.0, 20.0, 19.0, 18.0, 12.0, 6.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.6321258544921875, -1.566009521484375, -1.4998931884765625, -1.43377685546875, -1.3676605224609375, -1.301544189453125, -1.2354278564453125, -1.1693115234375, -1.1031951904296875, -1.037078857421875, -0.9709625244140625, -0.90484619140625, -0.8387298583984375, -0.772613525390625, -0.7064971923828125, -0.640380859375, -0.5742645263671875, -0.508148193359375, -0.4420318603515625, -0.37591552734375, -0.3097991943359375, -0.243682861328125, -0.1775665283203125, -0.1114501953125, -0.0453338623046875, 0.020782470703125, 0.0868988037109375, 0.15301513671875, 0.2191314697265625, 0.285247802734375, 0.3513641357421875, 0.41748046875, 0.4835968017578125, 0.549713134765625, 0.6158294677734375, 0.68194580078125, 0.7480621337890625, 0.814178466796875, 0.8802947998046875, 0.9464111328125, 1.0125274658203125, 1.078643798828125, 1.1447601318359375, 1.21087646484375, 1.2769927978515625, 1.343109130859375, 1.4092254638671875, 1.475341796875, 1.5414581298828125, 1.607574462890625, 1.6736907958984375, 1.73980712890625, 1.8059234619140625, 1.872039794921875, 1.9381561279296875, 2.0042724609375, 2.0703887939453125, 2.136505126953125, 2.2026214599609375, 2.26873779296875, 2.3348541259765625, 2.400970458984375, 2.4670867919921875, 2.533203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 17.0, 7.0, 16.0, 20.0, 29.0, 41.0, 66.0, 78.0, 87.0, 132.0, 205.0, 333.0, 529.0, 1016.0, 2222.0, 6411.0, 24378.0, 115598.0, 613918.0, 224992.0, 41657.0, 10343.0, 3245.0, 1363.0, 673.0, 359.0, 265.0, 158.0, 101.0, 70.0, 51.0, 27.0, 27.0, 27.0, 19.0, 16.0, 11.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.328125, -6.1075439453125, -5.886962890625, -5.6663818359375, -5.44580078125, -5.2252197265625, -5.004638671875, -4.7840576171875, -4.5634765625, -4.3428955078125, -4.122314453125, -3.9017333984375, -3.68115234375, -3.4605712890625, -3.239990234375, -3.0194091796875, -2.798828125, -2.5782470703125, -2.357666015625, -2.1370849609375, -1.91650390625, -1.6959228515625, -1.475341796875, -1.2547607421875, -1.0341796875, -0.8135986328125, -0.593017578125, -0.3724365234375, -0.15185546875, 0.0687255859375, 0.289306640625, 0.5098876953125, 0.73046875, 0.9510498046875, 1.171630859375, 1.3922119140625, 1.61279296875, 1.8333740234375, 2.053955078125, 2.2745361328125, 2.4951171875, 2.7156982421875, 2.936279296875, 3.1568603515625, 3.37744140625, 3.5980224609375, 3.818603515625, 4.0391845703125, 4.259765625, 4.4803466796875, 4.700927734375, 4.9215087890625, 5.14208984375, 5.3626708984375, 5.583251953125, 5.8038330078125, 6.0244140625, 6.2449951171875, 6.465576171875, 6.6861572265625, 6.90673828125, 7.1273193359375, 7.347900390625, 7.5684814453125, 7.7890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 11.0, 12.0, 21.0, 21.0, 24.0, 30.0, 21.0, 37.0, 29.0, 42.0, 50.0, 52.0, 55.0, 52.0, 70.0, 47.0, 71.0, 48.0, 43.0, 36.0, 23.0, 37.0, 23.0, 25.0, 17.0, 18.0, 15.0, 7.0, 9.0, 7.0, 5.0, 1.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.2613525390625, -7.022705078125, -6.7840576171875, -6.54541015625, -6.3067626953125, -6.068115234375, -5.8294677734375, -5.5908203125, -5.3521728515625, -5.113525390625, -4.8748779296875, -4.63623046875, -4.3975830078125, -4.158935546875, -3.9202880859375, -3.681640625, -3.4429931640625, -3.204345703125, -2.9656982421875, -2.72705078125, -2.4884033203125, -2.249755859375, -2.0111083984375, -1.7724609375, -1.5338134765625, -1.295166015625, -1.0565185546875, -0.81787109375, -0.5792236328125, -0.340576171875, -0.1019287109375, 0.13671875, 0.3753662109375, 0.614013671875, 0.8526611328125, 1.09130859375, 1.3299560546875, 1.568603515625, 1.8072509765625, 2.0458984375, 2.2845458984375, 2.523193359375, 2.7618408203125, 3.00048828125, 3.2391357421875, 3.477783203125, 3.7164306640625, 3.955078125, 4.1937255859375, 4.432373046875, 4.6710205078125, 4.90966796875, 5.1483154296875, 5.386962890625, 5.6256103515625, 5.8642578125, 6.1029052734375, 6.341552734375, 6.5802001953125, 6.81884765625, 7.0574951171875, 7.296142578125, 7.5347900390625, 7.7734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 14.0, 20.0, 24.0, 83.0, 186.0, 501.0, 6765.0, 1027267.0, 12615.0, 663.0, 243.0, 99.0, 39.0, 11.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -26.954833984375, -26.17529296875, -25.395751953125, -24.6162109375, -23.836669921875, -23.05712890625, -22.277587890625, -21.498046875, -20.718505859375, -19.93896484375, -19.159423828125, -18.3798828125, -17.600341796875, -16.82080078125, -16.041259765625, -15.26171875, -14.482177734375, -13.70263671875, -12.923095703125, -12.1435546875, -11.364013671875, -10.58447265625, -9.804931640625, -9.025390625, -8.245849609375, -7.46630859375, -6.686767578125, -5.9072265625, -5.127685546875, -4.34814453125, -3.568603515625, -2.7890625, -2.009521484375, -1.22998046875, -0.450439453125, 0.3291015625, 1.108642578125, 1.88818359375, 2.667724609375, 3.447265625, 4.226806640625, 5.00634765625, 5.785888671875, 6.5654296875, 7.344970703125, 8.12451171875, 8.904052734375, 9.68359375, 10.463134765625, 11.24267578125, 12.022216796875, 12.8017578125, 13.581298828125, 14.36083984375, 15.140380859375, 15.919921875, 16.699462890625, 17.47900390625, 18.258544921875, 19.0380859375, 19.817626953125, 20.59716796875, 21.376708984375, 22.15625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 6.0, 6.0, 3.0, 12.0, 13.0, 23.0, 26.0, 27.0, 70.0, 234.0, 325.0, 100.0, 49.0, 34.0, 19.0, 19.0, 15.0, 13.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005517005920410156, -0.0005268529057502747, -0.0005020052194595337, -0.0004771575331687927, -0.00045230984687805176, -0.0004274621605873108, -0.0004026144742965698, -0.00037776678800582886, -0.0003529191017150879, -0.0003280714154243469, -0.00030322372913360596, -0.000278376042842865, -0.000253528356552124, -0.00022868067026138306, -0.0002038329839706421, -0.00017898529767990112, -0.00015413761138916016, -0.0001292899250984192, -0.00010444223880767822, -7.959455251693726e-05, -5.474686622619629e-05, -2.9899179935455322e-05, -5.0514936447143555e-06, 1.979619264602661e-05, 4.464387893676758e-05, 6.949156522750854e-05, 9.433925151824951e-05, 0.00011918693780899048, 0.00014403462409973145, 0.0001688823103904724, 0.00019372999668121338, 0.00021857768297195435, 0.0002434253692626953, 0.0002682730555534363, 0.00029312074184417725, 0.0003179684281349182, 0.0003428161144256592, 0.00036766380071640015, 0.0003925114870071411, 0.0004173591732978821, 0.00044220685958862305, 0.000467054545879364, 0.000491902232170105, 0.000516749918460846, 0.0005415976047515869, 0.0005664452910423279, 0.0005912929773330688, 0.0006161406636238098, 0.0006409883499145508, 0.0006658360362052917, 0.0006906837224960327, 0.0007155314087867737, 0.0007403790950775146, 0.0007652267813682556, 0.0007900744676589966, 0.0008149221539497375, 0.0008397698402404785, 0.0008646175265312195, 0.0008894652128219604, 0.0009143128991127014, 0.0009391605854034424, 0.0009640082716941833, 0.0009888559579849243, 0.0010137036442756653, 0.0010385513305664062]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 25.0, 58.0, 122.0, 237.0, 1156.0, 542735.0, 502621.0, 1096.0, 258.0, 131.0, 43.0, 28.0, 13.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.21875, -26.24658203125, -25.2744140625, -24.30224609375, -23.330078125, -22.35791015625, -21.3857421875, -20.41357421875, -19.44140625, -18.46923828125, -17.4970703125, -16.52490234375, -15.552734375, -14.58056640625, -13.6083984375, -12.63623046875, -11.6640625, -10.69189453125, -9.7197265625, -8.74755859375, -7.775390625, -6.80322265625, -5.8310546875, -4.85888671875, -3.88671875, -2.91455078125, -1.9423828125, -0.97021484375, 0.001953125, 0.97412109375, 1.9462890625, 2.91845703125, 3.890625, 4.86279296875, 5.8349609375, 6.80712890625, 7.779296875, 8.75146484375, 9.7236328125, 10.69580078125, 11.66796875, 12.64013671875, 13.6123046875, 14.58447265625, 15.556640625, 16.52880859375, 17.5009765625, 18.47314453125, 19.4453125, 20.41748046875, 21.3896484375, 22.36181640625, 23.333984375, 24.30615234375, 25.2783203125, 26.25048828125, 27.22265625, 28.19482421875, 29.1669921875, 30.13916015625, 31.111328125, 32.08349609375, 33.0556640625, 34.02783203125, 35.0]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 63.0, 620.0, 276.0, 27.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.046875, -18.246337890625, -17.44580078125, -16.645263671875, -15.8447265625, -15.044189453125, -14.24365234375, -13.443115234375, -12.642578125, -11.842041015625, -11.04150390625, -10.240966796875, -9.4404296875, -8.639892578125, -7.83935546875, -7.038818359375, -6.23828125, -5.437744140625, -4.63720703125, -3.836669921875, -3.0361328125, -2.235595703125, -1.43505859375, -0.634521484375, 0.166015625, 0.966552734375, 1.76708984375, 2.567626953125, 3.3681640625, 4.168701171875, 4.96923828125, 5.769775390625, 6.5703125, 7.370849609375, 8.17138671875, 8.971923828125, 9.7724609375, 10.572998046875, 11.37353515625, 12.174072265625, 12.974609375, 13.775146484375, 14.57568359375, 15.376220703125, 16.1767578125, 16.977294921875, 17.77783203125, 18.578369140625, 19.37890625, 20.179443359375, 20.97998046875, 21.780517578125, 22.5810546875, 23.381591796875, 24.18212890625, 24.982666015625, 25.783203125, 26.583740234375, 27.38427734375, 28.184814453125, 28.9853515625, 29.785888671875, 30.58642578125, 31.386962890625, 32.1875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 23.0, 121.0, 452.0, 340.0, 48.0, 14.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.83174133300781, -61.25709915161133, -55.682456970214844, -50.107818603515625, -44.53317642211914, -38.958534240722656, -33.38389587402344, -27.809253692626953, -22.23461151123047, -16.659969329833984, -11.085329055786133, -5.510688781738281, 0.06395339965820312, 5.6385955810546875, 11.213233947753906, 16.78787612915039, 22.362518310546875, 27.93716049194336, 33.511802673339844, 39.08644104003906, 44.66108322143555, 50.23572540283203, 55.81036376953125, 61.385005950927734, 66.95964813232422, 72.53428649902344, 78.10893249511719, 83.6835708618164, 89.25820922851562, 94.83285522460938, 100.4074935913086, 105.98213195800781, 111.55679321289062, 117.13143157958984, 122.7060775756836, 128.2807159423828, 133.85536193847656, 139.42999267578125, 145.004638671875, 150.57928466796875, 156.1539306640625, 161.72857666015625, 167.30320739746094, 172.8778533935547, 178.45249938964844, 184.02713012695312, 189.60177612304688, 195.17642211914062, 200.7510528564453, 206.32569885253906, 211.90032958984375, 217.4749755859375, 223.04962158203125, 228.624267578125, 234.1988983154297, 239.77354431152344, 245.34817504882812, 250.92282104492188, 256.4974670410156, 262.07208251953125, 267.646728515625, 273.22137451171875, 278.7960205078125, 284.37066650390625, 289.9453125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 10.0, 11.0, 22.0, 27.0, 30.0, 36.0, 45.0, 52.0, 53.0, 51.0, 55.0, 66.0, 61.0, 71.0, 50.0, 63.0, 45.0, 39.0, 45.0, 31.0, 34.0, 28.0, 11.0, 18.0, 10.0, 10.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.340576171875, -37.86341094970703, -36.3862419128418, -34.90907287597656, -33.431907653808594, -31.954740524291992, -30.47757339477539, -29.00040626525879, -27.523239135742188, -26.046072006225586, -24.568904876708984, -23.091737747192383, -21.61457061767578, -20.13740348815918, -18.660236358642578, -17.183069229125977, -15.705902099609375, -14.228734970092773, -12.751567840576172, -11.27440071105957, -9.797233581542969, -8.320066452026367, -6.842899322509766, -5.365732192993164, -3.8885650634765625, -2.411397933959961, -0.9342308044433594, 0.5429363250732422, 2.0201034545898438, 3.4972705841064453, 4.974437713623047, 6.451604843139648, 7.928768157958984, 9.405935287475586, 10.883102416992188, 12.360269546508789, 13.83743667602539, 15.314603805541992, 16.791770935058594, 18.268938064575195, 19.746105194091797, 21.2232723236084, 22.700439453125, 24.1776065826416, 25.654773712158203, 27.131940841674805, 28.609107971191406, 30.086275100708008, 31.56344223022461, 33.040611267089844, 34.51777648925781, 35.99494171142578, 37.472110748291016, 38.94927978515625, 40.42644500732422, 41.90361022949219, 43.38077926635742, 44.857948303222656, 46.335113525390625, 47.812278747558594, 49.28944778442383, 50.76661682128906, 52.24378204345703, 53.720947265625, 55.198116302490234]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 6.0, 13.0, 24.0, 31.0, 65.0, 127.0, 247.0, 526.0, 1302.0, 3786.0, 14623.0, 99663.0, 3725706.0, 311002.0, 27881.0, 6193.0, 1810.0, 684.0, 302.0, 127.0, 67.0, 35.0, 25.0, 15.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8984375, -12.4639892578125, -12.029541015625, -11.5950927734375, -11.16064453125, -10.7261962890625, -10.291748046875, -9.8572998046875, -9.4228515625, -8.9884033203125, -8.553955078125, -8.1195068359375, -7.68505859375, -7.2506103515625, -6.816162109375, -6.3817138671875, -5.947265625, -5.5128173828125, -5.078369140625, -4.6439208984375, -4.20947265625, -3.7750244140625, -3.340576171875, -2.9061279296875, -2.4716796875, -2.0372314453125, -1.602783203125, -1.1683349609375, -0.73388671875, -0.2994384765625, 0.135009765625, 0.5694580078125, 1.00390625, 1.4383544921875, 1.872802734375, 2.3072509765625, 2.74169921875, 3.1761474609375, 3.610595703125, 4.0450439453125, 4.4794921875, 4.9139404296875, 5.348388671875, 5.7828369140625, 6.21728515625, 6.6517333984375, 7.086181640625, 7.5206298828125, 7.955078125, 8.3895263671875, 8.823974609375, 9.2584228515625, 9.69287109375, 10.1273193359375, 10.561767578125, 10.9962158203125, 11.4306640625, 11.8651123046875, 12.299560546875, 12.7340087890625, 13.16845703125, 13.6029052734375, 14.037353515625, 14.4718017578125, 14.90625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 8.0, 17.0, 18.0, 16.0, 31.0, 53.0, 78.0, 50.0, 66.0, 75.0, 73.0, 66.0, 66.0, 67.0, 67.0, 60.0, 38.0, 42.0, 25.0, 21.0, 13.0, 8.0, 9.0, 12.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.15673828125, -2.0771484375, -1.99755859375, -1.91796875, -1.83837890625, -1.7587890625, -1.67919921875, -1.599609375, -1.52001953125, -1.4404296875, -1.36083984375, -1.28125, -1.20166015625, -1.1220703125, -1.04248046875, -0.962890625, -0.88330078125, -0.8037109375, -0.72412109375, -0.64453125, -0.56494140625, -0.4853515625, -0.40576171875, -0.326171875, -0.24658203125, -0.1669921875, -0.08740234375, -0.0078125, 0.07177734375, 0.1513671875, 0.23095703125, 0.310546875, 0.39013671875, 0.4697265625, 0.54931640625, 0.62890625, 0.70849609375, 0.7880859375, 0.86767578125, 0.947265625, 1.02685546875, 1.1064453125, 1.18603515625, 1.265625, 1.34521484375, 1.4248046875, 1.50439453125, 1.583984375, 1.66357421875, 1.7431640625, 1.82275390625, 1.90234375, 1.98193359375, 2.0615234375, 2.14111328125, 2.220703125, 2.30029296875, 2.3798828125, 2.45947265625, 2.5390625, 2.61865234375, 2.6982421875, 2.77783203125, 2.857421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 17.0, 18.0, 15.0, 28.0, 44.0, 57.0, 88.0, 106.0, 210.0, 370.0, 880.0, 3402.0, 22410.0, 551805.0, 3547103.0, 58398.0, 6680.0, 1499.0, 498.0, 243.0, 136.0, 87.0, 65.0, 39.0, 21.0, 19.0, 16.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.562744140625, -13.18798828125, -12.813232421875, -12.4384765625, -12.063720703125, -11.68896484375, -11.314208984375, -10.939453125, -10.564697265625, -10.18994140625, -9.815185546875, -9.4404296875, -9.065673828125, -8.69091796875, -8.316162109375, -7.94140625, -7.566650390625, -7.19189453125, -6.817138671875, -6.4423828125, -6.067626953125, -5.69287109375, -5.318115234375, -4.943359375, -4.568603515625, -4.19384765625, -3.819091796875, -3.4443359375, -3.069580078125, -2.69482421875, -2.320068359375, -1.9453125, -1.570556640625, -1.19580078125, -0.821044921875, -0.4462890625, -0.071533203125, 0.30322265625, 0.677978515625, 1.052734375, 1.427490234375, 1.80224609375, 2.177001953125, 2.5517578125, 2.926513671875, 3.30126953125, 3.676025390625, 4.05078125, 4.425537109375, 4.80029296875, 5.175048828125, 5.5498046875, 5.924560546875, 6.29931640625, 6.674072265625, 7.048828125, 7.423583984375, 7.79833984375, 8.173095703125, 8.5478515625, 8.922607421875, 9.29736328125, 9.672119140625, 10.046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 13.0, 28.0, 68.0, 140.0, 452.0, 2104.0, 835.0, 245.0, 94.0, 33.0, 22.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.90069580078125, -6.7310791015625, -6.56146240234375, -6.391845703125, -6.22222900390625, -6.0526123046875, -5.88299560546875, -5.71337890625, -5.54376220703125, -5.3741455078125, -5.20452880859375, -5.034912109375, -4.86529541015625, -4.6956787109375, -4.52606201171875, -4.3564453125, -4.18682861328125, -4.0172119140625, -3.84759521484375, -3.677978515625, -3.50836181640625, -3.3387451171875, -3.16912841796875, -2.99951171875, -2.82989501953125, -2.6602783203125, -2.49066162109375, -2.321044921875, -2.15142822265625, -1.9818115234375, -1.81219482421875, -1.642578125, -1.47296142578125, -1.3033447265625, -1.13372802734375, -0.964111328125, -0.79449462890625, -0.6248779296875, -0.45526123046875, -0.28564453125, -0.11602783203125, 0.0535888671875, 0.22320556640625, 0.392822265625, 0.56243896484375, 0.7320556640625, 0.90167236328125, 1.0712890625, 1.24090576171875, 1.4105224609375, 1.58013916015625, 1.749755859375, 1.91937255859375, 2.0889892578125, 2.25860595703125, 2.42822265625, 2.59783935546875, 2.7674560546875, 2.93707275390625, 3.106689453125, 3.27630615234375, 3.4459228515625, 3.61553955078125, 3.78515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 15.0, 20.0, 38.0, 93.0, 166.0, 198.0, 199.0, 145.0, 61.0, 39.0, 10.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.742679595947266, -36.914608001708984, -36.08654022216797, -35.25846862792969, -34.430397033691406, -33.602325439453125, -32.77425765991211, -31.946186065673828, -31.11811637878418, -30.29004669189453, -29.46197509765625, -28.6339054107666, -27.805835723876953, -26.977764129638672, -26.149694442749023, -25.321624755859375, -24.493553161621094, -23.665483474731445, -22.837411880493164, -22.009342193603516, -21.181270599365234, -20.353200912475586, -19.525131225585938, -18.697059631347656, -17.868989944458008, -17.04092025756836, -16.212848663330078, -15.38477897644043, -14.556708335876465, -13.7286376953125, -12.900568008422852, -12.072497367858887, -11.244428634643555, -10.41635799407959, -9.588287353515625, -8.760217666625977, -7.932147026062012, -7.104076385498047, -6.27600622177124, -5.447936058044434, -4.619865417480469, -3.791795015335083, -2.9637246131896973, -2.1356542110443115, -1.3075838088989258, -0.47951316833496094, 0.3485569953918457, 1.1766271591186523, 2.004697799682617, 2.832768201828003, 3.6608386039733887, 4.488908767700195, 5.31697940826416, 6.145050048828125, 6.973120212554932, 7.801190376281738, 8.629261016845703, 9.457331657409668, 10.285402297973633, 11.113471984863281, 11.941542625427246, 12.769613265991211, 13.59768295288086, 14.425753593444824, 15.253824234008789]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 13.0, 11.0, 29.0, 25.0, 22.0, 24.0, 42.0, 26.0, 50.0, 53.0, 46.0, 58.0, 45.0, 40.0, 55.0, 43.0, 43.0, 48.0, 45.0, 33.0, 31.0, 26.0, 26.0, 24.0, 15.0, 22.0, 19.0, 25.0, 5.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.333694458007812, -9.017455101013184, -8.701214790344238, -8.38497543334961, -8.068735122680664, -7.752495765686035, -7.436255931854248, -7.120016098022461, -6.803776741027832, -6.487536907196045, -6.171297073364258, -5.855057716369629, -5.538817882537842, -5.222578048706055, -4.906338214874268, -4.5900983810424805, -4.273858547210693, -3.9576187133789062, -3.6413791179656982, -3.325139284133911, -3.008899688720703, -2.692659854888916, -2.376420021057129, -2.060180425643921, -1.7439405918121338, -1.4277008771896362, -1.1114611625671387, -0.7952213287353516, -0.478981614112854, -0.16274189949035645, 0.15349793434143066, 0.46973752975463867, 0.7859773635864258, 1.1022170782089233, 1.418456792831421, 1.734696626663208, 2.050936222076416, 2.367176055908203, 2.6834158897399902, 2.9996554851531982, 3.3158953189849854, 3.6321351528167725, 3.9483747482299805, 4.264614582061768, 4.580854415893555, 4.897093772888184, 5.213334083557129, 5.529573440551758, 5.845813274383545, 6.162053108215332, 6.478292942047119, 6.794532775878906, 7.110772132873535, 7.427011966705322, 7.743251800537109, 8.059491157531738, 8.375731468200684, 8.691970825195312, 9.008211135864258, 9.324450492858887, 9.640690803527832, 9.956930160522461, 10.273170471191406, 10.589409828186035, 10.905649185180664]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 10.0, 16.0, 30.0, 38.0, 61.0, 114.0, 200.0, 359.0, 814.0, 2319.0, 8584.0, 49769.0, 478922.0, 447722.0, 47320.0, 8338.0, 2273.0, 807.0, 380.0, 198.0, 105.0, 63.0, 28.0, 23.0, 19.0, 12.0, 11.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.7606201171875, -9.411865234375, -9.0631103515625, -8.71435546875, -8.3656005859375, -8.016845703125, -7.6680908203125, -7.3193359375, -6.9705810546875, -6.621826171875, -6.2730712890625, -5.92431640625, -5.5755615234375, -5.226806640625, -4.8780517578125, -4.529296875, -4.1805419921875, -3.831787109375, -3.4830322265625, -3.13427734375, -2.7855224609375, -2.436767578125, -2.0880126953125, -1.7392578125, -1.3905029296875, -1.041748046875, -0.6929931640625, -0.34423828125, 0.0045166015625, 0.353271484375, 0.7020263671875, 1.05078125, 1.3995361328125, 1.748291015625, 2.0970458984375, 2.44580078125, 2.7945556640625, 3.143310546875, 3.4920654296875, 3.8408203125, 4.1895751953125, 4.538330078125, 4.8870849609375, 5.23583984375, 5.5845947265625, 5.933349609375, 6.2821044921875, 6.630859375, 6.9796142578125, 7.328369140625, 7.6771240234375, 8.02587890625, 8.3746337890625, 8.723388671875, 9.0721435546875, 9.4208984375, 9.7696533203125, 10.118408203125, 10.4671630859375, 10.81591796875, 11.1646728515625, 11.513427734375, 11.8621826171875, 12.2109375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 19.0, 19.0, 35.0, 38.0, 50.0, 59.0, 56.0, 76.0, 67.0, 78.0, 73.0, 76.0, 55.0, 68.0, 55.0, 42.0, 30.0, 25.0, 18.0, 10.0, 12.0, 6.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.07574462890625, -1.9952392578125, -1.91473388671875, -1.834228515625, -1.75372314453125, -1.6732177734375, -1.59271240234375, -1.51220703125, -1.43170166015625, -1.3511962890625, -1.27069091796875, -1.190185546875, -1.10968017578125, -1.0291748046875, -0.94866943359375, -0.8681640625, -0.78765869140625, -0.7071533203125, -0.62664794921875, -0.546142578125, -0.46563720703125, -0.3851318359375, -0.30462646484375, -0.22412109375, -0.14361572265625, -0.0631103515625, 0.01739501953125, 0.097900390625, 0.17840576171875, 0.2589111328125, 0.33941650390625, 0.419921875, 0.50042724609375, 0.5809326171875, 0.66143798828125, 0.741943359375, 0.82244873046875, 0.9029541015625, 0.98345947265625, 1.06396484375, 1.14447021484375, 1.2249755859375, 1.30548095703125, 1.385986328125, 1.46649169921875, 1.5469970703125, 1.62750244140625, 1.7080078125, 1.78851318359375, 1.8690185546875, 1.94952392578125, 2.030029296875, 2.11053466796875, 2.1910400390625, 2.27154541015625, 2.35205078125, 2.43255615234375, 2.5130615234375, 2.59356689453125, 2.674072265625, 2.75457763671875, 2.8350830078125, 2.91558837890625, 2.99609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 14.0, 13.0, 38.0, 43.0, 63.0, 151.0, 263.0, 620.0, 1813.0, 10022.0, 103632.0, 812155.0, 106565.0, 10234.0, 1715.0, 626.0, 265.0, 147.0, 56.0, 48.0, 18.0, 13.0, 10.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.46826171875, -9.1240234375, -8.77978515625, -8.435546875, -8.09130859375, -7.7470703125, -7.40283203125, -7.05859375, -6.71435546875, -6.3701171875, -6.02587890625, -5.681640625, -5.33740234375, -4.9931640625, -4.64892578125, -4.3046875, -3.96044921875, -3.6162109375, -3.27197265625, -2.927734375, -2.58349609375, -2.2392578125, -1.89501953125, -1.55078125, -1.20654296875, -0.8623046875, -0.51806640625, -0.173828125, 0.17041015625, 0.5146484375, 0.85888671875, 1.203125, 1.54736328125, 1.8916015625, 2.23583984375, 2.580078125, 2.92431640625, 3.2685546875, 3.61279296875, 3.95703125, 4.30126953125, 4.6455078125, 4.98974609375, 5.333984375, 5.67822265625, 6.0224609375, 6.36669921875, 6.7109375, 7.05517578125, 7.3994140625, 7.74365234375, 8.087890625, 8.43212890625, 8.7763671875, 9.12060546875, 9.46484375, 9.80908203125, 10.1533203125, 10.49755859375, 10.841796875, 11.18603515625, 11.5302734375, 11.87451171875, 12.21875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 11.0, 19.0, 15.0, 22.0, 32.0, 30.0, 55.0, 49.0, 46.0, 51.0, 59.0, 58.0, 76.0, 56.0, 66.0, 50.0, 58.0, 39.0, 41.0, 30.0, 33.0, 27.0, 21.0, 12.0, 13.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.792724609375, -8.49951171875, -8.206298828125, -7.9130859375, -7.619873046875, -7.32666015625, -7.033447265625, -6.740234375, -6.447021484375, -6.15380859375, -5.860595703125, -5.5673828125, -5.274169921875, -4.98095703125, -4.687744140625, -4.39453125, -4.101318359375, -3.80810546875, -3.514892578125, -3.2216796875, -2.928466796875, -2.63525390625, -2.342041015625, -2.048828125, -1.755615234375, -1.46240234375, -1.169189453125, -0.8759765625, -0.582763671875, -0.28955078125, 0.003662109375, 0.296875, 0.590087890625, 0.88330078125, 1.176513671875, 1.4697265625, 1.762939453125, 2.05615234375, 2.349365234375, 2.642578125, 2.935791015625, 3.22900390625, 3.522216796875, 3.8154296875, 4.108642578125, 4.40185546875, 4.695068359375, 4.98828125, 5.281494140625, 5.57470703125, 5.867919921875, 6.1611328125, 6.454345703125, 6.74755859375, 7.040771484375, 7.333984375, 7.627197265625, 7.92041015625, 8.213623046875, 8.5068359375, 8.800048828125, 9.09326171875, 9.386474609375, 9.6796875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 15.0, 20.0, 36.0, 84.0, 164.0, 465.0, 1596.0, 10027.0, 128010.0, 841000.0, 59672.0, 5764.0, 1070.0, 352.0, 131.0, 59.0, 33.0, 17.0, 10.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.26544189453125, -4.0972900390625, -3.92913818359375, -3.760986328125, -3.59283447265625, -3.4246826171875, -3.25653076171875, -3.08837890625, -2.92022705078125, -2.7520751953125, -2.58392333984375, -2.415771484375, -2.24761962890625, -2.0794677734375, -1.91131591796875, -1.7431640625, -1.57501220703125, -1.4068603515625, -1.23870849609375, -1.070556640625, -0.90240478515625, -0.7342529296875, -0.56610107421875, -0.39794921875, -0.22979736328125, -0.0616455078125, 0.10650634765625, 0.274658203125, 0.44281005859375, 0.6109619140625, 0.77911376953125, 0.947265625, 1.11541748046875, 1.2835693359375, 1.45172119140625, 1.619873046875, 1.78802490234375, 1.9561767578125, 2.12432861328125, 2.29248046875, 2.46063232421875, 2.6287841796875, 2.79693603515625, 2.965087890625, 3.13323974609375, 3.3013916015625, 3.46954345703125, 3.6376953125, 3.80584716796875, 3.9739990234375, 4.14215087890625, 4.310302734375, 4.47845458984375, 4.6466064453125, 4.81475830078125, 4.98291015625, 5.15106201171875, 5.3192138671875, 5.48736572265625, 5.655517578125, 5.82366943359375, 5.9918212890625, 6.15997314453125, 6.328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 9.0, 6.0, 13.0, 11.0, 24.0, 34.0, 60.0, 99.0, 206.0, 192.0, 120.0, 54.0, 30.0, 23.0, 14.0, 15.0, 21.0, 7.0, 6.0, 3.0, 10.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005307197570800781, -0.0005167946219444275, -0.0005028694868087769, -0.0004889443516731262, -0.0004750192165374756, -0.00046109408140182495, -0.0004471689462661743, -0.0004332438111305237, -0.00041931867599487305, -0.0004053935408592224, -0.0003914684057235718, -0.00037754327058792114, -0.0003636181354522705, -0.0003496930003166199, -0.00033576786518096924, -0.0003218427300453186, -0.00030791759490966797, -0.00029399245977401733, -0.0002800673246383667, -0.00026614218950271606, -0.00025221705436706543, -0.0002382919192314148, -0.00022436678409576416, -0.00021044164896011353, -0.0001965165138244629, -0.00018259137868881226, -0.00016866624355316162, -0.00015474110841751099, -0.00014081597328186035, -0.00012689083814620972, -0.00011296570301055908, -9.904056787490845e-05, -8.511543273925781e-05, -7.119029760360718e-05, -5.726516246795654e-05, -4.334002733230591e-05, -2.9414892196655273e-05, -1.548975706100464e-05, -1.564621925354004e-06, 1.2360513210296631e-05, 2.6285648345947266e-05, 4.02107834815979e-05, 5.4135918617248535e-05, 6.806105375289917e-05, 8.19861888885498e-05, 9.591132402420044e-05, 0.00010983645915985107, 0.0001237615942955017, 0.00013768672943115234, 0.00015161186456680298, 0.0001655369997024536, 0.00017946213483810425, 0.00019338726997375488, 0.00020731240510940552, 0.00022123754024505615, 0.0002351626753807068, 0.0002490878105163574, 0.00026301294565200806, 0.0002769380807876587, 0.0002908632159233093, 0.00030478835105895996, 0.0003187134861946106, 0.00033263862133026123, 0.00034656375646591187, 0.0003604888916015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 13.0, 17.0, 33.0, 54.0, 91.0, 168.0, 324.0, 646.0, 1457.0, 3856.0, 14678.0, 87937.0, 746023.0, 161869.0, 22492.0, 5404.0, 1874.0, 785.0, 383.0, 191.0, 88.0, 43.0, 35.0, 21.0, 9.0, 13.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-4.30078125, -4.183380126953125, -4.06597900390625, -3.948577880859375, -3.8311767578125, -3.713775634765625, -3.59637451171875, -3.478973388671875, -3.361572265625, -3.244171142578125, -3.12677001953125, -3.009368896484375, -2.8919677734375, -2.774566650390625, -2.65716552734375, -2.539764404296875, -2.42236328125, -2.304962158203125, -2.18756103515625, -2.070159912109375, -1.9527587890625, -1.835357666015625, -1.71795654296875, -1.600555419921875, -1.483154296875, -1.365753173828125, -1.24835205078125, -1.130950927734375, -1.0135498046875, -0.896148681640625, -0.77874755859375, -0.661346435546875, -0.5439453125, -0.426544189453125, -0.30914306640625, -0.191741943359375, -0.0743408203125, 0.043060302734375, 0.16046142578125, 0.277862548828125, 0.395263671875, 0.512664794921875, 0.63006591796875, 0.747467041015625, 0.8648681640625, 0.982269287109375, 1.09967041015625, 1.217071533203125, 1.33447265625, 1.451873779296875, 1.56927490234375, 1.686676025390625, 1.8040771484375, 1.921478271484375, 2.03887939453125, 2.156280517578125, 2.273681640625, 2.391082763671875, 2.50848388671875, 2.625885009765625, 2.7432861328125, 2.860687255859375, 2.97808837890625, 3.095489501953125, 3.212890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 15.0, 11.0, 31.0, 33.0, 37.0, 60.0, 91.0, 105.0, 151.0, 138.0, 98.0, 83.0, 57.0, 26.0, 22.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.96527099609375, -3.8367919921875, -3.70831298828125, -3.579833984375, -3.45135498046875, -3.3228759765625, -3.19439697265625, -3.06591796875, -2.93743896484375, -2.8089599609375, -2.68048095703125, -2.552001953125, -2.42352294921875, -2.2950439453125, -2.16656494140625, -2.0380859375, -1.90960693359375, -1.7811279296875, -1.65264892578125, -1.524169921875, -1.39569091796875, -1.2672119140625, -1.13873291015625, -1.01025390625, -0.88177490234375, -0.7532958984375, -0.62481689453125, -0.496337890625, -0.36785888671875, -0.2393798828125, -0.11090087890625, 0.017578125, 0.14605712890625, 0.2745361328125, 0.40301513671875, 0.531494140625, 0.65997314453125, 0.7884521484375, 0.91693115234375, 1.04541015625, 1.17388916015625, 1.3023681640625, 1.43084716796875, 1.559326171875, 1.68780517578125, 1.8162841796875, 1.94476318359375, 2.0732421875, 2.20172119140625, 2.3302001953125, 2.45867919921875, 2.587158203125, 2.71563720703125, 2.8441162109375, 2.97259521484375, 3.10107421875, 3.22955322265625, 3.3580322265625, 3.48651123046875, 3.614990234375, 3.74346923828125, 3.8719482421875, 4.00042724609375, 4.12890625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 45.0, 221.0, 464.0, 221.0, 37.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.1803741455078, -164.7919158935547, -160.4034423828125, -156.01498413085938, -151.62652587890625, -147.23805236816406, -142.84959411621094, -138.4611358642578, -134.07266235351562, -129.6842041015625, -125.29573822021484, -120.90727233886719, -116.51880645751953, -112.13034057617188, -107.74188232421875, -103.3534164428711, -98.96495819091797, -94.57649230957031, -90.18803405761719, -85.79956817626953, -81.41110229492188, -77.02264404296875, -72.6341781616211, -68.24571228027344, -63.85725021362305, -59.468788146972656, -55.080322265625, -50.69186019897461, -46.30339813232422, -41.91493225097656, -37.52647018432617, -33.13800811767578, -28.749542236328125, -24.3610782623291, -19.972614288330078, -15.584152221679688, -11.195688247680664, -6.807224273681641, -2.41876220703125, 1.9697017669677734, 6.358165740966797, 10.74662971496582, 15.135092735290527, 19.523555755615234, 23.912019729614258, 28.30048370361328, 32.68894577026367, 37.07740783691406, 41.46587371826172, 45.85433578491211, 50.242801666259766, 54.631263732910156, 59.01972961425781, 63.4081916809082, 67.7966537475586, 72.18511962890625, 76.57357788085938, 80.96204376220703, 85.35050201416016, 89.73896789550781, 94.12743377685547, 98.51589965820312, 102.90435791015625, 107.2928237915039, 111.68128967285156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 8.0, 8.0, 17.0, 14.0, 23.0, 29.0, 19.0, 21.0, 26.0, 38.0, 39.0, 54.0, 46.0, 42.0, 51.0, 46.0, 49.0, 52.0, 44.0, 35.0, 41.0, 37.0, 41.0, 32.0, 20.0, 26.0, 32.0, 20.0, 16.0, 15.0, 10.0, 9.0, 11.0, 8.0, 5.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.05866241455078, -33.87992477416992, -32.70118713378906, -31.52245330810547, -30.34371566772461, -29.16497802734375, -27.986242294311523, -26.807506561279297, -25.628768920898438, -24.450031280517578, -23.27129554748535, -22.092559814453125, -20.913822174072266, -19.735084533691406, -18.55634880065918, -17.377613067626953, -16.198875427246094, -15.02013874053955, -13.841402053833008, -12.662665367126465, -11.483928680419922, -10.305191993713379, -9.126455307006836, -7.947718620300293, -6.76898193359375, -5.590245246887207, -4.411508560180664, -3.232771873474121, -2.054035186767578, -0.8752985000610352, 0.3034381866455078, 1.4821748733520508, 2.6609115600585938, 3.8396482467651367, 5.01838493347168, 6.197121620178223, 7.375858306884766, 8.554594993591309, 9.733331680297852, 10.912068367004395, 12.090805053710938, 13.26954174041748, 14.448278427124023, 15.627015113830566, 16.80575180053711, 17.98448944091797, 19.163225173950195, 20.341960906982422, 21.52069854736328, 22.69943618774414, 23.878171920776367, 25.056907653808594, 26.235645294189453, 27.414382934570312, 28.59311866760254, 29.771854400634766, 30.950592041015625, 32.129329681396484, 33.308067321777344, 34.48680114746094, 35.6655387878418, 36.844276428222656, 38.02301025390625, 39.20174789428711, 40.38048553466797]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 12.0, 19.0, 26.0, 55.0, 79.0, 135.0, 160.0, 303.0, 550.0, 972.0, 1815.0, 3521.0, 7770.0, 20301.0, 67883.0, 544535.0, 3359990.0, 132517.0, 31957.0, 11315.0, 4865.0, 2435.0, 1233.0, 732.0, 408.0, 217.0, 155.0, 92.0, 71.0, 48.0, 20.0, 16.0, 16.0, 10.0, 11.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.0146484375, -7.740234375, -7.4658203125, -7.19140625, -6.9169921875, -6.642578125, -6.3681640625, -6.09375, -5.8193359375, -5.544921875, -5.2705078125, -4.99609375, -4.7216796875, -4.447265625, -4.1728515625, -3.8984375, -3.6240234375, -3.349609375, -3.0751953125, -2.80078125, -2.5263671875, -2.251953125, -1.9775390625, -1.703125, -1.4287109375, -1.154296875, -0.8798828125, -0.60546875, -0.3310546875, -0.056640625, 0.2177734375, 0.4921875, 0.7666015625, 1.041015625, 1.3154296875, 1.58984375, 1.8642578125, 2.138671875, 2.4130859375, 2.6875, 2.9619140625, 3.236328125, 3.5107421875, 3.78515625, 4.0595703125, 4.333984375, 4.6083984375, 4.8828125, 5.1572265625, 5.431640625, 5.7060546875, 5.98046875, 6.2548828125, 6.529296875, 6.8037109375, 7.078125, 7.3525390625, 7.626953125, 7.9013671875, 8.17578125, 8.4501953125, 8.724609375, 8.9990234375, 9.2734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 11.0, 12.0, 17.0, 16.0, 31.0, 43.0, 30.0, 48.0, 49.0, 78.0, 57.0, 66.0, 65.0, 68.0, 57.0, 75.0, 52.0, 48.0, 39.0, 32.0, 33.0, 25.0, 17.0, 5.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.02154541015625, -1.9454345703125, -1.86932373046875, -1.793212890625, -1.71710205078125, -1.6409912109375, -1.56488037109375, -1.48876953125, -1.41265869140625, -1.3365478515625, -1.26043701171875, -1.184326171875, -1.10821533203125, -1.0321044921875, -0.95599365234375, -0.8798828125, -0.80377197265625, -0.7276611328125, -0.65155029296875, -0.575439453125, -0.49932861328125, -0.4232177734375, -0.34710693359375, -0.27099609375, -0.19488525390625, -0.1187744140625, -0.04266357421875, 0.033447265625, 0.10955810546875, 0.1856689453125, 0.26177978515625, 0.337890625, 0.41400146484375, 0.4901123046875, 0.56622314453125, 0.642333984375, 0.71844482421875, 0.7945556640625, 0.87066650390625, 0.94677734375, 1.02288818359375, 1.0989990234375, 1.17510986328125, 1.251220703125, 1.32733154296875, 1.4034423828125, 1.47955322265625, 1.5556640625, 1.63177490234375, 1.7078857421875, 1.78399658203125, 1.860107421875, 1.93621826171875, 2.0123291015625, 2.08843994140625, 2.16455078125, 2.24066162109375, 2.3167724609375, 2.39288330078125, 2.468994140625, 2.54510498046875, 2.6212158203125, 2.69732666015625, 2.7734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 7.0, 5.0, 8.0, 14.0, 8.0, 17.0, 28.0, 37.0, 25.0, 62.0, 88.0, 160.0, 232.0, 501.0, 958.0, 2272.0, 5506.0, 15808.0, 59941.0, 459835.0, 3418577.0, 178867.0, 34009.0, 10276.0, 3800.0, 1615.0, 706.0, 374.0, 184.0, 120.0, 78.0, 36.0, 31.0, 28.0, 21.0, 13.0, 12.0, 10.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.28167724609375, -6.0516357421875, -5.82159423828125, -5.591552734375, -5.36151123046875, -5.1314697265625, -4.90142822265625, -4.67138671875, -4.44134521484375, -4.2113037109375, -3.98126220703125, -3.751220703125, -3.52117919921875, -3.2911376953125, -3.06109619140625, -2.8310546875, -2.60101318359375, -2.3709716796875, -2.14093017578125, -1.910888671875, -1.68084716796875, -1.4508056640625, -1.22076416015625, -0.99072265625, -0.76068115234375, -0.5306396484375, -0.30059814453125, -0.070556640625, 0.15948486328125, 0.3895263671875, 0.61956787109375, 0.849609375, 1.07965087890625, 1.3096923828125, 1.53973388671875, 1.769775390625, 1.99981689453125, 2.2298583984375, 2.45989990234375, 2.68994140625, 2.91998291015625, 3.1500244140625, 3.38006591796875, 3.610107421875, 3.84014892578125, 4.0701904296875, 4.30023193359375, 4.5302734375, 4.76031494140625, 4.9903564453125, 5.22039794921875, 5.450439453125, 5.68048095703125, 5.9105224609375, 6.14056396484375, 6.37060546875, 6.60064697265625, 6.8306884765625, 7.06072998046875, 7.290771484375, 7.52081298828125, 7.7508544921875, 7.98089599609375, 8.2109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 9.0, 8.0, 23.0, 22.0, 42.0, 80.0, 203.0, 551.0, 2318.0, 430.0, 187.0, 78.0, 44.0, 19.0, 18.0, 10.0, 6.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.79296875, -6.6400146484375, -6.487060546875, -6.3341064453125, -6.18115234375, -6.0281982421875, -5.875244140625, -5.7222900390625, -5.5693359375, -5.4163818359375, -5.263427734375, -5.1104736328125, -4.95751953125, -4.8045654296875, -4.651611328125, -4.4986572265625, -4.345703125, -4.1927490234375, -4.039794921875, -3.8868408203125, -3.73388671875, -3.5809326171875, -3.427978515625, -3.2750244140625, -3.1220703125, -2.9691162109375, -2.816162109375, -2.6632080078125, -2.51025390625, -2.3572998046875, -2.204345703125, -2.0513916015625, -1.8984375, -1.7454833984375, -1.592529296875, -1.4395751953125, -1.28662109375, -1.1336669921875, -0.980712890625, -0.8277587890625, -0.6748046875, -0.5218505859375, -0.368896484375, -0.2159423828125, -0.06298828125, 0.0899658203125, 0.242919921875, 0.3958740234375, 0.548828125, 0.7017822265625, 0.854736328125, 1.0076904296875, 1.16064453125, 1.3135986328125, 1.466552734375, 1.6195068359375, 1.7724609375, 1.9254150390625, 2.078369140625, 2.2313232421875, 2.38427734375, 2.5372314453125, 2.690185546875, 2.8431396484375, 2.99609375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 14.0, 42.0, 118.0, 304.0, 295.0, 159.0, 43.0, 11.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.48490524291992, -42.24455642700195, -41.00421142578125, -39.76386260986328, -38.52351379394531, -37.28316879272461, -36.04281997680664, -34.80247497558594, -33.56212615966797, -32.32177734375, -31.081432342529297, -29.841083526611328, -28.600736618041992, -27.360389709472656, -26.120040893554688, -24.87969398498535, -23.639347076416016, -22.39900016784668, -21.158653259277344, -19.918304443359375, -18.67795753479004, -17.437610626220703, -16.197261810302734, -14.956914901733398, -13.716567993164062, -12.476221084594727, -11.235873222351074, -9.995525360107422, -8.755178451538086, -7.514831066131592, -6.274483680725098, -5.034135818481445, -3.793792724609375, -2.553445339202881, -1.3130979537963867, -0.07275056838989258, 1.1675968170166016, 2.4079442024230957, 3.64829158782959, 4.888639450073242, 6.128986358642578, 7.369333744049072, 8.609681129455566, 9.850028991699219, 11.090375900268555, 12.33072280883789, 13.571070671081543, 14.811418533325195, 16.05176544189453, 17.292112350463867, 18.532459259033203, 19.772808074951172, 21.013154983520508, 22.253501892089844, 23.493850708007812, 24.73419761657715, 25.974544525146484, 27.21489143371582, 28.455238342285156, 29.695587158203125, 30.93593406677246, 32.1762809753418, 33.416629791259766, 34.65697479248047, 35.89732360839844]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 18.0, 17.0, 26.0, 37.0, 47.0, 60.0, 54.0, 66.0, 61.0, 75.0, 93.0, 73.0, 63.0, 62.0, 54.0, 48.0, 23.0, 33.0, 18.0, 14.0, 16.0, 9.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.734742164611816, -12.249144554138184, -11.76354694366455, -11.277948379516602, -10.792350769042969, -10.306753158569336, -9.821155548095703, -9.33555793762207, -8.849960327148438, -8.364362716674805, -7.878764629364014, -7.393167018890381, -6.90756893157959, -6.421971321105957, -5.936373710632324, -5.450776100158691, -4.965177536010742, -4.479579925537109, -3.9939818382263184, -3.5083842277526855, -3.0227863788604736, -2.5371885299682617, -2.051590919494629, -1.565993070602417, -1.080395221710205, -0.5947974324226379, -0.1091996431350708, 0.37639808654785156, 0.8619959354400635, 1.3475937843322754, 1.8331913948059082, 2.31878924369812, 2.8043880462646484, 3.2899858951568604, 3.7755837440490723, 4.261181354522705, 4.746779441833496, 5.232377052307129, 5.717974662780762, 6.2035722732543945, 6.6891703605651855, 7.174767971038818, 7.660366058349609, 8.145963668823242, 8.631561279296875, 9.117158889770508, 9.60275650024414, 10.08835506439209, 10.573952674865723, 11.059550285339355, 11.545147895812988, 12.030746459960938, 12.51634407043457, 13.001941680908203, 13.487539291381836, 13.973136901855469, 14.458734512329102, 14.944332122802734, 15.429929733276367, 15.91552734375, 16.401124954223633, 16.886722564697266, 17.37232208251953, 17.857919692993164, 18.343517303466797]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 8.0, 18.0, 25.0, 51.0, 87.0, 130.0, 195.0, 403.0, 726.0, 1388.0, 3065.0, 8212.0, 24045.0, 75574.0, 231808.0, 440663.0, 175332.0, 56968.0, 18300.0, 6412.0, 2520.0, 1144.0, 603.0, 316.0, 199.0, 118.0, 81.0, 34.0, 41.0, 17.0, 12.0, 18.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.59375, -7.3958740234375, -7.197998046875, -7.0001220703125, -6.80224609375, -6.6043701171875, -6.406494140625, -6.2086181640625, -6.0107421875, -5.8128662109375, -5.614990234375, -5.4171142578125, -5.21923828125, -5.0213623046875, -4.823486328125, -4.6256103515625, -4.427734375, -4.2298583984375, -4.031982421875, -3.8341064453125, -3.63623046875, -3.4383544921875, -3.240478515625, -3.0426025390625, -2.8447265625, -2.6468505859375, -2.448974609375, -2.2510986328125, -2.05322265625, -1.8553466796875, -1.657470703125, -1.4595947265625, -1.26171875, -1.0638427734375, -0.865966796875, -0.6680908203125, -0.47021484375, -0.2723388671875, -0.074462890625, 0.1234130859375, 0.3212890625, 0.5191650390625, 0.717041015625, 0.9149169921875, 1.11279296875, 1.3106689453125, 1.508544921875, 1.7064208984375, 1.904296875, 2.1021728515625, 2.300048828125, 2.4979248046875, 2.69580078125, 2.8936767578125, 3.091552734375, 3.2894287109375, 3.4873046875, 3.6851806640625, 3.883056640625, 4.0809326171875, 4.27880859375, 4.4766845703125, 4.674560546875, 4.8724365234375, 5.0703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 10.0, 11.0, 20.0, 18.0, 25.0, 31.0, 41.0, 43.0, 53.0, 58.0, 56.0, 53.0, 50.0, 68.0, 64.0, 52.0, 49.0, 50.0, 48.0, 36.0, 37.0, 28.0, 27.0, 15.0, 11.0, 9.0, 3.0, 10.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.561126708984375, -1.49334716796875, -1.425567626953125, -1.3577880859375, -1.290008544921875, -1.22222900390625, -1.154449462890625, -1.086669921875, -1.018890380859375, -0.95111083984375, -0.883331298828125, -0.8155517578125, -0.747772216796875, -0.67999267578125, -0.612213134765625, -0.54443359375, -0.476654052734375, -0.40887451171875, -0.341094970703125, -0.2733154296875, -0.205535888671875, -0.13775634765625, -0.069976806640625, -0.002197265625, 0.065582275390625, 0.13336181640625, 0.201141357421875, 0.2689208984375, 0.336700439453125, 0.40447998046875, 0.472259521484375, 0.5400390625, 0.607818603515625, 0.67559814453125, 0.743377685546875, 0.8111572265625, 0.878936767578125, 0.94671630859375, 1.014495849609375, 1.082275390625, 1.150054931640625, 1.21783447265625, 1.285614013671875, 1.3533935546875, 1.421173095703125, 1.48895263671875, 1.556732177734375, 1.62451171875, 1.692291259765625, 1.76007080078125, 1.827850341796875, 1.8956298828125, 1.963409423828125, 2.03118896484375, 2.098968505859375, 2.166748046875, 2.234527587890625, 2.30230712890625, 2.370086669921875, 2.4378662109375, 2.505645751953125, 2.57342529296875, 2.641204833984375, 2.708984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 12.0, 13.0, 22.0, 34.0, 43.0, 70.0, 101.0, 152.0, 204.0, 323.0, 447.0, 732.0, 1431.0, 3286.0, 11632.0, 56180.0, 288908.0, 531649.0, 120105.0, 23124.0, 5551.0, 1947.0, 901.0, 547.0, 327.0, 216.0, 171.0, 103.0, 75.0, 57.0, 53.0, 28.0, 26.0, 25.0, 11.0, 6.0, 10.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.29254150390625, -6.0772705078125, -5.86199951171875, -5.646728515625, -5.43145751953125, -5.2161865234375, -5.00091552734375, -4.78564453125, -4.57037353515625, -4.3551025390625, -4.13983154296875, -3.924560546875, -3.70928955078125, -3.4940185546875, -3.27874755859375, -3.0634765625, -2.84820556640625, -2.6329345703125, -2.41766357421875, -2.202392578125, -1.98712158203125, -1.7718505859375, -1.55657958984375, -1.34130859375, -1.12603759765625, -0.9107666015625, -0.69549560546875, -0.480224609375, -0.26495361328125, -0.0496826171875, 0.16558837890625, 0.380859375, 0.59613037109375, 0.8114013671875, 1.02667236328125, 1.241943359375, 1.45721435546875, 1.6724853515625, 1.88775634765625, 2.10302734375, 2.31829833984375, 2.5335693359375, 2.74884033203125, 2.964111328125, 3.17938232421875, 3.3946533203125, 3.60992431640625, 3.8251953125, 4.04046630859375, 4.2557373046875, 4.47100830078125, 4.686279296875, 4.90155029296875, 5.1168212890625, 5.33209228515625, 5.54736328125, 5.76263427734375, 5.9779052734375, 6.19317626953125, 6.408447265625, 6.62371826171875, 6.8389892578125, 7.05426025390625, 7.26953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 4.0, 4.0, 5.0, 6.0, 18.0, 10.0, 15.0, 17.0, 21.0, 27.0, 28.0, 34.0, 28.0, 39.0, 48.0, 53.0, 48.0, 35.0, 51.0, 50.0, 38.0, 48.0, 50.0, 41.0, 32.0, 39.0, 31.0, 29.0, 21.0, 22.0, 34.0, 10.0, 11.0, 14.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.404296875, -7.15234375, -6.900390625, -6.6484375, -6.396484375, -6.14453125, -5.892578125, -5.640625, -5.388671875, -5.13671875, -4.884765625, -4.6328125, -4.380859375, -4.12890625, -3.876953125, -3.625, -3.373046875, -3.12109375, -2.869140625, -2.6171875, -2.365234375, -2.11328125, -1.861328125, -1.609375, -1.357421875, -1.10546875, -0.853515625, -0.6015625, -0.349609375, -0.09765625, 0.154296875, 0.40625, 0.658203125, 0.91015625, 1.162109375, 1.4140625, 1.666015625, 1.91796875, 2.169921875, 2.421875, 2.673828125, 2.92578125, 3.177734375, 3.4296875, 3.681640625, 3.93359375, 4.185546875, 4.4375, 4.689453125, 4.94140625, 5.193359375, 5.4453125, 5.697265625, 5.94921875, 6.201171875, 6.453125, 6.705078125, 6.95703125, 7.208984375, 7.4609375, 7.712890625, 7.96484375, 8.216796875, 8.46875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 7.0, 10.0, 15.0, 22.0, 38.0, 42.0, 47.0, 104.0, 207.0, 459.0, 1079.0, 2781.0, 10461.0, 59913.0, 636688.0, 292741.0, 33459.0, 6794.0, 2056.0, 831.0, 353.0, 168.0, 86.0, 55.0, 34.0, 26.0, 26.0, 12.0, 9.0, 11.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.34765625, -6.18426513671875, -6.0208740234375, -5.85748291015625, -5.694091796875, -5.53070068359375, -5.3673095703125, -5.20391845703125, -5.04052734375, -4.87713623046875, -4.7137451171875, -4.55035400390625, -4.386962890625, -4.22357177734375, -4.0601806640625, -3.89678955078125, -3.7333984375, -3.57000732421875, -3.4066162109375, -3.24322509765625, -3.079833984375, -2.91644287109375, -2.7530517578125, -2.58966064453125, -2.42626953125, -2.26287841796875, -2.0994873046875, -1.93609619140625, -1.772705078125, -1.60931396484375, -1.4459228515625, -1.28253173828125, -1.119140625, -0.95574951171875, -0.7923583984375, -0.62896728515625, -0.465576171875, -0.30218505859375, -0.1387939453125, 0.02459716796875, 0.18798828125, 0.35137939453125, 0.5147705078125, 0.67816162109375, 0.841552734375, 1.00494384765625, 1.1683349609375, 1.33172607421875, 1.4951171875, 1.65850830078125, 1.8218994140625, 1.98529052734375, 2.148681640625, 2.31207275390625, 2.4754638671875, 2.63885498046875, 2.80224609375, 2.96563720703125, 3.1290283203125, 3.29241943359375, 3.455810546875, 3.61920166015625, 3.7825927734375, 3.94598388671875, 4.109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 7.0, 12.0, 7.0, 15.0, 14.0, 25.0, 30.0, 45.0, 49.0, 68.0, 136.0, 190.0, 91.0, 72.0, 46.0, 45.0, 40.0, 30.0, 16.0, 10.0, 8.0, 7.0, 8.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004711151123046875, -0.0004550069570541382, -0.00043889880180358887, -0.00042279064655303955, -0.00040668249130249023, -0.0003905743360519409, -0.0003744661808013916, -0.0003583580255508423, -0.00034224987030029297, -0.00032614171504974365, -0.00031003355979919434, -0.000293925404548645, -0.0002778172492980957, -0.0002617090940475464, -0.00024560093879699707, -0.00022949278354644775, -0.00021338462829589844, -0.00019727647304534912, -0.0001811683177947998, -0.0001650601625442505, -0.00014895200729370117, -0.00013284385204315186, -0.00011673569679260254, -0.00010062754154205322, -8.45193862915039e-05, -6.841123104095459e-05, -5.2303075790405273e-05, -3.619492053985596e-05, -2.008676528930664e-05, -3.978610038757324e-06, 1.2129545211791992e-05, 2.823770046234131e-05, 4.4345855712890625e-05, 6.045401096343994e-05, 7.656216621398926e-05, 9.267032146453857e-05, 0.00010877847671508789, 0.0001248866319656372, 0.00014099478721618652, 0.00015710294246673584, 0.00017321109771728516, 0.00018931925296783447, 0.0002054274082183838, 0.0002215355634689331, 0.00023764371871948242, 0.00025375187397003174, 0.00026986002922058105, 0.00028596818447113037, 0.0003020763397216797, 0.000318184494972229, 0.0003342926502227783, 0.00035040080547332764, 0.00036650896072387695, 0.00038261711597442627, 0.0003987252712249756, 0.0004148334264755249, 0.0004309415817260742, 0.00044704973697662354, 0.00046315789222717285, 0.00047926604747772217, 0.0004953742027282715, 0.0005114823579788208, 0.0005275905132293701, 0.0005436986684799194, 0.0005598068237304688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 13.0, 27.0, 31.0, 63.0, 92.0, 141.0, 261.0, 571.0, 1412.0, 4614.0, 30096.0, 646730.0, 338921.0, 19747.0, 3619.0, 1146.0, 482.0, 207.0, 124.0, 87.0, 57.0, 27.0, 19.0, 18.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.5546875, -8.3228759765625, -8.091064453125, -7.8592529296875, -7.62744140625, -7.3956298828125, -7.163818359375, -6.9320068359375, -6.7001953125, -6.4683837890625, -6.236572265625, -6.0047607421875, -5.77294921875, -5.5411376953125, -5.309326171875, -5.0775146484375, -4.845703125, -4.6138916015625, -4.382080078125, -4.1502685546875, -3.91845703125, -3.6866455078125, -3.454833984375, -3.2230224609375, -2.9912109375, -2.7593994140625, -2.527587890625, -2.2957763671875, -2.06396484375, -1.8321533203125, -1.600341796875, -1.3685302734375, -1.13671875, -0.9049072265625, -0.673095703125, -0.4412841796875, -0.20947265625, 0.0223388671875, 0.254150390625, 0.4859619140625, 0.7177734375, 0.9495849609375, 1.181396484375, 1.4132080078125, 1.64501953125, 1.8768310546875, 2.108642578125, 2.3404541015625, 2.572265625, 2.8040771484375, 3.035888671875, 3.2677001953125, 3.49951171875, 3.7313232421875, 3.963134765625, 4.1949462890625, 4.4267578125, 4.6585693359375, 4.890380859375, 5.1221923828125, 5.35400390625, 5.5858154296875, 5.817626953125, 6.0494384765625, 6.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 14.0, 32.0, 58.0, 106.0, 188.0, 251.0, 153.0, 70.0, 41.0, 24.0, 13.0, 15.0, 7.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -12.0174560546875, -11.745849609375, -11.4742431640625, -11.20263671875, -10.9310302734375, -10.659423828125, -10.3878173828125, -10.1162109375, -9.8446044921875, -9.572998046875, -9.3013916015625, -9.02978515625, -8.7581787109375, -8.486572265625, -8.2149658203125, -7.943359375, -7.6717529296875, -7.400146484375, -7.1285400390625, -6.85693359375, -6.5853271484375, -6.313720703125, -6.0421142578125, -5.7705078125, -5.4989013671875, -5.227294921875, -4.9556884765625, -4.68408203125, -4.4124755859375, -4.140869140625, -3.8692626953125, -3.59765625, -3.3260498046875, -3.054443359375, -2.7828369140625, -2.51123046875, -2.2396240234375, -1.968017578125, -1.6964111328125, -1.4248046875, -1.1531982421875, -0.881591796875, -0.6099853515625, -0.33837890625, -0.0667724609375, 0.204833984375, 0.4764404296875, 0.748046875, 1.0196533203125, 1.291259765625, 1.5628662109375, 1.83447265625, 2.1060791015625, 2.377685546875, 2.6492919921875, 2.9208984375, 3.1925048828125, 3.464111328125, 3.7357177734375, 4.00732421875, 4.2789306640625, 4.550537109375, 4.8221435546875, 5.09375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 38.0, 78.0, 198.0, 324.0, 231.0, 92.0, 28.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-185.39590454101562, -181.6613006591797, -177.92669677734375, -174.19210815429688, -170.45750427246094, -166.722900390625, -162.98831176757812, -159.2537078857422, -155.51910400390625, -151.7845001220703, -148.04989624023438, -144.3153076171875, -140.58070373535156, -136.84609985351562, -133.11151123046875, -129.3769073486328, -125.64230346679688, -121.90769958496094, -118.17310333251953, -114.43850708007812, -110.70390319824219, -106.96929931640625, -103.23470306396484, -99.50010681152344, -95.7655029296875, -92.03089904785156, -88.29630279541016, -84.56170654296875, -80.82710266113281, -77.09249877929688, -73.35790252685547, -69.62330627441406, -65.88870239257812, -62.15410232543945, -58.41950225830078, -54.68490219116211, -50.95030212402344, -47.215702056884766, -43.481101989746094, -39.74650192260742, -36.01190185546875, -32.27730178833008, -28.542701721191406, -24.808101654052734, -21.073501586914062, -17.33890151977539, -13.604301452636719, -9.869701385498047, -6.135101318359375, -2.400501251220703, 1.3340988159179688, 5.068698883056641, 8.803298950195312, 12.537899017333984, 16.272499084472656, 20.007099151611328, 23.74169921875, 27.476299285888672, 31.210899353027344, 34.945499420166016, 38.68009948730469, 42.41469955444336, 46.14929962158203, 49.8838996887207, 53.618499755859375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 10.0, 13.0, 12.0, 12.0, 17.0, 14.0, 27.0, 34.0, 23.0, 36.0, 30.0, 37.0, 43.0, 39.0, 33.0, 44.0, 46.0, 57.0, 47.0, 40.0, 52.0, 38.0, 35.0, 32.0, 33.0, 34.0, 24.0, 23.0, 18.0, 17.0, 7.0, 8.0, 4.0, 10.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.10211181640625, -39.6962890625, -38.290470123291016, -36.884647369384766, -35.47882843017578, -34.07300567626953, -32.66718292236328, -31.261362075805664, -29.855541229248047, -28.44972038269043, -27.043899536132812, -25.638076782226562, -24.232255935668945, -22.826435089111328, -21.420612335205078, -20.01479148864746, -18.608970642089844, -17.203149795532227, -15.797327995300293, -14.39150619506836, -12.985685348510742, -11.579864501953125, -10.174042701721191, -8.768220901489258, -7.362400054931641, -5.956578731536865, -4.55075740814209, -3.1449360847473145, -1.739114761352539, -0.33329343795776367, 1.0725278854370117, 2.4783496856689453, 3.8841705322265625, 5.289991855621338, 6.695813179016113, 8.101634979248047, 9.507455825805664, 10.913276672363281, 12.319098472595215, 13.724920272827148, 15.130741119384766, 16.536561965942383, 17.9423828125, 19.34820556640625, 20.754026412963867, 22.159847259521484, 23.565670013427734, 24.97149085998535, 26.37731170654297, 27.783132553100586, 29.188953399658203, 30.594776153564453, 32.00059509277344, 33.40641784667969, 34.81224060058594, 36.21806335449219, 37.62388229370117, 39.02970504760742, 40.435523986816406, 41.841346740722656, 43.247169494628906, 44.65298843383789, 46.05881118774414, 47.464630126953125, 48.870452880859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 4.0, 14.0, 25.0, 35.0, 48.0, 57.0, 107.0, 213.0, 325.0, 596.0, 1177.0, 2404.0, 5264.0, 13126.0, 41081.0, 225245.0, 3565764.0, 268748.0, 45077.0, 13975.0, 5706.0, 2564.0, 1280.0, 626.0, 379.0, 164.0, 109.0, 55.0, 39.0, 21.0, 17.0, 10.0, 4.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.63031005859375, -6.3895263671875, -6.14874267578125, -5.907958984375, -5.66717529296875, -5.4263916015625, -5.18560791015625, -4.94482421875, -4.70404052734375, -4.4632568359375, -4.22247314453125, -3.981689453125, -3.74090576171875, -3.5001220703125, -3.25933837890625, -3.0185546875, -2.77777099609375, -2.5369873046875, -2.29620361328125, -2.055419921875, -1.81463623046875, -1.5738525390625, -1.33306884765625, -1.09228515625, -0.85150146484375, -0.6107177734375, -0.36993408203125, -0.129150390625, 0.11163330078125, 0.3524169921875, 0.59320068359375, 0.833984375, 1.07476806640625, 1.3155517578125, 1.55633544921875, 1.797119140625, 2.03790283203125, 2.2786865234375, 2.51947021484375, 2.76025390625, 3.00103759765625, 3.2418212890625, 3.48260498046875, 3.723388671875, 3.96417236328125, 4.2049560546875, 4.44573974609375, 4.6865234375, 4.92730712890625, 5.1680908203125, 5.40887451171875, 5.649658203125, 5.89044189453125, 6.1312255859375, 6.37200927734375, 6.61279296875, 6.85357666015625, 7.0943603515625, 7.33514404296875, 7.575927734375, 7.81671142578125, 8.0574951171875, 8.29827880859375, 8.5390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 14.0, 11.0, 17.0, 22.0, 37.0, 28.0, 34.0, 39.0, 50.0, 44.0, 56.0, 48.0, 61.0, 57.0, 63.0, 62.0, 54.0, 44.0, 60.0, 26.0, 36.0, 30.0, 25.0, 18.0, 14.0, 11.0, 6.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.1600341796875, -2.083740234375, -2.0074462890625, -1.93115234375, -1.8548583984375, -1.778564453125, -1.7022705078125, -1.6259765625, -1.5496826171875, -1.473388671875, -1.3970947265625, -1.32080078125, -1.2445068359375, -1.168212890625, -1.0919189453125, -1.015625, -0.9393310546875, -0.863037109375, -0.7867431640625, -0.71044921875, -0.6341552734375, -0.557861328125, -0.4815673828125, -0.4052734375, -0.3289794921875, -0.252685546875, -0.1763916015625, -0.10009765625, -0.0238037109375, 0.052490234375, 0.1287841796875, 0.205078125, 0.2813720703125, 0.357666015625, 0.4339599609375, 0.51025390625, 0.5865478515625, 0.662841796875, 0.7391357421875, 0.8154296875, 0.8917236328125, 0.968017578125, 1.0443115234375, 1.12060546875, 1.1968994140625, 1.273193359375, 1.3494873046875, 1.42578125, 1.5020751953125, 1.578369140625, 1.6546630859375, 1.73095703125, 1.8072509765625, 1.883544921875, 1.9598388671875, 2.0361328125, 2.1124267578125, 2.188720703125, 2.2650146484375, 2.34130859375, 2.4176025390625, 2.493896484375, 2.5701904296875, 2.646484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 13.0, 21.0, 19.0, 24.0, 45.0, 84.0, 143.0, 232.0, 407.0, 851.0, 1860.0, 4236.0, 12004.0, 42531.0, 268078.0, 3482867.0, 312849.0, 46768.0, 12861.0, 4543.0, 1892.0, 879.0, 455.0, 243.0, 153.0, 82.0, 47.0, 35.0, 19.0, 15.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.4857177734375, -6.280029296875, -6.0743408203125, -5.86865234375, -5.6629638671875, -5.457275390625, -5.2515869140625, -5.0458984375, -4.8402099609375, -4.634521484375, -4.4288330078125, -4.22314453125, -4.0174560546875, -3.811767578125, -3.6060791015625, -3.400390625, -3.1947021484375, -2.989013671875, -2.7833251953125, -2.57763671875, -2.3719482421875, -2.166259765625, -1.9605712890625, -1.7548828125, -1.5491943359375, -1.343505859375, -1.1378173828125, -0.93212890625, -0.7264404296875, -0.520751953125, -0.3150634765625, -0.109375, 0.0963134765625, 0.302001953125, 0.5076904296875, 0.71337890625, 0.9190673828125, 1.124755859375, 1.3304443359375, 1.5361328125, 1.7418212890625, 1.947509765625, 2.1531982421875, 2.35888671875, 2.5645751953125, 2.770263671875, 2.9759521484375, 3.181640625, 3.3873291015625, 3.593017578125, 3.7987060546875, 4.00439453125, 4.2100830078125, 4.415771484375, 4.6214599609375, 4.8271484375, 5.0328369140625, 5.238525390625, 5.4442138671875, 5.64990234375, 5.8555908203125, 6.061279296875, 6.2669677734375, 6.47265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 11.0, 11.0, 12.0, 21.0, 23.0, 33.0, 56.0, 87.0, 191.0, 444.0, 1947.0, 676.0, 239.0, 125.0, 66.0, 32.0, 31.0, 16.0, 7.0, 11.0, 2.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.696380615234375, -4.56463623046875, -4.432891845703125, -4.3011474609375, -4.169403076171875, -4.03765869140625, -3.905914306640625, -3.774169921875, -3.642425537109375, -3.51068115234375, -3.378936767578125, -3.2471923828125, -3.115447998046875, -2.98370361328125, -2.851959228515625, -2.72021484375, -2.588470458984375, -2.45672607421875, -2.324981689453125, -2.1932373046875, -2.061492919921875, -1.92974853515625, -1.798004150390625, -1.666259765625, -1.534515380859375, -1.40277099609375, -1.271026611328125, -1.1392822265625, -1.007537841796875, -0.87579345703125, -0.744049072265625, -0.6123046875, -0.480560302734375, -0.34881591796875, -0.217071533203125, -0.0853271484375, 0.046417236328125, 0.17816162109375, 0.309906005859375, 0.441650390625, 0.573394775390625, 0.70513916015625, 0.836883544921875, 0.9686279296875, 1.100372314453125, 1.23211669921875, 1.363861083984375, 1.49560546875, 1.627349853515625, 1.75909423828125, 1.890838623046875, 2.0225830078125, 2.154327392578125, 2.28607177734375, 2.417816162109375, 2.549560546875, 2.681304931640625, 2.81304931640625, 2.944793701171875, 3.0765380859375, 3.208282470703125, 3.34002685546875, 3.471771240234375, 3.603515625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 46.0, 109.0, 200.0, 265.0, 207.0, 100.0, 37.0, 13.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-56.362586975097656, -55.174278259277344, -53.98596954345703, -52.79766082763672, -51.609352111816406, -50.421043395996094, -49.23273468017578, -48.04442596435547, -46.856117248535156, -45.667808532714844, -44.47949981689453, -43.29119110107422, -42.102882385253906, -40.914573669433594, -39.72626495361328, -38.53795623779297, -37.349647521972656, -36.161338806152344, -34.97303009033203, -33.78472137451172, -32.596412658691406, -31.408103942871094, -30.21979522705078, -29.03148651123047, -27.843181610107422, -26.65487289428711, -25.466564178466797, -24.278255462646484, -23.089946746826172, -21.90163803100586, -20.713329315185547, -19.525020599365234, -18.336711883544922, -17.14840316772461, -15.960094451904297, -14.771785736083984, -13.583477020263672, -12.39516830444336, -11.206860542297363, -10.01855182647705, -8.830243110656738, -7.641934394836426, -6.453625679016113, -5.265317440032959, -4.0770087242126465, -2.888700008392334, -1.7003917694091797, -0.5120830535888672, 0.6762256622314453, 1.8645342588424683, 3.052842855453491, 4.241151332855225, 5.429460048675537, 6.61776876449585, 7.806077003479004, 8.994385719299316, 10.182694435119629, 11.371003150939941, 12.559311866760254, 13.74761962890625, 14.935928344726562, 16.124237060546875, 17.312545776367188, 18.5008544921875, 19.689163208007812]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 18.0, 22.0, 22.0, 32.0, 38.0, 46.0, 50.0, 72.0, 70.0, 68.0, 79.0, 88.0, 66.0, 65.0, 53.0, 43.0, 46.0, 29.0, 22.0, 24.0, 15.0, 3.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.16061782836914, -20.58466148376465, -20.00870704650879, -19.432750701904297, -18.856796264648438, -18.280839920043945, -17.704885482788086, -17.128929138183594, -16.552974700927734, -15.977019309997559, -15.401063919067383, -14.825108528137207, -14.249153137207031, -13.673196792602539, -13.097241401672363, -12.521286010742188, -11.945329666137695, -11.36937427520752, -10.793418884277344, -10.217463493347168, -9.641508102416992, -9.0655517578125, -8.489596366882324, -7.913640975952148, -7.337685585021973, -6.761730194091797, -6.185774803161621, -5.609818935394287, -5.033863544464111, -4.4579081535339355, -3.8819525241851807, -3.305996894836426, -2.730039596557617, -2.1540842056274414, -1.5781285762786865, -1.0021730661392212, -0.42621755599975586, 0.14973783493041992, 0.7256934642791748, 1.3016490936279297, 1.8776044845581055, 2.4535598754882812, 3.029515504837036, 3.605471134185791, 4.181426525115967, 4.757381916046143, 5.333337783813477, 5.909293174743652, 6.485248565673828, 7.061203956604004, 7.63715934753418, 8.213114738464355, 8.789070129394531, 9.365026473999023, 9.9409818649292, 10.516937255859375, 11.09289264678955, 11.668848037719727, 12.244803428649902, 12.820758819580078, 13.39671516418457, 13.97266960144043, 14.548625946044922, 15.124581336975098, 15.700536727905273]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 8.0, 5.0, 12.0, 10.0, 9.0, 19.0, 24.0, 32.0, 58.0, 97.0, 128.0, 182.0, 349.0, 597.0, 1044.0, 2286.0, 5222.0, 14247.0, 41489.0, 127769.0, 321796.0, 329706.0, 134427.0, 43663.0, 14776.0, 5605.0, 2429.0, 1068.0, 569.0, 325.0, 205.0, 136.0, 82.0, 51.0, 37.0, 39.0, 20.0, 13.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.59375, -5.4190673828125, -5.244384765625, -5.0697021484375, -4.89501953125, -4.7203369140625, -4.545654296875, -4.3709716796875, -4.1962890625, -4.0216064453125, -3.846923828125, -3.6722412109375, -3.49755859375, -3.3228759765625, -3.148193359375, -2.9735107421875, -2.798828125, -2.6241455078125, -2.449462890625, -2.2747802734375, -2.10009765625, -1.9254150390625, -1.750732421875, -1.5760498046875, -1.4013671875, -1.2266845703125, -1.052001953125, -0.8773193359375, -0.70263671875, -0.5279541015625, -0.353271484375, -0.1785888671875, -0.00390625, 0.1707763671875, 0.345458984375, 0.5201416015625, 0.69482421875, 0.8695068359375, 1.044189453125, 1.2188720703125, 1.3935546875, 1.5682373046875, 1.742919921875, 1.9176025390625, 2.09228515625, 2.2669677734375, 2.441650390625, 2.6163330078125, 2.791015625, 2.9656982421875, 3.140380859375, 3.3150634765625, 3.48974609375, 3.6644287109375, 3.839111328125, 4.0137939453125, 4.1884765625, 4.3631591796875, 4.537841796875, 4.7125244140625, 4.88720703125, 5.0618896484375, 5.236572265625, 5.4112548828125, 5.5859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 8.0, 15.0, 18.0, 19.0, 33.0, 30.0, 42.0, 31.0, 35.0, 49.0, 49.0, 56.0, 53.0, 49.0, 46.0, 68.0, 56.0, 35.0, 49.0, 47.0, 33.0, 29.0, 32.0, 20.0, 26.0, 12.0, 9.0, 10.0, 7.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.065673828125, -1.99658203125, -1.927490234375, -1.8583984375, -1.789306640625, -1.72021484375, -1.651123046875, -1.58203125, -1.512939453125, -1.44384765625, -1.374755859375, -1.3056640625, -1.236572265625, -1.16748046875, -1.098388671875, -1.029296875, -0.960205078125, -0.89111328125, -0.822021484375, -0.7529296875, -0.683837890625, -0.61474609375, -0.545654296875, -0.4765625, -0.407470703125, -0.33837890625, -0.269287109375, -0.2001953125, -0.131103515625, -0.06201171875, 0.007080078125, 0.076171875, 0.145263671875, 0.21435546875, 0.283447265625, 0.3525390625, 0.421630859375, 0.49072265625, 0.559814453125, 0.62890625, 0.697998046875, 0.76708984375, 0.836181640625, 0.9052734375, 0.974365234375, 1.04345703125, 1.112548828125, 1.181640625, 1.250732421875, 1.31982421875, 1.388916015625, 1.4580078125, 1.527099609375, 1.59619140625, 1.665283203125, 1.734375, 1.803466796875, 1.87255859375, 1.941650390625, 2.0107421875, 2.079833984375, 2.14892578125, 2.218017578125, 2.287109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 11.0, 13.0, 16.0, 22.0, 35.0, 47.0, 86.0, 108.0, 156.0, 216.0, 329.0, 507.0, 880.0, 1752.0, 4767.0, 18336.0, 92963.0, 459104.0, 377150.0, 70193.0, 14265.0, 3894.0, 1469.0, 802.0, 476.0, 309.0, 203.0, 136.0, 95.0, 53.0, 47.0, 45.0, 20.0, 12.0, 15.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.332763671875, -7.10302734375, -6.873291015625, -6.6435546875, -6.413818359375, -6.18408203125, -5.954345703125, -5.724609375, -5.494873046875, -5.26513671875, -5.035400390625, -4.8056640625, -4.575927734375, -4.34619140625, -4.116455078125, -3.88671875, -3.656982421875, -3.42724609375, -3.197509765625, -2.9677734375, -2.738037109375, -2.50830078125, -2.278564453125, -2.048828125, -1.819091796875, -1.58935546875, -1.359619140625, -1.1298828125, -0.900146484375, -0.67041015625, -0.440673828125, -0.2109375, 0.018798828125, 0.24853515625, 0.478271484375, 0.7080078125, 0.937744140625, 1.16748046875, 1.397216796875, 1.626953125, 1.856689453125, 2.08642578125, 2.316162109375, 2.5458984375, 2.775634765625, 3.00537109375, 3.235107421875, 3.46484375, 3.694580078125, 3.92431640625, 4.154052734375, 4.3837890625, 4.613525390625, 4.84326171875, 5.072998046875, 5.302734375, 5.532470703125, 5.76220703125, 5.991943359375, 6.2216796875, 6.451416015625, 6.68115234375, 6.910888671875, 7.140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 7.0, 8.0, 19.0, 14.0, 12.0, 17.0, 26.0, 20.0, 21.0, 25.0, 32.0, 38.0, 41.0, 45.0, 46.0, 48.0, 60.0, 46.0, 49.0, 36.0, 41.0, 40.0, 30.0, 35.0, 32.0, 37.0, 24.0, 20.0, 18.0, 16.0, 18.0, 13.0, 10.0, 8.0, 12.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.421875, -11.1165771484375, -10.811279296875, -10.5059814453125, -10.20068359375, -9.8953857421875, -9.590087890625, -9.2847900390625, -8.9794921875, -8.6741943359375, -8.368896484375, -8.0635986328125, -7.75830078125, -7.4530029296875, -7.147705078125, -6.8424072265625, -6.537109375, -6.2318115234375, -5.926513671875, -5.6212158203125, -5.31591796875, -5.0106201171875, -4.705322265625, -4.4000244140625, -4.0947265625, -3.7894287109375, -3.484130859375, -3.1788330078125, -2.87353515625, -2.5682373046875, -2.262939453125, -1.9576416015625, -1.65234375, -1.3470458984375, -1.041748046875, -0.7364501953125, -0.43115234375, -0.1258544921875, 0.179443359375, 0.4847412109375, 0.7900390625, 1.0953369140625, 1.400634765625, 1.7059326171875, 2.01123046875, 2.3165283203125, 2.621826171875, 2.9271240234375, 3.232421875, 3.5377197265625, 3.843017578125, 4.1483154296875, 4.45361328125, 4.7589111328125, 5.064208984375, 5.3695068359375, 5.6748046875, 5.9801025390625, 6.285400390625, 6.5906982421875, 6.89599609375, 7.2012939453125, 7.506591796875, 7.8118896484375, 8.1171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 9.0, 7.0, 8.0, 25.0, 28.0, 47.0, 68.0, 111.0, 159.0, 321.0, 795.0, 1868.0, 5747.0, 23825.0, 128082.0, 502711.0, 308612.0, 58188.0, 12177.0, 3396.0, 1236.0, 513.0, 250.0, 134.0, 77.0, 58.0, 31.0, 17.0, 16.0, 10.0, 9.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1328125, -3.027587890625, -2.92236328125, -2.817138671875, -2.7119140625, -2.606689453125, -2.50146484375, -2.396240234375, -2.291015625, -2.185791015625, -2.08056640625, -1.975341796875, -1.8701171875, -1.764892578125, -1.65966796875, -1.554443359375, -1.44921875, -1.343994140625, -1.23876953125, -1.133544921875, -1.0283203125, -0.923095703125, -0.81787109375, -0.712646484375, -0.607421875, -0.502197265625, -0.39697265625, -0.291748046875, -0.1865234375, -0.081298828125, 0.02392578125, 0.129150390625, 0.234375, 0.339599609375, 0.44482421875, 0.550048828125, 0.6552734375, 0.760498046875, 0.86572265625, 0.970947265625, 1.076171875, 1.181396484375, 1.28662109375, 1.391845703125, 1.4970703125, 1.602294921875, 1.70751953125, 1.812744140625, 1.91796875, 2.023193359375, 2.12841796875, 2.233642578125, 2.3388671875, 2.444091796875, 2.54931640625, 2.654541015625, 2.759765625, 2.864990234375, 2.97021484375, 3.075439453125, 3.1806640625, 3.285888671875, 3.39111328125, 3.496337890625, 3.6015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 2.0, 11.0, 5.0, 9.0, 11.0, 22.0, 25.0, 34.0, 48.0, 72.0, 70.0, 124.0, 121.0, 108.0, 86.0, 58.0, 52.0, 45.0, 20.0, 20.0, 16.0, 14.0, 13.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005102157592773438, -0.0004958994686603546, -0.0004815831780433655, -0.00046726688742637634, -0.0004529505968093872, -0.00043863430619239807, -0.00042431801557540894, -0.0004100017249584198, -0.00039568543434143066, -0.00038136914372444153, -0.0003670528531074524, -0.00035273656249046326, -0.0003384202718734741, -0.000324103981256485, -0.00030978769063949585, -0.0002954714000225067, -0.0002811551094055176, -0.00026683881878852844, -0.0002525225281715393, -0.00023820623755455017, -0.00022388994693756104, -0.0002095736563205719, -0.00019525736570358276, -0.00018094107508659363, -0.0001666247844696045, -0.00015230849385261536, -0.00013799220323562622, -0.00012367591261863708, -0.00010935962200164795, -9.504333138465881e-05, -8.072704076766968e-05, -6.641075015068054e-05, -5.2094459533691406e-05, -3.777816891670227e-05, -2.3461878299713135e-05, -9.145587682723999e-06, 5.170702934265137e-06, 1.9486993551254272e-05, 3.380328416824341e-05, 4.8119574785232544e-05, 6.243586540222168e-05, 7.675215601921082e-05, 9.106844663619995e-05, 0.00010538473725318909, 0.00011970102787017822, 0.00013401731848716736, 0.0001483336091041565, 0.00016264989972114563, 0.00017696619033813477, 0.0001912824809551239, 0.00020559877157211304, 0.00021991506218910217, 0.0002342313528060913, 0.00024854764342308044, 0.0002628639340400696, 0.0002771802246570587, 0.00029149651527404785, 0.000305812805891037, 0.0003201290965080261, 0.00033444538712501526, 0.0003487616777420044, 0.00036307796835899353, 0.00037739425897598267, 0.0003917105495929718, 0.00040602684020996094]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 16.0, 6.0, 16.0, 11.0, 19.0, 34.0, 37.0, 55.0, 91.0, 149.0, 282.0, 517.0, 1108.0, 2828.0, 8715.0, 42897.0, 271530.0, 556905.0, 132589.0, 21666.0, 5272.0, 1859.0, 887.0, 459.0, 229.0, 126.0, 90.0, 40.0, 34.0, 21.0, 22.0, 13.0, 8.0, 5.0, 2.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.62890625, -3.512969970703125, -3.39703369140625, -3.281097412109375, -3.1651611328125, -3.049224853515625, -2.93328857421875, -2.817352294921875, -2.701416015625, -2.585479736328125, -2.46954345703125, -2.353607177734375, -2.2376708984375, -2.121734619140625, -2.00579833984375, -1.889862060546875, -1.77392578125, -1.657989501953125, -1.54205322265625, -1.426116943359375, -1.3101806640625, -1.194244384765625, -1.07830810546875, -0.962371826171875, -0.846435546875, -0.730499267578125, -0.61456298828125, -0.498626708984375, -0.3826904296875, -0.266754150390625, -0.15081787109375, -0.034881591796875, 0.0810546875, 0.196990966796875, 0.31292724609375, 0.428863525390625, 0.5447998046875, 0.660736083984375, 0.77667236328125, 0.892608642578125, 1.008544921875, 1.124481201171875, 1.24041748046875, 1.356353759765625, 1.4722900390625, 1.588226318359375, 1.70416259765625, 1.820098876953125, 1.93603515625, 2.051971435546875, 2.16790771484375, 2.283843994140625, 2.3997802734375, 2.515716552734375, 2.63165283203125, 2.747589111328125, 2.863525390625, 2.979461669921875, 3.09539794921875, 3.211334228515625, 3.3272705078125, 3.443206787109375, 3.55914306640625, 3.675079345703125, 3.791015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 13.0, 22.0, 26.0, 52.0, 75.0, 101.0, 116.0, 136.0, 136.0, 110.0, 65.0, 47.0, 37.0, 27.0, 13.0, 14.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.46875, -5.29571533203125, -5.1226806640625, -4.94964599609375, -4.776611328125, -4.60357666015625, -4.4305419921875, -4.25750732421875, -4.08447265625, -3.91143798828125, -3.7384033203125, -3.56536865234375, -3.392333984375, -3.21929931640625, -3.0462646484375, -2.87322998046875, -2.7001953125, -2.52716064453125, -2.3541259765625, -2.18109130859375, -2.008056640625, -1.83502197265625, -1.6619873046875, -1.48895263671875, -1.31591796875, -1.14288330078125, -0.9698486328125, -0.79681396484375, -0.623779296875, -0.45074462890625, -0.2777099609375, -0.10467529296875, 0.068359375, 0.24139404296875, 0.4144287109375, 0.58746337890625, 0.760498046875, 0.93353271484375, 1.1065673828125, 1.27960205078125, 1.45263671875, 1.62567138671875, 1.7987060546875, 1.97174072265625, 2.144775390625, 2.31781005859375, 2.4908447265625, 2.66387939453125, 2.8369140625, 3.00994873046875, 3.1829833984375, 3.35601806640625, 3.529052734375, 3.70208740234375, 3.8751220703125, 4.04815673828125, 4.22119140625, 4.39422607421875, 4.5672607421875, 4.74029541015625, 4.913330078125, 5.08636474609375, 5.2593994140625, 5.43243408203125, 5.60546875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 22.0, 58.0, 124.0, 217.0, 232.0, 187.0, 108.0, 40.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-147.81956481933594, -144.994873046875, -142.17018127441406, -139.34548950195312, -136.5207977294922, -133.69610595703125, -130.8714141845703, -128.04672241210938, -125.22203063964844, -122.3973388671875, -119.57264709472656, -116.74795532226562, -113.92326354980469, -111.09857177734375, -108.27388000488281, -105.44918823242188, -102.62449645996094, -99.7998046875, -96.97511291503906, -94.15042114257812, -91.32572937011719, -88.50103759765625, -85.67634582519531, -82.85165405273438, -80.02696228027344, -77.2022705078125, -74.37757873535156, -71.55288696289062, -68.72819519042969, -65.90350341796875, -63.07881164550781, -60.254119873046875, -57.42943572998047, -54.60474395751953, -51.780052185058594, -48.955360412597656, -46.13066864013672, -43.30597686767578, -40.481285095214844, -37.656593322753906, -34.83190155029297, -32.00720977783203, -29.182518005371094, -26.357826232910156, -23.53313446044922, -20.70844268798828, -17.883750915527344, -15.059059143066406, -12.234367370605469, -9.409675598144531, -6.584983825683594, -3.7602920532226562, -0.9356002807617188, 1.8890914916992188, 4.713783264160156, 7.538475036621094, 10.363166809082031, 13.187858581542969, 16.012550354003906, 18.837242126464844, 21.66193389892578, 24.48662567138672, 27.311317443847656, 30.136009216308594, 32.96070098876953]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 7.0, 7.0, 11.0, 13.0, 9.0, 15.0, 21.0, 23.0, 31.0, 25.0, 34.0, 26.0, 38.0, 35.0, 45.0, 38.0, 52.0, 36.0, 41.0, 43.0, 57.0, 35.0, 36.0, 36.0, 36.0, 33.0, 27.0, 21.0, 23.0, 25.0, 14.0, 18.0, 18.0, 8.0, 10.0, 6.0, 6.0, 11.0, 4.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.94471740722656, -43.548954010009766, -42.15319061279297, -40.75742721557617, -39.361663818359375, -37.96589660644531, -36.570133209228516, -35.17436981201172, -33.77860641479492, -32.382843017578125, -30.987079620361328, -29.5913143157959, -28.1955509185791, -26.799787521362305, -25.404022216796875, -24.008258819580078, -22.61249542236328, -21.216732025146484, -19.820968627929688, -18.425203323364258, -17.02943992614746, -15.633676528930664, -14.23791217803955, -12.842147827148438, -11.44638442993164, -10.050621032714844, -8.65485668182373, -7.259092807769775, -5.86332893371582, -4.467565059661865, -3.07180118560791, -1.6760368347167969, -0.2802734375, 1.115490436553955, 2.51125431060791, 3.9070181846618652, 5.30278205871582, 6.698545932769775, 8.09430980682373, 9.490074157714844, 10.88583755493164, 12.281600952148438, 13.67736530303955, 15.073129653930664, 16.46889305114746, 17.864656448364258, 19.260421752929688, 20.656185150146484, 22.05194854736328, 23.447711944580078, 24.843475341796875, 26.239240646362305, 27.6350040435791, 29.0307674407959, 30.426532745361328, 31.822296142578125, 33.21805953979492, 34.61382293701172, 36.009586334228516, 37.40534973144531, 38.801116943359375, 40.19688034057617, 41.59264373779297, 42.988407135009766, 44.38417053222656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 11.0, 13.0, 21.0, 28.0, 45.0, 44.0, 55.0, 93.0, 118.0, 177.0, 266.0, 419.0, 731.0, 1276.0, 2641.0, 5791.0, 17473.0, 92045.0, 3943217.0, 99487.0, 18294.0, 5950.0, 2601.0, 1386.0, 740.0, 425.0, 275.0, 188.0, 129.0, 80.0, 54.0, 35.0, 39.0, 23.0, 21.0, 17.0, 14.0, 6.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.390625, -7.1484375, -6.90625, -6.6640625, -6.421875, -6.1796875, -5.9375, -5.6953125, -5.453125, -5.2109375, -4.96875, -4.7265625, -4.484375, -4.2421875, -4.0, -3.7578125, -3.515625, -3.2734375, -3.03125, -2.7890625, -2.546875, -2.3046875, -2.0625, -1.8203125, -1.578125, -1.3359375, -1.09375, -0.8515625, -0.609375, -0.3671875, -0.125, 0.1171875, 0.359375, 0.6015625, 0.84375, 1.0859375, 1.328125, 1.5703125, 1.8125, 2.0546875, 2.296875, 2.5390625, 2.78125, 3.0234375, 3.265625, 3.5078125, 3.75, 3.9921875, 4.234375, 4.4765625, 4.71875, 4.9609375, 5.203125, 5.4453125, 5.6875, 5.9296875, 6.171875, 6.4140625, 6.65625, 6.8984375, 7.140625, 7.3828125, 7.625, 7.8671875, 8.109375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 7.0, 7.0, 6.0, 2.0, 6.0, 17.0, 11.0, 18.0, 35.0, 28.0, 41.0, 34.0, 37.0, 36.0, 42.0, 53.0, 56.0, 59.0, 60.0, 54.0, 51.0, 44.0, 60.0, 33.0, 33.0, 31.0, 34.0, 25.0, 24.0, 8.0, 10.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.0, -2.918975830078125, -2.83795166015625, -2.756927490234375, -2.6759033203125, -2.594879150390625, -2.51385498046875, -2.432830810546875, -2.351806640625, -2.270782470703125, -2.18975830078125, -2.108734130859375, -2.0277099609375, -1.946685791015625, -1.86566162109375, -1.784637451171875, -1.70361328125, -1.622589111328125, -1.54156494140625, -1.460540771484375, -1.3795166015625, -1.298492431640625, -1.21746826171875, -1.136444091796875, -1.055419921875, -0.974395751953125, -0.89337158203125, -0.812347412109375, -0.7313232421875, -0.650299072265625, -0.56927490234375, -0.488250732421875, -0.4072265625, -0.326202392578125, -0.24517822265625, -0.164154052734375, -0.0831298828125, -0.002105712890625, 0.07891845703125, 0.159942626953125, 0.240966796875, 0.321990966796875, 0.40301513671875, 0.484039306640625, 0.5650634765625, 0.646087646484375, 0.72711181640625, 0.808135986328125, 0.88916015625, 0.970184326171875, 1.05120849609375, 1.132232666015625, 1.2132568359375, 1.294281005859375, 1.37530517578125, 1.456329345703125, 1.537353515625, 1.618377685546875, 1.69940185546875, 1.780426025390625, 1.8614501953125, 1.942474365234375, 2.02349853515625, 2.104522705078125, 2.185546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 5.0, 12.0, 11.0, 21.0, 27.0, 50.0, 54.0, 66.0, 109.0, 192.0, 273.0, 507.0, 903.0, 1647.0, 3254.0, 6813.0, 16078.0, 49746.0, 305705.0, 3661342.0, 101555.0, 26196.0, 10059.0, 4478.0, 2289.0, 1216.0, 668.0, 398.0, 198.0, 140.0, 79.0, 59.0, 40.0, 22.0, 21.0, 9.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.974365234375, -3.85107421875, -3.727783203125, -3.6044921875, -3.481201171875, -3.35791015625, -3.234619140625, -3.111328125, -2.988037109375, -2.86474609375, -2.741455078125, -2.6181640625, -2.494873046875, -2.37158203125, -2.248291015625, -2.125, -2.001708984375, -1.87841796875, -1.755126953125, -1.6318359375, -1.508544921875, -1.38525390625, -1.261962890625, -1.138671875, -1.015380859375, -0.89208984375, -0.768798828125, -0.6455078125, -0.522216796875, -0.39892578125, -0.275634765625, -0.15234375, -0.029052734375, 0.09423828125, 0.217529296875, 0.3408203125, 0.464111328125, 0.58740234375, 0.710693359375, 0.833984375, 0.957275390625, 1.08056640625, 1.203857421875, 1.3271484375, 1.450439453125, 1.57373046875, 1.697021484375, 1.8203125, 1.943603515625, 2.06689453125, 2.190185546875, 2.3134765625, 2.436767578125, 2.56005859375, 2.683349609375, 2.806640625, 2.929931640625, 3.05322265625, 3.176513671875, 3.2998046875, 3.423095703125, 3.54638671875, 3.669677734375, 3.79296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 22.0, 30.0, 40.0, 108.0, 235.0, 3064.0, 281.0, 107.0, 56.0, 34.0, 21.0, 17.0, 9.0, 8.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.8779296875, -1.8384552001953125, -1.798980712890625, -1.7595062255859375, -1.72003173828125, -1.6805572509765625, -1.641082763671875, -1.6016082763671875, -1.5621337890625, -1.5226593017578125, -1.483184814453125, -1.4437103271484375, -1.40423583984375, -1.3647613525390625, -1.325286865234375, -1.2858123779296875, -1.246337890625, -1.2068634033203125, -1.167388916015625, -1.1279144287109375, -1.08843994140625, -1.0489654541015625, -1.009490966796875, -0.9700164794921875, -0.9305419921875, -0.8910675048828125, -0.851593017578125, -0.8121185302734375, -0.77264404296875, -0.7331695556640625, -0.693695068359375, -0.6542205810546875, -0.61474609375, -0.5752716064453125, -0.535797119140625, -0.4963226318359375, -0.45684814453125, -0.4173736572265625, -0.377899169921875, -0.3384246826171875, -0.2989501953125, -0.2594757080078125, -0.220001220703125, -0.1805267333984375, -0.14105224609375, -0.1015777587890625, -0.062103271484375, -0.0226287841796875, 0.016845703125, 0.0563201904296875, 0.095794677734375, 0.1352691650390625, 0.17474365234375, 0.2142181396484375, 0.253692626953125, 0.2931671142578125, 0.3326416015625, 0.3721160888671875, 0.411590576171875, 0.4510650634765625, 0.49053955078125, 0.5300140380859375, 0.569488525390625, 0.6089630126953125, 0.6484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 20.0, 14.0, 39.0, 58.0, 94.0, 120.0, 130.0, 128.0, 134.0, 91.0, 61.0, 39.0, 17.0, 22.0, 4.0, 8.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.845813751220703, -3.7018120288848877, -3.557810068130493, -3.4138083457946777, -3.269806385040283, -3.1258046627044678, -2.9818029403686523, -2.837800979614258, -2.6937992572784424, -2.549797534942627, -2.4057955741882324, -2.261793851852417, -2.1177921295166016, -1.973790168762207, -1.8297884464263916, -1.6857866048812866, -1.5417847633361816, -1.3977829217910767, -1.2537810802459717, -1.1097793579101562, -0.9657775163650513, -0.8217756748199463, -0.6777738928794861, -0.5337721109390259, -0.3897702693939209, -0.2457684576511383, -0.10176664590835571, 0.04223516583442688, 0.18623697757720947, 0.33023881912231445, 0.47424060106277466, 0.6182423830032349, 0.7622442245483398, 0.9062460660934448, 1.0502479076385498, 1.1942496299743652, 1.3382514715194702, 1.4822533130645752, 1.6262550354003906, 1.7702568769454956, 1.9142587184906006, 2.058260440826416, 2.2022624015808105, 2.346264123916626, 2.4902658462524414, 2.634267807006836, 2.7782695293426514, 2.922271251678467, 3.0662732124328613, 3.2102749347686768, 3.3542768955230713, 3.4982786178588867, 3.6422805786132812, 3.7862823009490967, 3.930284023284912, 4.074285984039307, 4.218287467956543, 4.3622894287109375, 4.506290912628174, 4.650292873382568, 4.794294834136963, 4.938296318054199, 5.082298278808594, 5.226300239562988, 5.370302200317383]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 6.0, 1.0, 8.0, 11.0, 8.0, 7.0, 17.0, 19.0, 24.0, 25.0, 20.0, 33.0, 32.0, 43.0, 47.0, 33.0, 44.0, 36.0, 49.0, 47.0, 51.0, 40.0, 39.0, 47.0, 41.0, 36.0, 38.0, 29.0, 31.0, 24.0, 21.0, 12.0, 14.0, 14.0, 13.0, 5.0, 10.0, 6.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6375346183776855, -2.5584826469421387, -2.4794304370880127, -2.4003782272338867, -2.32132625579834, -2.242274284362793, -2.163222074508667, -2.084169864654541, -2.005117893218994, -1.9260658025741577, -1.8470137119293213, -1.7679616212844849, -1.6889095306396484, -1.609857439994812, -1.5308053493499756, -1.4517532587051392, -1.3727011680603027, -1.2936490774154663, -1.2145969867706299, -1.1355448961257935, -1.056492805480957, -0.9774407148361206, -0.8983886241912842, -0.8193365335464478, -0.7402844429016113, -0.6612323522567749, -0.5821802616119385, -0.503128170967102, -0.4240760803222656, -0.3450239896774292, -0.2659718990325928, -0.18691980838775635, -0.10786747932434082, -0.028815388679504395, 0.05023670196533203, 0.12928879261016846, 0.20834088325500488, 0.2873929738998413, 0.36644506454467773, 0.44549715518951416, 0.5245492458343506, 0.603601336479187, 0.6826534271240234, 0.7617055177688599, 0.8407576084136963, 0.9198096990585327, 0.9988617897033691, 1.0779138803482056, 1.156965970993042, 1.2360180616378784, 1.3150701522827148, 1.3941222429275513, 1.4731743335723877, 1.5522264242172241, 1.6312785148620605, 1.710330605506897, 1.7893826961517334, 1.8684347867965698, 1.9474868774414062, 2.026538848876953, 2.105591058731079, 2.184643268585205, 2.263695240020752, 2.342747211456299, 2.421799421310425]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 18.0, 33.0, 42.0, 55.0, 79.0, 164.0, 268.0, 634.0, 1458.0, 4320.0, 14443.0, 55106.0, 219287.0, 468621.0, 210389.0, 52751.0, 13920.0, 4168.0, 1493.0, 636.0, 260.0, 141.0, 80.0, 41.0, 28.0, 21.0, 14.0, 14.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.35546875, -7.15924072265625, -6.9630126953125, -6.76678466796875, -6.570556640625, -6.37432861328125, -6.1781005859375, -5.98187255859375, -5.78564453125, -5.58941650390625, -5.3931884765625, -5.19696044921875, -5.000732421875, -4.80450439453125, -4.6082763671875, -4.41204833984375, -4.2158203125, -4.01959228515625, -3.8233642578125, -3.62713623046875, -3.430908203125, -3.23468017578125, -3.0384521484375, -2.84222412109375, -2.64599609375, -2.44976806640625, -2.2535400390625, -2.05731201171875, -1.861083984375, -1.66485595703125, -1.4686279296875, -1.27239990234375, -1.076171875, -0.87994384765625, -0.6837158203125, -0.48748779296875, -0.291259765625, -0.09503173828125, 0.1011962890625, 0.29742431640625, 0.49365234375, 0.68988037109375, 0.8861083984375, 1.08233642578125, 1.278564453125, 1.47479248046875, 1.6710205078125, 1.86724853515625, 2.0634765625, 2.25970458984375, 2.4559326171875, 2.65216064453125, 2.848388671875, 3.04461669921875, 3.2408447265625, 3.43707275390625, 3.63330078125, 3.82952880859375, 4.0257568359375, 4.22198486328125, 4.418212890625, 4.61444091796875, 4.8106689453125, 5.00689697265625, 5.203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 7.0, 15.0, 15.0, 14.0, 22.0, 30.0, 26.0, 36.0, 36.0, 46.0, 37.0, 41.0, 54.0, 59.0, 59.0, 46.0, 44.0, 62.0, 53.0, 40.0, 46.0, 27.0, 27.0, 28.0, 31.0, 21.0, 5.0, 11.0, 12.0, 8.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.998046875, -2.91888427734375, -2.8397216796875, -2.76055908203125, -2.681396484375, -2.60223388671875, -2.5230712890625, -2.44390869140625, -2.36474609375, -2.28558349609375, -2.2064208984375, -2.12725830078125, -2.048095703125, -1.96893310546875, -1.8897705078125, -1.81060791015625, -1.7314453125, -1.65228271484375, -1.5731201171875, -1.49395751953125, -1.414794921875, -1.33563232421875, -1.2564697265625, -1.17730712890625, -1.09814453125, -1.01898193359375, -0.9398193359375, -0.86065673828125, -0.781494140625, -0.70233154296875, -0.6231689453125, -0.54400634765625, -0.46484375, -0.38568115234375, -0.3065185546875, -0.22735595703125, -0.148193359375, -0.06903076171875, 0.0101318359375, 0.08929443359375, 0.16845703125, 0.24761962890625, 0.3267822265625, 0.40594482421875, 0.485107421875, 0.56427001953125, 0.6434326171875, 0.72259521484375, 0.8017578125, 0.88092041015625, 0.9600830078125, 1.03924560546875, 1.118408203125, 1.19757080078125, 1.2767333984375, 1.35589599609375, 1.43505859375, 1.51422119140625, 1.5933837890625, 1.67254638671875, 1.751708984375, 1.83087158203125, 1.9100341796875, 1.98919677734375, 2.068359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 5.0, 9.0, 12.0, 9.0, 20.0, 36.0, 43.0, 82.0, 137.0, 199.0, 414.0, 867.0, 2200.0, 7289.0, 48961.0, 605946.0, 345923.0, 27958.0, 5245.0, 1620.0, 736.0, 320.0, 183.0, 105.0, 67.0, 57.0, 38.0, 22.0, 13.0, 7.0, 7.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.5943603515625, -10.251220703125, -9.9080810546875, -9.56494140625, -9.2218017578125, -8.878662109375, -8.5355224609375, -8.1923828125, -7.8492431640625, -7.506103515625, -7.1629638671875, -6.81982421875, -6.4766845703125, -6.133544921875, -5.7904052734375, -5.447265625, -5.1041259765625, -4.760986328125, -4.4178466796875, -4.07470703125, -3.7315673828125, -3.388427734375, -3.0452880859375, -2.7021484375, -2.3590087890625, -2.015869140625, -1.6727294921875, -1.32958984375, -0.9864501953125, -0.643310546875, -0.3001708984375, 0.04296875, 0.3861083984375, 0.729248046875, 1.0723876953125, 1.41552734375, 1.7586669921875, 2.101806640625, 2.4449462890625, 2.7880859375, 3.1312255859375, 3.474365234375, 3.8175048828125, 4.16064453125, 4.5037841796875, 4.846923828125, 5.1900634765625, 5.533203125, 5.8763427734375, 6.219482421875, 6.5626220703125, 6.90576171875, 7.2489013671875, 7.592041015625, 7.9351806640625, 8.2783203125, 8.6214599609375, 8.964599609375, 9.3077392578125, 9.65087890625, 9.9940185546875, 10.337158203125, 10.6802978515625, 11.0234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 6.0, 4.0, 13.0, 5.0, 8.0, 12.0, 16.0, 15.0, 26.0, 31.0, 29.0, 31.0, 30.0, 46.0, 43.0, 48.0, 58.0, 64.0, 52.0, 52.0, 53.0, 49.0, 42.0, 36.0, 34.0, 42.0, 21.0, 20.0, 25.0, 12.0, 17.0, 12.0, 13.0, 8.0, 8.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.09375, -13.654296875, -13.21484375, -12.775390625, -12.3359375, -11.896484375, -11.45703125, -11.017578125, -10.578125, -10.138671875, -9.69921875, -9.259765625, -8.8203125, -8.380859375, -7.94140625, -7.501953125, -7.0625, -6.623046875, -6.18359375, -5.744140625, -5.3046875, -4.865234375, -4.42578125, -3.986328125, -3.546875, -3.107421875, -2.66796875, -2.228515625, -1.7890625, -1.349609375, -0.91015625, -0.470703125, -0.03125, 0.408203125, 0.84765625, 1.287109375, 1.7265625, 2.166015625, 2.60546875, 3.044921875, 3.484375, 3.923828125, 4.36328125, 4.802734375, 5.2421875, 5.681640625, 6.12109375, 6.560546875, 7.0, 7.439453125, 7.87890625, 8.318359375, 8.7578125, 9.197265625, 9.63671875, 10.076171875, 10.515625, 10.955078125, 11.39453125, 11.833984375, 12.2734375, 12.712890625, 13.15234375, 13.591796875, 14.03125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 8.0, 9.0, 15.0, 18.0, 21.0, 38.0, 48.0, 59.0, 81.0, 120.0, 180.0, 349.0, 665.0, 1606.0, 5287.0, 24926.0, 165622.0, 629542.0, 183385.0, 27410.0, 5753.0, 1721.0, 684.0, 350.0, 206.0, 106.0, 81.0, 58.0, 40.0, 33.0, 21.0, 23.0, 23.0, 11.0, 6.0, 6.0, 7.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.203125, -3.1103515625, -3.017578125, -2.9248046875, -2.83203125, -2.7392578125, -2.646484375, -2.5537109375, -2.4609375, -2.3681640625, -2.275390625, -2.1826171875, -2.08984375, -1.9970703125, -1.904296875, -1.8115234375, -1.71875, -1.6259765625, -1.533203125, -1.4404296875, -1.34765625, -1.2548828125, -1.162109375, -1.0693359375, -0.9765625, -0.8837890625, -0.791015625, -0.6982421875, -0.60546875, -0.5126953125, -0.419921875, -0.3271484375, -0.234375, -0.1416015625, -0.048828125, 0.0439453125, 0.13671875, 0.2294921875, 0.322265625, 0.4150390625, 0.5078125, 0.6005859375, 0.693359375, 0.7861328125, 0.87890625, 0.9716796875, 1.064453125, 1.1572265625, 1.25, 1.3427734375, 1.435546875, 1.5283203125, 1.62109375, 1.7138671875, 1.806640625, 1.8994140625, 1.9921875, 2.0849609375, 2.177734375, 2.2705078125, 2.36328125, 2.4560546875, 2.548828125, 2.6416015625, 2.734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 16.0, 15.0, 25.0, 28.0, 23.0, 46.0, 69.0, 85.0, 90.0, 101.0, 89.0, 90.0, 68.0, 60.0, 51.0, 39.0, 21.0, 13.0, 14.0, 14.0, 4.0, 4.0, 9.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002703666687011719, -0.00025942176580429077, -0.00024847686290740967, -0.00023753196001052856, -0.00022658705711364746, -0.00021564215421676636, -0.00020469725131988525, -0.00019375234842300415, -0.00018280744552612305, -0.00017186254262924194, -0.00016091763973236084, -0.00014997273683547974, -0.00013902783393859863, -0.00012808293104171753, -0.00011713802814483643, -0.00010619312524795532, -9.524822235107422e-05, -8.430331945419312e-05, -7.335841655731201e-05, -6.241351366043091e-05, -5.1468610763549805e-05, -4.05237078666687e-05, -2.9578804969787598e-05, -1.8633902072906494e-05, -7.68899917602539e-06, 3.255903720855713e-06, 1.4200806617736816e-05, 2.514570951461792e-05, 3.6090612411499023e-05, 4.703551530838013e-05, 5.798041820526123e-05, 6.892532110214233e-05, 7.987022399902344e-05, 9.081512689590454e-05, 0.00010176002979278564, 0.00011270493268966675, 0.00012364983558654785, 0.00013459473848342896, 0.00014553964138031006, 0.00015648454427719116, 0.00016742944717407227, 0.00017837435007095337, 0.00018931925296783447, 0.00020026415586471558, 0.00021120905876159668, 0.00022215396165847778, 0.0002330988645553589, 0.00024404376745224, 0.0002549886703491211, 0.0002659335732460022, 0.0002768784761428833, 0.0002878233790397644, 0.0002987682819366455, 0.0003097131848335266, 0.0003206580877304077, 0.0003316029906272888, 0.0003425478935241699, 0.000353492796421051, 0.00036443769931793213, 0.00037538260221481323, 0.00038632750511169434, 0.00039727240800857544, 0.00040821731090545654, 0.00041916221380233765, 0.00043010711669921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 5.0, 16.0, 15.0, 28.0, 40.0, 63.0, 149.0, 252.0, 459.0, 949.0, 2630.0, 11201.0, 141428.0, 785095.0, 93544.0, 8565.0, 2336.0, 896.0, 404.0, 186.0, 123.0, 50.0, 34.0, 9.0, 21.0, 14.0, 4.0, 5.0, 3.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.666015625, -3.527313232421875, -3.38861083984375, -3.249908447265625, -3.1112060546875, -2.972503662109375, -2.83380126953125, -2.695098876953125, -2.556396484375, -2.417694091796875, -2.27899169921875, -2.140289306640625, -2.0015869140625, -1.862884521484375, -1.72418212890625, -1.585479736328125, -1.44677734375, -1.308074951171875, -1.16937255859375, -1.030670166015625, -0.8919677734375, -0.753265380859375, -0.61456298828125, -0.475860595703125, -0.337158203125, -0.198455810546875, -0.05975341796875, 0.078948974609375, 0.2176513671875, 0.356353759765625, 0.49505615234375, 0.633758544921875, 0.7724609375, 0.911163330078125, 1.04986572265625, 1.188568115234375, 1.3272705078125, 1.465972900390625, 1.60467529296875, 1.743377685546875, 1.882080078125, 2.020782470703125, 2.15948486328125, 2.298187255859375, 2.4368896484375, 2.575592041015625, 2.71429443359375, 2.852996826171875, 2.99169921875, 3.130401611328125, 3.26910400390625, 3.407806396484375, 3.5465087890625, 3.685211181640625, 3.82391357421875, 3.962615966796875, 4.101318359375, 4.240020751953125, 4.37872314453125, 4.517425537109375, 4.6561279296875, 4.794830322265625, 4.93353271484375, 5.072235107421875, 5.2109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 11.0, 17.0, 49.0, 76.0, 129.0, 169.0, 190.0, 153.0, 83.0, 43.0, 28.0, 15.0, 20.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6171875, -9.371826171875, -9.12646484375, -8.881103515625, -8.6357421875, -8.390380859375, -8.14501953125, -7.899658203125, -7.654296875, -7.408935546875, -7.16357421875, -6.918212890625, -6.6728515625, -6.427490234375, -6.18212890625, -5.936767578125, -5.69140625, -5.446044921875, -5.20068359375, -4.955322265625, -4.7099609375, -4.464599609375, -4.21923828125, -3.973876953125, -3.728515625, -3.483154296875, -3.23779296875, -2.992431640625, -2.7470703125, -2.501708984375, -2.25634765625, -2.010986328125, -1.765625, -1.520263671875, -1.27490234375, -1.029541015625, -0.7841796875, -0.538818359375, -0.29345703125, -0.048095703125, 0.197265625, 0.442626953125, 0.68798828125, 0.933349609375, 1.1787109375, 1.424072265625, 1.66943359375, 1.914794921875, 2.16015625, 2.405517578125, 2.65087890625, 2.896240234375, 3.1416015625, 3.386962890625, 3.63232421875, 3.877685546875, 4.123046875, 4.368408203125, 4.61376953125, 4.859130859375, 5.1044921875, 5.349853515625, 5.59521484375, 5.840576171875, 6.0859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 14.0, 16.0, 32.0, 67.0, 92.0, 138.0, 161.0, 150.0, 103.0, 86.0, 42.0, 31.0, 26.0, 11.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.989959716796875, -31.4179630279541, -29.845964431762695, -28.273967742919922, -26.701969146728516, -25.129972457885742, -23.55797576904297, -21.985977172851562, -20.41398048400879, -18.841983795166016, -17.26998519897461, -15.697988510131836, -14.125990867614746, -12.553993225097656, -10.981996536254883, -9.409998893737793, -7.838001251220703, -6.266003608703613, -4.694006443023682, -3.12200927734375, -1.5500116348266602, 0.021986007690429688, 1.5939826965332031, 3.165980339050293, 4.737977981567383, 6.309975624084473, 7.881972789764404, 9.453969955444336, 11.025967597961426, 12.597965240478516, 14.169961929321289, 15.741959571838379, 17.31395721435547, 18.885953903198242, 20.45795249938965, 22.029949188232422, 23.601947784423828, 25.1739444732666, 26.745941162109375, 28.31793975830078, 29.889936447143555, 31.461933135986328, 33.033931732177734, 34.605926513671875, 36.17792510986328, 37.74992370605469, 39.321922302246094, 40.893917083740234, 42.46591567993164, 44.03791427612305, 45.60990905761719, 47.181907653808594, 48.75390625, 50.325904846191406, 51.89789962768555, 53.46989822387695, 55.041893005371094, 56.6138916015625, 58.18588638305664, 59.75788497924805, 61.32988357543945, 62.901878356933594, 64.473876953125, 66.0458755493164, 67.61787414550781]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 6.0, 9.0, 6.0, 7.0, 8.0, 18.0, 11.0, 13.0, 12.0, 10.0, 21.0, 18.0, 21.0, 26.0, 38.0, 45.0, 32.0, 36.0, 39.0, 39.0, 49.0, 37.0, 42.0, 38.0, 33.0, 42.0, 36.0, 44.0, 30.0, 34.0, 24.0, 23.0, 20.0, 20.0, 16.0, 11.0, 17.0, 11.0, 10.0, 11.0, 10.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-45.91868591308594, -44.43265151977539, -42.946617126464844, -41.46058654785156, -39.974552154541016, -38.48851776123047, -37.00248718261719, -35.51645278930664, -34.030418395996094, -32.54438400268555, -31.058351516723633, -29.57231903076172, -28.086284637451172, -26.600250244140625, -25.11421775817871, -23.628185272216797, -22.14215087890625, -20.656116485595703, -19.17008399963379, -17.684051513671875, -16.198017120361328, -14.711983680725098, -13.225950241088867, -11.739916801452637, -10.253883361816406, -8.767849922180176, -7.281816482543945, -5.795783042907715, -4.309749603271484, -2.823716163635254, -1.3376827239990234, 0.14835071563720703, 1.6343803405761719, 3.1204137802124023, 4.606447219848633, 6.092480659484863, 7.578514099121094, 9.064547538757324, 10.550580978393555, 12.036614418029785, 13.522647857666016, 15.008681297302246, 16.494714736938477, 17.98074722290039, 19.466781616210938, 20.952816009521484, 22.4388484954834, 23.924880981445312, 25.41091537475586, 26.896949768066406, 28.38298225402832, 29.869014739990234, 31.35504913330078, 32.84108352661133, 34.327117919921875, 35.813148498535156, 37.2991828918457, 38.78521728515625, 40.27124786376953, 41.75728225708008, 43.243316650390625, 44.72935104370117, 46.21538543701172, 47.701416015625, 49.18745040893555]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 7.0, 14.0, 24.0, 27.0, 37.0, 60.0, 112.0, 195.0, 306.0, 652.0, 1332.0, 2945.0, 7839.0, 30780.0, 385302.0, 3705001.0, 43134.0, 9861.0, 3551.0, 1552.0, 659.0, 363.0, 215.0, 99.0, 65.0, 43.0, 27.0, 20.0, 11.0, 10.0, 11.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2578125, -6.0687255859375, -5.879638671875, -5.6905517578125, -5.50146484375, -5.3123779296875, -5.123291015625, -4.9342041015625, -4.7451171875, -4.5560302734375, -4.366943359375, -4.1778564453125, -3.98876953125, -3.7996826171875, -3.610595703125, -3.4215087890625, -3.232421875, -3.0433349609375, -2.854248046875, -2.6651611328125, -2.47607421875, -2.2869873046875, -2.097900390625, -1.9088134765625, -1.7197265625, -1.5306396484375, -1.341552734375, -1.1524658203125, -0.96337890625, -0.7742919921875, -0.585205078125, -0.3961181640625, -0.20703125, -0.0179443359375, 0.171142578125, 0.3602294921875, 0.54931640625, 0.7384033203125, 0.927490234375, 1.1165771484375, 1.3056640625, 1.4947509765625, 1.683837890625, 1.8729248046875, 2.06201171875, 2.2510986328125, 2.440185546875, 2.6292724609375, 2.818359375, 3.0074462890625, 3.196533203125, 3.3856201171875, 3.57470703125, 3.7637939453125, 3.952880859375, 4.1419677734375, 4.3310546875, 4.5201416015625, 4.709228515625, 4.8983154296875, 5.08740234375, 5.2764892578125, 5.465576171875, 5.6546630859375, 5.84375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 3.0, 9.0, 8.0, 14.0, 22.0, 21.0, 29.0, 32.0, 26.0, 23.0, 35.0, 44.0, 53.0, 57.0, 54.0, 69.0, 61.0, 60.0, 64.0, 36.0, 38.0, 37.0, 43.0, 26.0, 25.0, 23.0, 11.0, 11.0, 14.0, 10.0, 9.0, 3.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.171875, -3.085235595703125, -2.99859619140625, -2.911956787109375, -2.8253173828125, -2.738677978515625, -2.65203857421875, -2.565399169921875, -2.478759765625, -2.392120361328125, -2.30548095703125, -2.218841552734375, -2.1322021484375, -2.045562744140625, -1.95892333984375, -1.872283935546875, -1.78564453125, -1.699005126953125, -1.61236572265625, -1.525726318359375, -1.4390869140625, -1.352447509765625, -1.26580810546875, -1.179168701171875, -1.092529296875, -1.005889892578125, -0.91925048828125, -0.832611083984375, -0.7459716796875, -0.659332275390625, -0.57269287109375, -0.486053466796875, -0.3994140625, -0.312774658203125, -0.22613525390625, -0.139495849609375, -0.0528564453125, 0.033782958984375, 0.12042236328125, 0.207061767578125, 0.293701171875, 0.380340576171875, 0.46697998046875, 0.553619384765625, 0.6402587890625, 0.726898193359375, 0.81353759765625, 0.900177001953125, 0.98681640625, 1.073455810546875, 1.16009521484375, 1.246734619140625, 1.3333740234375, 1.420013427734375, 1.50665283203125, 1.593292236328125, 1.679931640625, 1.766571044921875, 1.85321044921875, 1.939849853515625, 2.0264892578125, 2.113128662109375, 2.19976806640625, 2.286407470703125, 2.373046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 14.0, 20.0, 12.0, 19.0, 21.0, 37.0, 43.0, 77.0, 104.0, 195.0, 317.0, 817.0, 2102.0, 7285.0, 38039.0, 3236004.0, 862334.0, 36022.0, 6959.0, 2038.0, 841.0, 362.0, 195.0, 111.0, 72.0, 68.0, 35.0, 37.0, 25.0, 19.0, 16.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.66015625, -6.48931884765625, -6.3184814453125, -6.14764404296875, -5.976806640625, -5.80596923828125, -5.6351318359375, -5.46429443359375, -5.29345703125, -5.12261962890625, -4.9517822265625, -4.78094482421875, -4.610107421875, -4.43927001953125, -4.2684326171875, -4.09759521484375, -3.9267578125, -3.75592041015625, -3.5850830078125, -3.41424560546875, -3.243408203125, -3.07257080078125, -2.9017333984375, -2.73089599609375, -2.56005859375, -2.38922119140625, -2.2183837890625, -2.04754638671875, -1.876708984375, -1.70587158203125, -1.5350341796875, -1.36419677734375, -1.193359375, -1.02252197265625, -0.8516845703125, -0.68084716796875, -0.510009765625, -0.33917236328125, -0.1683349609375, 0.00250244140625, 0.17333984375, 0.34417724609375, 0.5150146484375, 0.68585205078125, 0.856689453125, 1.02752685546875, 1.1983642578125, 1.36920166015625, 1.5400390625, 1.71087646484375, 1.8817138671875, 2.05255126953125, 2.223388671875, 2.39422607421875, 2.5650634765625, 2.73590087890625, 2.90673828125, 3.07757568359375, 3.2484130859375, 3.41925048828125, 3.590087890625, 3.76092529296875, 3.9317626953125, 4.10260009765625, 4.2734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 12.0, 23.0, 44.0, 84.0, 295.0, 3176.0, 265.0, 85.0, 41.0, 19.0, 14.0, 10.0, 3.0, 7.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.03515625, -2.9761276245117188, -2.9170989990234375, -2.8580703735351562, -2.799041748046875, -2.7400131225585938, -2.6809844970703125, -2.6219558715820312, -2.56292724609375, -2.5038986206054688, -2.4448699951171875, -2.3858413696289062, -2.326812744140625, -2.2677841186523438, -2.2087554931640625, -2.1497268676757812, -2.0906982421875, -2.0316696166992188, -1.9726409912109375, -1.9136123657226562, -1.854583740234375, -1.7955551147460938, -1.7365264892578125, -1.6774978637695312, -1.61846923828125, -1.5594406127929688, -1.5004119873046875, -1.4413833618164062, -1.382354736328125, -1.3233261108398438, -1.2642974853515625, -1.2052688598632812, -1.146240234375, -1.0872116088867188, -1.0281829833984375, -0.9691543579101562, -0.910125732421875, -0.8510971069335938, -0.7920684814453125, -0.7330398559570312, -0.67401123046875, -0.6149826049804688, -0.5559539794921875, -0.49692535400390625, -0.437896728515625, -0.37886810302734375, -0.3198394775390625, -0.26081085205078125, -0.2017822265625, -0.14275360107421875, -0.0837249755859375, -0.02469635009765625, 0.034332275390625, 0.09336090087890625, 0.1523895263671875, 0.21141815185546875, 0.27044677734375, 0.32947540283203125, 0.3885040283203125, 0.44753265380859375, 0.506561279296875, 0.5655899047851562, 0.6246185302734375, 0.6836471557617188, 0.74267578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 11.0, 32.0, 68.0, 129.0, 181.0, 208.0, 137.0, 101.0, 63.0, 31.0, 12.0, 7.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.283803939819336, -5.0614471435546875, -4.839089870452881, -4.616733074188232, -4.394375801086426, -4.172019004821777, -3.94966197013855, -3.7273049354553223, -3.5049479007720947, -3.282590866088867, -3.0602338314056396, -2.837876796722412, -2.6155200004577637, -2.393162727355957, -2.1708059310913086, -1.948448896408081, -1.7260918617248535, -1.503734827041626, -1.2813777923583984, -1.0590208768844604, -0.8366638422012329, -0.6143068075180054, -0.3919498920440674, -0.16959285736083984, 0.052764177322387695, 0.27512118220329285, 0.497478187084198, 0.7198351621627808, 0.9421921968460083, 1.1645492315292358, 1.3869061470031738, 1.6092631816864014, 1.831620216369629, 2.0539772510528564, 2.276334285736084, 2.4986910820007324, 2.721048355102539, 2.9434051513671875, 3.165762186050415, 3.3881192207336426, 3.61047625541687, 3.8328332901000977, 4.055190086364746, 4.277547359466553, 4.499904155731201, 4.722261428833008, 4.944618225097656, 5.166975021362305, 5.389332294464111, 5.61168909072876, 5.834046363830566, 6.056403160095215, 6.2787604331970215, 6.50111722946167, 6.723474502563477, 6.945831298828125, 7.168188095092773, 7.390544891357422, 7.6129021644592285, 7.835258960723877, 8.057616233825684, 8.279973030090332, 8.50232982635498, 8.724687576293945, 8.947044372558594]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 2.0, 9.0, 12.0, 15.0, 9.0, 14.0, 19.0, 23.0, 28.0, 25.0, 34.0, 36.0, 39.0, 46.0, 44.0, 52.0, 50.0, 47.0, 43.0, 49.0, 39.0, 49.0, 45.0, 45.0, 23.0, 45.0, 31.0, 30.0, 19.0, 10.0, 12.0, 9.0, 8.0, 11.0, 14.0, 1.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3758206367492676, -3.2708516120910645, -3.1658825874328613, -3.060913562774658, -2.955944538116455, -2.850975513458252, -2.746006488800049, -2.6410374641418457, -2.5360684394836426, -2.4310994148254395, -2.3261303901672363, -2.221161365509033, -2.11619234085083, -2.011223316192627, -1.9062541723251343, -1.8012851476669312, -1.6963160037994385, -1.5913469791412354, -1.4863779544830322, -1.381408929824829, -1.276439905166626, -1.1714708805084229, -1.0665017366409302, -0.961532711982727, -0.8565636873245239, -0.7515946626663208, -0.6466256380081177, -0.5416565537452698, -0.43668752908706665, -0.3317185044288635, -0.22674942016601562, -0.1217803955078125, -0.016811132431030273, 0.08815790712833405, 0.19312694668769836, 0.2980960011482239, 0.403065025806427, 0.5080340504646301, 0.613003134727478, 0.7179721593856812, 0.8229411840438843, 0.9279102087020874, 1.0328792333602905, 1.1378483772277832, 1.2428174018859863, 1.3477864265441895, 1.4527554512023926, 1.5577244758605957, 1.6626935005187988, 1.767662525177002, 1.872631549835205, 1.9776005744934082, 2.0825695991516113, 2.1875386238098145, 2.2925076484680176, 2.3974766731262207, 2.502445697784424, 2.607414722442627, 2.71238374710083, 2.817352771759033, 2.9223217964172363, 3.0272908210754395, 3.1322598457336426, 3.2372288703918457, 3.342198133468628]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 12.0, 9.0, 20.0, 22.0, 22.0, 56.0, 72.0, 93.0, 128.0, 239.0, 375.0, 756.0, 1555.0, 3305.0, 8761.0, 25282.0, 80687.0, 246199.0, 388522.0, 197561.0, 62475.0, 19499.0, 7064.0, 2893.0, 1352.0, 659.0, 350.0, 207.0, 109.0, 76.0, 53.0, 37.0, 28.0, 20.0, 10.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.74981689453125, -3.6129150390625, -3.47601318359375, -3.339111328125, -3.20220947265625, -3.0653076171875, -2.92840576171875, -2.79150390625, -2.65460205078125, -2.5177001953125, -2.38079833984375, -2.243896484375, -2.10699462890625, -1.9700927734375, -1.83319091796875, -1.6962890625, -1.55938720703125, -1.4224853515625, -1.28558349609375, -1.148681640625, -1.01177978515625, -0.8748779296875, -0.73797607421875, -0.60107421875, -0.46417236328125, -0.3272705078125, -0.19036865234375, -0.053466796875, 0.08343505859375, 0.2203369140625, 0.35723876953125, 0.494140625, 0.63104248046875, 0.7679443359375, 0.90484619140625, 1.041748046875, 1.17864990234375, 1.3155517578125, 1.45245361328125, 1.58935546875, 1.72625732421875, 1.8631591796875, 2.00006103515625, 2.136962890625, 2.27386474609375, 2.4107666015625, 2.54766845703125, 2.6845703125, 2.82147216796875, 2.9583740234375, 3.09527587890625, 3.232177734375, 3.36907958984375, 3.5059814453125, 3.64288330078125, 3.77978515625, 3.91668701171875, 4.0535888671875, 4.19049072265625, 4.327392578125, 4.46429443359375, 4.6011962890625, 4.73809814453125, 4.875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 7.0, 17.0, 18.0, 18.0, 22.0, 27.0, 36.0, 25.0, 32.0, 44.0, 36.0, 56.0, 63.0, 50.0, 75.0, 60.0, 60.0, 48.0, 29.0, 43.0, 44.0, 27.0, 35.0, 19.0, 16.0, 5.0, 17.0, 13.0, 8.0, 8.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.18359375, -3.097503662109375, -3.01141357421875, -2.925323486328125, -2.8392333984375, -2.753143310546875, -2.66705322265625, -2.580963134765625, -2.494873046875, -2.408782958984375, -2.32269287109375, -2.236602783203125, -2.1505126953125, -2.064422607421875, -1.97833251953125, -1.892242431640625, -1.80615234375, -1.720062255859375, -1.63397216796875, -1.547882080078125, -1.4617919921875, -1.375701904296875, -1.28961181640625, -1.203521728515625, -1.117431640625, -1.031341552734375, -0.94525146484375, -0.859161376953125, -0.7730712890625, -0.686981201171875, -0.60089111328125, -0.514801025390625, -0.4287109375, -0.342620849609375, -0.25653076171875, -0.170440673828125, -0.0843505859375, 0.001739501953125, 0.08782958984375, 0.173919677734375, 0.260009765625, 0.346099853515625, 0.43218994140625, 0.518280029296875, 0.6043701171875, 0.690460205078125, 0.77655029296875, 0.862640380859375, 0.94873046875, 1.034820556640625, 1.12091064453125, 1.207000732421875, 1.2930908203125, 1.379180908203125, 1.46527099609375, 1.551361083984375, 1.637451171875, 1.723541259765625, 1.80963134765625, 1.895721435546875, 1.9818115234375, 2.067901611328125, 2.15399169921875, 2.240081787109375, 2.326171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 5.0, 6.0, 10.0, 18.0, 29.0, 21.0, 53.0, 119.0, 227.0, 477.0, 1704.0, 8273.0, 215890.0, 797206.0, 20333.0, 2735.0, 798.0, 329.0, 138.0, 70.0, 45.0, 21.0, 8.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-19.1875, -18.6978759765625, -18.208251953125, -17.7186279296875, -17.22900390625, -16.7393798828125, -16.249755859375, -15.7601318359375, -15.2705078125, -14.7808837890625, -14.291259765625, -13.8016357421875, -13.31201171875, -12.8223876953125, -12.332763671875, -11.8431396484375, -11.353515625, -10.8638916015625, -10.374267578125, -9.8846435546875, -9.39501953125, -8.9053955078125, -8.415771484375, -7.9261474609375, -7.4365234375, -6.9468994140625, -6.457275390625, -5.9676513671875, -5.47802734375, -4.9884033203125, -4.498779296875, -4.0091552734375, -3.51953125, -3.0299072265625, -2.540283203125, -2.0506591796875, -1.56103515625, -1.0714111328125, -0.581787109375, -0.0921630859375, 0.3974609375, 0.8870849609375, 1.376708984375, 1.8663330078125, 2.35595703125, 2.8455810546875, 3.335205078125, 3.8248291015625, 4.314453125, 4.8040771484375, 5.293701171875, 5.7833251953125, 6.27294921875, 6.7625732421875, 7.252197265625, 7.7418212890625, 8.2314453125, 8.7210693359375, 9.210693359375, 9.7003173828125, 10.18994140625, 10.6795654296875, 11.169189453125, 11.6588134765625, 12.1484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 10.0, 12.0, 15.0, 22.0, 25.0, 42.0, 52.0, 47.0, 52.0, 86.0, 80.0, 72.0, 85.0, 94.0, 76.0, 58.0, 48.0, 39.0, 22.0, 11.0, 14.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0625, -20.400390625, -19.73828125, -19.076171875, -18.4140625, -17.751953125, -17.08984375, -16.427734375, -15.765625, -15.103515625, -14.44140625, -13.779296875, -13.1171875, -12.455078125, -11.79296875, -11.130859375, -10.46875, -9.806640625, -9.14453125, -8.482421875, -7.8203125, -7.158203125, -6.49609375, -5.833984375, -5.171875, -4.509765625, -3.84765625, -3.185546875, -2.5234375, -1.861328125, -1.19921875, -0.537109375, 0.125, 0.787109375, 1.44921875, 2.111328125, 2.7734375, 3.435546875, 4.09765625, 4.759765625, 5.421875, 6.083984375, 6.74609375, 7.408203125, 8.0703125, 8.732421875, 9.39453125, 10.056640625, 10.71875, 11.380859375, 12.04296875, 12.705078125, 13.3671875, 14.029296875, 14.69140625, 15.353515625, 16.015625, 16.677734375, 17.33984375, 18.001953125, 18.6640625, 19.326171875, 19.98828125, 20.650390625, 21.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 8.0, 20.0, 19.0, 34.0, 62.0, 104.0, 148.0, 330.0, 809.0, 4513.0, 170808.0, 853937.0, 15317.0, 1473.0, 473.0, 224.0, 101.0, 64.0, 34.0, 18.0, 15.0, 19.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.707763671875, -4.48583984375, -4.263916015625, -4.0419921875, -3.820068359375, -3.59814453125, -3.376220703125, -3.154296875, -2.932373046875, -2.71044921875, -2.488525390625, -2.2666015625, -2.044677734375, -1.82275390625, -1.600830078125, -1.37890625, -1.156982421875, -0.93505859375, -0.713134765625, -0.4912109375, -0.269287109375, -0.04736328125, 0.174560546875, 0.396484375, 0.618408203125, 0.84033203125, 1.062255859375, 1.2841796875, 1.506103515625, 1.72802734375, 1.949951171875, 2.171875, 2.393798828125, 2.61572265625, 2.837646484375, 3.0595703125, 3.281494140625, 3.50341796875, 3.725341796875, 3.947265625, 4.169189453125, 4.39111328125, 4.613037109375, 4.8349609375, 5.056884765625, 5.27880859375, 5.500732421875, 5.72265625, 5.944580078125, 6.16650390625, 6.388427734375, 6.6103515625, 6.832275390625, 7.05419921875, 7.276123046875, 7.498046875, 7.719970703125, 7.94189453125, 8.163818359375, 8.3857421875, 8.607666015625, 8.82958984375, 9.051513671875, 9.2734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 9.0, 10.0, 35.0, 27.0, 35.0, 67.0, 91.0, 128.0, 152.0, 119.0, 97.0, 64.0, 45.0, 34.0, 28.0, 15.0, 10.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004718303680419922, -0.0004573352634906769, -0.00044284015893936157, -0.00042834505438804626, -0.00041384994983673096, -0.00039935484528541565, -0.00038485974073410034, -0.00037036463618278503, -0.0003558695316314697, -0.0003413744270801544, -0.0003268793225288391, -0.0003123842179775238, -0.0002978891134262085, -0.0002833940088748932, -0.0002688989043235779, -0.0002544037997722626, -0.00023990869522094727, -0.00022541359066963196, -0.00021091848611831665, -0.00019642338156700134, -0.00018192827701568604, -0.00016743317246437073, -0.00015293806791305542, -0.0001384429633617401, -0.0001239478588104248, -0.0001094527542591095, -9.495764970779419e-05, -8.046254515647888e-05, -6.596744060516357e-05, -5.1472336053848267e-05, -3.697723150253296e-05, -2.248212695121765e-05, -7.987022399902344e-06, 6.508082151412964e-06, 2.100318670272827e-05, 3.549829125404358e-05, 4.999339580535889e-05, 6.44885003566742e-05, 7.89836049079895e-05, 9.347870945930481e-05, 0.00010797381401062012, 0.00012246891856193542, 0.00013696402311325073, 0.00015145912766456604, 0.00016595423221588135, 0.00018044933676719666, 0.00019494444131851196, 0.00020943954586982727, 0.00022393465042114258, 0.00023842975497245789, 0.0002529248595237732, 0.0002674199640750885, 0.0002819150686264038, 0.0002964101731777191, 0.0003109052777290344, 0.00032540038228034973, 0.00033989548683166504, 0.00035439059138298035, 0.00036888569593429565, 0.00038338080048561096, 0.00039787590503692627, 0.0004123710095882416, 0.0004268661141395569, 0.0004413612186908722, 0.0004558563232421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 13.0, 12.0, 31.0, 46.0, 89.0, 213.0, 601.0, 1968.0, 19471.0, 908611.0, 111722.0, 4233.0, 946.0, 318.0, 138.0, 57.0, 36.0, 22.0, 11.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.0546875, -9.81927490234375, -9.5838623046875, -9.34844970703125, -9.113037109375, -8.87762451171875, -8.6422119140625, -8.40679931640625, -8.17138671875, -7.93597412109375, -7.7005615234375, -7.46514892578125, -7.229736328125, -6.99432373046875, -6.7589111328125, -6.52349853515625, -6.2880859375, -6.05267333984375, -5.8172607421875, -5.58184814453125, -5.346435546875, -5.11102294921875, -4.8756103515625, -4.64019775390625, -4.40478515625, -4.16937255859375, -3.9339599609375, -3.69854736328125, -3.463134765625, -3.22772216796875, -2.9923095703125, -2.75689697265625, -2.521484375, -2.28607177734375, -2.0506591796875, -1.81524658203125, -1.579833984375, -1.34442138671875, -1.1090087890625, -0.87359619140625, -0.63818359375, -0.40277099609375, -0.1673583984375, 0.06805419921875, 0.303466796875, 0.53887939453125, 0.7742919921875, 1.00970458984375, 1.2451171875, 1.48052978515625, 1.7159423828125, 1.95135498046875, 2.186767578125, 2.42218017578125, 2.6575927734375, 2.89300537109375, 3.12841796875, 3.36383056640625, 3.5992431640625, 3.83465576171875, 4.070068359375, 4.30548095703125, 4.5408935546875, 4.77630615234375, 5.01171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 9.0, 15.0, 16.0, 35.0, 51.0, 135.0, 161.0, 186.0, 165.0, 107.0, 53.0, 22.0, 18.0, 12.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.84375, -10.60504150390625, -10.3663330078125, -10.12762451171875, -9.888916015625, -9.65020751953125, -9.4114990234375, -9.17279052734375, -8.93408203125, -8.69537353515625, -8.4566650390625, -8.21795654296875, -7.979248046875, -7.74053955078125, -7.5018310546875, -7.26312255859375, -7.0244140625, -6.78570556640625, -6.5469970703125, -6.30828857421875, -6.069580078125, -5.83087158203125, -5.5921630859375, -5.35345458984375, -5.11474609375, -4.87603759765625, -4.6373291015625, -4.39862060546875, -4.159912109375, -3.92120361328125, -3.6824951171875, -3.44378662109375, -3.205078125, -2.96636962890625, -2.7276611328125, -2.48895263671875, -2.250244140625, -2.01153564453125, -1.7728271484375, -1.53411865234375, -1.29541015625, -1.05670166015625, -0.8179931640625, -0.57928466796875, -0.340576171875, -0.10186767578125, 0.1368408203125, 0.37554931640625, 0.6142578125, 0.85296630859375, 1.0916748046875, 1.33038330078125, 1.569091796875, 1.80780029296875, 2.0465087890625, 2.28521728515625, 2.52392578125, 2.76263427734375, 3.0013427734375, 3.24005126953125, 3.478759765625, 3.71746826171875, 3.9561767578125, 4.19488525390625, 4.43359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 11.0, 8.0, 18.0, 44.0, 121.0, 240.0, 296.0, 180.0, 60.0, 18.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.734859466552734, -38.39486312866211, -35.054866790771484, -31.71487045288086, -28.374874114990234, -25.034879684448242, -21.694883346557617, -18.354887008666992, -15.014890670776367, -11.674894332885742, -8.334897994995117, -4.994902610778809, -1.6549062728881836, 1.685089111328125, 5.02508544921875, 8.365081787109375, 11.705078125, 15.045074462890625, 18.38507080078125, 21.725067138671875, 25.0650634765625, 28.405057907104492, 31.745054244995117, 35.085052490234375, 38.425048828125, 41.765045166015625, 45.10504150390625, 48.445037841796875, 51.7850341796875, 55.125030517578125, 58.46502685546875, 61.805023193359375, 65.14501190185547, 68.4850082397461, 71.82500457763672, 75.16500091552734, 78.50499725341797, 81.8449935913086, 85.18498992919922, 88.52498626708984, 91.86498260498047, 95.2049789428711, 98.54497528076172, 101.88497161865234, 105.22496795654297, 108.5649642944336, 111.90496063232422, 115.24495697021484, 118.58494567871094, 121.92494201660156, 125.26493835449219, 128.6049346923828, 131.94493103027344, 135.28492736816406, 138.6249237060547, 141.9649200439453, 145.30491638183594, 148.64491271972656, 151.9849090576172, 155.3249053955078, 158.66490173339844, 162.00489807128906, 165.3448944091797, 168.6848907470703, 172.02488708496094]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 12.0, 14.0, 11.0, 12.0, 7.0, 20.0, 18.0, 15.0, 22.0, 24.0, 42.0, 31.0, 32.0, 40.0, 43.0, 39.0, 48.0, 40.0, 44.0, 41.0, 42.0, 40.0, 36.0, 26.0, 28.0, 28.0, 25.0, 24.0, 24.0, 26.0, 24.0, 16.0, 13.0, 12.0, 14.0, 7.0, 10.0, 9.0, 6.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-47.39202117919922, -45.92927551269531, -44.466529846191406, -43.0037841796875, -41.541038513183594, -40.07828903198242, -38.615543365478516, -37.15279769897461, -35.6900520324707, -34.2273063659668, -32.76456069946289, -31.30181312561035, -29.839067459106445, -28.37632179260254, -26.91357421875, -25.450828552246094, -23.988082885742188, -22.52533721923828, -21.062591552734375, -19.599843978881836, -18.13709831237793, -16.674352645874023, -15.2116060256958, -13.748859405517578, -12.286113739013672, -10.823368072509766, -9.360621452331543, -7.8978753089904785, -6.435129165649414, -4.97238302230835, -3.509636878967285, -2.0468902587890625, -0.5841407775878906, 0.8786053657531738, 2.3413515090942383, 3.8040976524353027, 5.266843795776367, 6.729589939117432, 8.192336082458496, 9.655082702636719, 11.117828369140625, 12.580574035644531, 14.043320655822754, 15.506067276000977, 16.968812942504883, 18.43155860900879, 19.894306182861328, 21.357051849365234, 22.81979751586914, 24.282543182373047, 25.745288848876953, 27.208036422729492, 28.6707820892334, 30.133527755737305, 31.596275329589844, 33.05902099609375, 34.521766662597656, 35.98451232910156, 37.44725799560547, 38.910003662109375, 40.37274932861328, 41.83549880981445, 43.29824447631836, 44.760990142822266, 46.22373580932617]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 10.0, 6.0, 21.0, 12.0, 24.0, 39.0, 59.0, 64.0, 122.0, 196.0, 298.0, 499.0, 970.0, 1906.0, 4380.0, 11253.0, 40178.0, 3825322.0, 261116.0, 30872.0, 9378.0, 3791.0, 1696.0, 822.0, 459.0, 252.0, 173.0, 118.0, 77.0, 38.0, 35.0, 23.0, 18.0, 14.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.0703125, -5.89642333984375, -5.7225341796875, -5.54864501953125, -5.374755859375, -5.20086669921875, -5.0269775390625, -4.85308837890625, -4.67919921875, -4.50531005859375, -4.3314208984375, -4.15753173828125, -3.983642578125, -3.80975341796875, -3.6358642578125, -3.46197509765625, -3.2880859375, -3.11419677734375, -2.9403076171875, -2.76641845703125, -2.592529296875, -2.41864013671875, -2.2447509765625, -2.07086181640625, -1.89697265625, -1.72308349609375, -1.5491943359375, -1.37530517578125, -1.201416015625, -1.02752685546875, -0.8536376953125, -0.67974853515625, -0.505859375, -0.33197021484375, -0.1580810546875, 0.01580810546875, 0.189697265625, 0.36358642578125, 0.5374755859375, 0.71136474609375, 0.88525390625, 1.05914306640625, 1.2330322265625, 1.40692138671875, 1.580810546875, 1.75469970703125, 1.9285888671875, 2.10247802734375, 2.2763671875, 2.45025634765625, 2.6241455078125, 2.79803466796875, 2.971923828125, 3.14581298828125, 3.3197021484375, 3.49359130859375, 3.66748046875, 3.84136962890625, 4.0152587890625, 4.18914794921875, 4.363037109375, 4.53692626953125, 4.7108154296875, 4.88470458984375, 5.05859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 17.0, 12.0, 26.0, 22.0, 32.0, 42.0, 26.0, 50.0, 56.0, 86.0, 75.0, 66.0, 59.0, 54.0, 61.0, 53.0, 47.0, 43.0, 32.0, 30.0, 17.0, 14.0, 7.0, 11.0, 12.0, 3.0, 7.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-4.171875, -4.068817138671875, -3.96575927734375, -3.862701416015625, -3.7596435546875, -3.656585693359375, -3.55352783203125, -3.450469970703125, -3.347412109375, -3.244354248046875, -3.14129638671875, -3.038238525390625, -2.9351806640625, -2.832122802734375, -2.72906494140625, -2.626007080078125, -2.52294921875, -2.419891357421875, -2.31683349609375, -2.213775634765625, -2.1107177734375, -2.007659912109375, -1.90460205078125, -1.801544189453125, -1.698486328125, -1.595428466796875, -1.49237060546875, -1.389312744140625, -1.2862548828125, -1.183197021484375, -1.08013916015625, -0.977081298828125, -0.8740234375, -0.770965576171875, -0.66790771484375, -0.564849853515625, -0.4617919921875, -0.358734130859375, -0.25567626953125, -0.152618408203125, -0.049560546875, 0.053497314453125, 0.15655517578125, 0.259613037109375, 0.3626708984375, 0.465728759765625, 0.56878662109375, 0.671844482421875, 0.77490234375, 0.877960205078125, 0.98101806640625, 1.084075927734375, 1.1871337890625, 1.290191650390625, 1.39324951171875, 1.496307373046875, 1.599365234375, 1.702423095703125, 1.80548095703125, 1.908538818359375, 2.0115966796875, 2.114654541015625, 2.21771240234375, 2.320770263671875, 2.423828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 14.0, 16.0, 34.0, 30.0, 42.0, 61.0, 104.0, 119.0, 179.0, 272.0, 452.0, 832.0, 1581.0, 3247.0, 7866.0, 22059.0, 91637.0, 3853636.0, 161710.0, 31442.0, 10350.0, 4079.0, 1937.0, 973.0, 585.0, 336.0, 221.0, 132.0, 80.0, 62.0, 63.0, 34.0, 25.0, 17.0, 13.0, 7.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-3.09375, -2.9959716796875, -2.898193359375, -2.8004150390625, -2.70263671875, -2.6048583984375, -2.507080078125, -2.4093017578125, -2.3115234375, -2.2137451171875, -2.115966796875, -2.0181884765625, -1.92041015625, -1.8226318359375, -1.724853515625, -1.6270751953125, -1.529296875, -1.4315185546875, -1.333740234375, -1.2359619140625, -1.13818359375, -1.0404052734375, -0.942626953125, -0.8448486328125, -0.7470703125, -0.6492919921875, -0.551513671875, -0.4537353515625, -0.35595703125, -0.2581787109375, -0.160400390625, -0.0626220703125, 0.03515625, 0.1329345703125, 0.230712890625, 0.3284912109375, 0.42626953125, 0.5240478515625, 0.621826171875, 0.7196044921875, 0.8173828125, 0.9151611328125, 1.012939453125, 1.1107177734375, 1.20849609375, 1.3062744140625, 1.404052734375, 1.5018310546875, 1.599609375, 1.6973876953125, 1.795166015625, 1.8929443359375, 1.99072265625, 2.0885009765625, 2.186279296875, 2.2840576171875, 2.3818359375, 2.4796142578125, 2.577392578125, 2.6751708984375, 2.77294921875, 2.8707275390625, 2.968505859375, 3.0662841796875, 3.1640625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 22.0, 23.0, 59.0, 91.0, 413.0, 3195.0, 121.0, 66.0, 23.0, 17.0, 12.0, 4.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.7349090576171875, -0.696380615234375, -0.6578521728515625, -0.61932373046875, -0.5807952880859375, -0.542266845703125, -0.5037384033203125, -0.4652099609375, -0.4266815185546875, -0.388153076171875, -0.3496246337890625, -0.31109619140625, -0.2725677490234375, -0.234039306640625, -0.1955108642578125, -0.156982421875, -0.1184539794921875, -0.079925537109375, -0.0413970947265625, -0.00286865234375, 0.0356597900390625, 0.074188232421875, 0.1127166748046875, 0.1512451171875, 0.1897735595703125, 0.228302001953125, 0.2668304443359375, 0.30535888671875, 0.3438873291015625, 0.382415771484375, 0.4209442138671875, 0.45947265625, 0.4980010986328125, 0.536529541015625, 0.5750579833984375, 0.61358642578125, 0.6521148681640625, 0.690643310546875, 0.7291717529296875, 0.7677001953125, 0.8062286376953125, 0.844757080078125, 0.8832855224609375, 0.92181396484375, 0.9603424072265625, 0.998870849609375, 1.0373992919921875, 1.075927734375, 1.1144561767578125, 1.152984619140625, 1.1915130615234375, 1.23004150390625, 1.2685699462890625, 1.307098388671875, 1.3456268310546875, 1.3841552734375, 1.4226837158203125, 1.461212158203125, 1.4997406005859375, 1.53826904296875, 1.5767974853515625, 1.615325927734375, 1.6538543701171875, 1.6923828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 13.0, 17.0, 34.0, 69.0, 128.0, 169.0, 184.0, 155.0, 115.0, 57.0, 33.0, 14.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3867790699005127, -3.2246382236480713, -3.062497615814209, -2.9003567695617676, -2.738215923309326, -2.5760750770568848, -2.4139344692230225, -2.251793622970581, -2.0896530151367188, -1.927512288093567, -1.7653714418411255, -1.6032307147979736, -1.4410898685455322, -1.2789491415023804, -1.1168084144592285, -0.9546675682067871, -0.7925267219543457, -0.6303859353065491, -0.46824517846107483, -0.3061044216156006, -0.14396363496780396, 0.018177151679992676, 0.18031787872314453, 0.34245872497558594, 0.5045994520187378, 0.6667402386665344, 0.828881025314331, 0.9910217523574829, 1.1531624794006348, 1.3153033256530762, 1.477444052696228, 1.6395848989486694, 1.8017258644104004, 1.9638665914535522, 2.126007318496704, 2.2881481647491455, 2.450289011001587, 2.612429618835449, 2.7745704650878906, 2.936711311340332, 3.0988521575927734, 3.260993003845215, 3.423133611679077, 3.5852744579315186, 3.74741530418396, 3.9095559120178223, 4.071696758270264, 4.233837604522705, 4.395977973937988, 4.55811882019043, 4.720259666442871, 4.8824005126953125, 5.044540882110596, 5.206681728363037, 5.3688225746154785, 5.53096342086792, 5.693104267120361, 5.855245113372803, 6.017385959625244, 6.179526329040527, 6.341667175292969, 6.50380802154541, 6.665948867797852, 6.828089714050293, 6.990230560302734]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 17.0, 16.0, 28.0, 24.0, 39.0, 36.0, 63.0, 58.0, 66.0, 65.0, 69.0, 62.0, 69.0, 69.0, 62.0, 56.0, 42.0, 25.0, 31.0, 26.0, 23.0, 20.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0220165252685547, -1.931532859802246, -1.841049313545227, -1.7505656480789185, -1.6600821018218994, -1.5695984363555908, -1.4791147708892822, -1.3886312246322632, -1.2981476783752441, -1.2076640129089355, -1.1171804666519165, -1.026696801185608, -0.9362132549285889, -0.8457295894622803, -0.7552459836006165, -0.6647623777389526, -0.574278712272644, -0.4837951064109802, -0.3933115005493164, -0.3028278648853302, -0.21234425902366638, -0.12186065316200256, -0.03137701749801636, 0.05910658836364746, 0.14959019422531128, 0.2400738000869751, 0.3305574059486389, 0.4210410416126251, 0.5115246772766113, 0.6020082235336304, 0.692491888999939, 0.7829754948616028, 0.8734591007232666, 0.9639427065849304, 1.0544263124465942, 1.1449099779129028, 1.2353935241699219, 1.3258771896362305, 1.416360855102539, 1.506844401359558, 1.5973279476165771, 1.6878116130828857, 1.7782951593399048, 1.8687788248062134, 1.9592623710632324, 2.049746036529541, 2.1402297019958496, 2.230713367462158, 2.321197032928467, 2.4116806983947754, 2.502164363861084, 2.5926477909088135, 2.683131456375122, 2.7736151218414307, 2.8640987873077393, 2.9545822143554688, 3.0450658798217773, 3.135549545288086, 3.2260332107543945, 3.316516637802124, 3.4070003032684326, 3.497483968734741, 3.58796763420105, 3.6784510612487793, 3.768934726715088]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 10.0, 20.0, 15.0, 24.0, 42.0, 59.0, 95.0, 134.0, 258.0, 467.0, 934.0, 1827.0, 3955.0, 9907.0, 27595.0, 83629.0, 243675.0, 385130.0, 192019.0, 62917.0, 21357.0, 7855.0, 3234.0, 1490.0, 758.0, 452.0, 247.0, 148.0, 101.0, 63.0, 48.0, 32.0, 18.0, 11.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1484375, -3.019287109375, -2.89013671875, -2.760986328125, -2.6318359375, -2.502685546875, -2.37353515625, -2.244384765625, -2.115234375, -1.986083984375, -1.85693359375, -1.727783203125, -1.5986328125, -1.469482421875, -1.34033203125, -1.211181640625, -1.08203125, -0.952880859375, -0.82373046875, -0.694580078125, -0.5654296875, -0.436279296875, -0.30712890625, -0.177978515625, -0.048828125, 0.080322265625, 0.20947265625, 0.338623046875, 0.4677734375, 0.596923828125, 0.72607421875, 0.855224609375, 0.984375, 1.113525390625, 1.24267578125, 1.371826171875, 1.5009765625, 1.630126953125, 1.75927734375, 1.888427734375, 2.017578125, 2.146728515625, 2.27587890625, 2.405029296875, 2.5341796875, 2.663330078125, 2.79248046875, 2.921630859375, 3.05078125, 3.179931640625, 3.30908203125, 3.438232421875, 3.5673828125, 3.696533203125, 3.82568359375, 3.954833984375, 4.083984375, 4.213134765625, 4.34228515625, 4.471435546875, 4.6005859375, 4.729736328125, 4.85888671875, 4.988037109375, 5.1171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 11.0, 10.0, 18.0, 19.0, 23.0, 24.0, 45.0, 32.0, 39.0, 56.0, 64.0, 79.0, 73.0, 59.0, 60.0, 55.0, 67.0, 44.0, 24.0, 45.0, 33.0, 28.0, 13.0, 19.0, 2.0, 14.0, 5.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.16015625, -4.058380126953125, -3.95660400390625, -3.854827880859375, -3.7530517578125, -3.651275634765625, -3.54949951171875, -3.447723388671875, -3.345947265625, -3.244171142578125, -3.14239501953125, -3.040618896484375, -2.9388427734375, -2.837066650390625, -2.73529052734375, -2.633514404296875, -2.53173828125, -2.429962158203125, -2.32818603515625, -2.226409912109375, -2.1246337890625, -2.022857666015625, -1.92108154296875, -1.819305419921875, -1.717529296875, -1.615753173828125, -1.51397705078125, -1.412200927734375, -1.3104248046875, -1.208648681640625, -1.10687255859375, -1.005096435546875, -0.9033203125, -0.801544189453125, -0.69976806640625, -0.597991943359375, -0.4962158203125, -0.394439697265625, -0.29266357421875, -0.190887451171875, -0.089111328125, 0.012664794921875, 0.11444091796875, 0.216217041015625, 0.3179931640625, 0.419769287109375, 0.52154541015625, 0.623321533203125, 0.72509765625, 0.826873779296875, 0.92864990234375, 1.030426025390625, 1.1322021484375, 1.233978271484375, 1.33575439453125, 1.437530517578125, 1.539306640625, 1.641082763671875, 1.74285888671875, 1.844635009765625, 1.9464111328125, 2.048187255859375, 2.14996337890625, 2.251739501953125, 2.353515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 9.0, 7.0, 16.0, 22.0, 26.0, 36.0, 58.0, 106.0, 268.0, 665.0, 2266.0, 13161.0, 613530.0, 404113.0, 11141.0, 1975.0, 578.0, 261.0, 133.0, 71.0, 33.0, 24.0, 18.0, 12.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.796875, -22.1962890625, -21.595703125, -20.9951171875, -20.39453125, -19.7939453125, -19.193359375, -18.5927734375, -17.9921875, -17.3916015625, -16.791015625, -16.1904296875, -15.58984375, -14.9892578125, -14.388671875, -13.7880859375, -13.1875, -12.5869140625, -11.986328125, -11.3857421875, -10.78515625, -10.1845703125, -9.583984375, -8.9833984375, -8.3828125, -7.7822265625, -7.181640625, -6.5810546875, -5.98046875, -5.3798828125, -4.779296875, -4.1787109375, -3.578125, -2.9775390625, -2.376953125, -1.7763671875, -1.17578125, -0.5751953125, 0.025390625, 0.6259765625, 1.2265625, 1.8271484375, 2.427734375, 3.0283203125, 3.62890625, 4.2294921875, 4.830078125, 5.4306640625, 6.03125, 6.6318359375, 7.232421875, 7.8330078125, 8.43359375, 9.0341796875, 9.634765625, 10.2353515625, 10.8359375, 11.4365234375, 12.037109375, 12.6376953125, 13.23828125, 13.8388671875, 14.439453125, 15.0400390625, 15.640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 9.0, 17.0, 15.0, 15.0, 15.0, 18.0, 42.0, 46.0, 69.0, 70.0, 81.0, 92.0, 90.0, 82.0, 69.0, 72.0, 64.0, 36.0, 26.0, 12.0, 13.0, 9.0, 6.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-31.8125, -30.97412109375, -30.1357421875, -29.29736328125, -28.458984375, -27.62060546875, -26.7822265625, -25.94384765625, -25.10546875, -24.26708984375, -23.4287109375, -22.59033203125, -21.751953125, -20.91357421875, -20.0751953125, -19.23681640625, -18.3984375, -17.56005859375, -16.7216796875, -15.88330078125, -15.044921875, -14.20654296875, -13.3681640625, -12.52978515625, -11.69140625, -10.85302734375, -10.0146484375, -9.17626953125, -8.337890625, -7.49951171875, -6.6611328125, -5.82275390625, -4.984375, -4.14599609375, -3.3076171875, -2.46923828125, -1.630859375, -0.79248046875, 0.0458984375, 0.88427734375, 1.72265625, 2.56103515625, 3.3994140625, 4.23779296875, 5.076171875, 5.91455078125, 6.7529296875, 7.59130859375, 8.4296875, 9.26806640625, 10.1064453125, 10.94482421875, 11.783203125, 12.62158203125, 13.4599609375, 14.29833984375, 15.13671875, 15.97509765625, 16.8134765625, 17.65185546875, 18.490234375, 19.32861328125, 20.1669921875, 21.00537109375, 21.84375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 12.0, 13.0, 19.0, 26.0, 44.0, 52.0, 101.0, 148.0, 287.0, 644.0, 2628.0, 87680.0, 946968.0, 7860.0, 1137.0, 423.0, 164.0, 102.0, 77.0, 37.0, 28.0, 27.0, 29.0, 13.0, 10.0, 10.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.265625, -12.93585205078125, -12.6060791015625, -12.27630615234375, -11.946533203125, -11.61676025390625, -11.2869873046875, -10.95721435546875, -10.62744140625, -10.29766845703125, -9.9678955078125, -9.63812255859375, -9.308349609375, -8.97857666015625, -8.6488037109375, -8.31903076171875, -7.9892578125, -7.65948486328125, -7.3297119140625, -6.99993896484375, -6.670166015625, -6.34039306640625, -6.0106201171875, -5.68084716796875, -5.35107421875, -5.02130126953125, -4.6915283203125, -4.36175537109375, -4.031982421875, -3.70220947265625, -3.3724365234375, -3.04266357421875, -2.712890625, -2.38311767578125, -2.0533447265625, -1.72357177734375, -1.393798828125, -1.06402587890625, -0.7342529296875, -0.40447998046875, -0.07470703125, 0.25506591796875, 0.5848388671875, 0.91461181640625, 1.244384765625, 1.57415771484375, 1.9039306640625, 2.23370361328125, 2.5634765625, 2.89324951171875, 3.2230224609375, 3.55279541015625, 3.882568359375, 4.21234130859375, 4.5421142578125, 4.87188720703125, 5.20166015625, 5.53143310546875, 5.8612060546875, 6.19097900390625, 6.520751953125, 6.85052490234375, 7.1802978515625, 7.51007080078125, 7.83984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 9.0, 17.0, 15.0, 11.0, 26.0, 22.0, 37.0, 51.0, 49.0, 92.0, 85.0, 98.0, 111.0, 68.0, 62.0, 54.0, 30.0, 35.0, 27.0, 26.0, 17.0, 11.0, 12.0, 7.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018596649169921875, -0.00017645210027694702, -0.0001669377088546753, -0.00015742331743240356, -0.00014790892601013184, -0.0001383945345878601, -0.00012888014316558838, -0.00011936575174331665, -0.00010985136032104492, -0.0001003369688987732, -9.082257747650146e-05, -8.130818605422974e-05, -7.179379463195801e-05, -6.227940320968628e-05, -5.276501178741455e-05, -4.325062036514282e-05, -3.3736228942871094e-05, -2.4221837520599365e-05, -1.4707446098327637e-05, -5.193054676055908e-06, 4.32133674621582e-06, 1.3835728168487549e-05, 2.3350119590759277e-05, 3.2864511013031006e-05, 4.2378902435302734e-05, 5.189329385757446e-05, 6.140768527984619e-05, 7.092207670211792e-05, 8.043646812438965e-05, 8.995085954666138e-05, 9.94652509689331e-05, 0.00010897964239120483, 0.00011849403381347656, 0.0001280084252357483, 0.00013752281665802002, 0.00014703720808029175, 0.00015655159950256348, 0.0001660659909248352, 0.00017558038234710693, 0.00018509477376937866, 0.0001946091651916504, 0.00020412355661392212, 0.00021363794803619385, 0.00022315233945846558, 0.0002326667308807373, 0.00024218112230300903, 0.00025169551372528076, 0.0002612099051475525, 0.0002707242965698242, 0.00028023868799209595, 0.0002897530794143677, 0.0002992674708366394, 0.00030878186225891113, 0.00031829625368118286, 0.0003278106451034546, 0.0003373250365257263, 0.00034683942794799805, 0.0003563538193702698, 0.0003658682107925415, 0.00037538260221481323, 0.00038489699363708496, 0.0003944113850593567, 0.0004039257764816284, 0.00041344016790390015, 0.0004229545593261719]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 6.0, 10.0, 11.0, 24.0, 31.0, 41.0, 65.0, 156.0, 268.0, 578.0, 1686.0, 8685.0, 313147.0, 708378.0, 12197.0, 2030.0, 622.0, 269.0, 140.0, 73.0, 38.0, 38.0, 23.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.97027587890625, -7.7218017578125, -7.47332763671875, -7.224853515625, -6.97637939453125, -6.7279052734375, -6.47943115234375, -6.23095703125, -5.98248291015625, -5.7340087890625, -5.48553466796875, -5.237060546875, -4.98858642578125, -4.7401123046875, -4.49163818359375, -4.2431640625, -3.99468994140625, -3.7462158203125, -3.49774169921875, -3.249267578125, -3.00079345703125, -2.7523193359375, -2.50384521484375, -2.25537109375, -2.00689697265625, -1.7584228515625, -1.50994873046875, -1.261474609375, -1.01300048828125, -0.7645263671875, -0.51605224609375, -0.267578125, -0.01910400390625, 0.2293701171875, 0.47784423828125, 0.726318359375, 0.97479248046875, 1.2232666015625, 1.47174072265625, 1.72021484375, 1.96868896484375, 2.2171630859375, 2.46563720703125, 2.714111328125, 2.96258544921875, 3.2110595703125, 3.45953369140625, 3.7080078125, 3.95648193359375, 4.2049560546875, 4.45343017578125, 4.701904296875, 4.95037841796875, 5.1988525390625, 5.44732666015625, 5.69580078125, 5.94427490234375, 6.1927490234375, 6.44122314453125, 6.689697265625, 6.93817138671875, 7.1866455078125, 7.43511962890625, 7.68359375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 8.0, 4.0, 16.0, 28.0, 66.0, 206.0, 376.0, 172.0, 49.0, 21.0, 15.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.03125, -20.578125, -20.125, -19.671875, -19.21875, -18.765625, -18.3125, -17.859375, -17.40625, -16.953125, -16.5, -16.046875, -15.59375, -15.140625, -14.6875, -14.234375, -13.78125, -13.328125, -12.875, -12.421875, -11.96875, -11.515625, -11.0625, -10.609375, -10.15625, -9.703125, -9.25, -8.796875, -8.34375, -7.890625, -7.4375, -6.984375, -6.53125, -6.078125, -5.625, -5.171875, -4.71875, -4.265625, -3.8125, -3.359375, -2.90625, -2.453125, -2.0, -1.546875, -1.09375, -0.640625, -0.1875, 0.265625, 0.71875, 1.171875, 1.625, 2.078125, 2.53125, 2.984375, 3.4375, 3.890625, 4.34375, 4.796875, 5.25, 5.703125, 6.15625, 6.609375, 7.0625, 7.515625, 7.96875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 20.0, 101.0, 369.0, 364.0, 106.0, 24.0, 5.0, 6.0, 2.0, 1.0, 2.0], "bins": [-289.10589599609375, -283.93951416015625, -278.7731018066406, -273.6067199707031, -268.4403076171875, -263.27392578125, -258.1075134277344, -252.94113159179688, -247.77471923828125, -242.6083221435547, -237.44192504882812, -232.27552795410156, -227.109130859375, -221.94273376464844, -216.77633666992188, -211.60995483398438, -206.4435577392578, -201.27716064453125, -196.1107635498047, -190.94436645507812, -185.77796936035156, -180.611572265625, -175.44517517089844, -170.27877807617188, -165.11239624023438, -159.9459991455078, -154.77960205078125, -149.6132049560547, -144.44680786132812, -139.28041076660156, -134.114013671875, -128.9476318359375, -123.78121948242188, -118.61482238769531, -113.44842529296875, -108.28202819824219, -103.11563110351562, -97.94923400878906, -92.78284454345703, -87.61644744873047, -82.45004272460938, -77.28364562988281, -72.11724853515625, -66.95085144042969, -61.78445816040039, -56.61806106567383, -51.45166778564453, -46.28527069091797, -41.11887741088867, -35.95248031616211, -30.78608512878418, -25.61968994140625, -20.453292846679688, -15.286895751953125, -10.120500564575195, -4.954105377197266, 0.21229171752929688, 5.378687858581543, 10.545083999633789, 15.711480140686035, 20.87787628173828, 26.044273376464844, 31.210668563842773, 36.3770637512207, 41.543460845947266]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 11.0, 11.0, 14.0, 13.0, 15.0, 18.0, 24.0, 31.0, 25.0, 51.0, 36.0, 41.0, 58.0, 44.0, 46.0, 61.0, 56.0, 60.0, 39.0, 43.0, 49.0, 36.0, 39.0, 32.0, 27.0, 27.0, 20.0, 14.0, 10.0, 11.0, 9.0, 5.0, 4.0, 4.0, 1.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.098533630371094, -59.790096282958984, -57.481658935546875, -55.173221588134766, -52.864784240722656, -50.55634689331055, -48.24790954589844, -45.93947219848633, -43.63103485107422, -41.32259750366211, -39.01416015625, -36.70572280883789, -34.39728546142578, -32.08884811401367, -29.780410766601562, -27.471973419189453, -25.163536071777344, -22.855098724365234, -20.546661376953125, -18.238224029541016, -15.929786682128906, -13.621349334716797, -11.312911987304688, -9.004474639892578, -6.696037292480469, -4.387599945068359, -2.07916259765625, 0.22927474975585938, 2.5377120971679688, 4.846149444580078, 7.1545867919921875, 9.463024139404297, 11.771453857421875, 14.079891204833984, 16.388328552246094, 18.696765899658203, 21.005203247070312, 23.313640594482422, 25.62207794189453, 27.93051528930664, 30.23895263671875, 32.54738998413086, 34.85582733154297, 37.16426467895508, 39.47270202636719, 41.7811393737793, 44.089576721191406, 46.398014068603516, 48.706451416015625, 51.014888763427734, 53.323326110839844, 55.63176345825195, 57.94020080566406, 60.24863815307617, 62.55707550048828, 64.86550903320312, 67.1739501953125, 69.48239135742188, 71.79082489013672, 74.09925842285156, 76.40769958496094, 78.71614074707031, 81.02457427978516, 83.3330078125, 85.64144897460938]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 19.0, 18.0, 44.0, 40.0, 59.0, 125.0, 291.0, 612.0, 1609.0, 4753.0, 19060.0, 163381.0, 3921041.0, 66165.0, 11601.0, 3222.0, 1154.0, 512.0, 238.0, 118.0, 73.0, 48.0, 28.0, 20.0, 14.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.25, -7.0557861328125, -6.861572265625, -6.6673583984375, -6.47314453125, -6.2789306640625, -6.084716796875, -5.8905029296875, -5.6962890625, -5.5020751953125, -5.307861328125, -5.1136474609375, -4.91943359375, -4.7252197265625, -4.531005859375, -4.3367919921875, -4.142578125, -3.9483642578125, -3.754150390625, -3.5599365234375, -3.36572265625, -3.1715087890625, -2.977294921875, -2.7830810546875, -2.5888671875, -2.3946533203125, -2.200439453125, -2.0062255859375, -1.81201171875, -1.6177978515625, -1.423583984375, -1.2293701171875, -1.03515625, -0.8409423828125, -0.646728515625, -0.4525146484375, -0.25830078125, -0.0640869140625, 0.130126953125, 0.3243408203125, 0.5185546875, 0.7127685546875, 0.906982421875, 1.1011962890625, 1.29541015625, 1.4896240234375, 1.683837890625, 1.8780517578125, 2.072265625, 2.2664794921875, 2.460693359375, 2.6549072265625, 2.84912109375, 3.0433349609375, 3.237548828125, 3.4317626953125, 3.6259765625, 3.8201904296875, 4.014404296875, 4.2086181640625, 4.40283203125, 4.5970458984375, 4.791259765625, 4.9854736328125, 5.1796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 13.0, 20.0, 25.0, 49.0, 36.0, 76.0, 89.0, 114.0, 117.0, 100.0, 102.0, 86.0, 49.0, 40.0, 30.0, 12.0, 9.0, 7.0, 12.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.932861328125, -3.76025390625, -3.587646484375, -3.4150390625, -3.242431640625, -3.06982421875, -2.897216796875, -2.724609375, -2.552001953125, -2.37939453125, -2.206787109375, -2.0341796875, -1.861572265625, -1.68896484375, -1.516357421875, -1.34375, -1.171142578125, -0.99853515625, -0.825927734375, -0.6533203125, -0.480712890625, -0.30810546875, -0.135498046875, 0.037109375, 0.209716796875, 0.38232421875, 0.554931640625, 0.7275390625, 0.900146484375, 1.07275390625, 1.245361328125, 1.41796875, 1.590576171875, 1.76318359375, 1.935791015625, 2.1083984375, 2.281005859375, 2.45361328125, 2.626220703125, 2.798828125, 2.971435546875, 3.14404296875, 3.316650390625, 3.4892578125, 3.661865234375, 3.83447265625, 4.007080078125, 4.1796875, 4.352294921875, 4.52490234375, 4.697509765625, 4.8701171875, 5.042724609375, 5.21533203125, 5.387939453125, 5.560546875, 5.733154296875, 5.90576171875, 6.078369140625, 6.2509765625, 6.423583984375, 6.59619140625, 6.768798828125, 6.94140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 9.0, 13.0, 16.0, 22.0, 21.0, 21.0, 30.0, 46.0, 50.0, 54.0, 76.0, 65.0, 69.0, 91.0, 96.0, 113.0, 416.0, 6415.0, 4144485.0, 40382.0, 941.0, 151.0, 93.0, 69.0, 70.0, 62.0, 69.0, 54.0, 47.0, 37.0, 48.0, 24.0, 25.0, 21.0, 12.0, 14.0, 17.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.953125, -19.39404296875, -18.8349609375, -18.27587890625, -17.716796875, -17.15771484375, -16.5986328125, -16.03955078125, -15.48046875, -14.92138671875, -14.3623046875, -13.80322265625, -13.244140625, -12.68505859375, -12.1259765625, -11.56689453125, -11.0078125, -10.44873046875, -9.8896484375, -9.33056640625, -8.771484375, -8.21240234375, -7.6533203125, -7.09423828125, -6.53515625, -5.97607421875, -5.4169921875, -4.85791015625, -4.298828125, -3.73974609375, -3.1806640625, -2.62158203125, -2.0625, -1.50341796875, -0.9443359375, -0.38525390625, 0.173828125, 0.73291015625, 1.2919921875, 1.85107421875, 2.41015625, 2.96923828125, 3.5283203125, 4.08740234375, 4.646484375, 5.20556640625, 5.7646484375, 6.32373046875, 6.8828125, 7.44189453125, 8.0009765625, 8.56005859375, 9.119140625, 9.67822265625, 10.2373046875, 10.79638671875, 11.35546875, 11.91455078125, 12.4736328125, 13.03271484375, 13.591796875, 14.15087890625, 14.7099609375, 15.26904296875, 15.828125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 48.0, 3100.0, 878.0, 40.0, 11.0, 1.0, 2.0, 2.0], "bins": [-19.9375, -19.59344482421875, -19.2493896484375, -18.90533447265625, -18.561279296875, -18.21722412109375, -17.8731689453125, -17.52911376953125, -17.18505859375, -16.84100341796875, -16.4969482421875, -16.15289306640625, -15.808837890625, -15.46478271484375, -15.1207275390625, -14.77667236328125, -14.4326171875, -14.08856201171875, -13.7445068359375, -13.40045166015625, -13.056396484375, -12.71234130859375, -12.3682861328125, -12.02423095703125, -11.68017578125, -11.33612060546875, -10.9920654296875, -10.64801025390625, -10.303955078125, -9.95989990234375, -9.6158447265625, -9.27178955078125, -8.927734375, -8.58367919921875, -8.2396240234375, -7.89556884765625, -7.551513671875, -7.20745849609375, -6.8634033203125, -6.51934814453125, -6.17529296875, -5.83123779296875, -5.4871826171875, -5.14312744140625, -4.799072265625, -4.45501708984375, -4.1109619140625, -3.76690673828125, -3.4228515625, -3.07879638671875, -2.7347412109375, -2.39068603515625, -2.046630859375, -1.70257568359375, -1.3585205078125, -1.01446533203125, -0.67041015625, -0.32635498046875, 0.0177001953125, 0.36175537109375, 0.705810546875, 1.04986572265625, 1.3939208984375, 1.73797607421875, 2.08203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 25.0, 162.0, 444.0, 274.0, 59.0, 22.0, 5.0, 10.0, 1.0, 1.0, 1.0, 1.0], "bins": [-69.4361343383789, -68.16034698486328, -66.88455200195312, -65.6087646484375, -64.33296966552734, -63.05718231201172, -61.78139114379883, -60.50559997558594, -59.22980880737305, -57.954017639160156, -56.678226470947266, -55.402435302734375, -54.12664794921875, -52.85085678100586, -51.57506561279297, -50.29927444458008, -49.02348327636719, -47.7476921081543, -46.471900939941406, -45.19611358642578, -43.92032241821289, -42.64453125, -41.36874008178711, -40.09294891357422, -38.817161560058594, -37.5413703918457, -36.26557922363281, -34.98979187011719, -33.7140007019043, -32.438209533691406, -31.162418365478516, -29.886627197265625, -28.610836029052734, -27.335044860839844, -26.059255599975586, -24.783464431762695, -23.507673263549805, -22.231884002685547, -20.956092834472656, -19.680301666259766, -18.404510498046875, -17.128719329833984, -15.85292911529541, -14.577138900756836, -13.301347732543945, -12.025557518005371, -10.749767303466797, -9.473976135253906, -8.198185920715332, -6.9223952293396, -5.646604537963867, -4.370814323425293, -3.0950236320495605, -1.8192329406738281, -0.5434427261352539, 0.7323484420776367, 2.008138656616211, 3.2839293479919434, 4.559720039367676, 5.83551025390625, 7.111300945281982, 8.387091636657715, 9.662881851196289, 10.93867301940918, 12.214463233947754]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 12.0, 15.0, 19.0, 22.0, 34.0, 41.0, 53.0, 74.0, 84.0, 108.0, 98.0, 95.0, 77.0, 81.0, 55.0, 38.0, 26.0, 17.0, 18.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.626962661743164, -27.79433822631836, -26.961715698242188, -26.129091262817383, -25.296466827392578, -24.463842391967773, -23.63121795654297, -22.798595428466797, -21.965970993041992, -21.133346557617188, -20.300724029541016, -19.46809959411621, -18.635475158691406, -17.8028507232666, -16.970226287841797, -16.137603759765625, -15.30497932434082, -14.472354888916016, -13.639731407165527, -12.807107925415039, -11.974483489990234, -11.14185905456543, -10.309235572814941, -9.476612091064453, -8.643987655639648, -7.811363697052002, -6.9787397384643555, -6.146115779876709, -5.3134918212890625, -4.480867862701416, -3.6482439041137695, -2.815619945526123, -1.9829978942871094, -1.150373935699463, -0.3177499771118164, 0.5148739814758301, 1.3474979400634766, 2.180121898651123, 3.0127458572387695, 3.845369815826416, 4.6779937744140625, 5.510617733001709, 6.3432416915893555, 7.175865650177002, 8.008489608764648, 8.841114044189453, 9.673737525939941, 10.50636100769043, 11.338985443115234, 12.171609878540039, 13.004233360290527, 13.836856842041016, 14.66948127746582, 15.502105712890625, 16.334728240966797, 17.1673526763916, 17.999977111816406, 18.83260154724121, 19.665225982666016, 20.497848510742188, 21.330472946166992, 22.163097381591797, 22.99571990966797, 23.828344345092773, 24.660968780517578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 12.0, 16.0, 26.0, 37.0, 31.0, 81.0, 90.0, 136.0, 226.0, 334.0, 543.0, 960.0, 1841.0, 3744.0, 8809.0, 24330.0, 82437.0, 304922.0, 426653.0, 133375.0, 37026.0, 12435.0, 5032.0, 2412.0, 1177.0, 678.0, 395.0, 258.0, 184.0, 110.0, 64.0, 59.0, 30.0, 22.0, 11.0, 12.0, 10.0, 3.0, 8.0, 5.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.5390625, -5.37701416015625, -5.2149658203125, -5.05291748046875, -4.890869140625, -4.72882080078125, -4.5667724609375, -4.40472412109375, -4.24267578125, -4.08062744140625, -3.9185791015625, -3.75653076171875, -3.594482421875, -3.43243408203125, -3.2703857421875, -3.10833740234375, -2.9462890625, -2.78424072265625, -2.6221923828125, -2.46014404296875, -2.298095703125, -2.13604736328125, -1.9739990234375, -1.81195068359375, -1.64990234375, -1.48785400390625, -1.3258056640625, -1.16375732421875, -1.001708984375, -0.83966064453125, -0.6776123046875, -0.51556396484375, -0.353515625, -0.19146728515625, -0.0294189453125, 0.13262939453125, 0.294677734375, 0.45672607421875, 0.6187744140625, 0.78082275390625, 0.94287109375, 1.10491943359375, 1.2669677734375, 1.42901611328125, 1.591064453125, 1.75311279296875, 1.9151611328125, 2.07720947265625, 2.2392578125, 2.40130615234375, 2.5633544921875, 2.72540283203125, 2.887451171875, 3.04949951171875, 3.2115478515625, 3.37359619140625, 3.53564453125, 3.69769287109375, 3.8597412109375, 4.02178955078125, 4.183837890625, 4.34588623046875, 4.5079345703125, 4.66998291015625, 4.83203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 10.0, 7.0, 19.0, 26.0, 34.0, 40.0, 51.0, 49.0, 82.0, 92.0, 108.0, 95.0, 92.0, 82.0, 63.0, 41.0, 29.0, 17.0, 17.0, 16.0, 11.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.90838623046875, -3.7503662109375, -3.59234619140625, -3.434326171875, -3.27630615234375, -3.1182861328125, -2.96026611328125, -2.80224609375, -2.64422607421875, -2.4862060546875, -2.32818603515625, -2.170166015625, -2.01214599609375, -1.8541259765625, -1.69610595703125, -1.5380859375, -1.38006591796875, -1.2220458984375, -1.06402587890625, -0.906005859375, -0.74798583984375, -0.5899658203125, -0.43194580078125, -0.27392578125, -0.11590576171875, 0.0421142578125, 0.20013427734375, 0.358154296875, 0.51617431640625, 0.6741943359375, 0.83221435546875, 0.990234375, 1.14825439453125, 1.3062744140625, 1.46429443359375, 1.622314453125, 1.78033447265625, 1.9383544921875, 2.09637451171875, 2.25439453125, 2.41241455078125, 2.5704345703125, 2.72845458984375, 2.886474609375, 3.04449462890625, 3.2025146484375, 3.36053466796875, 3.5185546875, 3.67657470703125, 3.8345947265625, 3.99261474609375, 4.150634765625, 4.30865478515625, 4.4666748046875, 4.62469482421875, 4.78271484375, 4.94073486328125, 5.0987548828125, 5.25677490234375, 5.414794921875, 5.57281494140625, 5.7308349609375, 5.88885498046875, 6.046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 13.0, 12.0, 18.0, 32.0, 24.0, 45.0, 67.0, 107.0, 212.0, 396.0, 773.0, 2178.0, 8321.0, 116983.0, 876334.0, 35516.0, 4640.0, 1488.0, 622.0, 295.0, 173.0, 90.0, 59.0, 46.0, 26.0, 16.0, 13.0, 14.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.7471923828125, -15.260009765625, -14.7728271484375, -14.28564453125, -13.7984619140625, -13.311279296875, -12.8240966796875, -12.3369140625, -11.8497314453125, -11.362548828125, -10.8753662109375, -10.38818359375, -9.9010009765625, -9.413818359375, -8.9266357421875, -8.439453125, -7.9522705078125, -7.465087890625, -6.9779052734375, -6.49072265625, -6.0035400390625, -5.516357421875, -5.0291748046875, -4.5419921875, -4.0548095703125, -3.567626953125, -3.0804443359375, -2.59326171875, -2.1060791015625, -1.618896484375, -1.1317138671875, -0.64453125, -0.1573486328125, 0.329833984375, 0.8170166015625, 1.30419921875, 1.7913818359375, 2.278564453125, 2.7657470703125, 3.2529296875, 3.7401123046875, 4.227294921875, 4.7144775390625, 5.20166015625, 5.6888427734375, 6.176025390625, 6.6632080078125, 7.150390625, 7.6375732421875, 8.124755859375, 8.6119384765625, 9.09912109375, 9.5863037109375, 10.073486328125, 10.5606689453125, 11.0478515625, 11.5350341796875, 12.022216796875, 12.5093994140625, 12.99658203125, 13.4837646484375, 13.970947265625, 14.4581298828125, 14.9453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 9.0, 6.0, 6.0, 20.0, 20.0, 26.0, 38.0, 42.0, 60.0, 71.0, 80.0, 89.0, 105.0, 98.0, 80.0, 69.0, 51.0, 40.0, 19.0, 17.0, 17.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-27.140625, -26.4111328125, -25.681640625, -24.9521484375, -24.22265625, -23.4931640625, -22.763671875, -22.0341796875, -21.3046875, -20.5751953125, -19.845703125, -19.1162109375, -18.38671875, -17.6572265625, -16.927734375, -16.1982421875, -15.46875, -14.7392578125, -14.009765625, -13.2802734375, -12.55078125, -11.8212890625, -11.091796875, -10.3623046875, -9.6328125, -8.9033203125, -8.173828125, -7.4443359375, -6.71484375, -5.9853515625, -5.255859375, -4.5263671875, -3.796875, -3.0673828125, -2.337890625, -1.6083984375, -0.87890625, -0.1494140625, 0.580078125, 1.3095703125, 2.0390625, 2.7685546875, 3.498046875, 4.2275390625, 4.95703125, 5.6865234375, 6.416015625, 7.1455078125, 7.875, 8.6044921875, 9.333984375, 10.0634765625, 10.79296875, 11.5224609375, 12.251953125, 12.9814453125, 13.7109375, 14.4404296875, 15.169921875, 15.8994140625, 16.62890625, 17.3583984375, 18.087890625, 18.8173828125, 19.546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 20.0, 22.0, 24.0, 42.0, 41.0, 70.0, 96.0, 122.0, 169.0, 258.0, 397.0, 726.0, 1973.0, 7752.0, 59161.0, 725248.0, 226352.0, 19770.0, 3590.0, 1121.0, 531.0, 317.0, 214.0, 140.0, 92.0, 66.0, 46.0, 44.0, 28.0, 26.0, 19.0, 14.0, 10.0, 11.0, 8.0, 4.0, 1.0, 4.0, 1.0, 4.0], "bins": [-4.01171875, -3.910797119140625, -3.80987548828125, -3.708953857421875, -3.6080322265625, -3.507110595703125, -3.40618896484375, -3.305267333984375, -3.204345703125, -3.103424072265625, -3.00250244140625, -2.901580810546875, -2.8006591796875, -2.699737548828125, -2.59881591796875, -2.497894287109375, -2.39697265625, -2.296051025390625, -2.19512939453125, -2.094207763671875, -1.9932861328125, -1.892364501953125, -1.79144287109375, -1.690521240234375, -1.589599609375, -1.488677978515625, -1.38775634765625, -1.286834716796875, -1.1859130859375, -1.084991455078125, -0.98406982421875, -0.883148193359375, -0.7822265625, -0.681304931640625, -0.58038330078125, -0.479461669921875, -0.3785400390625, -0.277618408203125, -0.17669677734375, -0.075775146484375, 0.025146484375, 0.126068115234375, 0.22698974609375, 0.327911376953125, 0.4288330078125, 0.529754638671875, 0.63067626953125, 0.731597900390625, 0.83251953125, 0.933441162109375, 1.03436279296875, 1.135284423828125, 1.2362060546875, 1.337127685546875, 1.43804931640625, 1.538970947265625, 1.639892578125, 1.740814208984375, 1.84173583984375, 1.942657470703125, 2.0435791015625, 2.144500732421875, 2.24542236328125, 2.346343994140625, 2.447265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 13.0, 25.0, 18.0, 30.0, 40.0, 54.0, 74.0, 106.0, 130.0, 116.0, 73.0, 70.0, 42.0, 41.0, 33.0, 21.0, 15.0, 14.0, 6.0, 9.0, 8.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003025531768798828, -0.0002912096679210663, -0.00027986615896224976, -0.00026852265000343323, -0.0002571791410446167, -0.00024583563208580017, -0.00023449212312698364, -0.00022314861416816711, -0.00021180510520935059, -0.00020046159625053406, -0.00018911808729171753, -0.000177774578332901, -0.00016643106937408447, -0.00015508756041526794, -0.00014374405145645142, -0.0001324005424976349, -0.00012105703353881836, -0.00010971352458000183, -9.83700156211853e-05, -8.702650666236877e-05, -7.568299770355225e-05, -6.433948874473572e-05, -5.299597978591919e-05, -4.165247082710266e-05, -3.0308961868286133e-05, -1.8965452909469604e-05, -7.621943950653076e-06, 3.721565008163452e-06, 1.506507396697998e-05, 2.640858292579651e-05, 3.775209188461304e-05, 4.9095600843429565e-05, 6.0439109802246094e-05, 7.178261876106262e-05, 8.312612771987915e-05, 9.446963667869568e-05, 0.00010581314563751221, 0.00011715665459632874, 0.00012850016355514526, 0.0001398436725139618, 0.00015118718147277832, 0.00016253069043159485, 0.00017387419939041138, 0.0001852177083492279, 0.00019656121730804443, 0.00020790472626686096, 0.0002192482352256775, 0.00023059174418449402, 0.00024193525314331055, 0.0002532787621021271, 0.0002646222710609436, 0.00027596578001976013, 0.00028730928897857666, 0.0002986527979373932, 0.0003099963068962097, 0.00032133981585502625, 0.0003326833248138428, 0.0003440268337726593, 0.00035537034273147583, 0.00036671385169029236, 0.0003780573606491089, 0.0003894008696079254, 0.00040074437856674194, 0.00041208788752555847, 0.000423431396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 9.0, 21.0, 30.0, 38.0, 43.0, 79.0, 112.0, 235.0, 450.0, 991.0, 3333.0, 22093.0, 671677.0, 331483.0, 13748.0, 2498.0, 794.0, 392.0, 201.0, 104.0, 80.0, 40.0, 29.0, 25.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.22265625, -5.08111572265625, -4.9395751953125, -4.79803466796875, -4.656494140625, -4.51495361328125, -4.3734130859375, -4.23187255859375, -4.09033203125, -3.94879150390625, -3.8072509765625, -3.66571044921875, -3.524169921875, -3.38262939453125, -3.2410888671875, -3.09954833984375, -2.9580078125, -2.81646728515625, -2.6749267578125, -2.53338623046875, -2.391845703125, -2.25030517578125, -2.1087646484375, -1.96722412109375, -1.82568359375, -1.68414306640625, -1.5426025390625, -1.40106201171875, -1.259521484375, -1.11798095703125, -0.9764404296875, -0.83489990234375, -0.693359375, -0.55181884765625, -0.4102783203125, -0.26873779296875, -0.127197265625, 0.01434326171875, 0.1558837890625, 0.29742431640625, 0.43896484375, 0.58050537109375, 0.7220458984375, 0.86358642578125, 1.005126953125, 1.14666748046875, 1.2882080078125, 1.42974853515625, 1.5712890625, 1.71282958984375, 1.8543701171875, 1.99591064453125, 2.137451171875, 2.27899169921875, 2.4205322265625, 2.56207275390625, 2.70361328125, 2.84515380859375, 2.9866943359375, 3.12823486328125, 3.269775390625, 3.41131591796875, 3.5528564453125, 3.69439697265625, 3.8359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 17.0, 25.0, 46.0, 73.0, 107.0, 159.0, 181.0, 132.0, 99.0, 53.0, 28.0, 19.0, 20.0, 10.0, 10.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.99847412109375, -4.8328857421875, -4.66729736328125, -4.501708984375, -4.33612060546875, -4.1705322265625, -4.00494384765625, -3.83935546875, -3.67376708984375, -3.5081787109375, -3.34259033203125, -3.177001953125, -3.01141357421875, -2.8458251953125, -2.68023681640625, -2.5146484375, -2.34906005859375, -2.1834716796875, -2.01788330078125, -1.852294921875, -1.68670654296875, -1.5211181640625, -1.35552978515625, -1.18994140625, -1.02435302734375, -0.8587646484375, -0.69317626953125, -0.527587890625, -0.36199951171875, -0.1964111328125, -0.03082275390625, 0.134765625, 0.30035400390625, 0.4659423828125, 0.63153076171875, 0.797119140625, 0.96270751953125, 1.1282958984375, 1.29388427734375, 1.45947265625, 1.62506103515625, 1.7906494140625, 1.95623779296875, 2.121826171875, 2.28741455078125, 2.4530029296875, 2.61859130859375, 2.7841796875, 2.94976806640625, 3.1153564453125, 3.28094482421875, 3.446533203125, 3.61212158203125, 3.7777099609375, 3.94329833984375, 4.10888671875, 4.27447509765625, 4.4400634765625, 4.60565185546875, 4.771240234375, 4.93682861328125, 5.1024169921875, 5.26800537109375, 5.43359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 30.0, 100.0, 318.0, 374.0, 126.0, 34.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.09017944335938, -163.9984130859375, -158.90663146972656, -153.81484985351562, -148.72308349609375, -143.63131713867188, -138.53953552246094, -133.44775390625, -128.35598754882812, -123.26421356201172, -118.17243957519531, -113.0806655883789, -107.9888916015625, -102.8971176147461, -97.80534362792969, -92.71356964111328, -87.62179565429688, -82.53002166748047, -77.43824768066406, -72.34647369384766, -67.25469970703125, -62.162925720214844, -57.07115173339844, -51.97937774658203, -46.887603759765625, -41.79582977294922, -36.70405578613281, -31.612281799316406, -26.5205078125, -21.428733825683594, -16.336959838867188, -11.245185852050781, -6.1534271240234375, -1.0616531372070312, 4.030120849609375, 9.121894836425781, 14.213668823242188, 19.305442810058594, 24.397216796875, 29.488990783691406, 34.58076477050781, 39.67253875732422, 44.764312744140625, 49.85608673095703, 54.94786071777344, 60.039634704589844, 65.13140869140625, 70.22318267822266, 75.31495666503906, 80.40673065185547, 85.49850463867188, 90.59027862548828, 95.68205261230469, 100.7738265991211, 105.8656005859375, 110.9573745727539, 116.04914855957031, 121.14092254638672, 126.23269653320312, 131.324462890625, 136.41624450683594, 141.50802612304688, 146.59979248046875, 151.69155883789062, 156.78334045410156]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 7.0, 10.0, 9.0, 15.0, 21.0, 19.0, 18.0, 30.0, 32.0, 42.0, 45.0, 41.0, 40.0, 46.0, 60.0, 59.0, 68.0, 52.0, 50.0, 60.0, 48.0, 38.0, 29.0, 30.0, 24.0, 19.0, 12.0, 11.0, 10.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-85.27381896972656, -82.86646270751953, -80.45909881591797, -78.05174255371094, -75.64437866210938, -73.23702239990234, -70.82966613769531, -68.42230224609375, -66.01494598388672, -63.60758590698242, -61.200225830078125, -58.792869567871094, -56.3855094909668, -53.9781494140625, -51.5707893371582, -49.163429260253906, -46.75606918334961, -44.34870910644531, -41.941349029541016, -39.53398895263672, -37.12663269042969, -34.71927261352539, -32.311912536621094, -29.90455436706543, -27.497194290161133, -25.089834213256836, -22.682476043701172, -20.275115966796875, -17.867755889892578, -15.460397720336914, -13.053037643432617, -10.645679473876953, -8.238319396972656, -5.830960273742676, -3.423600673675537, -1.0162410736083984, 1.391118049621582, 3.7984771728515625, 6.205837249755859, 8.613195419311523, 11.02055549621582, 13.4279146194458, 15.835273742675781, 18.242633819580078, 20.649993896484375, 23.05735206604004, 25.464712142944336, 27.8720703125, 30.279430389404297, 32.686790466308594, 35.09415054321289, 37.50151062011719, 39.90886688232422, 42.316226959228516, 44.72358703613281, 47.130943298339844, 49.538307189941406, 51.9456672668457, 54.35302734375, 56.76038360595703, 59.16774368286133, 61.575103759765625, 63.98246383666992, 66.38982391357422, 68.79718017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 11.0, 16.0, 21.0, 48.0, 41.0, 70.0, 92.0, 164.0, 232.0, 356.0, 528.0, 946.0, 1563.0, 2751.0, 5224.0, 11480.0, 31883.0, 148951.0, 2444560.0, 1390419.0, 107404.0, 26543.0, 10150.0, 4623.0, 2442.0, 1423.0, 819.0, 486.0, 309.0, 233.0, 151.0, 112.0, 63.0, 54.0, 35.0, 20.0, 10.0, 9.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.94140625, -3.834625244140625, -3.72784423828125, -3.621063232421875, -3.5142822265625, -3.407501220703125, -3.30072021484375, -3.193939208984375, -3.087158203125, -2.980377197265625, -2.87359619140625, -2.766815185546875, -2.6600341796875, -2.553253173828125, -2.44647216796875, -2.339691162109375, -2.23291015625, -2.126129150390625, -2.01934814453125, -1.912567138671875, -1.8057861328125, -1.699005126953125, -1.59222412109375, -1.485443115234375, -1.378662109375, -1.271881103515625, -1.16510009765625, -1.058319091796875, -0.9515380859375, -0.844757080078125, -0.73797607421875, -0.631195068359375, -0.5244140625, -0.417633056640625, -0.31085205078125, -0.204071044921875, -0.0972900390625, 0.009490966796875, 0.11627197265625, 0.223052978515625, 0.329833984375, 0.436614990234375, 0.54339599609375, 0.650177001953125, 0.7569580078125, 0.863739013671875, 0.97052001953125, 1.077301025390625, 1.18408203125, 1.290863037109375, 1.39764404296875, 1.504425048828125, 1.6112060546875, 1.717987060546875, 1.82476806640625, 1.931549072265625, 2.038330078125, 2.145111083984375, 2.25189208984375, 2.358673095703125, 2.4654541015625, 2.572235107421875, 2.67901611328125, 2.785797119140625, 2.892578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 12.0, 15.0, 13.0, 13.0, 33.0, 25.0, 43.0, 21.0, 30.0, 45.0, 46.0, 55.0, 48.0, 64.0, 61.0, 73.0, 63.0, 52.0, 47.0, 42.0, 29.0, 25.0, 25.0, 16.0, 20.0, 15.0, 8.0, 10.0, 6.0, 8.0, 4.0, 5.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.240234375, -3.154815673828125, -3.06939697265625, -2.983978271484375, -2.8985595703125, -2.813140869140625, -2.72772216796875, -2.642303466796875, -2.556884765625, -2.471466064453125, -2.38604736328125, -2.300628662109375, -2.2152099609375, -2.129791259765625, -2.04437255859375, -1.958953857421875, -1.87353515625, -1.788116455078125, -1.70269775390625, -1.617279052734375, -1.5318603515625, -1.446441650390625, -1.36102294921875, -1.275604248046875, -1.190185546875, -1.104766845703125, -1.01934814453125, -0.933929443359375, -0.8485107421875, -0.763092041015625, -0.67767333984375, -0.592254638671875, -0.5068359375, -0.421417236328125, -0.33599853515625, -0.250579833984375, -0.1651611328125, -0.079742431640625, 0.00567626953125, 0.091094970703125, 0.176513671875, 0.261932373046875, 0.34735107421875, 0.432769775390625, 0.5181884765625, 0.603607177734375, 0.68902587890625, 0.774444580078125, 0.85986328125, 0.945281982421875, 1.03070068359375, 1.116119384765625, 1.2015380859375, 1.286956787109375, 1.37237548828125, 1.457794189453125, 1.543212890625, 1.628631591796875, 1.71405029296875, 1.799468994140625, 1.8848876953125, 1.970306396484375, 2.05572509765625, 2.141143798828125, 2.2265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 12.0, 19.0, 18.0, 27.0, 85.0, 222.0, 663.0, 3364.0, 49752.0, 4055983.0, 78507.0, 4426.0, 761.0, 231.0, 91.0, 42.0, 26.0, 18.0, 9.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.286865234375, -10.91748046875, -10.548095703125, -10.1787109375, -9.809326171875, -9.43994140625, -9.070556640625, -8.701171875, -8.331787109375, -7.96240234375, -7.593017578125, -7.2236328125, -6.854248046875, -6.48486328125, -6.115478515625, -5.74609375, -5.376708984375, -5.00732421875, -4.637939453125, -4.2685546875, -3.899169921875, -3.52978515625, -3.160400390625, -2.791015625, -2.421630859375, -2.05224609375, -1.682861328125, -1.3134765625, -0.944091796875, -0.57470703125, -0.205322265625, 0.1640625, 0.533447265625, 0.90283203125, 1.272216796875, 1.6416015625, 2.010986328125, 2.38037109375, 2.749755859375, 3.119140625, 3.488525390625, 3.85791015625, 4.227294921875, 4.5966796875, 4.966064453125, 5.33544921875, 5.704833984375, 6.07421875, 6.443603515625, 6.81298828125, 7.182373046875, 7.5517578125, 7.921142578125, 8.29052734375, 8.659912109375, 9.029296875, 9.398681640625, 9.76806640625, 10.137451171875, 10.5068359375, 10.876220703125, 11.24560546875, 11.614990234375, 11.984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 16.0, 19.0, 30.0, 61.0, 149.0, 540.0, 2031.0, 852.0, 187.0, 72.0, 32.0, 21.0, 18.0, 12.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4945068359375, -10.207763671875, -9.9210205078125, -9.63427734375, -9.3475341796875, -9.060791015625, -8.7740478515625, -8.4873046875, -8.2005615234375, -7.913818359375, -7.6270751953125, -7.34033203125, -7.0535888671875, -6.766845703125, -6.4801025390625, -6.193359375, -5.9066162109375, -5.619873046875, -5.3331298828125, -5.04638671875, -4.7596435546875, -4.472900390625, -4.1861572265625, -3.8994140625, -3.6126708984375, -3.325927734375, -3.0391845703125, -2.75244140625, -2.4656982421875, -2.178955078125, -1.8922119140625, -1.60546875, -1.3187255859375, -1.031982421875, -0.7452392578125, -0.45849609375, -0.1717529296875, 0.114990234375, 0.4017333984375, 0.6884765625, 0.9752197265625, 1.261962890625, 1.5487060546875, 1.83544921875, 2.1221923828125, 2.408935546875, 2.6956787109375, 2.982421875, 3.2691650390625, 3.555908203125, 3.8426513671875, 4.12939453125, 4.4161376953125, 4.702880859375, 4.9896240234375, 5.2763671875, 5.5631103515625, 5.849853515625, 6.1365966796875, 6.42333984375, 6.7100830078125, 6.996826171875, 7.2835693359375, 7.5703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 4.0, 11.0, 24.0, 40.0, 73.0, 124.0, 164.0, 180.0, 147.0, 81.0, 51.0, 28.0, 15.0, 15.0, 9.0, 5.0, 5.0, 1.0, 6.0, 2.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.610336303710938, -11.34864616394043, -10.086955070495605, -8.825263977050781, -7.563573837280273, -6.301883220672607, -5.040192604064941, -3.778501510620117, -2.5168113708496094, -1.2551207542419434, 0.006569862365722656, 1.2682604789733887, 2.5299510955810547, 3.7916417121887207, 5.053332328796387, 6.315023422241211, 7.576713562011719, 8.838403701782227, 10.10009479522705, 11.361785888671875, 12.623476028442383, 13.88516616821289, 15.146857261657715, 16.40854835510254, 17.670238494873047, 18.931928634643555, 20.193618774414062, 21.455310821533203, 22.71700096130371, 23.97869110107422, 25.24038314819336, 26.502073287963867, 27.763763427734375, 29.025453567504883, 30.28714370727539, 31.54883575439453, 32.810523986816406, 34.07221603393555, 35.33390808105469, 36.59559631347656, 37.8572883605957, 39.118980407714844, 40.38066864013672, 41.64236068725586, 42.904052734375, 44.165740966796875, 45.427433013916016, 46.689125061035156, 47.95081329345703, 49.21250534057617, 50.47419357299805, 51.73588562011719, 52.99757385253906, 54.2592658996582, 55.520957946777344, 56.78264617919922, 58.04433822631836, 59.3060302734375, 60.567718505859375, 61.829410552978516, 63.091102600097656, 64.35279083251953, 65.6144790649414, 66.87617492675781, 68.13786315917969]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 3.0, 2.0, 6.0, 7.0, 10.0, 8.0, 18.0, 13.0, 12.0, 23.0, 24.0, 33.0, 26.0, 34.0, 41.0, 40.0, 39.0, 48.0, 47.0, 43.0, 47.0, 48.0, 38.0, 44.0, 41.0, 28.0, 27.0, 31.0, 34.0, 22.0, 22.0, 30.0, 17.0, 17.0, 8.0, 11.0, 9.0, 7.0, 7.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-23.848102569580078, -23.170127868652344, -22.49215316772461, -21.814176559448242, -21.136201858520508, -20.458227157592773, -19.78025245666504, -19.102275848388672, -18.424301147460938, -17.746326446533203, -17.06835174560547, -16.3903751373291, -15.712400436401367, -15.034425735473633, -14.356451034545898, -13.678475379943848, -13.000500679016113, -12.322525978088379, -11.644550323486328, -10.966575622558594, -10.288599967956543, -9.610625267028809, -8.932649612426758, -8.254674911499023, -7.576699733734131, -6.898724555969238, -6.220749378204346, -5.542774200439453, -4.864799499511719, -4.186823844909668, -3.5088491439819336, -2.830873966217041, -2.1528987884521484, -1.4749236106872559, -0.7969485521316528, -0.1189734935760498, 0.5590016841888428, 1.2369768619537354, 1.9149518013000488, 2.5929269790649414, 3.270902156829834, 3.9488773345947266, 4.626852512359619, 5.304827690124512, 5.982802391052246, 6.660778045654297, 7.338752746582031, 8.016727447509766, 8.694703102111816, 9.37267780303955, 10.050653457641602, 10.728628158569336, 11.406603813171387, 12.084578514099121, 12.762554168701172, 13.440528869628906, 14.11850357055664, 14.796478271484375, 15.474453926086426, 16.152429580688477, 16.83040428161621, 17.508378982543945, 18.18635368347168, 18.864330291748047, 19.54230499267578]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 15.0, 14.0, 30.0, 37.0, 66.0, 76.0, 125.0, 217.0, 319.0, 574.0, 999.0, 1665.0, 3189.0, 6263.0, 13169.0, 28698.0, 65344.0, 154505.0, 324602.0, 253530.0, 107635.0, 46620.0, 20653.0, 9704.0, 4670.0, 2478.0, 1363.0, 743.0, 458.0, 257.0, 159.0, 108.0, 65.0, 53.0, 43.0, 37.0, 20.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.918182373046875, -2.81683349609375, -2.715484619140625, -2.6141357421875, -2.512786865234375, -2.41143798828125, -2.310089111328125, -2.208740234375, -2.107391357421875, -2.00604248046875, -1.904693603515625, -1.8033447265625, -1.701995849609375, -1.60064697265625, -1.499298095703125, -1.39794921875, -1.296600341796875, -1.19525146484375, -1.093902587890625, -0.9925537109375, -0.891204833984375, -0.78985595703125, -0.688507080078125, -0.587158203125, -0.485809326171875, -0.38446044921875, -0.283111572265625, -0.1817626953125, -0.080413818359375, 0.02093505859375, 0.122283935546875, 0.2236328125, 0.324981689453125, 0.42633056640625, 0.527679443359375, 0.6290283203125, 0.730377197265625, 0.83172607421875, 0.933074951171875, 1.034423828125, 1.135772705078125, 1.23712158203125, 1.338470458984375, 1.4398193359375, 1.541168212890625, 1.64251708984375, 1.743865966796875, 1.84521484375, 1.946563720703125, 2.04791259765625, 2.149261474609375, 2.2506103515625, 2.351959228515625, 2.45330810546875, 2.554656982421875, 2.656005859375, 2.757354736328125, 2.85870361328125, 2.960052490234375, 3.0614013671875, 3.162750244140625, 3.26409912109375, 3.365447998046875, 3.466796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 12.0, 8.0, 4.0, 8.0, 11.0, 17.0, 19.0, 21.0, 22.0, 20.0, 21.0, 29.0, 33.0, 27.0, 33.0, 40.0, 40.0, 41.0, 42.0, 48.0, 39.0, 49.0, 46.0, 41.0, 46.0, 44.0, 23.0, 30.0, 27.0, 13.0, 25.0, 14.0, 15.0, 10.0, 14.0, 15.0, 11.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0], "bins": [-2.029296875, -1.968719482421875, -1.90814208984375, -1.847564697265625, -1.7869873046875, -1.726409912109375, -1.66583251953125, -1.605255126953125, -1.544677734375, -1.484100341796875, -1.42352294921875, -1.362945556640625, -1.3023681640625, -1.241790771484375, -1.18121337890625, -1.120635986328125, -1.06005859375, -0.999481201171875, -0.93890380859375, -0.878326416015625, -0.8177490234375, -0.757171630859375, -0.69659423828125, -0.636016845703125, -0.575439453125, -0.514862060546875, -0.45428466796875, -0.393707275390625, -0.3331298828125, -0.272552490234375, -0.21197509765625, -0.151397705078125, -0.0908203125, -0.030242919921875, 0.03033447265625, 0.090911865234375, 0.1514892578125, 0.212066650390625, 0.27264404296875, 0.333221435546875, 0.393798828125, 0.454376220703125, 0.51495361328125, 0.575531005859375, 0.6361083984375, 0.696685791015625, 0.75726318359375, 0.817840576171875, 0.87841796875, 0.938995361328125, 0.99957275390625, 1.060150146484375, 1.1207275390625, 1.181304931640625, 1.24188232421875, 1.302459716796875, 1.363037109375, 1.423614501953125, 1.48419189453125, 1.544769287109375, 1.6053466796875, 1.665924072265625, 1.72650146484375, 1.787078857421875, 1.84765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 1.0, 1.0, 7.0, 8.0, 9.0, 13.0, 19.0, 24.0, 38.0, 64.0, 85.0, 178.0, 289.0, 569.0, 1398.0, 4413.0, 34691.0, 804667.0, 186829.0, 10959.0, 2447.0, 873.0, 410.0, 210.0, 104.0, 85.0, 48.0, 32.0, 23.0, 17.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8203125, -11.4481201171875, -11.075927734375, -10.7037353515625, -10.33154296875, -9.9593505859375, -9.587158203125, -9.2149658203125, -8.8427734375, -8.4705810546875, -8.098388671875, -7.7261962890625, -7.35400390625, -6.9818115234375, -6.609619140625, -6.2374267578125, -5.865234375, -5.4930419921875, -5.120849609375, -4.7486572265625, -4.37646484375, -4.0042724609375, -3.632080078125, -3.2598876953125, -2.8876953125, -2.5155029296875, -2.143310546875, -1.7711181640625, -1.39892578125, -1.0267333984375, -0.654541015625, -0.2823486328125, 0.08984375, 0.4620361328125, 0.834228515625, 1.2064208984375, 1.57861328125, 1.9508056640625, 2.322998046875, 2.6951904296875, 3.0673828125, 3.4395751953125, 3.811767578125, 4.1839599609375, 4.55615234375, 4.9283447265625, 5.300537109375, 5.6727294921875, 6.044921875, 6.4171142578125, 6.789306640625, 7.1614990234375, 7.53369140625, 7.9058837890625, 8.278076171875, 8.6502685546875, 9.0224609375, 9.3946533203125, 9.766845703125, 10.1390380859375, 10.51123046875, 10.8834228515625, 11.255615234375, 11.6278076171875, 12.0]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 9.0, 15.0, 26.0, 21.0, 29.0, 53.0, 33.0, 60.0, 52.0, 60.0, 73.0, 81.0, 68.0, 62.0, 64.0, 54.0, 57.0, 20.0, 31.0, 27.0, 24.0, 10.0, 14.0, 12.0, 9.0, 0.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5010986328125, -10.095947265625, -9.6907958984375, -9.28564453125, -8.8804931640625, -8.475341796875, -8.0701904296875, -7.6650390625, -7.2598876953125, -6.854736328125, -6.4495849609375, -6.04443359375, -5.6392822265625, -5.234130859375, -4.8289794921875, -4.423828125, -4.0186767578125, -3.613525390625, -3.2083740234375, -2.80322265625, -2.3980712890625, -1.992919921875, -1.5877685546875, -1.1826171875, -0.7774658203125, -0.372314453125, 0.0328369140625, 0.43798828125, 0.8431396484375, 1.248291015625, 1.6534423828125, 2.05859375, 2.4637451171875, 2.868896484375, 3.2740478515625, 3.67919921875, 4.0843505859375, 4.489501953125, 4.8946533203125, 5.2998046875, 5.7049560546875, 6.110107421875, 6.5152587890625, 6.92041015625, 7.3255615234375, 7.730712890625, 8.1358642578125, 8.541015625, 8.9461669921875, 9.351318359375, 9.7564697265625, 10.16162109375, 10.5667724609375, 10.971923828125, 11.3770751953125, 11.7822265625, 12.1873779296875, 12.592529296875, 12.9976806640625, 13.40283203125, 13.8079833984375, 14.213134765625, 14.6182861328125, 15.0234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 8.0, 4.0, 11.0, 16.0, 20.0, 31.0, 41.0, 65.0, 100.0, 169.0, 395.0, 1028.0, 3955.0, 37378.0, 907554.0, 88868.0, 6502.0, 1347.0, 461.0, 210.0, 122.0, 69.0, 47.0, 32.0, 27.0, 21.0, 14.0, 4.0, 11.0, 5.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.98828125, -4.825439453125, -4.66259765625, -4.499755859375, -4.3369140625, -4.174072265625, -4.01123046875, -3.848388671875, -3.685546875, -3.522705078125, -3.35986328125, -3.197021484375, -3.0341796875, -2.871337890625, -2.70849609375, -2.545654296875, -2.3828125, -2.219970703125, -2.05712890625, -1.894287109375, -1.7314453125, -1.568603515625, -1.40576171875, -1.242919921875, -1.080078125, -0.917236328125, -0.75439453125, -0.591552734375, -0.4287109375, -0.265869140625, -0.10302734375, 0.059814453125, 0.22265625, 0.385498046875, 0.54833984375, 0.711181640625, 0.8740234375, 1.036865234375, 1.19970703125, 1.362548828125, 1.525390625, 1.688232421875, 1.85107421875, 2.013916015625, 2.1767578125, 2.339599609375, 2.50244140625, 2.665283203125, 2.828125, 2.990966796875, 3.15380859375, 3.316650390625, 3.4794921875, 3.642333984375, 3.80517578125, 3.968017578125, 4.130859375, 4.293701171875, 4.45654296875, 4.619384765625, 4.7822265625, 4.945068359375, 5.10791015625, 5.270751953125, 5.43359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 10.0, 10.0, 8.0, 14.0, 17.0, 16.0, 38.0, 57.0, 120.0, 191.0, 180.0, 95.0, 48.0, 48.0, 22.0, 35.0, 20.0, 10.0, 8.0, 13.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00055694580078125, -0.0005394518375396729, -0.0005219578742980957, -0.0005044639110565186, -0.0004869699478149414, -0.00046947598457336426, -0.0004519820213317871, -0.00043448805809020996, -0.0004169940948486328, -0.00039950013160705566, -0.0003820061683654785, -0.00036451220512390137, -0.0003470182418823242, -0.00032952427864074707, -0.0003120303153991699, -0.0002945363521575928, -0.0002770423889160156, -0.0002595484256744385, -0.00024205446243286133, -0.00022456049919128418, -0.00020706653594970703, -0.00018957257270812988, -0.00017207860946655273, -0.00015458464622497559, -0.00013709068298339844, -0.00011959671974182129, -0.00010210275650024414, -8.460879325866699e-05, -6.711483001708984e-05, -4.9620866775512695e-05, -3.212690353393555e-05, -1.4632940292358398e-05, 2.86102294921875e-06, 2.03549861907959e-05, 3.784894943237305e-05, 5.5342912673950195e-05, 7.283687591552734e-05, 9.033083915710449e-05, 0.00010782480239868164, 0.0001253187656402588, 0.00014281272888183594, 0.00016030669212341309, 0.00017780065536499023, 0.00019529461860656738, 0.00021278858184814453, 0.00023028254508972168, 0.00024777650833129883, 0.000265270471572876, 0.0002827644348144531, 0.0003002583980560303, 0.0003177523612976074, 0.00033524632453918457, 0.0003527402877807617, 0.00037023425102233887, 0.000387728214263916, 0.00040522217750549316, 0.0004227161407470703, 0.00044021010398864746, 0.0004577040672302246, 0.00047519803047180176, 0.0004926919937133789, 0.0005101859569549561, 0.0005276799201965332, 0.0005451738834381104, 0.0005626678466796875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 7.0, 7.0, 15.0, 20.0, 16.0, 34.0, 45.0, 59.0, 124.0, 216.0, 356.0, 822.0, 2248.0, 8983.0, 76663.0, 870802.0, 75412.0, 8816.0, 2251.0, 791.0, 321.0, 196.0, 108.0, 85.0, 45.0, 28.0, 25.0, 9.0, 8.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.36273193359375, -3.2254638671875, -3.08819580078125, -2.950927734375, -2.81365966796875, -2.6763916015625, -2.53912353515625, -2.40185546875, -2.26458740234375, -2.1273193359375, -1.99005126953125, -1.852783203125, -1.71551513671875, -1.5782470703125, -1.44097900390625, -1.3037109375, -1.16644287109375, -1.0291748046875, -0.89190673828125, -0.754638671875, -0.61737060546875, -0.4801025390625, -0.34283447265625, -0.20556640625, -0.06829833984375, 0.0689697265625, 0.20623779296875, 0.343505859375, 0.48077392578125, 0.6180419921875, 0.75531005859375, 0.892578125, 1.02984619140625, 1.1671142578125, 1.30438232421875, 1.441650390625, 1.57891845703125, 1.7161865234375, 1.85345458984375, 1.99072265625, 2.12799072265625, 2.2652587890625, 2.40252685546875, 2.539794921875, 2.67706298828125, 2.8143310546875, 2.95159912109375, 3.0888671875, 3.22613525390625, 3.3634033203125, 3.50067138671875, 3.637939453125, 3.77520751953125, 3.9124755859375, 4.04974365234375, 4.18701171875, 4.32427978515625, 4.4615478515625, 4.59881591796875, 4.736083984375, 4.87335205078125, 5.0106201171875, 5.14788818359375, 5.28515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 7.0, 3.0, 3.0, 13.0, 9.0, 14.0, 20.0, 29.0, 38.0, 61.0, 73.0, 91.0, 115.0, 96.0, 98.0, 95.0, 55.0, 44.0, 30.0, 22.0, 19.0, 13.0, 11.0, 6.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8125, -2.7015380859375, -2.590576171875, -2.4796142578125, -2.36865234375, -2.2576904296875, -2.146728515625, -2.0357666015625, -1.9248046875, -1.8138427734375, -1.702880859375, -1.5919189453125, -1.48095703125, -1.3699951171875, -1.259033203125, -1.1480712890625, -1.037109375, -0.9261474609375, -0.815185546875, -0.7042236328125, -0.59326171875, -0.4822998046875, -0.371337890625, -0.2603759765625, -0.1494140625, -0.0384521484375, 0.072509765625, 0.1834716796875, 0.29443359375, 0.4053955078125, 0.516357421875, 0.6273193359375, 0.73828125, 0.8492431640625, 0.960205078125, 1.0711669921875, 1.18212890625, 1.2930908203125, 1.404052734375, 1.5150146484375, 1.6259765625, 1.7369384765625, 1.847900390625, 1.9588623046875, 2.06982421875, 2.1807861328125, 2.291748046875, 2.4027099609375, 2.513671875, 2.6246337890625, 2.735595703125, 2.8465576171875, 2.95751953125, 3.0684814453125, 3.179443359375, 3.2904052734375, 3.4013671875, 3.5123291015625, 3.623291015625, 3.7342529296875, 3.84521484375, 3.9561767578125, 4.067138671875, 4.1781005859375, 4.2890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 12.0, 39.0, 90.0, 235.0, 326.0, 175.0, 80.0, 20.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.10572814941406, -110.43189239501953, -107.758056640625, -105.08422088623047, -102.41038513183594, -99.7365493774414, -97.06271362304688, -94.38887786865234, -91.71504211425781, -89.04120635986328, -86.36737060546875, -83.69353485107422, -81.01969909667969, -78.34586334228516, -75.67202758789062, -72.9981918334961, -70.32435607910156, -67.65052032470703, -64.9766845703125, -62.30284881591797, -59.62901306152344, -56.955177307128906, -54.281341552734375, -51.607505798339844, -48.93367004394531, -46.25983428955078, -43.58599853515625, -40.91216278076172, -38.23832702636719, -35.564491271972656, -32.890655517578125, -30.216819763183594, -27.542984008789062, -24.86914825439453, -22.1953125, -19.52147674560547, -16.847640991210938, -14.173805236816406, -11.499969482421875, -8.826133728027344, -6.1522979736328125, -3.4784622192382812, -0.80462646484375, 1.8692092895507812, 4.5430450439453125, 7.216880798339844, 9.890716552734375, 12.564552307128906, 15.238388061523438, 17.91222381591797, 20.5860595703125, 23.25989532470703, 25.933731079101562, 28.607566833496094, 31.281402587890625, 33.955238342285156, 36.62907409667969, 39.30290985107422, 41.97674560546875, 44.65058135986328, 47.32441711425781, 49.998252868652344, 52.672088623046875, 55.345924377441406, 58.01976013183594]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 15.0, 20.0, 30.0, 20.0, 45.0, 40.0, 44.0, 61.0, 77.0, 93.0, 71.0, 87.0, 60.0, 58.0, 51.0, 58.0, 44.0, 23.0, 19.0, 16.0, 14.0, 18.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3303108215332, -41.397457122802734, -39.464603424072266, -37.53174591064453, -35.59889221191406, -33.666038513183594, -31.733184814453125, -29.800331115722656, -27.867475509643555, -25.934621810913086, -24.001766204833984, -22.068912506103516, -20.136058807373047, -18.203203201293945, -16.270349502563477, -14.337494850158691, -12.404640197753906, -10.471785545349121, -8.538930892944336, -6.606077194213867, -4.673222541809082, -2.740367889404297, -0.8075141906738281, 1.125340461730957, 3.058195114135742, 4.991049766540527, 6.923903942108154, 8.856758117675781, 10.789612770080566, 12.722467422485352, 14.65532112121582, 16.588176727294922, 18.521034240722656, 20.453887939453125, 22.386743545532227, 24.319597244262695, 26.252452850341797, 28.185306549072266, 30.118160247802734, 32.0510139465332, 33.98387145996094, 35.916725158691406, 37.849578857421875, 39.782432556152344, 41.71529006958008, 43.64814376831055, 45.580997467041016, 47.513851165771484, 49.44670486450195, 51.37955856323242, 53.31241226196289, 55.245269775390625, 57.178123474121094, 59.11097717285156, 61.04383087158203, 62.9766845703125, 64.90953826904297, 66.84239196777344, 68.7752456665039, 70.70809936523438, 72.64095306396484, 74.57380676269531, 76.50666809082031, 78.43952178955078, 80.37237548828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 7.0, 0.0, 2.0, 11.0, 21.0, 19.0, 39.0, 69.0, 116.0, 247.0, 1413.0, 71369.0, 4113359.0, 6526.0, 600.0, 203.0, 112.0, 67.0, 47.0, 15.0, 21.0, 11.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.367431640625, -26.73486328125, -26.102294921875, -25.4697265625, -24.837158203125, -24.20458984375, -23.572021484375, -22.939453125, -22.306884765625, -21.67431640625, -21.041748046875, -20.4091796875, -19.776611328125, -19.14404296875, -18.511474609375, -17.87890625, -17.246337890625, -16.61376953125, -15.981201171875, -15.3486328125, -14.716064453125, -14.08349609375, -13.450927734375, -12.818359375, -12.185791015625, -11.55322265625, -10.920654296875, -10.2880859375, -9.655517578125, -9.02294921875, -8.390380859375, -7.7578125, -7.125244140625, -6.49267578125, -5.860107421875, -5.2275390625, -4.594970703125, -3.96240234375, -3.329833984375, -2.697265625, -2.064697265625, -1.43212890625, -0.799560546875, -0.1669921875, 0.465576171875, 1.09814453125, 1.730712890625, 2.36328125, 2.995849609375, 3.62841796875, 4.260986328125, 4.8935546875, 5.526123046875, 6.15869140625, 6.791259765625, 7.423828125, 8.056396484375, 8.68896484375, 9.321533203125, 9.9541015625, 10.586669921875, 11.21923828125, 11.851806640625, 12.484375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 16.0, 28.0, 37.0, 74.0, 97.0, 124.0, 132.0, 139.0, 106.0, 96.0, 69.0, 30.0, 27.0, 13.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.891143798828125, -2.69830322265625, -2.505462646484375, -2.3126220703125, -2.119781494140625, -1.92694091796875, -1.734100341796875, -1.541259765625, -1.348419189453125, -1.15557861328125, -0.962738037109375, -0.7698974609375, -0.577056884765625, -0.38421630859375, -0.191375732421875, 0.00146484375, 0.194305419921875, 0.38714599609375, 0.579986572265625, 0.7728271484375, 0.965667724609375, 1.15850830078125, 1.351348876953125, 1.544189453125, 1.737030029296875, 1.92987060546875, 2.122711181640625, 2.3155517578125, 2.508392333984375, 2.70123291015625, 2.894073486328125, 3.0869140625, 3.279754638671875, 3.47259521484375, 3.665435791015625, 3.8582763671875, 4.051116943359375, 4.24395751953125, 4.436798095703125, 4.629638671875, 4.822479248046875, 5.01531982421875, 5.208160400390625, 5.4010009765625, 5.593841552734375, 5.78668212890625, 5.979522705078125, 6.17236328125, 6.365203857421875, 6.55804443359375, 6.750885009765625, 6.9437255859375, 7.136566162109375, 7.32940673828125, 7.522247314453125, 7.715087890625, 7.907928466796875, 8.10076904296875, 8.293609619140625, 8.4864501953125, 8.679290771484375, 8.87213134765625, 9.064971923828125, 9.2578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 15.0, 22.0, 36.0, 68.0, 81.0, 184.0, 378.0, 718.0, 1455.0, 3217.0, 8182.0, 27526.0, 171736.0, 3351934.0, 562533.0, 47397.0, 11569.0, 4103.0, 1637.0, 766.0, 335.0, 178.0, 78.0, 45.0, 24.0, 16.0, 13.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5078125, -4.36993408203125, -4.2320556640625, -4.09417724609375, -3.956298828125, -3.81842041015625, -3.6805419921875, -3.54266357421875, -3.40478515625, -3.26690673828125, -3.1290283203125, -2.99114990234375, -2.853271484375, -2.71539306640625, -2.5775146484375, -2.43963623046875, -2.3017578125, -2.16387939453125, -2.0260009765625, -1.88812255859375, -1.750244140625, -1.61236572265625, -1.4744873046875, -1.33660888671875, -1.19873046875, -1.06085205078125, -0.9229736328125, -0.78509521484375, -0.647216796875, -0.50933837890625, -0.3714599609375, -0.23358154296875, -0.095703125, 0.04217529296875, 0.1800537109375, 0.31793212890625, 0.455810546875, 0.59368896484375, 0.7315673828125, 0.86944580078125, 1.00732421875, 1.14520263671875, 1.2830810546875, 1.42095947265625, 1.558837890625, 1.69671630859375, 1.8345947265625, 1.97247314453125, 2.1103515625, 2.24822998046875, 2.3861083984375, 2.52398681640625, 2.661865234375, 2.79974365234375, 2.9376220703125, 3.07550048828125, 3.21337890625, 3.35125732421875, 3.4891357421875, 3.62701416015625, 3.764892578125, 3.90277099609375, 4.0406494140625, 4.17852783203125, 4.31640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 13.0, 16.0, 27.0, 47.0, 51.0, 119.0, 235.0, 512.0, 1086.0, 998.0, 488.0, 220.0, 97.0, 48.0, 18.0, 19.0, 15.0, 11.0, 2.0, 5.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.12890625, -5.96722412109375, -5.8055419921875, -5.64385986328125, -5.482177734375, -5.32049560546875, -5.1588134765625, -4.99713134765625, -4.83544921875, -4.67376708984375, -4.5120849609375, -4.35040283203125, -4.188720703125, -4.02703857421875, -3.8653564453125, -3.70367431640625, -3.5419921875, -3.38031005859375, -3.2186279296875, -3.05694580078125, -2.895263671875, -2.73358154296875, -2.5718994140625, -2.41021728515625, -2.24853515625, -2.08685302734375, -1.9251708984375, -1.76348876953125, -1.601806640625, -1.44012451171875, -1.2784423828125, -1.11676025390625, -0.955078125, -0.79339599609375, -0.6317138671875, -0.47003173828125, -0.308349609375, -0.14666748046875, 0.0150146484375, 0.17669677734375, 0.33837890625, 0.50006103515625, 0.6617431640625, 0.82342529296875, 0.985107421875, 1.14678955078125, 1.3084716796875, 1.47015380859375, 1.6318359375, 1.79351806640625, 1.9552001953125, 2.11688232421875, 2.278564453125, 2.44024658203125, 2.6019287109375, 2.76361083984375, 2.92529296875, 3.08697509765625, 3.2486572265625, 3.41033935546875, 3.572021484375, 3.73370361328125, 3.8953857421875, 4.05706787109375, 4.21875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 6.0, 16.0, 29.0, 80.0, 162.0, 231.0, 210.0, 138.0, 67.0, 25.0, 10.0, 9.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-63.12578582763672, -61.80710983276367, -60.48843765258789, -59.169761657714844, -57.85108947753906, -56.532413482666016, -55.213741302490234, -53.89506530761719, -52.576393127441406, -51.25771713256836, -49.93904495239258, -48.62036895751953, -47.30169677734375, -45.9830207824707, -44.66434860229492, -43.345672607421875, -42.027000427246094, -40.70832443237305, -39.389652252197266, -38.07097625732422, -36.75230407714844, -35.43362808227539, -34.11495590209961, -32.79627990722656, -31.477603912353516, -30.1589298248291, -28.840255737304688, -27.521581649780273, -26.20290756225586, -24.884233474731445, -23.56555938720703, -22.246883392333984, -20.928211212158203, -19.60953712463379, -18.290863037109375, -16.97218894958496, -15.653514862060547, -14.334840774536133, -13.016165733337402, -11.697491645812988, -10.378817558288574, -9.06014347076416, -7.741469383239746, -6.422794818878174, -5.10412073135376, -3.7854466438293457, -2.4667720794677734, -1.1480979919433594, 0.1705760955810547, 1.4892503023147583, 2.807924509048462, 4.126598834991455, 5.445272922515869, 6.763947010040283, 8.082621574401855, 9.40129566192627, 10.719969749450684, 12.038643836975098, 13.357317924499512, 14.675992965698242, 15.994667053222656, 17.31334114074707, 18.632015228271484, 19.9506893157959, 21.269363403320312]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 18.0, 22.0, 33.0, 38.0, 53.0, 62.0, 73.0, 77.0, 75.0, 100.0, 78.0, 70.0, 75.0, 45.0, 42.0, 37.0, 34.0, 19.0, 8.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0], "bins": [-46.01859664916992, -45.05628967285156, -44.09398651123047, -43.13167953491211, -42.169376373291016, -41.207069396972656, -40.24476623535156, -39.2824592590332, -38.320152282714844, -37.357845306396484, -36.39554214477539, -35.43323516845703, -34.47093200683594, -33.50862503051758, -32.546321868896484, -31.584014892578125, -30.62171173095703, -29.659406661987305, -28.697101593017578, -27.73479652404785, -26.772491455078125, -25.810184478759766, -24.84787940979004, -23.885574340820312, -22.923269271850586, -21.96096420288086, -20.998659133911133, -20.036354064941406, -19.074047088623047, -18.111743927001953, -17.149436950683594, -16.187131881713867, -15.224828720092773, -14.262523651123047, -13.30021858215332, -12.337912559509277, -11.37560749053955, -10.413302421569824, -9.450996398925781, -8.488691329956055, -7.526386260986328, -6.564081192016602, -5.601775646209717, -4.639470100402832, -3.6771650314331055, -2.714859962463379, -1.7525544166564941, -0.7902488708496094, 0.1720561981201172, 1.1343615055084229, 2.0966668128967285, 3.058972120285034, 4.02127742767334, 4.983582496643066, 5.945888042449951, 6.908193588256836, 7.8704986572265625, 8.832803726196289, 9.795108795166016, 10.757414817810059, 11.719719886779785, 12.682024955749512, 13.644330978393555, 14.606636047363281, 15.568941116333008]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 8.0, 6.0, 10.0, 24.0, 13.0, 31.0, 44.0, 61.0, 110.0, 164.0, 264.0, 385.0, 697.0, 1225.0, 2211.0, 4341.0, 8622.0, 17977.0, 39404.0, 93745.0, 242009.0, 356563.0, 160928.0, 64561.0, 28143.0, 13196.0, 6408.0, 3272.0, 1731.0, 942.0, 540.0, 328.0, 205.0, 128.0, 85.0, 53.0, 37.0, 19.0, 19.0, 11.0, 12.0, 6.0, 4.0, 5.0, 8.0, 1.0, 2.0], "bins": [-3.615234375, -3.52081298828125, -3.4263916015625, -3.33197021484375, -3.237548828125, -3.14312744140625, -3.0487060546875, -2.95428466796875, -2.85986328125, -2.76544189453125, -2.6710205078125, -2.57659912109375, -2.482177734375, -2.38775634765625, -2.2933349609375, -2.19891357421875, -2.1044921875, -2.01007080078125, -1.9156494140625, -1.82122802734375, -1.726806640625, -1.63238525390625, -1.5379638671875, -1.44354248046875, -1.34912109375, -1.25469970703125, -1.1602783203125, -1.06585693359375, -0.971435546875, -0.87701416015625, -0.7825927734375, -0.68817138671875, -0.59375, -0.49932861328125, -0.4049072265625, -0.31048583984375, -0.216064453125, -0.12164306640625, -0.0272216796875, 0.06719970703125, 0.16162109375, 0.25604248046875, 0.3504638671875, 0.44488525390625, 0.539306640625, 0.63372802734375, 0.7281494140625, 0.82257080078125, 0.9169921875, 1.01141357421875, 1.1058349609375, 1.20025634765625, 1.294677734375, 1.38909912109375, 1.4835205078125, 1.57794189453125, 1.67236328125, 1.76678466796875, 1.8612060546875, 1.95562744140625, 2.050048828125, 2.14447021484375, 2.2388916015625, 2.33331298828125, 2.427734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 7.0, 9.0, 18.0, 16.0, 18.0, 25.0, 28.0, 37.0, 49.0, 45.0, 59.0, 42.0, 58.0, 66.0, 55.0, 72.0, 64.0, 58.0, 41.0, 36.0, 38.0, 34.0, 30.0, 25.0, 13.0, 12.0, 11.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.299102783203125, -2.21734619140625, -2.135589599609375, -2.0538330078125, -1.972076416015625, -1.89031982421875, -1.808563232421875, -1.726806640625, -1.645050048828125, -1.56329345703125, -1.481536865234375, -1.3997802734375, -1.318023681640625, -1.23626708984375, -1.154510498046875, -1.07275390625, -0.990997314453125, -0.90924072265625, -0.827484130859375, -0.7457275390625, -0.663970947265625, -0.58221435546875, -0.500457763671875, -0.418701171875, -0.336944580078125, -0.25518798828125, -0.173431396484375, -0.0916748046875, -0.009918212890625, 0.07183837890625, 0.153594970703125, 0.2353515625, 0.317108154296875, 0.39886474609375, 0.480621337890625, 0.5623779296875, 0.644134521484375, 0.72589111328125, 0.807647705078125, 0.889404296875, 0.971160888671875, 1.05291748046875, 1.134674072265625, 1.2164306640625, 1.298187255859375, 1.37994384765625, 1.461700439453125, 1.54345703125, 1.625213623046875, 1.70697021484375, 1.788726806640625, 1.8704833984375, 1.952239990234375, 2.03399658203125, 2.115753173828125, 2.197509765625, 2.279266357421875, 2.36102294921875, 2.442779541015625, 2.5245361328125, 2.606292724609375, 2.68804931640625, 2.769805908203125, 2.8515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 7.0, 16.0, 26.0, 28.0, 42.0, 58.0, 79.0, 126.0, 185.0, 288.0, 559.0, 1109.0, 2524.0, 7601.0, 31945.0, 208360.0, 669877.0, 98937.0, 18085.0, 4799.0, 1754.0, 877.0, 468.0, 265.0, 178.0, 114.0, 70.0, 45.0, 32.0, 22.0, 11.0, 14.0, 11.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.12554931640625, -4.9307861328125, -4.73602294921875, -4.541259765625, -4.34649658203125, -4.1517333984375, -3.95697021484375, -3.76220703125, -3.56744384765625, -3.3726806640625, -3.17791748046875, -2.983154296875, -2.78839111328125, -2.5936279296875, -2.39886474609375, -2.2041015625, -2.00933837890625, -1.8145751953125, -1.61981201171875, -1.425048828125, -1.23028564453125, -1.0355224609375, -0.84075927734375, -0.64599609375, -0.45123291015625, -0.2564697265625, -0.06170654296875, 0.133056640625, 0.32781982421875, 0.5225830078125, 0.71734619140625, 0.912109375, 1.10687255859375, 1.3016357421875, 1.49639892578125, 1.691162109375, 1.88592529296875, 2.0806884765625, 2.27545166015625, 2.47021484375, 2.66497802734375, 2.8597412109375, 3.05450439453125, 3.249267578125, 3.44403076171875, 3.6387939453125, 3.83355712890625, 4.0283203125, 4.22308349609375, 4.4178466796875, 4.61260986328125, 4.807373046875, 5.00213623046875, 5.1968994140625, 5.39166259765625, 5.58642578125, 5.78118896484375, 5.9759521484375, 6.17071533203125, 6.365478515625, 6.56024169921875, 6.7550048828125, 6.94976806640625, 7.14453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 12.0, 13.0, 19.0, 12.0, 27.0, 28.0, 31.0, 32.0, 45.0, 48.0, 61.0, 66.0, 63.0, 59.0, 64.0, 61.0, 48.0, 48.0, 45.0, 39.0, 32.0, 23.0, 24.0, 16.0, 16.0, 10.0, 8.0, 12.0, 2.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0, -9.6983642578125, -9.396728515625, -9.0950927734375, -8.79345703125, -8.4918212890625, -8.190185546875, -7.8885498046875, -7.5869140625, -7.2852783203125, -6.983642578125, -6.6820068359375, -6.38037109375, -6.0787353515625, -5.777099609375, -5.4754638671875, -5.173828125, -4.8721923828125, -4.570556640625, -4.2689208984375, -3.96728515625, -3.6656494140625, -3.364013671875, -3.0623779296875, -2.7607421875, -2.4591064453125, -2.157470703125, -1.8558349609375, -1.55419921875, -1.2525634765625, -0.950927734375, -0.6492919921875, -0.34765625, -0.0460205078125, 0.255615234375, 0.5572509765625, 0.85888671875, 1.1605224609375, 1.462158203125, 1.7637939453125, 2.0654296875, 2.3670654296875, 2.668701171875, 2.9703369140625, 3.27197265625, 3.5736083984375, 3.875244140625, 4.1768798828125, 4.478515625, 4.7801513671875, 5.081787109375, 5.3834228515625, 5.68505859375, 5.9866943359375, 6.288330078125, 6.5899658203125, 6.8916015625, 7.1932373046875, 7.494873046875, 7.7965087890625, 8.09814453125, 8.3997802734375, 8.701416015625, 9.0030517578125, 9.3046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 7.0, 9.0, 31.0, 36.0, 83.0, 154.0, 564.0, 2394.0, 52571.0, 980609.0, 10176.0, 1311.0, 342.0, 121.0, 45.0, 36.0, 15.0, 9.0, 13.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.85076904296875, -7.6077880859375, -7.36480712890625, -7.121826171875, -6.87884521484375, -6.6358642578125, -6.39288330078125, -6.14990234375, -5.90692138671875, -5.6639404296875, -5.42095947265625, -5.177978515625, -4.93499755859375, -4.6920166015625, -4.44903564453125, -4.2060546875, -3.96307373046875, -3.7200927734375, -3.47711181640625, -3.234130859375, -2.99114990234375, -2.7481689453125, -2.50518798828125, -2.26220703125, -2.01922607421875, -1.7762451171875, -1.53326416015625, -1.290283203125, -1.04730224609375, -0.8043212890625, -0.56134033203125, -0.318359375, -0.07537841796875, 0.1676025390625, 0.41058349609375, 0.653564453125, 0.89654541015625, 1.1395263671875, 1.38250732421875, 1.62548828125, 1.86846923828125, 2.1114501953125, 2.35443115234375, 2.597412109375, 2.84039306640625, 3.0833740234375, 3.32635498046875, 3.5693359375, 3.81231689453125, 4.0552978515625, 4.29827880859375, 4.541259765625, 4.78424072265625, 5.0272216796875, 5.27020263671875, 5.51318359375, 5.75616455078125, 5.9991455078125, 6.24212646484375, 6.485107421875, 6.72808837890625, 6.9710693359375, 7.21405029296875, 7.45703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 15.0, 24.0, 31.0, 61.0, 114.0, 179.0, 227.0, 148.0, 77.0, 47.0, 20.0, 15.0, 10.0, 8.0, 6.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003781318664550781, -0.00035613030195236206, -0.000334128737449646, -0.00031212717294692993, -0.00029012560844421387, -0.0002681240439414978, -0.00024612247943878174, -0.00022412091493606567, -0.0002021193504333496, -0.00018011778593063354, -0.00015811622142791748, -0.00013611465692520142, -0.00011411309242248535, -9.211152791976929e-05, -7.010996341705322e-05, -4.810839891433716e-05, -2.6106834411621094e-05, -4.105269908905029e-06, 1.7896294593811035e-05, 3.98978590965271e-05, 6.189942359924316e-05, 8.390098810195923e-05, 0.00010590255260467529, 0.00012790411710739136, 0.00014990568161010742, 0.00017190724611282349, 0.00019390881061553955, 0.00021591037511825562, 0.00023791193962097168, 0.00025991350412368774, 0.0002819150686264038, 0.0003039166331291199, 0.00032591819763183594, 0.000347919762134552, 0.00036992132663726807, 0.00039192289113998413, 0.0004139244556427002, 0.00043592602014541626, 0.0004579275846481323, 0.0004799291491508484, 0.0005019307136535645, 0.0005239322781562805, 0.0005459338426589966, 0.0005679354071617126, 0.0005899369716644287, 0.0006119385361671448, 0.0006339401006698608, 0.0006559416651725769, 0.000677943229675293, 0.000699944794178009, 0.0007219463586807251, 0.0007439479231834412, 0.0007659494876861572, 0.0007879510521888733, 0.0008099526166915894, 0.0008319541811943054, 0.0008539557456970215, 0.0008759573101997375, 0.0008979588747024536, 0.0009199604392051697, 0.0009419620037078857, 0.0009639635682106018, 0.0009859651327133179, 0.001007966697216034, 0.00102996826171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 10.0, 6.0, 14.0, 21.0, 34.0, 43.0, 58.0, 84.0, 178.0, 297.0, 640.0, 1653.0, 5418.0, 28894.0, 583012.0, 396720.0, 23925.0, 4768.0, 1474.0, 600.0, 279.0, 148.0, 84.0, 59.0, 50.0, 26.0, 16.0, 14.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.154296875, -3.052398681640625, -2.95050048828125, -2.848602294921875, -2.7467041015625, -2.644805908203125, -2.54290771484375, -2.441009521484375, -2.339111328125, -2.237213134765625, -2.13531494140625, -2.033416748046875, -1.9315185546875, -1.829620361328125, -1.72772216796875, -1.625823974609375, -1.52392578125, -1.422027587890625, -1.32012939453125, -1.218231201171875, -1.1163330078125, -1.014434814453125, -0.91253662109375, -0.810638427734375, -0.708740234375, -0.606842041015625, -0.50494384765625, -0.403045654296875, -0.3011474609375, -0.199249267578125, -0.09735107421875, 0.004547119140625, 0.1064453125, 0.208343505859375, 0.31024169921875, 0.412139892578125, 0.5140380859375, 0.615936279296875, 0.71783447265625, 0.819732666015625, 0.921630859375, 1.023529052734375, 1.12542724609375, 1.227325439453125, 1.3292236328125, 1.431121826171875, 1.53302001953125, 1.634918212890625, 1.73681640625, 1.838714599609375, 1.94061279296875, 2.042510986328125, 2.1444091796875, 2.246307373046875, 2.34820556640625, 2.450103759765625, 2.552001953125, 2.653900146484375, 2.75579833984375, 2.857696533203125, 2.9595947265625, 3.061492919921875, 3.16339111328125, 3.265289306640625, 3.3671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 12.0, 20.0, 19.0, 34.0, 52.0, 72.0, 102.0, 108.0, 126.0, 96.0, 97.0, 62.0, 50.0, 38.0, 22.0, 18.0, 15.0, 5.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.80078125, -2.716552734375, -2.63232421875, -2.548095703125, -2.4638671875, -2.379638671875, -2.29541015625, -2.211181640625, -2.126953125, -2.042724609375, -1.95849609375, -1.874267578125, -1.7900390625, -1.705810546875, -1.62158203125, -1.537353515625, -1.453125, -1.368896484375, -1.28466796875, -1.200439453125, -1.1162109375, -1.031982421875, -0.94775390625, -0.863525390625, -0.779296875, -0.695068359375, -0.61083984375, -0.526611328125, -0.4423828125, -0.358154296875, -0.27392578125, -0.189697265625, -0.10546875, -0.021240234375, 0.06298828125, 0.147216796875, 0.2314453125, 0.315673828125, 0.39990234375, 0.484130859375, 0.568359375, 0.652587890625, 0.73681640625, 0.821044921875, 0.9052734375, 0.989501953125, 1.07373046875, 1.157958984375, 1.2421875, 1.326416015625, 1.41064453125, 1.494873046875, 1.5791015625, 1.663330078125, 1.74755859375, 1.831787109375, 1.916015625, 2.000244140625, 2.08447265625, 2.168701171875, 2.2529296875, 2.337158203125, 2.42138671875, 2.505615234375, 2.58984375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 16.0, 34.0, 86.0, 173.0, 295.0, 189.0, 107.0, 47.0, 20.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.12120819091797, -68.15371704101562, -66.18622589111328, -64.21873474121094, -62.251243591308594, -60.28375244140625, -58.316261291503906, -56.34877014160156, -54.38127899169922, -52.413787841796875, -50.44629669189453, -48.47880554199219, -46.511314392089844, -44.5438232421875, -42.576332092285156, -40.60884094238281, -38.64134979248047, -36.673858642578125, -34.70636749267578, -32.73887634277344, -30.771385192871094, -28.80389404296875, -26.836402893066406, -24.868911743164062, -22.90142059326172, -20.933929443359375, -18.96643829345703, -16.998947143554688, -15.031455993652344, -13.06396484375, -11.096473693847656, -9.128982543945312, -7.161491394042969, -5.194000244140625, -3.2265090942382812, -1.2590179443359375, 0.7084732055664062, 2.67596435546875, 4.643455505371094, 6.6109466552734375, 8.578437805175781, 10.545928955078125, 12.513420104980469, 14.480911254882812, 16.448402404785156, 18.4158935546875, 20.383384704589844, 22.350875854492188, 24.31836700439453, 26.285858154296875, 28.25334930419922, 30.220840454101562, 32.188331604003906, 34.15582275390625, 36.123313903808594, 38.09080505371094, 40.05829620361328, 42.025787353515625, 43.99327850341797, 45.96076965332031, 47.928260803222656, 49.895751953125, 51.863243103027344, 53.83073425292969, 55.79822540283203]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 4.0, 5.0, 8.0, 10.0, 12.0, 11.0, 15.0, 13.0, 25.0, 20.0, 32.0, 38.0, 37.0, 38.0, 43.0, 44.0, 55.0, 58.0, 58.0, 47.0, 56.0, 49.0, 36.0, 36.0, 34.0, 27.0, 20.0, 34.0, 29.0, 21.0, 18.0, 15.0, 13.0, 9.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.916412353515625, -35.87670135498047, -34.83698654174805, -33.79727554321289, -32.757564544677734, -31.717851638793945, -30.678138732910156, -29.638427734375, -28.59871482849121, -27.559001922607422, -26.519290924072266, -25.479578018188477, -24.439865112304688, -23.40015411376953, -22.360441207885742, -21.320728302001953, -20.281017303466797, -19.241304397583008, -18.20159339904785, -17.161880493164062, -16.122169494628906, -15.082456588745117, -14.042743682861328, -13.003031730651855, -11.963319778442383, -10.92360782623291, -9.883895874023438, -8.844182968139648, -7.804471015930176, -6.764759063720703, -5.725046634674072, -4.685334205627441, -3.645618438720703, -2.6059062480926514, -1.5661940574645996, -0.5264818668365479, 0.5132303237915039, 1.5529422760009766, 2.5926547050476074, 3.6323671340942383, 4.672079086303711, 5.711791038513184, 6.7515034675598145, 7.791215896606445, 8.830927848815918, 9.87063980102539, 10.91035270690918, 11.950064659118652, 12.989776611328125, 14.029488563537598, 15.06920051574707, 16.10891342163086, 17.148624420166016, 18.188337326049805, 19.228050231933594, 20.26776123046875, 21.30747413635254, 22.347187042236328, 23.386898040771484, 24.426610946655273, 25.466323852539062, 26.50603485107422, 27.545747756958008, 28.585460662841797, 29.625171661376953]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 9.0, 18.0, 26.0, 39.0, 113.0, 194.0, 477.0, 1382.0, 4630.0, 22584.0, 263734.0, 3546345.0, 321821.0, 25566.0, 5007.0, 1434.0, 476.0, 207.0, 103.0, 51.0, 27.0, 15.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0], "bins": [-7.1171875, -6.967437744140625, -6.81768798828125, -6.667938232421875, -6.5181884765625, -6.368438720703125, -6.21868896484375, -6.068939208984375, -5.919189453125, -5.769439697265625, -5.61968994140625, -5.469940185546875, -5.3201904296875, -5.170440673828125, -5.02069091796875, -4.870941162109375, -4.72119140625, -4.571441650390625, -4.42169189453125, -4.271942138671875, -4.1221923828125, -3.972442626953125, -3.82269287109375, -3.672943115234375, -3.523193359375, -3.373443603515625, -3.22369384765625, -3.073944091796875, -2.9241943359375, -2.774444580078125, -2.62469482421875, -2.474945068359375, -2.3251953125, -2.175445556640625, -2.02569580078125, -1.875946044921875, -1.7261962890625, -1.576446533203125, -1.42669677734375, -1.276947021484375, -1.127197265625, -0.977447509765625, -0.82769775390625, -0.677947998046875, -0.5281982421875, -0.378448486328125, -0.22869873046875, -0.078948974609375, 0.07080078125, 0.220550537109375, 0.37030029296875, 0.520050048828125, 0.6697998046875, 0.819549560546875, 0.96929931640625, 1.119049072265625, 1.268798828125, 1.418548583984375, 1.56829833984375, 1.718048095703125, 1.8677978515625, 2.017547607421875, 2.16729736328125, 2.317047119140625, 2.466796875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 15.0, 12.0, 17.0, 16.0, 20.0, 17.0, 27.0, 34.0, 35.0, 29.0, 47.0, 48.0, 49.0, 54.0, 42.0, 56.0, 55.0, 53.0, 49.0, 41.0, 40.0, 42.0, 38.0, 26.0, 22.0, 11.0, 18.0, 11.0, 15.0, 6.0, 12.0, 4.0, 3.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7734375, -1.7177276611328125, -1.662017822265625, -1.6063079833984375, -1.55059814453125, -1.4948883056640625, -1.439178466796875, -1.3834686279296875, -1.3277587890625, -1.2720489501953125, -1.216339111328125, -1.1606292724609375, -1.10491943359375, -1.0492095947265625, -0.993499755859375, -0.9377899169921875, -0.882080078125, -0.8263702392578125, -0.770660400390625, -0.7149505615234375, -0.65924072265625, -0.6035308837890625, -0.547821044921875, -0.4921112060546875, -0.4364013671875, -0.3806915283203125, -0.324981689453125, -0.2692718505859375, -0.21356201171875, -0.1578521728515625, -0.102142333984375, -0.0464324951171875, 0.00927734375, 0.0649871826171875, 0.120697021484375, 0.1764068603515625, 0.23211669921875, 0.2878265380859375, 0.343536376953125, 0.3992462158203125, 0.4549560546875, 0.5106658935546875, 0.566375732421875, 0.6220855712890625, 0.67779541015625, 0.7335052490234375, 0.789215087890625, 0.8449249267578125, 0.900634765625, 0.9563446044921875, 1.012054443359375, 1.0677642822265625, 1.12347412109375, 1.1791839599609375, 1.234893798828125, 1.2906036376953125, 1.3463134765625, 1.4020233154296875, 1.457733154296875, 1.5134429931640625, 1.56915283203125, 1.6248626708984375, 1.680572509765625, 1.7362823486328125, 1.7919921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 9.0, 8.0, 14.0, 21.0, 45.0, 71.0, 145.0, 282.0, 717.0, 2016.0, 7888.0, 41494.0, 485069.0, 3403948.0, 215984.0, 27033.0, 6164.0, 1919.0, 707.0, 326.0, 151.0, 118.0, 43.0, 26.0, 21.0, 22.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.2657470703125, -4.125244140625, -3.9847412109375, -3.84423828125, -3.7037353515625, -3.563232421875, -3.4227294921875, -3.2822265625, -3.1417236328125, -3.001220703125, -2.8607177734375, -2.72021484375, -2.5797119140625, -2.439208984375, -2.2987060546875, -2.158203125, -2.0177001953125, -1.877197265625, -1.7366943359375, -1.59619140625, -1.4556884765625, -1.315185546875, -1.1746826171875, -1.0341796875, -0.8936767578125, -0.753173828125, -0.6126708984375, -0.47216796875, -0.3316650390625, -0.191162109375, -0.0506591796875, 0.08984375, 0.2303466796875, 0.370849609375, 0.5113525390625, 0.65185546875, 0.7923583984375, 0.932861328125, 1.0733642578125, 1.2138671875, 1.3543701171875, 1.494873046875, 1.6353759765625, 1.77587890625, 1.9163818359375, 2.056884765625, 2.1973876953125, 2.337890625, 2.4783935546875, 2.618896484375, 2.7593994140625, 2.89990234375, 3.0404052734375, 3.180908203125, 3.3214111328125, 3.4619140625, 3.6024169921875, 3.742919921875, 3.8834228515625, 4.02392578125, 4.1644287109375, 4.304931640625, 4.4454345703125, 4.5859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 14.0, 21.0, 16.0, 24.0, 42.0, 77.0, 109.0, 150.0, 285.0, 468.0, 701.0, 765.0, 500.0, 305.0, 185.0, 110.0, 93.0, 46.0, 38.0, 24.0, 15.0, 12.0, 10.0, 8.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34375, -3.21551513671875, -3.0872802734375, -2.95904541015625, -2.830810546875, -2.70257568359375, -2.5743408203125, -2.44610595703125, -2.31787109375, -2.18963623046875, -2.0614013671875, -1.93316650390625, -1.804931640625, -1.67669677734375, -1.5484619140625, -1.42022705078125, -1.2919921875, -1.16375732421875, -1.0355224609375, -0.90728759765625, -0.779052734375, -0.65081787109375, -0.5225830078125, -0.39434814453125, -0.26611328125, -0.13787841796875, -0.0096435546875, 0.11859130859375, 0.246826171875, 0.37506103515625, 0.5032958984375, 0.63153076171875, 0.759765625, 0.88800048828125, 1.0162353515625, 1.14447021484375, 1.272705078125, 1.40093994140625, 1.5291748046875, 1.65740966796875, 1.78564453125, 1.91387939453125, 2.0421142578125, 2.17034912109375, 2.298583984375, 2.42681884765625, 2.5550537109375, 2.68328857421875, 2.8115234375, 2.93975830078125, 3.0679931640625, 3.19622802734375, 3.324462890625, 3.45269775390625, 3.5809326171875, 3.70916748046875, 3.83740234375, 3.96563720703125, 4.0938720703125, 4.22210693359375, 4.350341796875, 4.47857666015625, 4.6068115234375, 4.73504638671875, 4.86328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 12.0, 24.0, 34.0, 60.0, 138.0, 163.0, 190.0, 173.0, 88.0, 49.0, 19.0, 13.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.071008682250977, -28.827295303344727, -27.583581924438477, -26.339868545532227, -25.096155166625977, -23.852441787719727, -22.60873031616211, -21.36501693725586, -20.12130355834961, -18.87759017944336, -17.63387680053711, -16.39016342163086, -15.14645004272461, -13.90273666381836, -12.659024238586426, -11.415310859680176, -10.17159652709961, -8.92788314819336, -7.684169769287109, -6.440456867218018, -5.196743488311768, -3.9530301094055176, -2.709317207336426, -1.4656038284301758, -0.22189044952392578, 1.0218228101730347, 2.265536069869995, 3.509249210357666, 4.752962589263916, 5.996675968170166, 7.240388870239258, 8.484102249145508, 9.727813720703125, 10.971527099609375, 12.215240478515625, 13.458953857421875, 14.702667236328125, 15.946380615234375, 17.190093994140625, 18.433807373046875, 19.677520751953125, 20.921234130859375, 22.164947509765625, 23.408660888671875, 24.652374267578125, 25.896087646484375, 27.139801025390625, 28.383514404296875, 29.627225875854492, 30.870939254760742, 32.11465072631836, 33.35836410522461, 34.60207748413086, 35.84579086303711, 37.08950424194336, 38.33321762084961, 39.57693099975586, 40.82064437866211, 42.06435775756836, 43.30807113647461, 44.55178451538086, 45.79549789428711, 47.03921127319336, 48.28292465209961, 49.52663803100586]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 5.0, 17.0, 19.0, 16.0, 32.0, 20.0, 38.0, 43.0, 44.0, 48.0, 40.0, 51.0, 34.0, 56.0, 48.0, 50.0, 48.0, 44.0, 42.0, 32.0, 44.0, 41.0, 32.0, 17.0, 23.0, 22.0, 19.0, 9.0, 7.0, 6.0, 5.0, 12.0, 3.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.57982635498047, -18.961090087890625, -18.342355728149414, -17.72361946105957, -17.10488510131836, -16.486148834228516, -15.867412567138672, -15.248677253723145, -14.629941940307617, -14.01120662689209, -13.392471313476562, -12.773735046386719, -12.154999732971191, -11.536264419555664, -10.91752815246582, -10.298792839050293, -9.680057525634766, -9.061322212219238, -8.442586898803711, -7.823850631713867, -7.20511531829834, -6.5863800048828125, -5.967644214630127, -5.348908424377441, -4.730173110961914, -4.111437797546387, -3.492702007293701, -2.8739664554595947, -2.2552309036254883, -1.6364953517913818, -1.0177597999572754, -0.39902400970458984, 0.2197113037109375, 0.838446855545044, 1.4571824073791504, 2.075917959213257, 2.6946535110473633, 3.3133890628814697, 3.932124614715576, 4.550860404968262, 5.169595718383789, 5.788331031799316, 6.407066822052002, 7.0258026123046875, 7.644537925720215, 8.263273239135742, 8.882009506225586, 9.500744819641113, 10.11948013305664, 10.738215446472168, 11.356950759887695, 11.975687026977539, 12.594422340393066, 13.213157653808594, 13.831893920898438, 14.450629234313965, 15.069364547729492, 15.68809986114502, 16.306835174560547, 16.92557144165039, 17.544307708740234, 18.163042068481445, 18.78177833557129, 19.4005126953125, 20.019248962402344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 12.0, 26.0, 29.0, 96.0, 164.0, 317.0, 610.0, 1398.0, 3548.0, 10770.0, 37624.0, 146948.0, 460437.0, 283277.0, 73678.0, 19646.0, 5979.0, 2200.0, 879.0, 417.0, 228.0, 105.0, 69.0, 37.0, 10.0, 16.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.263671875, -4.125, -3.986328125, -3.84765625, -3.708984375, -3.5703125, -3.431640625, -3.29296875, -3.154296875, -3.015625, -2.876953125, -2.73828125, -2.599609375, -2.4609375, -2.322265625, -2.18359375, -2.044921875, -1.90625, -1.767578125, -1.62890625, -1.490234375, -1.3515625, -1.212890625, -1.07421875, -0.935546875, -0.796875, -0.658203125, -0.51953125, -0.380859375, -0.2421875, -0.103515625, 0.03515625, 0.173828125, 0.3125, 0.451171875, 0.58984375, 0.728515625, 0.8671875, 1.005859375, 1.14453125, 1.283203125, 1.421875, 1.560546875, 1.69921875, 1.837890625, 1.9765625, 2.115234375, 2.25390625, 2.392578125, 2.53125, 2.669921875, 2.80859375, 2.947265625, 3.0859375, 3.224609375, 3.36328125, 3.501953125, 3.640625, 3.779296875, 3.91796875, 4.056640625, 4.1953125, 4.333984375, 4.47265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 9.0, 11.0, 11.0, 13.0, 22.0, 25.0, 22.0, 27.0, 26.0, 39.0, 37.0, 41.0, 46.0, 40.0, 54.0, 53.0, 48.0, 41.0, 44.0, 48.0, 48.0, 42.0, 30.0, 34.0, 29.0, 30.0, 30.0, 17.0, 16.0, 18.0, 8.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.53125, -1.47845458984375, -1.4256591796875, -1.37286376953125, -1.320068359375, -1.26727294921875, -1.2144775390625, -1.16168212890625, -1.10888671875, -1.05609130859375, -1.0032958984375, -0.95050048828125, -0.897705078125, -0.84490966796875, -0.7921142578125, -0.73931884765625, -0.6865234375, -0.63372802734375, -0.5809326171875, -0.52813720703125, -0.475341796875, -0.42254638671875, -0.3697509765625, -0.31695556640625, -0.26416015625, -0.21136474609375, -0.1585693359375, -0.10577392578125, -0.052978515625, -0.00018310546875, 0.0526123046875, 0.10540771484375, 0.158203125, 0.21099853515625, 0.2637939453125, 0.31658935546875, 0.369384765625, 0.42218017578125, 0.4749755859375, 0.52777099609375, 0.58056640625, 0.63336181640625, 0.6861572265625, 0.73895263671875, 0.791748046875, 0.84454345703125, 0.8973388671875, 0.95013427734375, 1.0029296875, 1.05572509765625, 1.1085205078125, 1.16131591796875, 1.214111328125, 1.26690673828125, 1.3197021484375, 1.37249755859375, 1.42529296875, 1.47808837890625, 1.5308837890625, 1.58367919921875, 1.636474609375, 1.68927001953125, 1.7420654296875, 1.79486083984375, 1.84765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 6.0, 8.0, 12.0, 18.0, 20.0, 35.0, 54.0, 78.0, 125.0, 169.0, 312.0, 456.0, 730.0, 1369.0, 2787.0, 8485.0, 59143.0, 735356.0, 210890.0, 19532.0, 4451.0, 1835.0, 996.0, 590.0, 355.0, 216.0, 159.0, 104.0, 81.0, 49.0, 22.0, 25.0, 27.0, 11.0, 9.0, 5.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.86907958984375, -7.6287841796875, -7.38848876953125, -7.148193359375, -6.90789794921875, -6.6676025390625, -6.42730712890625, -6.18701171875, -5.94671630859375, -5.7064208984375, -5.46612548828125, -5.225830078125, -4.98553466796875, -4.7452392578125, -4.50494384765625, -4.2646484375, -4.02435302734375, -3.7840576171875, -3.54376220703125, -3.303466796875, -3.06317138671875, -2.8228759765625, -2.58258056640625, -2.34228515625, -2.10198974609375, -1.8616943359375, -1.62139892578125, -1.381103515625, -1.14080810546875, -0.9005126953125, -0.66021728515625, -0.419921875, -0.17962646484375, 0.0606689453125, 0.30096435546875, 0.541259765625, 0.78155517578125, 1.0218505859375, 1.26214599609375, 1.50244140625, 1.74273681640625, 1.9830322265625, 2.22332763671875, 2.463623046875, 2.70391845703125, 2.9442138671875, 3.18450927734375, 3.4248046875, 3.66510009765625, 3.9053955078125, 4.14569091796875, 4.385986328125, 4.62628173828125, 4.8665771484375, 5.10687255859375, 5.34716796875, 5.58746337890625, 5.8277587890625, 6.06805419921875, 6.308349609375, 6.54864501953125, 6.7889404296875, 7.02923583984375, 7.26953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 12.0, 12.0, 16.0, 19.0, 29.0, 32.0, 39.0, 41.0, 53.0, 57.0, 72.0, 60.0, 55.0, 63.0, 48.0, 65.0, 47.0, 44.0, 48.0, 40.0, 22.0, 26.0, 19.0, 24.0, 11.0, 7.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.6505126953125, -8.379150390625, -8.1077880859375, -7.83642578125, -7.5650634765625, -7.293701171875, -7.0223388671875, -6.7509765625, -6.4796142578125, -6.208251953125, -5.9368896484375, -5.66552734375, -5.3941650390625, -5.122802734375, -4.8514404296875, -4.580078125, -4.3087158203125, -4.037353515625, -3.7659912109375, -3.49462890625, -3.2232666015625, -2.951904296875, -2.6805419921875, -2.4091796875, -2.1378173828125, -1.866455078125, -1.5950927734375, -1.32373046875, -1.0523681640625, -0.781005859375, -0.5096435546875, -0.23828125, 0.0330810546875, 0.304443359375, 0.5758056640625, 0.84716796875, 1.1185302734375, 1.389892578125, 1.6612548828125, 1.9326171875, 2.2039794921875, 2.475341796875, 2.7467041015625, 3.01806640625, 3.2894287109375, 3.560791015625, 3.8321533203125, 4.103515625, 4.3748779296875, 4.646240234375, 4.9176025390625, 5.18896484375, 5.4603271484375, 5.731689453125, 6.0030517578125, 6.2744140625, 6.5457763671875, 6.817138671875, 7.0885009765625, 7.35986328125, 7.6312255859375, 7.902587890625, 8.1739501953125, 8.4453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 13.0, 9.0, 19.0, 24.0, 25.0, 45.0, 79.0, 144.0, 356.0, 1260.0, 10549.0, 782157.0, 246697.0, 5615.0, 905.0, 306.0, 151.0, 77.0, 42.0, 27.0, 15.0, 13.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0625, -3.921875, -3.78125, -3.640625, -3.5, -3.359375, -3.21875, -3.078125, -2.9375, -2.796875, -2.65625, -2.515625, -2.375, -2.234375, -2.09375, -1.953125, -1.8125, -1.671875, -1.53125, -1.390625, -1.25, -1.109375, -0.96875, -0.828125, -0.6875, -0.546875, -0.40625, -0.265625, -0.125, 0.015625, 0.15625, 0.296875, 0.4375, 0.578125, 0.71875, 0.859375, 1.0, 1.140625, 1.28125, 1.421875, 1.5625, 1.703125, 1.84375, 1.984375, 2.125, 2.265625, 2.40625, 2.546875, 2.6875, 2.828125, 2.96875, 3.109375, 3.25, 3.390625, 3.53125, 3.671875, 3.8125, 3.953125, 4.09375, 4.234375, 4.375, 4.515625, 4.65625, 4.796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 6.0, 13.0, 8.0, 9.0, 16.0, 22.0, 22.0, 26.0, 32.0, 50.0, 45.0, 55.0, 78.0, 109.0, 124.0, 94.0, 62.0, 49.0, 42.0, 26.0, 29.0, 15.0, 14.0, 11.0, 7.0, 9.0, 8.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003383159637451172, -0.0003262832760810852, -0.0003142505884170532, -0.00030221790075302124, -0.00029018521308898926, -0.0002781525254249573, -0.0002661198377609253, -0.0002540871500968933, -0.00024205446243286133, -0.00023002177476882935, -0.00021798908710479736, -0.00020595639944076538, -0.0001939237117767334, -0.00018189102411270142, -0.00016985833644866943, -0.00015782564878463745, -0.00014579296112060547, -0.00013376027345657349, -0.0001217275857925415, -0.00010969489812850952, -9.766221046447754e-05, -8.562952280044556e-05, -7.359683513641357e-05, -6.156414747238159e-05, -4.953145980834961e-05, -3.749877214431763e-05, -2.5466084480285645e-05, -1.3433396816253662e-05, -1.4007091522216797e-06, 1.0631978511810303e-05, 2.2664666175842285e-05, 3.469735383987427e-05, 4.673004150390625e-05, 5.876272916793823e-05, 7.079541683197021e-05, 8.28281044960022e-05, 9.486079216003418e-05, 0.00010689347982406616, 0.00011892616748809814, 0.00013095885515213013, 0.0001429915428161621, 0.0001550242304801941, 0.00016705691814422607, 0.00017908960580825806, 0.00019112229347229004, 0.00020315498113632202, 0.000215187668800354, 0.00022722035646438599, 0.00023925304412841797, 0.00025128573179244995, 0.00026331841945648193, 0.0002753511071205139, 0.0002873837947845459, 0.0002994164824485779, 0.00031144917011260986, 0.00032348185777664185, 0.00033551454544067383, 0.0003475472331047058, 0.0003595799207687378, 0.0003716126084327698, 0.00038364529609680176, 0.00039567798376083374, 0.0004077106714248657, 0.0004197433590888977, 0.0004317760467529297]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 16.0, 16.0, 40.0, 50.0, 96.0, 147.0, 186.0, 280.0, 554.0, 1179.0, 3271.0, 11898.0, 89710.0, 841350.0, 82591.0, 11402.0, 3153.0, 1214.0, 546.0, 323.0, 174.0, 108.0, 63.0, 41.0, 31.0, 25.0, 17.0, 13.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.787841796875, -2.70458984375, -2.621337890625, -2.5380859375, -2.454833984375, -2.37158203125, -2.288330078125, -2.205078125, -2.121826171875, -2.03857421875, -1.955322265625, -1.8720703125, -1.788818359375, -1.70556640625, -1.622314453125, -1.5390625, -1.455810546875, -1.37255859375, -1.289306640625, -1.2060546875, -1.122802734375, -1.03955078125, -0.956298828125, -0.873046875, -0.789794921875, -0.70654296875, -0.623291015625, -0.5400390625, -0.456787109375, -0.37353515625, -0.290283203125, -0.20703125, -0.123779296875, -0.04052734375, 0.042724609375, 0.1259765625, 0.209228515625, 0.29248046875, 0.375732421875, 0.458984375, 0.542236328125, 0.62548828125, 0.708740234375, 0.7919921875, 0.875244140625, 0.95849609375, 1.041748046875, 1.125, 1.208251953125, 1.29150390625, 1.374755859375, 1.4580078125, 1.541259765625, 1.62451171875, 1.707763671875, 1.791015625, 1.874267578125, 1.95751953125, 2.040771484375, 2.1240234375, 2.207275390625, 2.29052734375, 2.373779296875, 2.45703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 9.0, 3.0, 9.0, 17.0, 39.0, 33.0, 71.0, 94.0, 119.0, 123.0, 126.0, 126.0, 73.0, 48.0, 30.0, 14.0, 13.0, 10.0, 5.0, 2.0, 6.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.546600341796875, -2.46429443359375, -2.381988525390625, -2.2996826171875, -2.217376708984375, -2.13507080078125, -2.052764892578125, -1.970458984375, -1.888153076171875, -1.80584716796875, -1.723541259765625, -1.6412353515625, -1.558929443359375, -1.47662353515625, -1.394317626953125, -1.31201171875, -1.229705810546875, -1.14739990234375, -1.065093994140625, -0.9827880859375, -0.900482177734375, -0.81817626953125, -0.735870361328125, -0.653564453125, -0.571258544921875, -0.48895263671875, -0.406646728515625, -0.3243408203125, -0.242034912109375, -0.15972900390625, -0.077423095703125, 0.0048828125, 0.087188720703125, 0.16949462890625, 0.251800537109375, 0.3341064453125, 0.416412353515625, 0.49871826171875, 0.581024169921875, 0.663330078125, 0.745635986328125, 0.82794189453125, 0.910247802734375, 0.9925537109375, 1.074859619140625, 1.15716552734375, 1.239471435546875, 1.32177734375, 1.404083251953125, 1.48638916015625, 1.568695068359375, 1.6510009765625, 1.733306884765625, 1.81561279296875, 1.897918701171875, 1.980224609375, 2.062530517578125, 2.14483642578125, 2.227142333984375, 2.3094482421875, 2.391754150390625, 2.47406005859375, 2.556365966796875, 2.638671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 9.0, 11.0, 44.0, 75.0, 170.0, 327.0, 198.0, 98.0, 32.0, 10.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.619117736816406, -41.846126556396484, -40.07313919067383, -38.300148010253906, -36.527156829833984, -34.75416564941406, -32.981178283691406, -31.208187103271484, -29.435197830200195, -27.662208557128906, -25.889217376708984, -24.116228103637695, -22.343238830566406, -20.570247650146484, -18.797258377075195, -17.024269104003906, -15.251277923583984, -13.478287696838379, -11.705297470092773, -9.932308197021484, -8.159317970275879, -6.386327743530273, -4.613338470458984, -2.840348243713379, -1.0673580169677734, 0.7056319713592529, 2.4786219596862793, 4.251611709594727, 6.024601936340332, 7.7975921630859375, 9.570581436157227, 11.343571662902832, 13.116561889648438, 14.889552116394043, 16.66254234313965, 18.435531616210938, 20.20852279663086, 21.98151206970215, 23.754501342773438, 25.52749252319336, 27.30048179626465, 29.073471069335938, 30.84646224975586, 32.61945343017578, 34.39244079589844, 36.16543197631836, 37.93842315673828, 39.71141052246094, 41.48440170288086, 43.25739288330078, 45.03038024902344, 46.80337142944336, 48.57636260986328, 50.34934997558594, 52.12234115600586, 53.89533233642578, 55.66831970214844, 57.44131088256836, 59.214298248291016, 60.98728942871094, 62.76028060913086, 64.53327178955078, 66.30625915527344, 68.0792465209961, 69.85224151611328]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 3.0, 1.0, 8.0, 14.0, 9.0, 7.0, 10.0, 13.0, 21.0, 24.0, 24.0, 28.0, 29.0, 23.0, 33.0, 33.0, 48.0, 66.0, 72.0, 65.0, 66.0, 44.0, 45.0, 41.0, 24.0, 32.0, 23.0, 35.0, 20.0, 24.0, 22.0, 17.0, 11.0, 15.0, 7.0, 7.0, 6.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-26.612018585205078, -25.818632125854492, -25.025245666503906, -24.23185920715332, -23.438472747802734, -22.64508819580078, -21.851699829101562, -21.05831527709961, -20.264928817749023, -19.471542358398438, -18.67815589904785, -17.884769439697266, -17.09138298034668, -16.297996520996094, -15.504611015319824, -14.711225509643555, -13.917838096618652, -13.124451637268066, -12.33106517791748, -11.537679672241211, -10.744293212890625, -9.950906753540039, -9.157520294189453, -8.364133834838867, -7.5707478523254395, -6.7773613929748535, -5.983975410461426, -5.19058895111084, -4.397202491760254, -3.603816509246826, -2.8104300498962402, -2.0170440673828125, -1.2236576080322266, -0.43027132749557495, 0.36311495304107666, 1.156501293182373, 1.9498875141143799, 2.7432737350463867, 3.5366601943969727, 4.3300461769104, 5.123432636260986, 5.916819095611572, 6.710205078125, 7.503591537475586, 8.296977996826172, 9.090364456176758, 9.883750915527344, 10.677136421203613, 11.4705228805542, 12.263909339904785, 13.057295799255371, 13.85068130493164, 14.644067764282227, 15.437454223632812, 16.2308406829834, 17.024227142333984, 17.81761360168457, 18.611000061035156, 19.404386520385742, 20.197772979736328, 20.991159439086914, 21.7845458984375, 22.577930450439453, 23.37131690979004, 24.164703369140625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 13.0, 16.0, 18.0, 30.0, 65.0, 111.0, 241.0, 524.0, 1307.0, 3766.0, 14697.0, 91336.0, 1971153.0, 1994760.0, 94641.0, 15091.0, 3958.0, 1314.0, 597.0, 281.0, 135.0, 90.0, 42.0, 29.0, 15.0, 7.0, 7.0, 7.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.29449462890625, -3.1846923828125, -3.07489013671875, -2.965087890625, -2.85528564453125, -2.7454833984375, -2.63568115234375, -2.52587890625, -2.41607666015625, -2.3062744140625, -2.19647216796875, -2.086669921875, -1.97686767578125, -1.8670654296875, -1.75726318359375, -1.6474609375, -1.53765869140625, -1.4278564453125, -1.31805419921875, -1.208251953125, -1.09844970703125, -0.9886474609375, -0.87884521484375, -0.76904296875, -0.65924072265625, -0.5494384765625, -0.43963623046875, -0.329833984375, -0.22003173828125, -0.1102294921875, -0.00042724609375, 0.109375, 0.21917724609375, 0.3289794921875, 0.43878173828125, 0.548583984375, 0.65838623046875, 0.7681884765625, 0.87799072265625, 0.98779296875, 1.09759521484375, 1.2073974609375, 1.31719970703125, 1.427001953125, 1.53680419921875, 1.6466064453125, 1.75640869140625, 1.8662109375, 1.97601318359375, 2.0858154296875, 2.19561767578125, 2.305419921875, 2.41522216796875, 2.5250244140625, 2.63482666015625, 2.74462890625, 2.85443115234375, 2.9642333984375, 3.07403564453125, 3.183837890625, 3.29364013671875, 3.4034423828125, 3.51324462890625, 3.623046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 8.0, 17.0, 17.0, 22.0, 31.0, 31.0, 51.0, 58.0, 49.0, 53.0, 74.0, 60.0, 69.0, 60.0, 69.0, 66.0, 45.0, 40.0, 34.0, 30.0, 31.0, 23.0, 12.0, 13.0, 6.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6328125, -2.56512451171875, -2.4974365234375, -2.42974853515625, -2.362060546875, -2.29437255859375, -2.2266845703125, -2.15899658203125, -2.09130859375, -2.02362060546875, -1.9559326171875, -1.88824462890625, -1.820556640625, -1.75286865234375, -1.6851806640625, -1.61749267578125, -1.5498046875, -1.48211669921875, -1.4144287109375, -1.34674072265625, -1.279052734375, -1.21136474609375, -1.1436767578125, -1.07598876953125, -1.00830078125, -0.94061279296875, -0.8729248046875, -0.80523681640625, -0.737548828125, -0.66986083984375, -0.6021728515625, -0.53448486328125, -0.466796875, -0.39910888671875, -0.3314208984375, -0.26373291015625, -0.196044921875, -0.12835693359375, -0.0606689453125, 0.00701904296875, 0.07470703125, 0.14239501953125, 0.2100830078125, 0.27777099609375, 0.345458984375, 0.41314697265625, 0.4808349609375, 0.54852294921875, 0.6162109375, 0.68389892578125, 0.7515869140625, 0.81927490234375, 0.886962890625, 0.95465087890625, 1.0223388671875, 1.09002685546875, 1.15771484375, 1.22540283203125, 1.2930908203125, 1.36077880859375, 1.428466796875, 1.49615478515625, 1.5638427734375, 1.63153076171875, 1.69921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 16.0, 26.0, 38.0, 69.0, 110.0, 265.0, 457.0, 1004.0, 2889.0, 14021.0, 156170.0, 3741517.0, 253115.0, 18652.0, 3568.0, 1199.0, 514.0, 283.0, 157.0, 81.0, 38.0, 32.0, 17.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.499786376953125, -3.32965087890625, -3.159515380859375, -2.9893798828125, -2.819244384765625, -2.64910888671875, -2.478973388671875, -2.308837890625, -2.138702392578125, -1.96856689453125, -1.798431396484375, -1.6282958984375, -1.458160400390625, -1.28802490234375, -1.117889404296875, -0.94775390625, -0.777618408203125, -0.60748291015625, -0.437347412109375, -0.2672119140625, -0.097076416015625, 0.07305908203125, 0.243194580078125, 0.413330078125, 0.583465576171875, 0.75360107421875, 0.923736572265625, 1.0938720703125, 1.264007568359375, 1.43414306640625, 1.604278564453125, 1.7744140625, 1.944549560546875, 2.11468505859375, 2.284820556640625, 2.4549560546875, 2.625091552734375, 2.79522705078125, 2.965362548828125, 3.135498046875, 3.305633544921875, 3.47576904296875, 3.645904541015625, 3.8160400390625, 3.986175537109375, 4.15631103515625, 4.326446533203125, 4.49658203125, 4.666717529296875, 4.83685302734375, 5.006988525390625, 5.1771240234375, 5.347259521484375, 5.51739501953125, 5.687530517578125, 5.857666015625, 6.027801513671875, 6.19793701171875, 6.368072509765625, 6.5382080078125, 6.708343505859375, 6.87847900390625, 7.048614501953125, 7.21875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 8.0, 20.0, 12.0, 23.0, 36.0, 94.0, 173.0, 329.0, 849.0, 1212.0, 677.0, 318.0, 131.0, 77.0, 31.0, 25.0, 18.0, 11.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.35284423828125, -6.1783447265625, -6.00384521484375, -5.829345703125, -5.65484619140625, -5.4803466796875, -5.30584716796875, -5.13134765625, -4.95684814453125, -4.7823486328125, -4.60784912109375, -4.433349609375, -4.25885009765625, -4.0843505859375, -3.90985107421875, -3.7353515625, -3.56085205078125, -3.3863525390625, -3.21185302734375, -3.037353515625, -2.86285400390625, -2.6883544921875, -2.51385498046875, -2.33935546875, -2.16485595703125, -1.9903564453125, -1.81585693359375, -1.641357421875, -1.46685791015625, -1.2923583984375, -1.11785888671875, -0.943359375, -0.76885986328125, -0.5943603515625, -0.41986083984375, -0.245361328125, -0.07086181640625, 0.1036376953125, 0.27813720703125, 0.45263671875, 0.62713623046875, 0.8016357421875, 0.97613525390625, 1.150634765625, 1.32513427734375, 1.4996337890625, 1.67413330078125, 1.8486328125, 2.02313232421875, 2.1976318359375, 2.37213134765625, 2.546630859375, 2.72113037109375, 2.8956298828125, 3.07012939453125, 3.24462890625, 3.41912841796875, 3.5936279296875, 3.76812744140625, 3.942626953125, 4.11712646484375, 4.2916259765625, 4.46612548828125, 4.640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 22.0, 49.0, 169.0, 334.0, 264.0, 102.0, 34.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.25945281982422, -84.24256896972656, -82.2256851196289, -80.20879364013672, -78.19190979003906, -76.1750259399414, -74.15814208984375, -72.1412582397461, -70.12437438964844, -68.10749053955078, -66.09060668945312, -64.07371520996094, -62.05683135986328, -60.039947509765625, -58.02306365966797, -56.00617980957031, -53.989288330078125, -51.97240447998047, -49.95551681518555, -47.93863296508789, -45.92174530029297, -43.90486145019531, -41.887977600097656, -39.87109375, -37.85420608520508, -35.83732223510742, -33.8204345703125, -31.803550720214844, -29.786664962768555, -27.769779205322266, -25.75289535522461, -23.73600959777832, -21.71912384033203, -19.702238082885742, -17.685352325439453, -15.668468475341797, -13.651582717895508, -11.634696960449219, -9.617812156677246, -7.600927352905273, -5.584041595458984, -3.5671563148498535, -1.5502710342407227, 0.4666142463684082, 2.483499526977539, 4.500385284423828, 6.517270088195801, 8.534154891967773, 10.551040649414062, 12.567926406860352, 14.584811210632324, 16.601696014404297, 18.618581771850586, 20.635467529296875, 22.65235137939453, 24.66923713684082, 26.68612289428711, 28.7030086517334, 30.719894409179688, 32.736778259277344, 34.753662109375, 36.77054977416992, 38.78743362426758, 40.8043212890625, 42.821205139160156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 12.0, 13.0, 16.0, 18.0, 27.0, 47.0, 50.0, 46.0, 69.0, 63.0, 63.0, 82.0, 80.0, 76.0, 70.0, 66.0, 46.0, 36.0, 30.0, 30.0, 18.0, 12.0, 10.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.398324966430664, -28.576370239257812, -27.75441551208496, -26.93246078491211, -26.11050796508789, -25.28855323791504, -24.466598510742188, -23.644643783569336, -22.822689056396484, -22.000734329223633, -21.17877960205078, -20.356826782226562, -19.53487205505371, -18.71291732788086, -17.890962600708008, -17.069007873535156, -16.247055053710938, -15.425100326538086, -14.60314655303955, -13.7811918258667, -12.959238052368164, -12.137283325195312, -11.315328598022461, -10.49337387084961, -9.671420097351074, -8.849465370178223, -8.027511596679688, -7.205556869506836, -6.383602619171143, -5.561648368835449, -4.739693641662598, -3.9177393913269043, -3.095783233642578, -2.2738289833068848, -1.4518744945526123, -0.6299200057983398, 0.19203424453735352, 1.0139884948730469, 1.8359432220458984, 2.657897472381592, 3.479851722717285, 4.3018059730529785, 5.123760223388672, 5.945714950561523, 6.767669200897217, 7.58962345123291, 8.411578178405762, 9.233531951904297, 10.055486679077148, 10.87744140625, 11.699395179748535, 12.521349906921387, 13.343303680419922, 14.165258407592773, 14.987213134765625, 15.809167861938477, 16.631122589111328, 17.45307731628418, 18.27503204345703, 19.09698486328125, 19.9189395904541, 20.740894317626953, 21.562849044799805, 22.384803771972656, 23.206756591796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 12.0, 7.0, 6.0, 18.0, 24.0, 30.0, 51.0, 82.0, 133.0, 207.0, 441.0, 913.0, 1992.0, 4838.0, 13689.0, 46058.0, 183975.0, 521463.0, 201508.0, 49211.0, 14675.0, 5129.0, 2104.0, 929.0, 493.0, 238.0, 110.0, 72.0, 50.0, 24.0, 22.0, 20.0, 10.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.38671875, -4.259674072265625, -4.13262939453125, -4.005584716796875, -3.8785400390625, -3.751495361328125, -3.62445068359375, -3.497406005859375, -3.370361328125, -3.243316650390625, -3.11627197265625, -2.989227294921875, -2.8621826171875, -2.735137939453125, -2.60809326171875, -2.481048583984375, -2.35400390625, -2.226959228515625, -2.09991455078125, -1.972869873046875, -1.8458251953125, -1.718780517578125, -1.59173583984375, -1.464691162109375, -1.337646484375, -1.210601806640625, -1.08355712890625, -0.956512451171875, -0.8294677734375, -0.702423095703125, -0.57537841796875, -0.448333740234375, -0.3212890625, -0.194244384765625, -0.06719970703125, 0.059844970703125, 0.1868896484375, 0.313934326171875, 0.44097900390625, 0.568023681640625, 0.695068359375, 0.822113037109375, 0.94915771484375, 1.076202392578125, 1.2032470703125, 1.330291748046875, 1.45733642578125, 1.584381103515625, 1.71142578125, 1.838470458984375, 1.96551513671875, 2.092559814453125, 2.2196044921875, 2.346649169921875, 2.47369384765625, 2.600738525390625, 2.727783203125, 2.854827880859375, 2.98187255859375, 3.108917236328125, 3.2359619140625, 3.363006591796875, 3.49005126953125, 3.617095947265625, 3.744140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 0.0, 3.0, 5.0, 7.0, 7.0, 13.0, 15.0, 11.0, 20.0, 24.0, 26.0, 22.0, 30.0, 31.0, 43.0, 31.0, 38.0, 39.0, 48.0, 44.0, 49.0, 40.0, 51.0, 44.0, 47.0, 40.0, 46.0, 38.0, 35.0, 24.0, 22.0, 18.0, 21.0, 17.0, 13.0, 9.0, 5.0, 4.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.34014892578125, -1.2916259765625, -1.24310302734375, -1.194580078125, -1.14605712890625, -1.0975341796875, -1.04901123046875, -1.00048828125, -0.95196533203125, -0.9034423828125, -0.85491943359375, -0.806396484375, -0.75787353515625, -0.7093505859375, -0.66082763671875, -0.6123046875, -0.56378173828125, -0.5152587890625, -0.46673583984375, -0.418212890625, -0.36968994140625, -0.3211669921875, -0.27264404296875, -0.22412109375, -0.17559814453125, -0.1270751953125, -0.07855224609375, -0.030029296875, 0.01849365234375, 0.0670166015625, 0.11553955078125, 0.1640625, 0.21258544921875, 0.2611083984375, 0.30963134765625, 0.358154296875, 0.40667724609375, 0.4552001953125, 0.50372314453125, 0.55224609375, 0.60076904296875, 0.6492919921875, 0.69781494140625, 0.746337890625, 0.79486083984375, 0.8433837890625, 0.89190673828125, 0.9404296875, 0.98895263671875, 1.0374755859375, 1.08599853515625, 1.134521484375, 1.18304443359375, 1.2315673828125, 1.28009033203125, 1.32861328125, 1.37713623046875, 1.4256591796875, 1.47418212890625, 1.522705078125, 1.57122802734375, 1.6197509765625, 1.66827392578125, 1.716796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 8.0, 12.0, 13.0, 27.0, 18.0, 36.0, 38.0, 59.0, 91.0, 142.0, 234.0, 369.0, 615.0, 1158.0, 2484.0, 8488.0, 57883.0, 762023.0, 188849.0, 18202.0, 4016.0, 1661.0, 765.0, 476.0, 307.0, 164.0, 146.0, 82.0, 36.0, 41.0, 28.0, 28.0, 9.0, 8.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.6953125, -8.45196533203125, -8.2086181640625, -7.96527099609375, -7.721923828125, -7.47857666015625, -7.2352294921875, -6.99188232421875, -6.74853515625, -6.50518798828125, -6.2618408203125, -6.01849365234375, -5.775146484375, -5.53179931640625, -5.2884521484375, -5.04510498046875, -4.8017578125, -4.55841064453125, -4.3150634765625, -4.07171630859375, -3.828369140625, -3.58502197265625, -3.3416748046875, -3.09832763671875, -2.85498046875, -2.61163330078125, -2.3682861328125, -2.12493896484375, -1.881591796875, -1.63824462890625, -1.3948974609375, -1.15155029296875, -0.908203125, -0.66485595703125, -0.4215087890625, -0.17816162109375, 0.065185546875, 0.30853271484375, 0.5518798828125, 0.79522705078125, 1.03857421875, 1.28192138671875, 1.5252685546875, 1.76861572265625, 2.011962890625, 2.25531005859375, 2.4986572265625, 2.74200439453125, 2.9853515625, 3.22869873046875, 3.4720458984375, 3.71539306640625, 3.958740234375, 4.20208740234375, 4.4454345703125, 4.68878173828125, 4.93212890625, 5.17547607421875, 5.4188232421875, 5.66217041015625, 5.905517578125, 6.14886474609375, 6.3922119140625, 6.63555908203125, 6.87890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 6.0, 11.0, 17.0, 16.0, 20.0, 23.0, 28.0, 28.0, 50.0, 41.0, 51.0, 67.0, 70.0, 70.0, 73.0, 72.0, 62.0, 52.0, 39.0, 26.0, 37.0, 28.0, 23.0, 10.0, 16.0, 12.0, 15.0, 10.0, 8.0, 1.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.08563232421875, -6.8236083984375, -6.56158447265625, -6.299560546875, -6.03753662109375, -5.7755126953125, -5.51348876953125, -5.25146484375, -4.98944091796875, -4.7274169921875, -4.46539306640625, -4.203369140625, -3.94134521484375, -3.6793212890625, -3.41729736328125, -3.1552734375, -2.89324951171875, -2.6312255859375, -2.36920166015625, -2.107177734375, -1.84515380859375, -1.5831298828125, -1.32110595703125, -1.05908203125, -0.79705810546875, -0.5350341796875, -0.27301025390625, -0.010986328125, 0.25103759765625, 0.5130615234375, 0.77508544921875, 1.037109375, 1.29913330078125, 1.5611572265625, 1.82318115234375, 2.085205078125, 2.34722900390625, 2.6092529296875, 2.87127685546875, 3.13330078125, 3.39532470703125, 3.6573486328125, 3.91937255859375, 4.181396484375, 4.44342041015625, 4.7054443359375, 4.96746826171875, 5.2294921875, 5.49151611328125, 5.7535400390625, 6.01556396484375, 6.277587890625, 6.53961181640625, 6.8016357421875, 7.06365966796875, 7.32568359375, 7.58770751953125, 7.8497314453125, 8.11175537109375, 8.373779296875, 8.63580322265625, 8.8978271484375, 9.15985107421875, 9.421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 14.0, 5.0, 9.0, 21.0, 12.0, 26.0, 51.0, 42.0, 121.0, 123.0, 236.0, 406.0, 1135.0, 4413.0, 35033.0, 825736.0, 166396.0, 11094.0, 2129.0, 704.0, 317.0, 170.0, 105.0, 61.0, 39.0, 32.0, 24.0, 20.0, 14.0, 11.0, 16.0, 7.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.625, -2.536773681640625, -2.44854736328125, -2.360321044921875, -2.2720947265625, -2.183868408203125, -2.09564208984375, -2.007415771484375, -1.919189453125, -1.830963134765625, -1.74273681640625, -1.654510498046875, -1.5662841796875, -1.478057861328125, -1.38983154296875, -1.301605224609375, -1.21337890625, -1.125152587890625, -1.03692626953125, -0.948699951171875, -0.8604736328125, -0.772247314453125, -0.68402099609375, -0.595794677734375, -0.507568359375, -0.419342041015625, -0.33111572265625, -0.242889404296875, -0.1546630859375, -0.066436767578125, 0.02178955078125, 0.110015869140625, 0.1982421875, 0.286468505859375, 0.37469482421875, 0.462921142578125, 0.5511474609375, 0.639373779296875, 0.72760009765625, 0.815826416015625, 0.904052734375, 0.992279052734375, 1.08050537109375, 1.168731689453125, 1.2569580078125, 1.345184326171875, 1.43341064453125, 1.521636962890625, 1.60986328125, 1.698089599609375, 1.78631591796875, 1.874542236328125, 1.9627685546875, 2.050994873046875, 2.13922119140625, 2.227447509765625, 2.315673828125, 2.403900146484375, 2.49212646484375, 2.580352783203125, 2.6685791015625, 2.756805419921875, 2.84503173828125, 2.933258056640625, 3.021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 3.0, 9.0, 6.0, 8.0, 9.0, 13.0, 18.0, 18.0, 20.0, 20.0, 27.0, 32.0, 44.0, 70.0, 82.0, 95.0, 92.0, 85.0, 62.0, 46.0, 41.0, 21.0, 23.0, 24.0, 23.0, 20.0, 14.0, 13.0, 9.0, 3.0, 6.0, 4.0, 7.0, 0.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-0.0003025531768798828, -0.0002939067780971527, -0.0002852603793144226, -0.0002766139805316925, -0.0002679675817489624, -0.0002593211829662323, -0.0002506747841835022, -0.0002420283854007721, -0.000233381986618042, -0.0002247355878353119, -0.0002160891890525818, -0.00020744279026985168, -0.00019879639148712158, -0.00019014999270439148, -0.00018150359392166138, -0.00017285719513893127, -0.00016421079635620117, -0.00015556439757347107, -0.00014691799879074097, -0.00013827160000801086, -0.00012962520122528076, -0.00012097880244255066, -0.00011233240365982056, -0.00010368600487709045, -9.503960609436035e-05, -8.639320731163025e-05, -7.774680852890015e-05, -6.910040974617004e-05, -6.045401096343994e-05, -5.180761218070984e-05, -4.3161213397979736e-05, -3.4514814615249634e-05, -2.586841583251953e-05, -1.722201704978943e-05, -8.575618267059326e-06, 7.078051567077637e-08, 8.717179298400879e-06, 1.736357808113098e-05, 2.6009976863861084e-05, 3.4656375646591187e-05, 4.330277442932129e-05, 5.194917321205139e-05, 6.0595571994781494e-05, 6.92419707775116e-05, 7.78883695602417e-05, 8.65347683429718e-05, 9.51811671257019e-05, 0.00010382756590843201, 0.00011247396469116211, 0.00012112036347389221, 0.00012976676225662231, 0.00013841316103935242, 0.00014705955982208252, 0.00015570595860481262, 0.00016435235738754272, 0.00017299875617027283, 0.00018164515495300293, 0.00019029155373573303, 0.00019893795251846313, 0.00020758435130119324, 0.00021623075008392334, 0.00022487714886665344, 0.00023352354764938354, 0.00024216994643211365, 0.00025081634521484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 19.0, 13.0, 28.0, 54.0, 70.0, 130.0, 249.0, 511.0, 1154.0, 3631.0, 17630.0, 264168.0, 722164.0, 30573.0, 5347.0, 1524.0, 571.0, 275.0, 148.0, 80.0, 54.0, 43.0, 35.0, 17.0, 11.0, 8.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.233123779296875, -2.15374755859375, -2.074371337890625, -1.9949951171875, -1.915618896484375, -1.83624267578125, -1.756866455078125, -1.677490234375, -1.598114013671875, -1.51873779296875, -1.439361572265625, -1.3599853515625, -1.280609130859375, -1.20123291015625, -1.121856689453125, -1.04248046875, -0.963104248046875, -0.88372802734375, -0.804351806640625, -0.7249755859375, -0.645599365234375, -0.56622314453125, -0.486846923828125, -0.407470703125, -0.328094482421875, -0.24871826171875, -0.169342041015625, -0.0899658203125, -0.010589599609375, 0.06878662109375, 0.148162841796875, 0.2275390625, 0.306915283203125, 0.38629150390625, 0.465667724609375, 0.5450439453125, 0.624420166015625, 0.70379638671875, 0.783172607421875, 0.862548828125, 0.941925048828125, 1.02130126953125, 1.100677490234375, 1.1800537109375, 1.259429931640625, 1.33880615234375, 1.418182373046875, 1.49755859375, 1.576934814453125, 1.65631103515625, 1.735687255859375, 1.8150634765625, 1.894439697265625, 1.97381591796875, 2.053192138671875, 2.132568359375, 2.211944580078125, 2.29132080078125, 2.370697021484375, 2.4500732421875, 2.529449462890625, 2.60882568359375, 2.688201904296875, 2.767578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 5.0, 7.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 30.0, 31.0, 53.0, 71.0, 93.0, 122.0, 123.0, 108.0, 78.0, 59.0, 36.0, 22.0, 16.0, 21.0, 11.0, 11.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6103515625, -1.5530548095703125, -1.495758056640625, -1.4384613037109375, -1.38116455078125, -1.3238677978515625, -1.266571044921875, -1.2092742919921875, -1.1519775390625, -1.0946807861328125, -1.037384033203125, -0.9800872802734375, -0.92279052734375, -0.8654937744140625, -0.808197021484375, -0.7509002685546875, -0.693603515625, -0.6363067626953125, -0.579010009765625, -0.5217132568359375, -0.46441650390625, -0.4071197509765625, -0.349822998046875, -0.2925262451171875, -0.2352294921875, -0.1779327392578125, -0.120635986328125, -0.0633392333984375, -0.00604248046875, 0.0512542724609375, 0.108551025390625, 0.1658477783203125, 0.22314453125, 0.2804412841796875, 0.337738037109375, 0.3950347900390625, 0.45233154296875, 0.5096282958984375, 0.566925048828125, 0.6242218017578125, 0.6815185546875, 0.7388153076171875, 0.796112060546875, 0.8534088134765625, 0.91070556640625, 0.9680023193359375, 1.025299072265625, 1.0825958251953125, 1.139892578125, 1.1971893310546875, 1.254486083984375, 1.3117828369140625, 1.36907958984375, 1.4263763427734375, 1.483673095703125, 1.5409698486328125, 1.5982666015625, 1.6555633544921875, 1.712860107421875, 1.7701568603515625, 1.82745361328125, 1.8847503662109375, 1.942047119140625, 1.9993438720703125, 2.056640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 19.0, 39.0, 116.0, 249.0, 328.0, 125.0, 51.0, 20.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.89119338989258, -60.13451385498047, -58.377830505371094, -56.621150970458984, -54.86446762084961, -53.1077880859375, -51.351104736328125, -49.594425201416016, -47.837745666503906, -46.0810661315918, -44.32438278198242, -42.56770324707031, -40.81101989746094, -39.05434036254883, -37.29766082763672, -35.540977478027344, -33.78429412841797, -32.02761459350586, -30.270931243896484, -28.514251708984375, -26.757568359375, -25.00088882446289, -23.24420738220215, -21.487525939941406, -19.730844497680664, -17.974163055419922, -16.21748161315918, -14.460801124572754, -12.704119682312012, -10.94743824005127, -9.190757751464844, -7.434076309204102, -5.677398681640625, -3.920717477798462, -2.164036273956299, -0.40735530853271484, 1.3493261337280273, 3.1060075759887695, 4.862688064575195, 6.6193695068359375, 8.37605094909668, 10.132732391357422, 11.889413833618164, 13.64609432220459, 15.402775764465332, 17.15945816040039, 18.9161376953125, 20.672819137573242, 22.429500579833984, 24.186182022094727, 25.94286346435547, 27.699542999267578, 29.456226348876953, 31.212905883789062, 32.96958923339844, 34.72626876831055, 36.482948303222656, 38.239627838134766, 39.99631118774414, 41.75299072265625, 43.509674072265625, 45.266353607177734, 47.023033142089844, 48.77971649169922, 50.536399841308594]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 6.0, 11.0, 8.0, 19.0, 20.0, 23.0, 23.0, 30.0, 35.0, 31.0, 36.0, 46.0, 58.0, 91.0, 109.0, 75.0, 62.0, 54.0, 46.0, 40.0, 22.0, 18.0, 28.0, 28.0, 20.0, 10.0, 14.0, 5.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.73558235168457, -22.764131546020508, -21.792680740356445, -20.821231842041016, -19.849781036376953, -18.87833023071289, -17.906879425048828, -16.935428619384766, -15.96397876739502, -14.992527961730957, -14.021078109741211, -13.049627304077148, -12.078176498413086, -11.10672664642334, -10.135275840759277, -9.163825988769531, -8.192375183105469, -7.2209248542785645, -6.24947452545166, -5.278023719787598, -4.306573390960693, -3.335123062133789, -2.3636722564697266, -1.3922219276428223, -0.42077159881591797, 0.5506788492202759, 1.5221292972564697, 2.493579864501953, 3.4650301933288574, 4.436480522155762, 5.407931327819824, 6.3793816566467285, 7.350833892822266, 8.322284698486328, 9.293734550476074, 10.265185356140137, 11.236635208129883, 12.208086013793945, 13.179536819458008, 14.15098762512207, 15.122437477111816, 16.093887329101562, 17.065338134765625, 18.036788940429688, 19.00823974609375, 19.979690551757812, 20.951141357421875, 21.922590255737305, 22.894041061401367, 23.86549186706543, 24.836942672729492, 25.808391571044922, 26.779842376708984, 27.751293182373047, 28.72274398803711, 29.694194793701172, 30.665645599365234, 31.637096405029297, 32.60854721069336, 33.57999801635742, 34.551448822021484, 35.52289581298828, 36.494346618652344, 37.465797424316406, 38.43724822998047]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 8.0, 20.0, 38.0, 46.0, 105.0, 157.0, 366.0, 816.0, 2449.0, 10103.0, 96133.0, 3544438.0, 513128.0, 20432.0, 3846.0, 1185.0, 490.0, 225.0, 114.0, 70.0, 29.0, 19.0, 18.0, 13.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.167633056640625, -5.03057861328125, -4.893524169921875, -4.7564697265625, -4.619415283203125, -4.48236083984375, -4.345306396484375, -4.208251953125, -4.071197509765625, -3.93414306640625, -3.797088623046875, -3.6600341796875, -3.522979736328125, -3.38592529296875, -3.248870849609375, -3.11181640625, -2.974761962890625, -2.83770751953125, -2.700653076171875, -2.5635986328125, -2.426544189453125, -2.28948974609375, -2.152435302734375, -2.015380859375, -1.878326416015625, -1.74127197265625, -1.604217529296875, -1.4671630859375, -1.330108642578125, -1.19305419921875, -1.055999755859375, -0.9189453125, -0.781890869140625, -0.64483642578125, -0.507781982421875, -0.3707275390625, -0.233673095703125, -0.09661865234375, 0.040435791015625, 0.177490234375, 0.314544677734375, 0.45159912109375, 0.588653564453125, 0.7257080078125, 0.862762451171875, 0.99981689453125, 1.136871337890625, 1.27392578125, 1.410980224609375, 1.54803466796875, 1.685089111328125, 1.8221435546875, 1.959197998046875, 2.09625244140625, 2.233306884765625, 2.370361328125, 2.507415771484375, 2.64447021484375, 2.781524658203125, 2.9185791015625, 3.055633544921875, 3.19268798828125, 3.329742431640625, 3.466796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 10.0, 7.0, 7.0, 12.0, 17.0, 21.0, 24.0, 25.0, 35.0, 35.0, 54.0, 35.0, 44.0, 60.0, 61.0, 53.0, 65.0, 58.0, 57.0, 45.0, 54.0, 40.0, 30.0, 26.0, 35.0, 28.0, 15.0, 15.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4443359375, -1.3903350830078125, -1.336334228515625, -1.2823333740234375, -1.22833251953125, -1.1743316650390625, -1.120330810546875, -1.0663299560546875, -1.0123291015625, -0.9583282470703125, -0.904327392578125, -0.8503265380859375, -0.79632568359375, -0.7423248291015625, -0.688323974609375, -0.6343231201171875, -0.580322265625, -0.5263214111328125, -0.472320556640625, -0.4183197021484375, -0.36431884765625, -0.3103179931640625, -0.256317138671875, -0.2023162841796875, -0.1483154296875, -0.0943145751953125, -0.040313720703125, 0.0136871337890625, 0.06768798828125, 0.1216888427734375, 0.175689697265625, 0.2296905517578125, 0.28369140625, 0.3376922607421875, 0.391693115234375, 0.4456939697265625, 0.49969482421875, 0.5536956787109375, 0.607696533203125, 0.6616973876953125, 0.7156982421875, 0.7696990966796875, 0.823699951171875, 0.8777008056640625, 0.93170166015625, 0.9857025146484375, 1.039703369140625, 1.0937042236328125, 1.147705078125, 1.2017059326171875, 1.255706787109375, 1.3097076416015625, 1.36370849609375, 1.4177093505859375, 1.471710205078125, 1.5257110595703125, 1.5797119140625, 1.6337127685546875, 1.687713623046875, 1.7417144775390625, 1.79571533203125, 1.8497161865234375, 1.903717041015625, 1.9577178955078125, 2.01171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 11.0, 17.0, 7.0, 30.0, 50.0, 93.0, 194.0, 440.0, 921.0, 2484.0, 9327.0, 89567.0, 3770886.0, 295450.0, 18247.0, 3899.0, 1402.0, 579.0, 284.0, 162.0, 88.0, 49.0, 31.0, 12.0, 13.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.17578125, -5.0069580078125, -4.838134765625, -4.6693115234375, -4.50048828125, -4.3316650390625, -4.162841796875, -3.9940185546875, -3.8251953125, -3.6563720703125, -3.487548828125, -3.3187255859375, -3.14990234375, -2.9810791015625, -2.812255859375, -2.6434326171875, -2.474609375, -2.3057861328125, -2.136962890625, -1.9681396484375, -1.79931640625, -1.6304931640625, -1.461669921875, -1.2928466796875, -1.1240234375, -0.9552001953125, -0.786376953125, -0.6175537109375, -0.44873046875, -0.2799072265625, -0.111083984375, 0.0577392578125, 0.2265625, 0.3953857421875, 0.564208984375, 0.7330322265625, 0.90185546875, 1.0706787109375, 1.239501953125, 1.4083251953125, 1.5771484375, 1.7459716796875, 1.914794921875, 2.0836181640625, 2.25244140625, 2.4212646484375, 2.590087890625, 2.7589111328125, 2.927734375, 3.0965576171875, 3.265380859375, 3.4342041015625, 3.60302734375, 3.7718505859375, 3.940673828125, 4.1094970703125, 4.2783203125, 4.4471435546875, 4.615966796875, 4.7847900390625, 4.95361328125, 5.1224365234375, 5.291259765625, 5.4600830078125, 5.62890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 8.0, 6.0, 7.0, 21.0, 27.0, 45.0, 89.0, 164.0, 399.0, 891.0, 1184.0, 636.0, 256.0, 126.0, 78.0, 47.0, 21.0, 24.0, 16.0, 9.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.50994873046875, -4.3558349609375, -4.20172119140625, -4.047607421875, -3.89349365234375, -3.7393798828125, -3.58526611328125, -3.43115234375, -3.27703857421875, -3.1229248046875, -2.96881103515625, -2.814697265625, -2.66058349609375, -2.5064697265625, -2.35235595703125, -2.1982421875, -2.04412841796875, -1.8900146484375, -1.73590087890625, -1.581787109375, -1.42767333984375, -1.2735595703125, -1.11944580078125, -0.96533203125, -0.81121826171875, -0.6571044921875, -0.50299072265625, -0.348876953125, -0.19476318359375, -0.0406494140625, 0.11346435546875, 0.267578125, 0.42169189453125, 0.5758056640625, 0.72991943359375, 0.884033203125, 1.03814697265625, 1.1922607421875, 1.34637451171875, 1.50048828125, 1.65460205078125, 1.8087158203125, 1.96282958984375, 2.116943359375, 2.27105712890625, 2.4251708984375, 2.57928466796875, 2.7333984375, 2.88751220703125, 3.0416259765625, 3.19573974609375, 3.349853515625, 3.50396728515625, 3.6580810546875, 3.81219482421875, 3.96630859375, 4.12042236328125, 4.2745361328125, 4.42864990234375, 4.582763671875, 4.73687744140625, 4.8909912109375, 5.04510498046875, 5.19921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 34.0, 300.0, 522.0, 96.0, 22.0, 4.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-129.88209533691406, -126.72681427001953, -123.57154083251953, -120.416259765625, -117.26097869873047, -114.10569763183594, -110.95042419433594, -107.7951431274414, -104.63986206054688, -101.48458099365234, -98.32930755615234, -95.17402648925781, -92.01874542236328, -88.86346435546875, -85.70819091796875, -82.55290985107422, -79.39763641357422, -76.24235534667969, -73.08708190917969, -69.93180084228516, -66.77651977539062, -63.62124252319336, -60.465965270996094, -57.31068420410156, -54.1554069519043, -51.00012969970703, -47.8448486328125, -44.689571380615234, -41.53429412841797, -38.37901306152344, -35.22373580932617, -32.068458557128906, -28.913177490234375, -25.757898330688477, -22.602619171142578, -19.447341918945312, -16.292062759399414, -13.136783599853516, -9.98150634765625, -6.826227188110352, -3.670948028564453, -0.5156693458557129, 2.6396093368530273, 5.794887542724609, 8.950166702270508, 12.105445861816406, 15.260723114013672, 18.41600227355957, 21.57128143310547, 24.726560592651367, 27.881839752197266, 31.03711700439453, 34.19239807128906, 37.34767532348633, 40.502952575683594, 43.658233642578125, 46.81351089477539, 49.968788146972656, 53.12406921386719, 56.27934646606445, 59.43462371826172, 62.58990478515625, 65.74517822265625, 68.90045928955078, 72.05574035644531]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 5.0, 7.0, 9.0, 11.0, 13.0, 20.0, 17.0, 18.0, 20.0, 26.0, 27.0, 34.0, 32.0, 30.0, 40.0, 38.0, 49.0, 51.0, 51.0, 47.0, 36.0, 38.0, 56.0, 38.0, 41.0, 32.0, 30.0, 23.0, 30.0, 25.0, 22.0, 15.0, 8.0, 10.0, 12.0, 8.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.217727661132812, -15.789100646972656, -15.3604736328125, -14.931846618652344, -14.503219604492188, -14.074592590332031, -13.645965576171875, -13.217338562011719, -12.788711547851562, -12.360084533691406, -11.93145751953125, -11.502830505371094, -11.074203491210938, -10.645576477050781, -10.216949462890625, -9.788322448730469, -9.359694480895996, -8.93106746673584, -8.502440452575684, -8.073813438415527, -7.645186424255371, -7.216559410095215, -6.7879319190979, -6.359304904937744, -5.930677890777588, -5.502050876617432, -5.073423862457275, -4.644796371459961, -4.216169357299805, -3.7875425815582275, -3.358915328979492, -2.930288314819336, -2.5016613006591797, -2.0730342864990234, -1.6444071531295776, -1.2157800197601318, -0.7871530055999756, -0.35852599143981934, 0.07010126113891602, 0.49872827529907227, 0.9273552894592285, 1.3559823036193848, 1.7846094369888306, 2.2132365703582764, 2.6418635845184326, 3.070490598678589, 3.499117851257324, 3.9277448654174805, 4.356371879577637, 4.784998893737793, 5.213625907897949, 5.6422529220581055, 6.070879936218262, 6.499506950378418, 6.928134441375732, 7.356761455535889, 7.785388469696045, 8.21401596069336, 8.642642974853516, 9.071269989013672, 9.499897003173828, 9.928524017333984, 10.35715103149414, 10.785778045654297, 11.214405059814453]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 19.0, 25.0, 24.0, 34.0, 59.0, 95.0, 163.0, 302.0, 608.0, 1469.0, 3914.0, 13519.0, 60840.0, 332153.0, 495760.0, 108395.0, 21750.0, 5767.0, 1978.0, 768.0, 366.0, 172.0, 110.0, 58.0, 48.0, 44.0, 27.0, 19.0, 9.0, 11.0, 8.0, 8.0, 8.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7734375, -3.652374267578125, -3.53131103515625, -3.410247802734375, -3.2891845703125, -3.168121337890625, -3.04705810546875, -2.925994873046875, -2.804931640625, -2.683868408203125, -2.56280517578125, -2.441741943359375, -2.3206787109375, -2.199615478515625, -2.07855224609375, -1.957489013671875, -1.83642578125, -1.715362548828125, -1.59429931640625, -1.473236083984375, -1.3521728515625, -1.231109619140625, -1.11004638671875, -0.988983154296875, -0.867919921875, -0.746856689453125, -0.62579345703125, -0.504730224609375, -0.3836669921875, -0.262603759765625, -0.14154052734375, -0.020477294921875, 0.1005859375, 0.221649169921875, 0.34271240234375, 0.463775634765625, 0.5848388671875, 0.705902099609375, 0.82696533203125, 0.948028564453125, 1.069091796875, 1.190155029296875, 1.31121826171875, 1.432281494140625, 1.5533447265625, 1.674407958984375, 1.79547119140625, 1.916534423828125, 2.03759765625, 2.158660888671875, 2.27972412109375, 2.400787353515625, 2.5218505859375, 2.642913818359375, 2.76397705078125, 2.885040283203125, 3.006103515625, 3.127166748046875, 3.24822998046875, 3.369293212890625, 3.4903564453125, 3.611419677734375, 3.73248291015625, 3.853546142578125, 3.974609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 15.0, 14.0, 13.0, 24.0, 29.0, 26.0, 41.0, 43.0, 47.0, 48.0, 45.0, 56.0, 59.0, 55.0, 58.0, 60.0, 43.0, 42.0, 53.0, 33.0, 37.0, 29.0, 24.0, 27.0, 15.0, 14.0, 10.0, 4.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.512786865234375, -1.45916748046875, -1.405548095703125, -1.3519287109375, -1.298309326171875, -1.24468994140625, -1.191070556640625, -1.137451171875, -1.083831787109375, -1.03021240234375, -0.976593017578125, -0.9229736328125, -0.869354248046875, -0.81573486328125, -0.762115478515625, -0.70849609375, -0.654876708984375, -0.60125732421875, -0.547637939453125, -0.4940185546875, -0.440399169921875, -0.38677978515625, -0.333160400390625, -0.279541015625, -0.225921630859375, -0.17230224609375, -0.118682861328125, -0.0650634765625, -0.011444091796875, 0.04217529296875, 0.095794677734375, 0.1494140625, 0.203033447265625, 0.25665283203125, 0.310272216796875, 0.3638916015625, 0.417510986328125, 0.47113037109375, 0.524749755859375, 0.578369140625, 0.631988525390625, 0.68560791015625, 0.739227294921875, 0.7928466796875, 0.846466064453125, 0.90008544921875, 0.953704833984375, 1.00732421875, 1.060943603515625, 1.11456298828125, 1.168182373046875, 1.2218017578125, 1.275421142578125, 1.32904052734375, 1.382659912109375, 1.436279296875, 1.489898681640625, 1.54351806640625, 1.597137451171875, 1.6507568359375, 1.704376220703125, 1.75799560546875, 1.811614990234375, 1.865234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 2.0, 10.0, 6.0, 16.0, 20.0, 23.0, 28.0, 48.0, 82.0, 133.0, 211.0, 435.0, 932.0, 2495.0, 7971.0, 35008.0, 207853.0, 656723.0, 108120.0, 20178.0, 5105.0, 1691.0, 660.0, 334.0, 171.0, 109.0, 67.0, 35.0, 27.0, 15.0, 15.0, 8.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.258056640625, -3.12939453125, -3.000732421875, -2.8720703125, -2.743408203125, -2.61474609375, -2.486083984375, -2.357421875, -2.228759765625, -2.10009765625, -1.971435546875, -1.8427734375, -1.714111328125, -1.58544921875, -1.456787109375, -1.328125, -1.199462890625, -1.07080078125, -0.942138671875, -0.8134765625, -0.684814453125, -0.55615234375, -0.427490234375, -0.298828125, -0.170166015625, -0.04150390625, 0.087158203125, 0.2158203125, 0.344482421875, 0.47314453125, 0.601806640625, 0.73046875, 0.859130859375, 0.98779296875, 1.116455078125, 1.2451171875, 1.373779296875, 1.50244140625, 1.631103515625, 1.759765625, 1.888427734375, 2.01708984375, 2.145751953125, 2.2744140625, 2.403076171875, 2.53173828125, 2.660400390625, 2.7890625, 2.917724609375, 3.04638671875, 3.175048828125, 3.3037109375, 3.432373046875, 3.56103515625, 3.689697265625, 3.818359375, 3.947021484375, 4.07568359375, 4.204345703125, 4.3330078125, 4.461669921875, 4.59033203125, 4.718994140625, 4.84765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 9.0, 12.0, 12.0, 6.0, 23.0, 28.0, 17.0, 36.0, 34.0, 45.0, 37.0, 49.0, 36.0, 61.0, 56.0, 44.0, 51.0, 51.0, 51.0, 33.0, 46.0, 34.0, 34.0, 39.0, 30.0, 34.0, 13.0, 21.0, 12.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.69921875, -5.52587890625, -5.3525390625, -5.17919921875, -5.005859375, -4.83251953125, -4.6591796875, -4.48583984375, -4.3125, -4.13916015625, -3.9658203125, -3.79248046875, -3.619140625, -3.44580078125, -3.2724609375, -3.09912109375, -2.92578125, -2.75244140625, -2.5791015625, -2.40576171875, -2.232421875, -2.05908203125, -1.8857421875, -1.71240234375, -1.5390625, -1.36572265625, -1.1923828125, -1.01904296875, -0.845703125, -0.67236328125, -0.4990234375, -0.32568359375, -0.15234375, 0.02099609375, 0.1943359375, 0.36767578125, 0.541015625, 0.71435546875, 0.8876953125, 1.06103515625, 1.234375, 1.40771484375, 1.5810546875, 1.75439453125, 1.927734375, 2.10107421875, 2.2744140625, 2.44775390625, 2.62109375, 2.79443359375, 2.9677734375, 3.14111328125, 3.314453125, 3.48779296875, 3.6611328125, 3.83447265625, 4.0078125, 4.18115234375, 4.3544921875, 4.52783203125, 4.701171875, 4.87451171875, 5.0478515625, 5.22119140625, 5.39453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 9.0, 10.0, 8.0, 14.0, 29.0, 41.0, 68.0, 118.0, 222.0, 562.0, 1417.0, 4496.0, 18602.0, 110265.0, 706253.0, 170815.0, 26545.0, 5964.0, 1799.0, 665.0, 263.0, 148.0, 82.0, 40.0, 33.0, 24.0, 20.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2041015625, -1.164764404296875, -1.12542724609375, -1.086090087890625, -1.0467529296875, -1.007415771484375, -0.96807861328125, -0.928741455078125, -0.889404296875, -0.850067138671875, -0.81072998046875, -0.771392822265625, -0.7320556640625, -0.692718505859375, -0.65338134765625, -0.614044189453125, -0.57470703125, -0.535369873046875, -0.49603271484375, -0.456695556640625, -0.4173583984375, -0.378021240234375, -0.33868408203125, -0.299346923828125, -0.260009765625, -0.220672607421875, -0.18133544921875, -0.141998291015625, -0.1026611328125, -0.063323974609375, -0.02398681640625, 0.015350341796875, 0.0546875, 0.094024658203125, 0.13336181640625, 0.172698974609375, 0.2120361328125, 0.251373291015625, 0.29071044921875, 0.330047607421875, 0.369384765625, 0.408721923828125, 0.44805908203125, 0.487396240234375, 0.5267333984375, 0.566070556640625, 0.60540771484375, 0.644744873046875, 0.68408203125, 0.723419189453125, 0.76275634765625, 0.802093505859375, 0.8414306640625, 0.880767822265625, 0.92010498046875, 0.959442138671875, 0.998779296875, 1.038116455078125, 1.07745361328125, 1.116790771484375, 1.1561279296875, 1.195465087890625, 1.23480224609375, 1.274139404296875, 1.3134765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 13.0, 5.0, 19.0, 15.0, 41.0, 57.0, 59.0, 84.0, 116.0, 131.0, 119.0, 98.0, 64.0, 57.0, 30.0, 31.0, 12.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033926963806152344, -0.0003299899399280548, -0.0003207102417945862, -0.00031143054366111755, -0.0003021508455276489, -0.0002928711473941803, -0.00028359144926071167, -0.00027431175112724304, -0.0002650320529937744, -0.0002557523548603058, -0.00024647265672683716, -0.00023719295859336853, -0.0002279132604598999, -0.00021863356232643127, -0.00020935386419296265, -0.00020007416605949402, -0.0001907944679260254, -0.00018151476979255676, -0.00017223507165908813, -0.0001629553735256195, -0.00015367567539215088, -0.00014439597725868225, -0.00013511627912521362, -0.000125836580991745, -0.00011655688285827637, -0.00010727718472480774, -9.799748659133911e-05, -8.871778845787048e-05, -7.943809032440186e-05, -7.015839219093323e-05, -6.08786940574646e-05, -5.159899592399597e-05, -4.2319297790527344e-05, -3.3039599657058716e-05, -2.3759901523590088e-05, -1.448020339012146e-05, -5.200505256652832e-06, 4.079192876815796e-06, 1.3358891010284424e-05, 2.2638589143753052e-05, 3.191828727722168e-05, 4.119798541069031e-05, 5.0477683544158936e-05, 5.9757381677627563e-05, 6.903707981109619e-05, 7.831677794456482e-05, 8.759647607803345e-05, 9.687617421150208e-05, 0.0001061558723449707, 0.00011543557047843933, 0.00012471526861190796, 0.0001339949667453766, 0.00014327466487884521, 0.00015255436301231384, 0.00016183406114578247, 0.0001711137592792511, 0.00018039345741271973, 0.00018967315554618835, 0.00019895285367965698, 0.0002082325518131256, 0.00021751224994659424, 0.00022679194808006287, 0.0002360716462135315, 0.0002453513443470001, 0.00025463104248046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 8.0, 11.0, 13.0, 17.0, 19.0, 47.0, 63.0, 106.0, 257.0, 490.0, 1242.0, 3548.0, 12850.0, 67306.0, 606994.0, 298435.0, 43482.0, 9017.0, 2748.0, 1005.0, 397.0, 208.0, 123.0, 64.0, 31.0, 31.0, 19.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.568359375, -1.5258331298828125, -1.483306884765625, -1.4407806396484375, -1.39825439453125, -1.3557281494140625, -1.313201904296875, -1.2706756591796875, -1.2281494140625, -1.1856231689453125, -1.143096923828125, -1.1005706787109375, -1.05804443359375, -1.0155181884765625, -0.972991943359375, -0.9304656982421875, -0.887939453125, -0.8454132080078125, -0.802886962890625, -0.7603607177734375, -0.71783447265625, -0.6753082275390625, -0.632781982421875, -0.5902557373046875, -0.5477294921875, -0.5052032470703125, -0.462677001953125, -0.4201507568359375, -0.37762451171875, -0.3350982666015625, -0.292572021484375, -0.2500457763671875, -0.20751953125, -0.1649932861328125, -0.122467041015625, -0.0799407958984375, -0.03741455078125, 0.0051116943359375, 0.047637939453125, 0.0901641845703125, 0.1326904296875, 0.1752166748046875, 0.217742919921875, 0.2602691650390625, 0.30279541015625, 0.3453216552734375, 0.387847900390625, 0.4303741455078125, 0.472900390625, 0.5154266357421875, 0.557952880859375, 0.6004791259765625, 0.64300537109375, 0.6855316162109375, 0.728057861328125, 0.7705841064453125, 0.8131103515625, 0.8556365966796875, 0.898162841796875, 0.9406890869140625, 0.98321533203125, 1.0257415771484375, 1.068267822265625, 1.1107940673828125, 1.1533203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 10.0, 11.0, 9.0, 11.0, 19.0, 26.0, 29.0, 51.0, 53.0, 65.0, 75.0, 83.0, 72.0, 86.0, 91.0, 59.0, 49.0, 50.0, 46.0, 22.0, 15.0, 17.0, 8.0, 10.0, 9.0, 5.0, 2.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0723876953125, -1.037353515625, -1.0023193359375, -0.96728515625, -0.9322509765625, -0.897216796875, -0.8621826171875, -0.8271484375, -0.7921142578125, -0.757080078125, -0.7220458984375, -0.68701171875, -0.6519775390625, -0.616943359375, -0.5819091796875, -0.546875, -0.5118408203125, -0.476806640625, -0.4417724609375, -0.40673828125, -0.3717041015625, -0.336669921875, -0.3016357421875, -0.2666015625, -0.2315673828125, -0.196533203125, -0.1614990234375, -0.12646484375, -0.0914306640625, -0.056396484375, -0.0213623046875, 0.013671875, 0.0487060546875, 0.083740234375, 0.1187744140625, 0.15380859375, 0.1888427734375, 0.223876953125, 0.2589111328125, 0.2939453125, 0.3289794921875, 0.364013671875, 0.3990478515625, 0.43408203125, 0.4691162109375, 0.504150390625, 0.5391845703125, 0.57421875, 0.6092529296875, 0.644287109375, 0.6793212890625, 0.71435546875, 0.7493896484375, 0.784423828125, 0.8194580078125, 0.8544921875, 0.8895263671875, 0.924560546875, 0.9595947265625, 0.99462890625, 1.0296630859375, 1.064697265625, 1.0997314453125, 1.134765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 5.0, 5.0, 4.0, 12.0, 23.0, 38.0, 70.0, 84.0, 130.0, 232.0, 154.0, 89.0, 56.0, 30.0, 23.0, 6.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.97100067138672, -24.20693016052246, -23.442861557006836, -22.678791046142578, -21.914722442626953, -21.150651931762695, -20.386581420898438, -19.622512817382812, -18.858442306518555, -18.094371795654297, -17.330303192138672, -16.566232681274414, -15.802163124084473, -15.038093566894531, -14.27402400970459, -13.509954452514648, -12.745884895324707, -11.981815338134766, -11.217745780944824, -10.453676223754883, -9.689605712890625, -8.925536155700684, -8.161466598510742, -7.397396564483643, -6.633327007293701, -5.86925745010376, -5.10518741607666, -4.341117858886719, -3.5770480632781982, -2.8129782676696777, -2.0489087104797363, -1.2848386764526367, -0.5207691192626953, 0.24330061674118042, 1.0073703527450562, 1.771440029144287, 2.5355098247528076, 3.299579620361328, 4.0636491775512695, 4.827719211578369, 5.5917887687683105, 6.355858325958252, 7.119928359985352, 7.883997917175293, 8.648067474365234, 9.412137985229492, 10.176206588745117, 10.940277099609375, 11.704346656799316, 12.468416213989258, 13.2324857711792, 13.99655532836914, 14.760625839233398, 15.52469539642334, 16.28876495361328, 17.05283546447754, 17.816904067993164, 18.580974578857422, 19.345043182373047, 20.109113693237305, 20.87318229675293, 21.637252807617188, 22.401321411132812, 23.16539192199707, 23.929462432861328]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 13.0, 16.0, 20.0, 18.0, 25.0, 19.0, 15.0, 28.0, 25.0, 29.0, 39.0, 60.0, 63.0, 79.0, 72.0, 53.0, 48.0, 48.0, 40.0, 31.0, 35.0, 23.0, 31.0, 23.0, 14.0, 27.0, 17.0, 19.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.89944076538086, -18.296358108520508, -17.69327735900879, -17.090194702148438, -16.48711395263672, -15.884032249450684, -15.280950546264648, -14.677867889404297, -14.074787139892578, -13.471705436706543, -12.868623733520508, -12.265542030334473, -11.662460327148438, -11.059378623962402, -10.456296920776367, -9.853214263916016, -9.25013256072998, -8.647050857543945, -8.04396915435791, -7.440887451171875, -6.83780574798584, -6.234724044799805, -5.631641864776611, -5.028560161590576, -4.425478458404541, -3.822396755218506, -3.2193150520324707, -2.6162331104278564, -2.0131514072418213, -1.4100697040557861, -0.8069877624511719, -0.20390605926513672, 0.39917564392089844, 1.0022573471069336, 1.6053391695022583, 2.208420991897583, 2.811502695083618, 3.4145843982696533, 4.017666339874268, 4.620748043060303, 5.223829746246338, 5.826911449432373, 6.429993152618408, 7.033075332641602, 7.636157035827637, 8.239238739013672, 8.842320442199707, 9.445402145385742, 10.048483848571777, 10.651565551757812, 11.254647254943848, 11.857728958129883, 12.460810661315918, 13.063892364501953, 13.666975021362305, 14.270055770874023, 14.873138427734375, 15.47622013092041, 16.079301834106445, 16.682384490966797, 17.285465240478516, 17.888547897338867, 18.491628646850586, 19.094711303710938, 19.697792053222656]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 11.0, 11.0, 21.0, 13.0, 34.0, 33.0, 65.0, 144.0, 221.0, 439.0, 1072.0, 2417.0, 7576.0, 36706.0, 489325.0, 3206387.0, 405384.0, 33481.0, 6850.0, 2281.0, 909.0, 399.0, 212.0, 105.0, 74.0, 39.0, 25.0, 14.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.17578125, -3.0953216552734375, -3.014862060546875, -2.9344024658203125, -2.85394287109375, -2.7734832763671875, -2.693023681640625, -2.6125640869140625, -2.5321044921875, -2.4516448974609375, -2.371185302734375, -2.2907257080078125, -2.21026611328125, -2.1298065185546875, -2.049346923828125, -1.9688873291015625, -1.888427734375, -1.8079681396484375, -1.727508544921875, -1.6470489501953125, -1.56658935546875, -1.4861297607421875, -1.405670166015625, -1.3252105712890625, -1.2447509765625, -1.1642913818359375, -1.083831787109375, -1.0033721923828125, -0.92291259765625, -0.8424530029296875, -0.761993408203125, -0.6815338134765625, -0.60107421875, -0.5206146240234375, -0.440155029296875, -0.3596954345703125, -0.27923583984375, -0.1987762451171875, -0.118316650390625, -0.0378570556640625, 0.0426025390625, 0.1230621337890625, 0.203521728515625, 0.2839813232421875, 0.36444091796875, 0.4449005126953125, 0.525360107421875, 0.6058197021484375, 0.686279296875, 0.7667388916015625, 0.847198486328125, 0.9276580810546875, 1.00811767578125, 1.0885772705078125, 1.169036865234375, 1.2494964599609375, 1.3299560546875, 1.4104156494140625, 1.490875244140625, 1.5713348388671875, 1.65179443359375, 1.7322540283203125, 1.812713623046875, 1.8931732177734375, 1.9736328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 1.0, 8.0, 7.0, 7.0, 11.0, 18.0, 15.0, 14.0, 23.0, 11.0, 42.0, 49.0, 39.0, 47.0, 47.0, 56.0, 50.0, 46.0, 47.0, 50.0, 45.0, 38.0, 51.0, 37.0, 38.0, 32.0, 37.0, 27.0, 22.0, 26.0, 10.0, 11.0, 11.0, 5.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.35919189453125, -1.3140869140625, -1.26898193359375, -1.223876953125, -1.17877197265625, -1.1336669921875, -1.08856201171875, -1.04345703125, -0.99835205078125, -0.9532470703125, -0.90814208984375, -0.863037109375, -0.81793212890625, -0.7728271484375, -0.72772216796875, -0.6826171875, -0.63751220703125, -0.5924072265625, -0.54730224609375, -0.502197265625, -0.45709228515625, -0.4119873046875, -0.36688232421875, -0.32177734375, -0.27667236328125, -0.2315673828125, -0.18646240234375, -0.141357421875, -0.09625244140625, -0.0511474609375, -0.00604248046875, 0.0390625, 0.08416748046875, 0.1292724609375, 0.17437744140625, 0.219482421875, 0.26458740234375, 0.3096923828125, 0.35479736328125, 0.39990234375, 0.44500732421875, 0.4901123046875, 0.53521728515625, 0.580322265625, 0.62542724609375, 0.6705322265625, 0.71563720703125, 0.7607421875, 0.80584716796875, 0.8509521484375, 0.89605712890625, 0.941162109375, 0.98626708984375, 1.0313720703125, 1.07647705078125, 1.12158203125, 1.16668701171875, 1.2117919921875, 1.25689697265625, 1.302001953125, 1.34710693359375, 1.3922119140625, 1.43731689453125, 1.482421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 17.0, 27.0, 106.0, 234.0, 928.0, 17710.0, 4080824.0, 91765.0, 2072.0, 351.0, 126.0, 60.0, 25.0, 12.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0859375, -9.8031005859375, -9.520263671875, -9.2374267578125, -8.95458984375, -8.6717529296875, -8.388916015625, -8.1060791015625, -7.8232421875, -7.5404052734375, -7.257568359375, -6.9747314453125, -6.69189453125, -6.4090576171875, -6.126220703125, -5.8433837890625, -5.560546875, -5.2777099609375, -4.994873046875, -4.7120361328125, -4.42919921875, -4.1463623046875, -3.863525390625, -3.5806884765625, -3.2978515625, -3.0150146484375, -2.732177734375, -2.4493408203125, -2.16650390625, -1.8836669921875, -1.600830078125, -1.3179931640625, -1.03515625, -0.7523193359375, -0.469482421875, -0.1866455078125, 0.09619140625, 0.3790283203125, 0.661865234375, 0.9447021484375, 1.2275390625, 1.5103759765625, 1.793212890625, 2.0760498046875, 2.35888671875, 2.6417236328125, 2.924560546875, 3.2073974609375, 3.490234375, 3.7730712890625, 4.055908203125, 4.3387451171875, 4.62158203125, 4.9044189453125, 5.187255859375, 5.4700927734375, 5.7529296875, 6.0357666015625, 6.318603515625, 6.6014404296875, 6.88427734375, 7.1671142578125, 7.449951171875, 7.7327880859375, 8.015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 11.0, 19.0, 31.0, 65.0, 136.0, 301.0, 674.0, 1204.0, 869.0, 392.0, 178.0, 70.0, 48.0, 22.0, 16.0, 12.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.930145263671875, -2.78802490234375, -2.645904541015625, -2.5037841796875, -2.361663818359375, -2.21954345703125, -2.077423095703125, -1.935302734375, -1.793182373046875, -1.65106201171875, -1.508941650390625, -1.3668212890625, -1.224700927734375, -1.08258056640625, -0.940460205078125, -0.79833984375, -0.656219482421875, -0.51409912109375, -0.371978759765625, -0.2298583984375, -0.087738037109375, 0.05438232421875, 0.196502685546875, 0.338623046875, 0.480743408203125, 0.62286376953125, 0.764984130859375, 0.9071044921875, 1.049224853515625, 1.19134521484375, 1.333465576171875, 1.4755859375, 1.617706298828125, 1.75982666015625, 1.901947021484375, 2.0440673828125, 2.186187744140625, 2.32830810546875, 2.470428466796875, 2.612548828125, 2.754669189453125, 2.89678955078125, 3.038909912109375, 3.1810302734375, 3.323150634765625, 3.46527099609375, 3.607391357421875, 3.74951171875, 3.891632080078125, 4.03375244140625, 4.175872802734375, 4.3179931640625, 4.460113525390625, 4.60223388671875, 4.744354248046875, 4.886474609375, 5.028594970703125, 5.17071533203125, 5.312835693359375, 5.4549560546875, 5.597076416015625, 5.73919677734375, 5.881317138671875, 6.0234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 13.0, 22.0, 35.0, 67.0, 78.0, 151.0, 162.0, 157.0, 132.0, 71.0, 43.0, 16.0, 14.0, 7.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.51131820678711, -23.798194885253906, -23.085071563720703, -22.3719482421875, -21.658824920654297, -20.945701599121094, -20.23257827758789, -19.519453048706055, -18.80632972717285, -18.09320640563965, -17.380083084106445, -16.666959762573242, -15.953835487365723, -15.24071216583252, -14.527588844299316, -13.814464569091797, -13.10134220123291, -12.388218879699707, -11.675095558166504, -10.961971282958984, -10.248847961425781, -9.535724639892578, -8.822601318359375, -8.109477996826172, -7.3963541984558105, -6.683230876922607, -5.970107078552246, -5.256983757019043, -4.54386043548584, -3.8307366371154785, -3.1176133155822754, -2.404489517211914, -1.691366195678711, -0.9782426953315735, -0.26511919498443604, 0.44800424575805664, 1.1611278057098389, 1.874251365661621, 2.587374687194824, 3.3004984855651855, 4.013621807098389, 4.726745128631592, 5.439868927001953, 6.152992248535156, 6.866115570068359, 7.579239368438721, 8.292362213134766, 9.005486488342285, 9.718609809875488, 10.431733131408691, 11.144856452941895, 11.857980728149414, 12.571104049682617, 13.28422737121582, 13.997350692749023, 14.710474014282227, 15.42359733581543, 16.136720657348633, 16.849843978881836, 17.56296730041504, 18.276090621948242, 18.989215850830078, 19.70233917236328, 20.415462493896484, 21.128585815429688]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 6.0, 5.0, 14.0, 19.0, 19.0, 18.0, 18.0, 23.0, 20.0, 44.0, 34.0, 37.0, 39.0, 43.0, 33.0, 46.0, 59.0, 35.0, 47.0, 47.0, 42.0, 42.0, 41.0, 42.0, 34.0, 29.0, 26.0, 20.0, 20.0, 25.0, 11.0, 7.0, 7.0, 6.0, 5.0, 3.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.209583282470703, -11.830857276916504, -11.452132225036621, -11.073406219482422, -10.694680213928223, -10.31595516204834, -9.93722915649414, -9.558504104614258, -9.179778099060059, -8.80105209350586, -8.422327041625977, -8.043601036071777, -7.664875507354736, -7.286149978637695, -6.907423973083496, -6.528698444366455, -6.149972438812256, -5.771246910095215, -5.392520904541016, -5.013795375823975, -4.635069847106934, -4.256343841552734, -3.8776183128356934, -3.4988927841186523, -3.1201670169830322, -2.741441249847412, -2.362715721130371, -1.983989953994751, -1.6052643060684204, -1.2265386581420898, -0.8478128910064697, -0.4690873622894287, -0.0903615951538086, 0.28836408257484436, 0.6670897603034973, 1.0458154678344727, 1.4245411157608032, 1.8032667636871338, 2.181992530822754, 2.560718059539795, 2.939443826675415, 3.318169593811035, 3.696895122528076, 4.075620651245117, 4.454346656799316, 4.833072185516357, 5.211797714233398, 5.590523719787598, 5.969249248504639, 6.34797477722168, 6.726700782775879, 7.10542631149292, 7.484151840209961, 7.86287784576416, 8.24160385131836, 8.620328903198242, 8.999054908752441, 9.37778091430664, 9.756505966186523, 10.135231971740723, 10.513957977294922, 10.892683029174805, 11.271409034729004, 11.650135040283203, 12.028860092163086]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 9.0, 5.0, 15.0, 9.0, 20.0, 46.0, 70.0, 120.0, 229.0, 481.0, 1327.0, 4280.0, 18543.0, 102389.0, 567372.0, 295583.0, 44767.0, 9325.0, 2448.0, 808.0, 322.0, 151.0, 92.0, 47.0, 39.0, 21.0, 16.0, 9.0, 1.0, 1.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.83038330078125, -3.7135009765625, -3.59661865234375, -3.479736328125, -3.36285400390625, -3.2459716796875, -3.12908935546875, -3.01220703125, -2.89532470703125, -2.7784423828125, -2.66156005859375, -2.544677734375, -2.42779541015625, -2.3109130859375, -2.19403076171875, -2.0771484375, -1.96026611328125, -1.8433837890625, -1.72650146484375, -1.609619140625, -1.49273681640625, -1.3758544921875, -1.25897216796875, -1.14208984375, -1.02520751953125, -0.9083251953125, -0.79144287109375, -0.674560546875, -0.55767822265625, -0.4407958984375, -0.32391357421875, -0.20703125, -0.09014892578125, 0.0267333984375, 0.14361572265625, 0.260498046875, 0.37738037109375, 0.4942626953125, 0.61114501953125, 0.72802734375, 0.84490966796875, 0.9617919921875, 1.07867431640625, 1.195556640625, 1.31243896484375, 1.4293212890625, 1.54620361328125, 1.6630859375, 1.77996826171875, 1.8968505859375, 2.01373291015625, 2.130615234375, 2.24749755859375, 2.3643798828125, 2.48126220703125, 2.59814453125, 2.71502685546875, 2.8319091796875, 2.94879150390625, 3.065673828125, 3.18255615234375, 3.2994384765625, 3.41632080078125, 3.533203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 10.0, 1.0, 4.0, 8.0, 7.0, 4.0, 9.0, 13.0, 18.0, 23.0, 27.0, 29.0, 37.0, 21.0, 24.0, 33.0, 41.0, 33.0, 47.0, 50.0, 55.0, 49.0, 54.0, 61.0, 42.0, 37.0, 38.0, 42.0, 28.0, 25.0, 21.0, 24.0, 17.0, 20.0, 14.0, 13.0, 8.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.30303955078125, -1.2593994140625, -1.21575927734375, -1.172119140625, -1.12847900390625, -1.0848388671875, -1.04119873046875, -0.99755859375, -0.95391845703125, -0.9102783203125, -0.86663818359375, -0.822998046875, -0.77935791015625, -0.7357177734375, -0.69207763671875, -0.6484375, -0.60479736328125, -0.5611572265625, -0.51751708984375, -0.473876953125, -0.43023681640625, -0.3865966796875, -0.34295654296875, -0.29931640625, -0.25567626953125, -0.2120361328125, -0.16839599609375, -0.124755859375, -0.08111572265625, -0.0374755859375, 0.00616455078125, 0.0498046875, 0.09344482421875, 0.1370849609375, 0.18072509765625, 0.224365234375, 0.26800537109375, 0.3116455078125, 0.35528564453125, 0.39892578125, 0.44256591796875, 0.4862060546875, 0.52984619140625, 0.573486328125, 0.61712646484375, 0.6607666015625, 0.70440673828125, 0.748046875, 0.79168701171875, 0.8353271484375, 0.87896728515625, 0.922607421875, 0.96624755859375, 1.0098876953125, 1.05352783203125, 1.09716796875, 1.14080810546875, 1.1844482421875, 1.22808837890625, 1.271728515625, 1.31536865234375, 1.3590087890625, 1.40264892578125, 1.4462890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 6.0, 9.0, 12.0, 17.0, 29.0, 34.0, 73.0, 98.0, 165.0, 252.0, 613.0, 1404.0, 4921.0, 37340.0, 800761.0, 185847.0, 12756.0, 2475.0, 833.0, 365.0, 199.0, 122.0, 85.0, 45.0, 36.0, 19.0, 16.0, 5.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.6446533203125, -5.461181640625, -5.2777099609375, -5.09423828125, -4.9107666015625, -4.727294921875, -4.5438232421875, -4.3603515625, -4.1768798828125, -3.993408203125, -3.8099365234375, -3.62646484375, -3.4429931640625, -3.259521484375, -3.0760498046875, -2.892578125, -2.7091064453125, -2.525634765625, -2.3421630859375, -2.15869140625, -1.9752197265625, -1.791748046875, -1.6082763671875, -1.4248046875, -1.2413330078125, -1.057861328125, -0.8743896484375, -0.69091796875, -0.5074462890625, -0.323974609375, -0.1405029296875, 0.04296875, 0.2264404296875, 0.409912109375, 0.5933837890625, 0.77685546875, 0.9603271484375, 1.143798828125, 1.3272705078125, 1.5107421875, 1.6942138671875, 1.877685546875, 2.0611572265625, 2.24462890625, 2.4281005859375, 2.611572265625, 2.7950439453125, 2.978515625, 3.1619873046875, 3.345458984375, 3.5289306640625, 3.71240234375, 3.8958740234375, 4.079345703125, 4.2628173828125, 4.4462890625, 4.6297607421875, 4.813232421875, 4.9967041015625, 5.18017578125, 5.3636474609375, 5.547119140625, 5.7305908203125, 5.9140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 9.0, 8.0, 11.0, 21.0, 20.0, 23.0, 23.0, 22.0, 40.0, 34.0, 52.0, 45.0, 47.0, 59.0, 49.0, 48.0, 58.0, 49.0, 54.0, 38.0, 41.0, 41.0, 37.0, 30.0, 24.0, 26.0, 14.0, 9.0, 12.0, 5.0, 8.0, 7.0, 6.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.16015625, -4.0157470703125, -3.871337890625, -3.7269287109375, -3.58251953125, -3.4381103515625, -3.293701171875, -3.1492919921875, -3.0048828125, -2.8604736328125, -2.716064453125, -2.5716552734375, -2.42724609375, -2.2828369140625, -2.138427734375, -1.9940185546875, -1.849609375, -1.7052001953125, -1.560791015625, -1.4163818359375, -1.27197265625, -1.1275634765625, -0.983154296875, -0.8387451171875, -0.6943359375, -0.5499267578125, -0.405517578125, -0.2611083984375, -0.11669921875, 0.0277099609375, 0.172119140625, 0.3165283203125, 0.4609375, 0.6053466796875, 0.749755859375, 0.8941650390625, 1.03857421875, 1.1829833984375, 1.327392578125, 1.4718017578125, 1.6162109375, 1.7606201171875, 1.905029296875, 2.0494384765625, 2.19384765625, 2.3382568359375, 2.482666015625, 2.6270751953125, 2.771484375, 2.9158935546875, 3.060302734375, 3.2047119140625, 3.34912109375, 3.4935302734375, 3.637939453125, 3.7823486328125, 3.9267578125, 4.0711669921875, 4.215576171875, 4.3599853515625, 4.50439453125, 4.6488037109375, 4.793212890625, 4.9376220703125, 5.08203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 11.0, 19.0, 30.0, 36.0, 51.0, 58.0, 102.0, 153.0, 229.0, 353.0, 575.0, 1101.0, 2085.0, 4301.0, 10393.0, 32572.0, 160958.0, 707677.0, 90908.0, 21924.0, 7676.0, 3422.0, 1616.0, 879.0, 506.0, 283.0, 159.0, 138.0, 83.0, 59.0, 39.0, 37.0, 34.0, 14.0, 13.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0], "bins": [-0.939453125, -0.9104080200195312, -0.8813629150390625, -0.8523178100585938, -0.823272705078125, -0.7942276000976562, -0.7651824951171875, -0.7361373901367188, -0.70709228515625, -0.6780471801757812, -0.6490020751953125, -0.6199569702148438, -0.590911865234375, -0.5618667602539062, -0.5328216552734375, -0.5037765502929688, -0.4747314453125, -0.44568634033203125, -0.4166412353515625, -0.38759613037109375, -0.358551025390625, -0.32950592041015625, -0.3004608154296875, -0.27141571044921875, -0.24237060546875, -0.21332550048828125, -0.1842803955078125, -0.15523529052734375, -0.126190185546875, -0.09714508056640625, -0.0680999755859375, -0.03905487060546875, -0.010009765625, 0.01903533935546875, 0.0480804443359375, 0.07712554931640625, 0.106170654296875, 0.13521575927734375, 0.1642608642578125, 0.19330596923828125, 0.22235107421875, 0.25139617919921875, 0.2804412841796875, 0.30948638916015625, 0.338531494140625, 0.36757659912109375, 0.3966217041015625, 0.42566680908203125, 0.4547119140625, 0.48375701904296875, 0.5128021240234375, 0.5418472290039062, 0.570892333984375, 0.5999374389648438, 0.6289825439453125, 0.6580276489257812, 0.68707275390625, 0.7161178588867188, 0.7451629638671875, 0.7742080688476562, 0.803253173828125, 0.8322982788085938, 0.8613433837890625, 0.8903884887695312, 0.91943359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 11.0, 7.0, 7.0, 8.0, 15.0, 12.0, 21.0, 38.0, 55.0, 107.0, 192.0, 204.0, 120.0, 71.0, 48.0, 24.0, 18.0, 15.0, 5.0, 6.0, 8.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003421306610107422, -0.00033040717244148254, -0.0003186836838722229, -0.00030696019530296326, -0.0002952367067337036, -0.00028351321816444397, -0.0002717897295951843, -0.0002600662410259247, -0.00024834275245666504, -0.0002366192638874054, -0.00022489577531814575, -0.0002131722867488861, -0.00020144879817962646, -0.00018972530961036682, -0.00017800182104110718, -0.00016627833247184753, -0.0001545548439025879, -0.00014283135533332825, -0.0001311078667640686, -0.00011938437819480896, -0.00010766088962554932, -9.593740105628967e-05, -8.421391248703003e-05, -7.249042391777039e-05, -6.076693534851074e-05, -4.90434467792511e-05, -3.7319958209991455e-05, -2.559646964073181e-05, -1.3872981071472168e-05, -2.1494925022125244e-06, 9.573996067047119e-06, 2.1297484636306763e-05, 3.3020973205566406e-05, 4.474446177482605e-05, 5.646795034408569e-05, 6.819143891334534e-05, 7.991492748260498e-05, 9.163841605186462e-05, 0.00010336190462112427, 0.00011508539319038391, 0.00012680888175964355, 0.0001385323703289032, 0.00015025585889816284, 0.00016197934746742249, 0.00017370283603668213, 0.00018542632460594177, 0.00019714981317520142, 0.00020887330174446106, 0.0002205967903137207, 0.00023232027888298035, 0.00024404376745224, 0.00025576725602149963, 0.0002674907445907593, 0.0002792142331600189, 0.00029093772172927856, 0.0003026612102985382, 0.00031438469886779785, 0.0003261081874370575, 0.00033783167600631714, 0.0003495551645755768, 0.0003612786531448364, 0.00037300214171409607, 0.0003847256302833557, 0.00039644911885261536, 0.000408172607421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 14.0, 7.0, 17.0, 22.0, 32.0, 40.0, 53.0, 64.0, 104.0, 164.0, 246.0, 442.0, 732.0, 1406.0, 2897.0, 6685.0, 17555.0, 61186.0, 504045.0, 363117.0, 59688.0, 17266.0, 6482.0, 2974.0, 1332.0, 751.0, 408.0, 271.0, 156.0, 119.0, 79.0, 52.0, 42.0, 36.0, 11.0, 9.0, 9.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8519058227539062, -0.8244171142578125, -0.7969284057617188, -0.769439697265625, -0.7419509887695312, -0.7144622802734375, -0.6869735717773438, -0.65948486328125, -0.6319961547851562, -0.6045074462890625, -0.5770187377929688, -0.549530029296875, -0.5220413208007812, -0.4945526123046875, -0.46706390380859375, -0.4395751953125, -0.41208648681640625, -0.3845977783203125, -0.35710906982421875, -0.329620361328125, -0.30213165283203125, -0.2746429443359375, -0.24715423583984375, -0.21966552734375, -0.19217681884765625, -0.1646881103515625, -0.13719940185546875, -0.109710693359375, -0.08222198486328125, -0.0547332763671875, -0.02724456787109375, 0.000244140625, 0.02773284912109375, 0.0552215576171875, 0.08271026611328125, 0.110198974609375, 0.13768768310546875, 0.1651763916015625, 0.19266510009765625, 0.22015380859375, 0.24764251708984375, 0.2751312255859375, 0.30261993408203125, 0.330108642578125, 0.35759735107421875, 0.3850860595703125, 0.41257476806640625, 0.4400634765625, 0.46755218505859375, 0.4950408935546875, 0.5225296020507812, 0.550018310546875, 0.5775070190429688, 0.6049957275390625, 0.6324844360351562, 0.65997314453125, 0.6874618530273438, 0.7149505615234375, 0.7424392700195312, 0.769927978515625, 0.7974166870117188, 0.8249053955078125, 0.8523941040039062, 0.8798828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 9.0, 11.0, 15.0, 19.0, 30.0, 41.0, 58.0, 61.0, 109.0, 109.0, 111.0, 94.0, 87.0, 52.0, 40.0, 36.0, 15.0, 12.0, 10.0, 12.0, 8.0, 4.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.083984375, -1.053009033203125, -1.02203369140625, -0.991058349609375, -0.9600830078125, -0.929107666015625, -0.89813232421875, -0.867156982421875, -0.836181640625, -0.805206298828125, -0.77423095703125, -0.743255615234375, -0.7122802734375, -0.681304931640625, -0.65032958984375, -0.619354248046875, -0.58837890625, -0.557403564453125, -0.52642822265625, -0.495452880859375, -0.4644775390625, -0.433502197265625, -0.40252685546875, -0.371551513671875, -0.340576171875, -0.309600830078125, -0.27862548828125, -0.247650146484375, -0.2166748046875, -0.185699462890625, -0.15472412109375, -0.123748779296875, -0.0927734375, -0.061798095703125, -0.03082275390625, 0.000152587890625, 0.0311279296875, 0.062103271484375, 0.09307861328125, 0.124053955078125, 0.155029296875, 0.186004638671875, 0.21697998046875, 0.247955322265625, 0.2789306640625, 0.309906005859375, 0.34088134765625, 0.371856689453125, 0.40283203125, 0.433807373046875, 0.46478271484375, 0.495758056640625, 0.5267333984375, 0.557708740234375, 0.58868408203125, 0.619659423828125, 0.650634765625, 0.681610107421875, 0.71258544921875, 0.743560791015625, 0.7745361328125, 0.805511474609375, 0.83648681640625, 0.867462158203125, 0.8984375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 29.0, 57.0, 179.0, 428.0, 164.0, 76.0, 26.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.633563995361328, -19.302579879760742, -17.97159767150879, -16.640613555908203, -15.309630393981934, -13.978647232055664, -12.647663116455078, -11.316679954528809, -9.985696792602539, -8.65471363067627, -7.323729991912842, -5.992746353149414, -4.6617631912231445, -3.330780029296875, -1.9997963905334473, -0.6688127517700195, 0.66217041015625, 1.9931538105010986, 3.3241372108459473, 4.655120849609375, 5.9861040115356445, 7.317087173461914, 8.6480712890625, 9.97905445098877, 11.310037612915039, 12.641020774841309, 13.972003936767578, 15.302988052368164, 16.63397216796875, 17.964954376220703, 19.29593849182129, 20.626922607421875, 21.957908630371094, 23.28889274597168, 24.619874954223633, 25.95085906982422, 27.281841278076172, 28.612825393676758, 29.943809509277344, 31.274791717529297, 32.60577392578125, 33.9367561340332, 35.26774215698242, 36.598724365234375, 37.92970657348633, 39.26068878173828, 40.5916748046875, 41.92265701293945, 43.25364303588867, 44.584625244140625, 45.915611267089844, 47.2465934753418, 48.57757568359375, 49.90856170654297, 51.23954391479492, 52.570526123046875, 53.901512145996094, 55.23249435424805, 56.563480377197266, 57.89446258544922, 59.22544479370117, 60.556427001953125, 61.887413024902344, 63.2183952331543, 64.54937744140625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 9.0, 4.0, 8.0, 6.0, 16.0, 20.0, 21.0, 20.0, 27.0, 32.0, 31.0, 33.0, 37.0, 42.0, 63.0, 101.0, 97.0, 85.0, 43.0, 37.0, 37.0, 28.0, 35.0, 22.0, 22.0, 28.0, 16.0, 21.0, 7.0, 11.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.488295555114746, -14.91494083404541, -14.341586112976074, -13.768231391906738, -13.194877624511719, -12.621522903442383, -12.048168182373047, -11.474813461303711, -10.901458740234375, -10.328104019165039, -9.754749298095703, -9.181394577026367, -8.608039855957031, -8.034685134887695, -7.461331367492676, -6.88797664642334, -6.314621925354004, -5.741267204284668, -5.167912483215332, -4.594558238983154, -4.021203517913818, -3.4478487968444824, -2.8744943141937256, -2.3011398315429688, -1.7277851104736328, -1.1544305086135864, -0.58107590675354, -0.007721304893493652, 0.5656332969665527, 1.1389880180358887, 1.7123425006866455, 2.2856969833374023, 2.8590526580810547, 3.4324073791503906, 4.005762100219727, 4.579116344451904, 5.15247106552124, 5.725825786590576, 6.299180030822754, 6.87253475189209, 7.445889472961426, 8.019244194030762, 8.592598915100098, 9.165953636169434, 9.739307403564453, 10.312662124633789, 10.886016845703125, 11.459371566772461, 12.032726287841797, 12.606081008911133, 13.179435729980469, 13.752790451049805, 14.32614517211914, 14.899499893188477, 15.472853660583496, 16.046207427978516, 16.619564056396484, 17.19291877746582, 17.766273498535156, 18.339628219604492, 18.912982940673828, 19.486337661743164, 20.0596923828125, 20.633045196533203, 21.20639991760254]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 15.0, 22.0, 38.0, 68.0, 68.0, 127.0, 248.0, 375.0, 751.0, 1834.0, 4821.0, 18947.0, 131005.0, 1643452.0, 2166722.0, 191298.0, 24315.0, 6000.0, 2219.0, 884.0, 445.0, 257.0, 149.0, 85.0, 41.0, 26.0, 22.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.59765625, -2.527587890625, -2.45751953125, -2.387451171875, -2.3173828125, -2.247314453125, -2.17724609375, -2.107177734375, -2.037109375, -1.967041015625, -1.89697265625, -1.826904296875, -1.7568359375, -1.686767578125, -1.61669921875, -1.546630859375, -1.4765625, -1.406494140625, -1.33642578125, -1.266357421875, -1.1962890625, -1.126220703125, -1.05615234375, -0.986083984375, -0.916015625, -0.845947265625, -0.77587890625, -0.705810546875, -0.6357421875, -0.565673828125, -0.49560546875, -0.425537109375, -0.35546875, -0.285400390625, -0.21533203125, -0.145263671875, -0.0751953125, -0.005126953125, 0.06494140625, 0.135009765625, 0.205078125, 0.275146484375, 0.34521484375, 0.415283203125, 0.4853515625, 0.555419921875, 0.62548828125, 0.695556640625, 0.765625, 0.835693359375, 0.90576171875, 0.975830078125, 1.0458984375, 1.115966796875, 1.18603515625, 1.256103515625, 1.326171875, 1.396240234375, 1.46630859375, 1.536376953125, 1.6064453125, 1.676513671875, 1.74658203125, 1.816650390625, 1.88671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 13.0, 5.0, 14.0, 15.0, 19.0, 16.0, 27.0, 25.0, 30.0, 26.0, 30.0, 29.0, 29.0, 36.0, 48.0, 44.0, 48.0, 47.0, 43.0, 51.0, 36.0, 34.0, 41.0, 31.0, 34.0, 32.0, 25.0, 28.0, 28.0, 13.0, 16.0, 7.0, 7.0, 13.0, 4.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1597747802734375, -1.123260498046875, -1.0867462158203125, -1.05023193359375, -1.0137176513671875, -0.977203369140625, -0.9406890869140625, -0.9041748046875, -0.8676605224609375, -0.831146240234375, -0.7946319580078125, -0.75811767578125, -0.7216033935546875, -0.685089111328125, -0.6485748291015625, -0.612060546875, -0.5755462646484375, -0.539031982421875, -0.5025177001953125, -0.46600341796875, -0.4294891357421875, -0.392974853515625, -0.3564605712890625, -0.3199462890625, -0.2834320068359375, -0.246917724609375, -0.2104034423828125, -0.17388916015625, -0.1373748779296875, -0.100860595703125, -0.0643463134765625, -0.02783203125, 0.0086822509765625, 0.045196533203125, 0.0817108154296875, 0.11822509765625, 0.1547393798828125, 0.191253662109375, 0.2277679443359375, 0.2642822265625, 0.3007965087890625, 0.337310791015625, 0.3738250732421875, 0.41033935546875, 0.4468536376953125, 0.483367919921875, 0.5198822021484375, 0.556396484375, 0.5929107666015625, 0.629425048828125, 0.6659393310546875, 0.70245361328125, 0.7389678955078125, 0.775482177734375, 0.8119964599609375, 0.8485107421875, 0.8850250244140625, 0.921539306640625, 0.9580535888671875, 0.99456787109375, 1.0310821533203125, 1.067596435546875, 1.1041107177734375, 1.140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 3.0, 8.0, 9.0, 13.0, 21.0, 29.0, 46.0, 59.0, 79.0, 144.0, 323.0, 826.0, 2369.0, 10639.0, 84939.0, 2602130.0, 1425360.0, 55917.0, 8184.0, 1865.0, 645.0, 276.0, 133.0, 72.0, 58.0, 36.0, 25.0, 19.0, 11.0, 8.0, 13.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.953125, -2.854400634765625, -2.75567626953125, -2.656951904296875, -2.5582275390625, -2.459503173828125, -2.36077880859375, -2.262054443359375, -2.163330078125, -2.064605712890625, -1.96588134765625, -1.867156982421875, -1.7684326171875, -1.669708251953125, -1.57098388671875, -1.472259521484375, -1.37353515625, -1.274810791015625, -1.17608642578125, -1.077362060546875, -0.9786376953125, -0.879913330078125, -0.78118896484375, -0.682464599609375, -0.583740234375, -0.485015869140625, -0.38629150390625, -0.287567138671875, -0.1888427734375, -0.090118408203125, 0.00860595703125, 0.107330322265625, 0.2060546875, 0.304779052734375, 0.40350341796875, 0.502227783203125, 0.6009521484375, 0.699676513671875, 0.79840087890625, 0.897125244140625, 0.995849609375, 1.094573974609375, 1.19329833984375, 1.292022705078125, 1.3907470703125, 1.489471435546875, 1.58819580078125, 1.686920166015625, 1.78564453125, 1.884368896484375, 1.98309326171875, 2.081817626953125, 2.1805419921875, 2.279266357421875, 2.37799072265625, 2.476715087890625, 2.575439453125, 2.674163818359375, 2.77288818359375, 2.871612548828125, 2.9703369140625, 3.069061279296875, 3.16778564453125, 3.266510009765625, 3.365234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 14.0, 17.0, 29.0, 31.0, 56.0, 62.0, 116.0, 184.0, 265.0, 460.0, 621.0, 658.0, 508.0, 346.0, 207.0, 161.0, 83.0, 61.0, 36.0, 33.0, 24.0, 21.0, 16.0, 11.0, 6.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.208984375, -3.129180908203125, -3.04937744140625, -2.969573974609375, -2.8897705078125, -2.809967041015625, -2.73016357421875, -2.650360107421875, -2.570556640625, -2.490753173828125, -2.41094970703125, -2.331146240234375, -2.2513427734375, -2.171539306640625, -2.09173583984375, -2.011932373046875, -1.93212890625, -1.852325439453125, -1.77252197265625, -1.692718505859375, -1.6129150390625, -1.533111572265625, -1.45330810546875, -1.373504638671875, -1.293701171875, -1.213897705078125, -1.13409423828125, -1.054290771484375, -0.9744873046875, -0.894683837890625, -0.81488037109375, -0.735076904296875, -0.6552734375, -0.575469970703125, -0.49566650390625, -0.415863037109375, -0.3360595703125, -0.256256103515625, -0.17645263671875, -0.096649169921875, -0.016845703125, 0.062957763671875, 0.14276123046875, 0.222564697265625, 0.3023681640625, 0.382171630859375, 0.46197509765625, 0.541778564453125, 0.62158203125, 0.701385498046875, 0.78118896484375, 0.860992431640625, 0.9407958984375, 1.020599365234375, 1.10040283203125, 1.180206298828125, 1.260009765625, 1.339813232421875, 1.41961669921875, 1.499420166015625, 1.5792236328125, 1.659027099609375, 1.73883056640625, 1.818634033203125, 1.8984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 3.0, 17.0, 40.0, 121.0, 247.0, 307.0, 170.0, 57.0, 21.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-58.03443908691406, -56.85390853881836, -55.673377990722656, -54.49284362792969, -53.312313079833984, -52.13178253173828, -50.95125198364258, -49.770721435546875, -48.59019088745117, -47.40966033935547, -46.229129791259766, -45.04859924316406, -43.868064880371094, -42.68753433227539, -41.50700378417969, -40.326473236083984, -39.14594268798828, -37.96541213989258, -36.784881591796875, -35.604347229003906, -34.4238166809082, -33.2432861328125, -32.0627555847168, -30.882225036621094, -29.701690673828125, -28.521160125732422, -27.340627670288086, -26.160097122192383, -24.97956657409668, -23.799034118652344, -22.61850357055664, -21.437973022460938, -20.257444381713867, -19.076913833618164, -17.896381378173828, -16.715850830078125, -15.535320281982422, -14.354788780212402, -13.174257278442383, -11.99372673034668, -10.81319522857666, -9.63266372680664, -8.452133178710938, -7.271601676940918, -6.091070652008057, -4.910539627075195, -3.730008125305176, -2.5494775772094727, -1.3689460754394531, -0.18841493129730225, 0.9921162128448486, 2.172647476196289, 3.3531785011291504, 4.533709526062012, 5.714241027832031, 6.894771575927734, 8.075303077697754, 9.255834579467773, 10.436365127563477, 11.616896629333496, 12.797428131103516, 13.977958679199219, 15.158490180969238, 16.339019775390625, 17.51955223083496]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 9.0, 6.0, 12.0, 18.0, 15.0, 24.0, 21.0, 47.0, 35.0, 44.0, 33.0, 52.0, 75.0, 61.0, 56.0, 61.0, 62.0, 54.0, 38.0, 49.0, 35.0, 41.0, 32.0, 24.0, 31.0, 10.0, 16.0, 10.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.297502517700195, -13.884312629699707, -13.471122741699219, -13.05793285369873, -12.644742965698242, -12.231552124023438, -11.818363189697266, -11.405172348022461, -10.991982460021973, -10.578792572021484, -10.165602684020996, -9.752412796020508, -9.33922290802002, -8.926033020019531, -8.512842178344727, -8.099652290344238, -7.686462879180908, -7.27327299118042, -6.860083103179932, -6.446892738342285, -6.033702850341797, -5.620512962341309, -5.20732307434082, -4.794133186340332, -4.380943298339844, -3.9677534103393555, -3.554563283920288, -3.1413733959198, -2.7281832695007324, -2.314993381500244, -1.9018034934997559, -1.4886133670806885, -1.075423240661621, -0.6622332334518433, -0.2490432858467102, 0.16414666175842285, 0.5773366689682007, 0.9905266761779785, 1.4037165641784668, 1.8169066905975342, 2.2300965785980225, 2.6432864665985107, 3.056476593017578, 3.4696664810180664, 3.8828563690185547, 4.296046257019043, 4.709236145019531, 5.122426509857178, 5.535616397857666, 5.948806285858154, 6.361996173858643, 6.775186538696289, 7.188376426696777, 7.601566314697266, 8.014756202697754, 8.427946090698242, 8.84113597869873, 9.254325866699219, 9.667515754699707, 10.080705642700195, 10.493895530700684, 10.907085418701172, 11.320276260375977, 11.733466148376465, 12.146656036376953]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 17.0, 18.0, 28.0, 39.0, 84.0, 128.0, 255.0, 457.0, 1088.0, 2664.0, 7323.0, 23789.0, 98746.0, 478573.0, 342222.0, 65939.0, 17589.0, 5663.0, 2114.0, 897.0, 421.0, 222.0, 88.0, 64.0, 44.0, 26.0, 18.0, 10.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.69140625, -3.582427978515625, -3.47344970703125, -3.364471435546875, -3.2554931640625, -3.146514892578125, -3.03753662109375, -2.928558349609375, -2.819580078125, -2.710601806640625, -2.60162353515625, -2.492645263671875, -2.3836669921875, -2.274688720703125, -2.16571044921875, -2.056732177734375, -1.94775390625, -1.838775634765625, -1.72979736328125, -1.620819091796875, -1.5118408203125, -1.402862548828125, -1.29388427734375, -1.184906005859375, -1.075927734375, -0.966949462890625, -0.85797119140625, -0.748992919921875, -0.6400146484375, -0.531036376953125, -0.42205810546875, -0.313079833984375, -0.2041015625, -0.095123291015625, 0.01385498046875, 0.122833251953125, 0.2318115234375, 0.340789794921875, 0.44976806640625, 0.558746337890625, 0.667724609375, 0.776702880859375, 0.88568115234375, 0.994659423828125, 1.1036376953125, 1.212615966796875, 1.32159423828125, 1.430572509765625, 1.53955078125, 1.648529052734375, 1.75750732421875, 1.866485595703125, 1.9754638671875, 2.084442138671875, 2.19342041015625, 2.302398681640625, 2.411376953125, 2.520355224609375, 2.62933349609375, 2.738311767578125, 2.8472900390625, 2.956268310546875, 3.06524658203125, 3.174224853515625, 3.283203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 10.0, 4.0, 4.0, 8.0, 8.0, 7.0, 8.0, 21.0, 24.0, 15.0, 31.0, 19.0, 33.0, 36.0, 43.0, 34.0, 37.0, 42.0, 50.0, 32.0, 46.0, 40.0, 45.0, 45.0, 31.0, 52.0, 43.0, 31.0, 29.0, 38.0, 21.0, 15.0, 12.0, 15.0, 17.0, 12.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.15142822265625, -1.1134033203125, -1.07537841796875, -1.037353515625, -0.99932861328125, -0.9613037109375, -0.92327880859375, -0.88525390625, -0.84722900390625, -0.8092041015625, -0.77117919921875, -0.733154296875, -0.69512939453125, -0.6571044921875, -0.61907958984375, -0.5810546875, -0.54302978515625, -0.5050048828125, -0.46697998046875, -0.428955078125, -0.39093017578125, -0.3529052734375, -0.31488037109375, -0.27685546875, -0.23883056640625, -0.2008056640625, -0.16278076171875, -0.124755859375, -0.08673095703125, -0.0487060546875, -0.01068115234375, 0.02734375, 0.06536865234375, 0.1033935546875, 0.14141845703125, 0.179443359375, 0.21746826171875, 0.2554931640625, 0.29351806640625, 0.33154296875, 0.36956787109375, 0.4075927734375, 0.44561767578125, 0.483642578125, 0.52166748046875, 0.5596923828125, 0.59771728515625, 0.6357421875, 0.67376708984375, 0.7117919921875, 0.74981689453125, 0.787841796875, 0.82586669921875, 0.8638916015625, 0.90191650390625, 0.93994140625, 0.97796630859375, 1.0159912109375, 1.05401611328125, 1.092041015625, 1.13006591796875, 1.1680908203125, 1.20611572265625, 1.244140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 10.0, 6.0, 13.0, 10.0, 17.0, 27.0, 38.0, 59.0, 77.0, 143.0, 227.0, 341.0, 617.0, 1369.0, 3312.0, 14811.0, 224938.0, 767605.0, 26739.0, 4681.0, 1675.0, 774.0, 419.0, 222.0, 157.0, 89.0, 51.0, 35.0, 26.0, 18.0, 15.0, 9.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.6328125, -4.45556640625, -4.2783203125, -4.10107421875, -3.923828125, -3.74658203125, -3.5693359375, -3.39208984375, -3.21484375, -3.03759765625, -2.8603515625, -2.68310546875, -2.505859375, -2.32861328125, -2.1513671875, -1.97412109375, -1.796875, -1.61962890625, -1.4423828125, -1.26513671875, -1.087890625, -0.91064453125, -0.7333984375, -0.55615234375, -0.37890625, -0.20166015625, -0.0244140625, 0.15283203125, 0.330078125, 0.50732421875, 0.6845703125, 0.86181640625, 1.0390625, 1.21630859375, 1.3935546875, 1.57080078125, 1.748046875, 1.92529296875, 2.1025390625, 2.27978515625, 2.45703125, 2.63427734375, 2.8115234375, 2.98876953125, 3.166015625, 3.34326171875, 3.5205078125, 3.69775390625, 3.875, 4.05224609375, 4.2294921875, 4.40673828125, 4.583984375, 4.76123046875, 4.9384765625, 5.11572265625, 5.29296875, 5.47021484375, 5.6474609375, 5.82470703125, 6.001953125, 6.17919921875, 6.3564453125, 6.53369140625, 6.7109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 10.0, 6.0, 12.0, 20.0, 26.0, 20.0, 34.0, 32.0, 46.0, 44.0, 63.0, 70.0, 72.0, 64.0, 70.0, 81.0, 55.0, 52.0, 46.0, 30.0, 28.0, 22.0, 15.0, 19.0, 13.0, 12.0, 11.0, 2.0, 7.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.5078125, -6.3343505859375, -6.160888671875, -5.9874267578125, -5.81396484375, -5.6405029296875, -5.467041015625, -5.2935791015625, -5.1201171875, -4.9466552734375, -4.773193359375, -4.5997314453125, -4.42626953125, -4.2528076171875, -4.079345703125, -3.9058837890625, -3.732421875, -3.5589599609375, -3.385498046875, -3.2120361328125, -3.03857421875, -2.8651123046875, -2.691650390625, -2.5181884765625, -2.3447265625, -2.1712646484375, -1.997802734375, -1.8243408203125, -1.65087890625, -1.4774169921875, -1.303955078125, -1.1304931640625, -0.95703125, -0.7835693359375, -0.610107421875, -0.4366455078125, -0.26318359375, -0.0897216796875, 0.083740234375, 0.2572021484375, 0.4306640625, 0.6041259765625, 0.777587890625, 0.9510498046875, 1.12451171875, 1.2979736328125, 1.471435546875, 1.6448974609375, 1.818359375, 1.9918212890625, 2.165283203125, 2.3387451171875, 2.51220703125, 2.6856689453125, 2.859130859375, 3.0325927734375, 3.2060546875, 3.3795166015625, 3.552978515625, 3.7264404296875, 3.89990234375, 4.0733642578125, 4.246826171875, 4.4202880859375, 4.59375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 15.0, 9.0, 7.0, 11.0, 15.0, 24.0, 34.0, 40.0, 63.0, 81.0, 164.0, 297.0, 661.0, 1819.0, 6903.0, 76001.0, 933609.0, 22663.0, 3870.0, 1127.0, 465.0, 226.0, 123.0, 76.0, 42.0, 45.0, 40.0, 26.0, 18.0, 14.0, 13.0, 13.0, 3.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.333984375, -2.248504638671875, -2.16302490234375, -2.077545166015625, -1.9920654296875, -1.906585693359375, -1.82110595703125, -1.735626220703125, -1.650146484375, -1.564666748046875, -1.47918701171875, -1.393707275390625, -1.3082275390625, -1.222747802734375, -1.13726806640625, -1.051788330078125, -0.96630859375, -0.880828857421875, -0.79534912109375, -0.709869384765625, -0.6243896484375, -0.538909912109375, -0.45343017578125, -0.367950439453125, -0.282470703125, -0.196990966796875, -0.11151123046875, -0.026031494140625, 0.0594482421875, 0.144927978515625, 0.23040771484375, 0.315887451171875, 0.4013671875, 0.486846923828125, 0.57232666015625, 0.657806396484375, 0.7432861328125, 0.828765869140625, 0.91424560546875, 0.999725341796875, 1.085205078125, 1.170684814453125, 1.25616455078125, 1.341644287109375, 1.4271240234375, 1.512603759765625, 1.59808349609375, 1.683563232421875, 1.76904296875, 1.854522705078125, 1.94000244140625, 2.025482177734375, 2.1109619140625, 2.196441650390625, 2.28192138671875, 2.367401123046875, 2.452880859375, 2.538360595703125, 2.62384033203125, 2.709320068359375, 2.7947998046875, 2.880279541015625, 2.96575927734375, 3.051239013671875, 3.13671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 7.0, 8.0, 14.0, 26.0, 52.0, 123.0, 334.0, 229.0, 87.0, 43.0, 23.0, 14.0, 2.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0009026527404785156, -0.0008820630609989166, -0.0008614733815193176, -0.0008408837020397186, -0.0008202940225601196, -0.0007997043430805206, -0.0007791146636009216, -0.0007585249841213226, -0.0007379353046417236, -0.0007173456251621246, -0.0006967559456825256, -0.0006761662662029266, -0.0006555765867233276, -0.0006349869072437286, -0.0006143972277641296, -0.0005938075482845306, -0.0005732178688049316, -0.0005526281893253326, -0.0005320385098457336, -0.0005114488303661346, -0.0004908591508865356, -0.00047026947140693665, -0.00044967979192733765, -0.00042909011244773865, -0.00040850043296813965, -0.00038791075348854065, -0.00036732107400894165, -0.00034673139452934265, -0.00032614171504974365, -0.00030555203557014465, -0.00028496235609054565, -0.00026437267661094666, -0.00024378299713134766, -0.00022319331765174866, -0.00020260363817214966, -0.00018201395869255066, -0.00016142427921295166, -0.00014083459973335266, -0.00012024492025375366, -9.965524077415466e-05, -7.906556129455566e-05, -5.8475881814956665e-05, -3.7886202335357666e-05, -1.7296522855758667e-05, 3.293156623840332e-06, 2.388283610343933e-05, 4.447251558303833e-05, 6.506219506263733e-05, 8.565187454223633e-05, 0.00010624155402183533, 0.00012683123350143433, 0.00014742091298103333, 0.00016801059246063232, 0.00018860027194023132, 0.00020918995141983032, 0.00022977963089942932, 0.0002503693103790283, 0.0002709589898586273, 0.0002915486693382263, 0.0003121383488178253, 0.0003327280282974243, 0.0003533177077770233, 0.0003739073872566223, 0.0003944970667362213, 0.0004150867462158203]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 13.0, 23.0, 16.0, 31.0, 35.0, 61.0, 79.0, 158.0, 265.0, 483.0, 979.0, 2365.0, 6042.0, 22401.0, 217920.0, 744634.0, 38930.0, 8385.0, 3072.0, 1195.0, 608.0, 305.0, 155.0, 121.0, 55.0, 49.0, 41.0, 21.0, 19.0, 19.0, 8.0, 6.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2080078125, -1.16351318359375, -1.1190185546875, -1.07452392578125, -1.030029296875, -0.98553466796875, -0.9410400390625, -0.89654541015625, -0.85205078125, -0.80755615234375, -0.7630615234375, -0.71856689453125, -0.674072265625, -0.62957763671875, -0.5850830078125, -0.54058837890625, -0.49609375, -0.45159912109375, -0.4071044921875, -0.36260986328125, -0.318115234375, -0.27362060546875, -0.2291259765625, -0.18463134765625, -0.14013671875, -0.09564208984375, -0.0511474609375, -0.00665283203125, 0.037841796875, 0.08233642578125, 0.1268310546875, 0.17132568359375, 0.2158203125, 0.26031494140625, 0.3048095703125, 0.34930419921875, 0.393798828125, 0.43829345703125, 0.4827880859375, 0.52728271484375, 0.57177734375, 0.61627197265625, 0.6607666015625, 0.70526123046875, 0.749755859375, 0.79425048828125, 0.8387451171875, 0.88323974609375, 0.927734375, 0.97222900390625, 1.0167236328125, 1.06121826171875, 1.105712890625, 1.15020751953125, 1.1947021484375, 1.23919677734375, 1.28369140625, 1.32818603515625, 1.3726806640625, 1.41717529296875, 1.461669921875, 1.50616455078125, 1.5506591796875, 1.59515380859375, 1.6396484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 15.0, 10.0, 10.0, 30.0, 37.0, 52.0, 112.0, 180.0, 225.0, 127.0, 84.0, 36.0, 28.0, 23.0, 12.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4892578125, -1.4345550537109375, -1.379852294921875, -1.3251495361328125, -1.27044677734375, -1.2157440185546875, -1.161041259765625, -1.1063385009765625, -1.0516357421875, -0.9969329833984375, -0.942230224609375, -0.8875274658203125, -0.83282470703125, -0.7781219482421875, -0.723419189453125, -0.6687164306640625, -0.614013671875, -0.5593109130859375, -0.504608154296875, -0.4499053955078125, -0.39520263671875, -0.3404998779296875, -0.285797119140625, -0.2310943603515625, -0.1763916015625, -0.1216888427734375, -0.066986083984375, -0.0122833251953125, 0.04241943359375, 0.0971221923828125, 0.151824951171875, 0.2065277099609375, 0.26123046875, 0.3159332275390625, 0.370635986328125, 0.4253387451171875, 0.48004150390625, 0.5347442626953125, 0.589447021484375, 0.6441497802734375, 0.6988525390625, 0.7535552978515625, 0.808258056640625, 0.8629608154296875, 0.91766357421875, 0.9723663330078125, 1.027069091796875, 1.0817718505859375, 1.136474609375, 1.1911773681640625, 1.245880126953125, 1.3005828857421875, 1.35528564453125, 1.4099884033203125, 1.464691162109375, 1.5193939208984375, 1.5740966796875, 1.6287994384765625, 1.683502197265625, 1.7382049560546875, 1.79290771484375, 1.8476104736328125, 1.902313232421875, 1.9570159912109375, 2.01171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 10.0, 9.0, 20.0, 50.0, 90.0, 230.0, 358.0, 112.0, 56.0, 24.0, 9.0, 15.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.92510986328125, -23.748525619506836, -22.571941375732422, -21.395357131958008, -20.218772888183594, -19.042186737060547, -17.865602493286133, -16.68901824951172, -15.512434005737305, -14.33584976196289, -13.159265518188477, -11.982680320739746, -10.806096076965332, -9.629511833190918, -8.452926635742188, -7.276342391967773, -6.099758148193359, -4.923173904418945, -3.746589183807373, -2.57000470161438, -1.3934202194213867, -0.21683597564697266, 0.9597487449645996, 2.136333465576172, 3.312917709350586, 4.489501953125, 5.666086673736572, 6.8426713943481445, 8.019255638122559, 9.195839881896973, 10.372425079345703, 11.549009323120117, 12.725589752197266, 13.90217399597168, 15.078758239746094, 16.255342483520508, 17.431926727294922, 18.60851287841797, 19.785097122192383, 20.961681365966797, 22.13826560974121, 23.314849853515625, 24.49143409729004, 25.668018341064453, 26.8446044921875, 28.02118682861328, 29.197772979736328, 30.374357223510742, 31.550941467285156, 32.7275276184082, 33.904109954833984, 35.08069610595703, 36.25727844238281, 37.43386459350586, 38.61044692993164, 39.78703308105469, 40.96361541748047, 42.140201568603516, 43.3167839050293, 44.493370056152344, 45.669952392578125, 46.84653854370117, 48.02312088012695, 49.19970703125, 50.37629318237305]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 4.0, 8.0, 7.0, 10.0, 10.0, 16.0, 7.0, 10.0, 21.0, 15.0, 14.0, 21.0, 34.0, 23.0, 30.0, 28.0, 47.0, 95.0, 122.0, 89.0, 46.0, 50.0, 29.0, 28.0, 24.0, 23.0, 17.0, 23.0, 19.0, 14.0, 8.0, 17.0, 8.0, 10.0, 13.0, 7.0, 6.0, 5.0, 6.0, 3.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.337566375732422, -13.870434761047363, -13.403304100036621, -12.936172485351562, -12.46904182434082, -12.001910209655762, -11.534778594970703, -11.067647933959961, -10.600517272949219, -10.13338565826416, -9.666254997253418, -9.19912338256836, -8.731992721557617, -8.264861106872559, -7.797729969024658, -7.330598831176758, -6.863467216491699, -6.396336078643799, -5.929204940795898, -5.46207332611084, -4.994942665100098, -4.527811050415039, -4.060679912567139, -3.5935487747192383, -3.126417636871338, -2.6592864990234375, -2.192155361175537, -1.7250239849090576, -1.2578928470611572, -0.7907617092132568, -0.32363033294677734, 0.14350080490112305, 0.6106328964233398, 1.0777640342712402, 1.5448952913284302, 2.01202654838562, 2.4791576862335205, 2.946288824081421, 3.4134202003479004, 3.880551338195801, 4.347682476043701, 4.814813613891602, 5.281944751739502, 5.749075889587402, 6.216207504272461, 6.683338165283203, 7.150469779968262, 7.617600917816162, 8.084732055664062, 8.551863670349121, 9.018994331359863, 9.486125946044922, 9.953256607055664, 10.420388221740723, 10.887519836425781, 11.354650497436523, 11.821781158447266, 12.288912773132324, 12.756043434143066, 13.223175048828125, 13.690305709838867, 14.157437324523926, 14.624568939208984, 15.091699600219727, 15.558831214904785]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 19.0, 19.0, 44.0, 75.0, 142.0, 330.0, 709.0, 1646.0, 4599.0, 17099.0, 137419.0, 1919539.0, 1938047.0, 149235.0, 17936.0, 4565.0, 1603.0, 628.0, 305.0, 124.0, 87.0, 44.0, 23.0, 10.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.658203125, -3.550628662109375, -3.44305419921875, -3.335479736328125, -3.2279052734375, -3.120330810546875, -3.01275634765625, -2.905181884765625, -2.797607421875, -2.690032958984375, -2.58245849609375, -2.474884033203125, -2.3673095703125, -2.259735107421875, -2.15216064453125, -2.044586181640625, -1.93701171875, -1.829437255859375, -1.72186279296875, -1.614288330078125, -1.5067138671875, -1.399139404296875, -1.29156494140625, -1.183990478515625, -1.076416015625, -0.968841552734375, -0.86126708984375, -0.753692626953125, -0.6461181640625, -0.538543701171875, -0.43096923828125, -0.323394775390625, -0.2158203125, -0.108245849609375, -0.00067138671875, 0.106903076171875, 0.2144775390625, 0.322052001953125, 0.42962646484375, 0.537200927734375, 0.644775390625, 0.752349853515625, 0.85992431640625, 0.967498779296875, 1.0750732421875, 1.182647705078125, 1.29022216796875, 1.397796630859375, 1.50537109375, 1.612945556640625, 1.72052001953125, 1.828094482421875, 1.9356689453125, 2.043243408203125, 2.15081787109375, 2.258392333984375, 2.365966796875, 2.473541259765625, 2.58111572265625, 2.688690185546875, 2.7962646484375, 2.903839111328125, 3.01141357421875, 3.118988037109375, 3.2265625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 6.0, 10.0, 15.0, 15.0, 10.0, 20.0, 23.0, 27.0, 26.0, 38.0, 32.0, 35.0, 35.0, 42.0, 45.0, 55.0, 39.0, 47.0, 54.0, 52.0, 33.0, 30.0, 41.0, 47.0, 31.0, 26.0, 22.0, 26.0, 15.0, 21.0, 13.0, 13.0, 8.0, 10.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2470703125, -1.2110595703125, -1.175048828125, -1.1390380859375, -1.10302734375, -1.0670166015625, -1.031005859375, -0.9949951171875, -0.958984375, -0.9229736328125, -0.886962890625, -0.8509521484375, -0.81494140625, -0.7789306640625, -0.742919921875, -0.7069091796875, -0.6708984375, -0.6348876953125, -0.598876953125, -0.5628662109375, -0.52685546875, -0.4908447265625, -0.454833984375, -0.4188232421875, -0.3828125, -0.3468017578125, -0.310791015625, -0.2747802734375, -0.23876953125, -0.2027587890625, -0.166748046875, -0.1307373046875, -0.0947265625, -0.0587158203125, -0.022705078125, 0.0133056640625, 0.04931640625, 0.0853271484375, 0.121337890625, 0.1573486328125, 0.193359375, 0.2293701171875, 0.265380859375, 0.3013916015625, 0.33740234375, 0.3734130859375, 0.409423828125, 0.4454345703125, 0.4814453125, 0.5174560546875, 0.553466796875, 0.5894775390625, 0.62548828125, 0.6614990234375, 0.697509765625, 0.7335205078125, 0.76953125, 0.8055419921875, 0.841552734375, 0.8775634765625, 0.91357421875, 0.9495849609375, 0.985595703125, 1.0216064453125, 1.0576171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 2.0, 4.0, 23.0, 25.0, 50.0, 98.0, 184.0, 528.0, 1618.0, 8058.0, 1799151.0, 2373057.0, 8927.0, 1674.0, 499.0, 207.0, 79.0, 41.0, 15.0, 11.0, 10.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.984375, -13.616455078125, -13.24853515625, -12.880615234375, -12.5126953125, -12.144775390625, -11.77685546875, -11.408935546875, -11.041015625, -10.673095703125, -10.30517578125, -9.937255859375, -9.5693359375, -9.201416015625, -8.83349609375, -8.465576171875, -8.09765625, -7.729736328125, -7.36181640625, -6.993896484375, -6.6259765625, -6.258056640625, -5.89013671875, -5.522216796875, -5.154296875, -4.786376953125, -4.41845703125, -4.050537109375, -3.6826171875, -3.314697265625, -2.94677734375, -2.578857421875, -2.2109375, -1.843017578125, -1.47509765625, -1.107177734375, -0.7392578125, -0.371337890625, -0.00341796875, 0.364501953125, 0.732421875, 1.100341796875, 1.46826171875, 1.836181640625, 2.2041015625, 2.572021484375, 2.93994140625, 3.307861328125, 3.67578125, 4.043701171875, 4.41162109375, 4.779541015625, 5.1474609375, 5.515380859375, 5.88330078125, 6.251220703125, 6.619140625, 6.987060546875, 7.35498046875, 7.722900390625, 8.0908203125, 8.458740234375, 8.82666015625, 9.194580078125, 9.5625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 8.0, 5.0, 13.0, 28.0, 56.0, 81.0, 171.0, 264.0, 482.0, 825.0, 793.0, 534.0, 316.0, 213.0, 117.0, 65.0, 36.0, 28.0, 18.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.4202880859375, -7.219482421875, -7.0186767578125, -6.81787109375, -6.6170654296875, -6.416259765625, -6.2154541015625, -6.0146484375, -5.8138427734375, -5.613037109375, -5.4122314453125, -5.21142578125, -5.0106201171875, -4.809814453125, -4.6090087890625, -4.408203125, -4.2073974609375, -4.006591796875, -3.8057861328125, -3.60498046875, -3.4041748046875, -3.203369140625, -3.0025634765625, -2.8017578125, -2.6009521484375, -2.400146484375, -2.1993408203125, -1.99853515625, -1.7977294921875, -1.596923828125, -1.3961181640625, -1.1953125, -0.9945068359375, -0.793701171875, -0.5928955078125, -0.39208984375, -0.1912841796875, 0.009521484375, 0.2103271484375, 0.4111328125, 0.6119384765625, 0.812744140625, 1.0135498046875, 1.21435546875, 1.4151611328125, 1.615966796875, 1.8167724609375, 2.017578125, 2.2183837890625, 2.419189453125, 2.6199951171875, 2.82080078125, 3.0216064453125, 3.222412109375, 3.4232177734375, 3.6240234375, 3.8248291015625, 4.025634765625, 4.2264404296875, 4.42724609375, 4.6280517578125, 4.828857421875, 5.0296630859375, 5.23046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 13.0, 22.0, 45.0, 78.0, 148.0, 255.0, 182.0, 113.0, 51.0, 30.0, 8.0, 10.0, 5.0, 3.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.178932189941406, -47.244972229003906, -45.311012268066406, -43.377052307128906, -41.44308853149414, -39.50912857055664, -37.57516860961914, -35.64120864868164, -33.707244873046875, -31.773284912109375, -29.839323043823242, -27.905363082885742, -25.97140121459961, -24.03744125366211, -22.10348129272461, -20.16952133178711, -18.23556137084961, -16.30160140991211, -14.367639541625977, -12.433679580688477, -10.49971866607666, -8.565757751464844, -6.631797790527344, -4.697836875915527, -2.763875961303711, -0.8299152851104736, 1.1040453910827637, 3.038005828857422, 4.971966743469238, 6.905927658081055, 8.839887619018555, 10.773848533630371, 12.707809448242188, 14.641770362854004, 16.57573127746582, 18.50969123840332, 20.443653106689453, 22.377613067626953, 24.311573028564453, 26.245532989501953, 28.179494857788086, 30.113454818725586, 32.04741668701172, 33.98137664794922, 35.91533660888672, 37.84929656982422, 39.78325653076172, 41.717220306396484, 43.651180267333984, 45.585140228271484, 47.519100189208984, 49.45306396484375, 51.38702392578125, 53.32098388671875, 55.25494384765625, 57.18890380859375, 59.12286376953125, 61.05682373046875, 62.99078369140625, 64.92474365234375, 66.85870361328125, 68.79266357421875, 70.72662353515625, 72.66059112548828, 74.59455108642578]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 14.0, 10.0, 20.0, 20.0, 17.0, 34.0, 36.0, 44.0, 52.0, 39.0, 52.0, 59.0, 61.0, 53.0, 73.0, 67.0, 47.0, 48.0, 39.0, 36.0, 28.0, 26.0, 23.0, 20.0, 17.0, 13.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.74528694152832, -26.797346115112305, -25.84940528869629, -24.901466369628906, -23.95352554321289, -23.005584716796875, -22.05764389038086, -21.109703063964844, -20.161762237548828, -19.213821411132812, -18.265880584716797, -17.31793975830078, -16.3700008392334, -15.422060012817383, -14.474119186401367, -13.526178359985352, -12.578239440917969, -11.630298614501953, -10.682358741760254, -9.734417915344238, -8.786478042602539, -7.838537216186523, -6.890596389770508, -5.94265604019165, -4.994715690612793, -4.0467753410339355, -3.098834753036499, -2.1508941650390625, -1.202953815460205, -0.25501346588134766, 0.692927360534668, 1.6408677101135254, 2.5888099670410156, 3.536750316619873, 4.4846906661987305, 5.432631492614746, 6.3805718421936035, 7.328512191772461, 8.276453018188477, 9.224393844604492, 10.172333717346191, 11.120274543762207, 12.068214416503906, 13.016155242919922, 13.964096069335938, 14.912035942077637, 15.859976768493652, 16.80791664123535, 17.755857467651367, 18.703798294067383, 19.6517391204834, 20.59967803955078, 21.547618865966797, 22.495559692382812, 23.443500518798828, 24.391441345214844, 25.33938217163086, 26.287322998046875, 27.23526382446289, 28.183204650878906, 29.13114356994629, 30.079084396362305, 31.02702522277832, 31.974966049194336, 32.92290496826172]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 12.0, 18.0, 39.0, 34.0, 54.0, 95.0, 173.0, 263.0, 493.0, 773.0, 1406.0, 2945.0, 6355.0, 16267.0, 50100.0, 222830.0, 584687.0, 111664.0, 30347.0, 10727.0, 4420.0, 2187.0, 1119.0, 596.0, 340.0, 230.0, 129.0, 80.0, 49.0, 34.0, 24.0, 22.0, 10.0, 7.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798828125, -1.73291015625, -1.6669921875, -1.60107421875, -1.53515625, -1.46923828125, -1.4033203125, -1.33740234375, -1.271484375, -1.20556640625, -1.1396484375, -1.07373046875, -1.0078125, -0.94189453125, -0.8759765625, -0.81005859375, -0.744140625, -0.67822265625, -0.6123046875, -0.54638671875, -0.48046875, -0.41455078125, -0.3486328125, -0.28271484375, -0.216796875, -0.15087890625, -0.0849609375, -0.01904296875, 0.046875, 0.11279296875, 0.1787109375, 0.24462890625, 0.310546875, 0.37646484375, 0.4423828125, 0.50830078125, 0.57421875, 0.64013671875, 0.7060546875, 0.77197265625, 0.837890625, 0.90380859375, 0.9697265625, 1.03564453125, 1.1015625, 1.16748046875, 1.2333984375, 1.29931640625, 1.365234375, 1.43115234375, 1.4970703125, 1.56298828125, 1.62890625, 1.69482421875, 1.7607421875, 1.82666015625, 1.892578125, 1.95849609375, 2.0244140625, 2.09033203125, 2.15625, 2.22216796875, 2.2880859375, 2.35400390625, 2.419921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 8.0, 18.0, 23.0, 20.0, 32.0, 29.0, 32.0, 28.0, 28.0, 41.0, 46.0, 43.0, 45.0, 44.0, 51.0, 41.0, 49.0, 47.0, 43.0, 39.0, 36.0, 42.0, 30.0, 23.0, 21.0, 19.0, 15.0, 15.0, 13.0, 12.0, 4.0, 4.0, 5.0, 1.0, 2.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.322265625, -1.27716064453125, -1.2320556640625, -1.18695068359375, -1.141845703125, -1.09674072265625, -1.0516357421875, -1.00653076171875, -0.96142578125, -0.91632080078125, -0.8712158203125, -0.82611083984375, -0.781005859375, -0.73590087890625, -0.6907958984375, -0.64569091796875, -0.6005859375, -0.55548095703125, -0.5103759765625, -0.46527099609375, -0.420166015625, -0.37506103515625, -0.3299560546875, -0.28485107421875, -0.23974609375, -0.19464111328125, -0.1495361328125, -0.10443115234375, -0.059326171875, -0.01422119140625, 0.0308837890625, 0.07598876953125, 0.12109375, 0.16619873046875, 0.2113037109375, 0.25640869140625, 0.301513671875, 0.34661865234375, 0.3917236328125, 0.43682861328125, 0.48193359375, 0.52703857421875, 0.5721435546875, 0.61724853515625, 0.662353515625, 0.70745849609375, 0.7525634765625, 0.79766845703125, 0.8427734375, 0.88787841796875, 0.9329833984375, 0.97808837890625, 1.023193359375, 1.06829833984375, 1.1134033203125, 1.15850830078125, 1.20361328125, 1.24871826171875, 1.2938232421875, 1.33892822265625, 1.384033203125, 1.42913818359375, 1.4742431640625, 1.51934814453125, 1.564453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 3.0, 5.0, 2.0, 4.0, 11.0, 15.0, 24.0, 30.0, 37.0, 51.0, 120.0, 159.0, 293.0, 487.0, 1112.0, 4003.0, 35299.0, 950719.0, 49031.0, 4569.0, 1292.0, 527.0, 292.0, 147.0, 97.0, 63.0, 41.0, 41.0, 16.0, 23.0, 11.0, 14.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.9212646484375, -3.783935546875, -3.6466064453125, -3.50927734375, -3.3719482421875, -3.234619140625, -3.0972900390625, -2.9599609375, -2.8226318359375, -2.685302734375, -2.5479736328125, -2.41064453125, -2.2733154296875, -2.135986328125, -1.9986572265625, -1.861328125, -1.7239990234375, -1.586669921875, -1.4493408203125, -1.31201171875, -1.1746826171875, -1.037353515625, -0.9000244140625, -0.7626953125, -0.6253662109375, -0.488037109375, -0.3507080078125, -0.21337890625, -0.0760498046875, 0.061279296875, 0.1986083984375, 0.3359375, 0.4732666015625, 0.610595703125, 0.7479248046875, 0.88525390625, 1.0225830078125, 1.159912109375, 1.2972412109375, 1.4345703125, 1.5718994140625, 1.709228515625, 1.8465576171875, 1.98388671875, 2.1212158203125, 2.258544921875, 2.3958740234375, 2.533203125, 2.6705322265625, 2.807861328125, 2.9451904296875, 3.08251953125, 3.2198486328125, 3.357177734375, 3.4945068359375, 3.6318359375, 3.7691650390625, 3.906494140625, 4.0438232421875, 4.18115234375, 4.3184814453125, 4.455810546875, 4.5931396484375, 4.73046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 5.0, 9.0, 10.0, 10.0, 18.0, 21.0, 22.0, 19.0, 27.0, 33.0, 29.0, 39.0, 51.0, 60.0, 79.0, 74.0, 72.0, 69.0, 54.0, 35.0, 38.0, 35.0, 36.0, 29.0, 27.0, 12.0, 12.0, 12.0, 7.0, 11.0, 9.0, 6.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.7103271484375, -5.514404296875, -5.3184814453125, -5.12255859375, -4.9266357421875, -4.730712890625, -4.5347900390625, -4.3388671875, -4.1429443359375, -3.947021484375, -3.7510986328125, -3.55517578125, -3.3592529296875, -3.163330078125, -2.9674072265625, -2.771484375, -2.5755615234375, -2.379638671875, -2.1837158203125, -1.98779296875, -1.7918701171875, -1.595947265625, -1.4000244140625, -1.2041015625, -1.0081787109375, -0.812255859375, -0.6163330078125, -0.42041015625, -0.2244873046875, -0.028564453125, 0.1673583984375, 0.36328125, 0.5592041015625, 0.755126953125, 0.9510498046875, 1.14697265625, 1.3428955078125, 1.538818359375, 1.7347412109375, 1.9306640625, 2.1265869140625, 2.322509765625, 2.5184326171875, 2.71435546875, 2.9102783203125, 3.106201171875, 3.3021240234375, 3.498046875, 3.6939697265625, 3.889892578125, 4.0858154296875, 4.28173828125, 4.4776611328125, 4.673583984375, 4.8695068359375, 5.0654296875, 5.2613525390625, 5.457275390625, 5.6531982421875, 5.84912109375, 6.0450439453125, 6.240966796875, 6.4368896484375, 6.6328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 8.0, 5.0, 5.0, 7.0, 10.0, 8.0, 12.0, 24.0, 35.0, 42.0, 67.0, 84.0, 89.0, 165.0, 272.0, 560.0, 1156.0, 2457.0, 7215.0, 28987.0, 728758.0, 242001.0, 25275.0, 6538.0, 2353.0, 1016.0, 539.0, 278.0, 189.0, 104.0, 82.0, 55.0, 41.0, 28.0, 21.0, 19.0, 10.0, 12.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4755859375, -0.4607048034667969, -0.44582366943359375, -0.4309425354003906, -0.4160614013671875, -0.4011802673339844, -0.38629913330078125, -0.3714179992675781, -0.356536865234375, -0.3416557312011719, -0.32677459716796875, -0.3118934631347656, -0.2970123291015625, -0.2821311950683594, -0.26725006103515625, -0.2523689270019531, -0.23748779296875, -0.22260665893554688, -0.20772552490234375, -0.19284439086914062, -0.1779632568359375, -0.16308212280273438, -0.14820098876953125, -0.13331985473632812, -0.118438720703125, -0.10355758666992188, -0.08867645263671875, -0.07379531860351562, -0.0589141845703125, -0.044033050537109375, -0.02915191650390625, -0.014270782470703125, 0.0006103515625, 0.015491485595703125, 0.03037261962890625, 0.045253753662109375, 0.0601348876953125, 0.07501602172851562, 0.08989715576171875, 0.10477828979492188, 0.119659423828125, 0.13454055786132812, 0.14942169189453125, 0.16430282592773438, 0.1791839599609375, 0.19406509399414062, 0.20894622802734375, 0.22382736206054688, 0.23870849609375, 0.2535896301269531, 0.26847076416015625, 0.2833518981933594, 0.2982330322265625, 0.3131141662597656, 0.32799530029296875, 0.3428764343261719, 0.357757568359375, 0.3726387023925781, 0.38751983642578125, 0.4024009704589844, 0.4172821044921875, 0.4321632385253906, 0.44704437255859375, 0.4619255065917969, 0.476806640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 8.0, 9.0, 14.0, 17.0, 23.0, 40.0, 59.0, 112.0, 154.0, 162.0, 121.0, 87.0, 52.0, 26.0, 18.0, 17.0, 22.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012612342834472656, -0.00012169033288955688, -0.00011725723743438721, -0.00011282414197921753, -0.00010839104652404785, -0.00010395795106887817, -9.95248556137085e-05, -9.509176015853882e-05, -9.065866470336914e-05, -8.622556924819946e-05, -8.179247379302979e-05, -7.735937833786011e-05, -7.292628288269043e-05, -6.849318742752075e-05, -6.406009197235107e-05, -5.9626996517181396e-05, -5.519390106201172e-05, -5.076080560684204e-05, -4.632771015167236e-05, -4.1894614696502686e-05, -3.746151924133301e-05, -3.302842378616333e-05, -2.8595328330993652e-05, -2.4162232875823975e-05, -1.9729137420654297e-05, -1.529604196548462e-05, -1.0862946510314941e-05, -6.429851055145264e-06, -1.996755599975586e-06, 2.436339855194092e-06, 6.8694353103637695e-06, 1.1302530765533447e-05, 1.5735626220703125e-05, 2.0168721675872803e-05, 2.460181713104248e-05, 2.9034912586212158e-05, 3.3468008041381836e-05, 3.7901103496551514e-05, 4.233419895172119e-05, 4.676729440689087e-05, 5.120038986206055e-05, 5.5633485317230225e-05, 6.00665807723999e-05, 6.449967622756958e-05, 6.893277168273926e-05, 7.336586713790894e-05, 7.779896259307861e-05, 8.223205804824829e-05, 8.666515350341797e-05, 9.109824895858765e-05, 9.553134441375732e-05, 9.9964439868927e-05, 0.00010439753532409668, 0.00010883063077926636, 0.00011326372623443604, 0.00011769682168960571, 0.0001221299171447754, 0.00012656301259994507, 0.00013099610805511475, 0.00013542920351028442, 0.0001398622989654541, 0.00014429539442062378, 0.00014872848987579346, 0.00015316158533096313, 0.0001575946807861328]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 10.0, 14.0, 14.0, 15.0, 30.0, 59.0, 78.0, 125.0, 240.0, 424.0, 865.0, 2101.0, 5250.0, 16276.0, 72814.0, 827439.0, 93246.0, 19318.0, 5957.0, 2196.0, 982.0, 472.0, 227.0, 147.0, 83.0, 53.0, 27.0, 24.0, 14.0, 11.0, 16.0, 8.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369384765625, -0.3559837341308594, -0.34258270263671875, -0.3291816711425781, -0.3157806396484375, -0.3023796081542969, -0.28897857666015625, -0.2755775451660156, -0.262176513671875, -0.24877548217773438, -0.23537445068359375, -0.22197341918945312, -0.2085723876953125, -0.19517135620117188, -0.18177032470703125, -0.16836929321289062, -0.15496826171875, -0.14156723022460938, -0.12816619873046875, -0.11476516723632812, -0.1013641357421875, -0.08796310424804688, -0.07456207275390625, -0.061161041259765625, -0.047760009765625, -0.034358978271484375, -0.02095794677734375, -0.007556915283203125, 0.0058441162109375, 0.019245147705078125, 0.03264617919921875, 0.046047210693359375, 0.0594482421875, 0.07284927368164062, 0.08625030517578125, 0.09965133666992188, 0.1130523681640625, 0.12645339965820312, 0.13985443115234375, 0.15325546264648438, 0.166656494140625, 0.18005752563476562, 0.19345855712890625, 0.20685958862304688, 0.2202606201171875, 0.23366165161132812, 0.24706268310546875, 0.2604637145996094, 0.27386474609375, 0.2872657775878906, 0.30066680908203125, 0.3140678405761719, 0.3274688720703125, 0.3408699035644531, 0.35427093505859375, 0.3676719665527344, 0.381072998046875, 0.3944740295410156, 0.40787506103515625, 0.4212760925292969, 0.4346771240234375, 0.4480781555175781, 0.46147918701171875, 0.4748802185058594, 0.48828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 6.0, 3.0, 7.0, 9.0, 13.0, 18.0, 21.0, 25.0, 36.0, 62.0, 83.0, 108.0, 116.0, 135.0, 85.0, 62.0, 42.0, 29.0, 24.0, 24.0, 16.0, 6.0, 8.0, 17.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490234375, -0.47313690185546875, -0.4560394287109375, -0.43894195556640625, -0.421844482421875, -0.40474700927734375, -0.3876495361328125, -0.37055206298828125, -0.35345458984375, -0.33635711669921875, -0.3192596435546875, -0.30216217041015625, -0.285064697265625, -0.26796722412109375, -0.2508697509765625, -0.23377227783203125, -0.2166748046875, -0.19957733154296875, -0.1824798583984375, -0.16538238525390625, -0.148284912109375, -0.13118743896484375, -0.1140899658203125, -0.09699249267578125, -0.07989501953125, -0.06279754638671875, -0.0457000732421875, -0.02860260009765625, -0.011505126953125, 0.00559234619140625, 0.0226898193359375, 0.03978729248046875, 0.056884765625, 0.07398223876953125, 0.0910797119140625, 0.10817718505859375, 0.125274658203125, 0.14237213134765625, 0.1594696044921875, 0.17656707763671875, 0.19366455078125, 0.21076202392578125, 0.2278594970703125, 0.24495697021484375, 0.262054443359375, 0.27915191650390625, 0.2962493896484375, 0.31334686279296875, 0.3304443359375, 0.34754180908203125, 0.3646392822265625, 0.38173675537109375, 0.398834228515625, 0.41593170166015625, 0.4330291748046875, 0.45012664794921875, 0.46722412109375, 0.48432159423828125, 0.5014190673828125, 0.5185165405273438, 0.535614013671875, 0.5527114868164062, 0.5698089599609375, 0.5869064331054688, 0.60400390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 22.0, 93.0, 691.0, 139.0, 38.0, 14.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.21783447265625, -75.26878356933594, -73.31973266601562, -71.37068176269531, -69.42162322998047, -67.47257232666016, -65.52352142333984, -63.57447052001953, -61.62541580200195, -59.67636489868164, -57.72731018066406, -55.77825927734375, -53.82920837402344, -51.88015365600586, -49.93110275268555, -47.98204803466797, -46.032997131347656, -44.083946228027344, -42.134891510009766, -40.18584060668945, -38.23678970336914, -36.28773498535156, -34.33868408203125, -32.38963317871094, -30.440582275390625, -28.49152946472168, -26.542478561401367, -24.593425750732422, -22.644372940063477, -20.69532012939453, -18.74626922607422, -16.797216415405273, -14.848163604736328, -12.8991117477417, -10.950058937072754, -9.001007080078125, -7.051954746246338, -5.102902412414551, -3.153850555419922, -1.2047977447509766, 0.7442541122436523, 2.6933064460754395, 4.642358779907227, 6.5914106369018555, 8.540462493896484, 10.48951530456543, 12.438567161560059, 14.387619972229004, 16.336671829223633, 18.285724639892578, 20.23477554321289, 22.183828353881836, 24.13288116455078, 26.081932067871094, 28.03098487854004, 29.980037689208984, 31.929088592529297, 33.87813949584961, 35.82719421386719, 37.7762451171875, 39.72529602050781, 41.67435073852539, 43.6234016418457, 45.57245635986328, 47.521507263183594]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 12.0, 16.0, 16.0, 22.0, 37.0, 29.0, 43.0, 48.0, 87.0, 332.0, 128.0, 35.0, 30.0, 21.0, 34.0, 18.0, 14.0, 13.0, 15.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53497886657715, -18.7392635345459, -17.943546295166016, -17.147830963134766, -16.352115631103516, -15.556398391723633, -14.760683059692383, -13.964966773986816, -13.16925048828125, -12.373534202575684, -11.577818870544434, -10.782102584838867, -9.9863862991333, -9.190670013427734, -8.394954681396484, -7.599238395690918, -6.803523063659668, -6.00780725479126, -5.212090969085693, -4.416375160217285, -3.620659112930298, -2.8249430656433105, -2.0292272567749023, -1.233510971069336, -0.43779516220092773, 0.3579208254814148, 1.1536368131637573, 1.949352741241455, 2.7450687885284424, 3.5407848358154297, 4.336500644683838, 5.132216930389404, 5.9279327392578125, 6.723648548126221, 7.519364833831787, 8.315080642700195, 9.110796928405762, 9.906513214111328, 10.702228546142578, 11.497944831848145, 12.293661117553711, 13.089377403259277, 13.885092735290527, 14.680809020996094, 15.47652530670166, 16.272241592407227, 17.067956924438477, 17.86367416381836, 18.65938949584961, 19.45510482788086, 20.250822067260742, 21.046537399291992, 21.842252731323242, 22.637969970703125, 23.433685302734375, 24.229400634765625, 25.025115966796875, 25.820831298828125, 26.616548538208008, 27.412263870239258, 28.207979202270508, 29.00369644165039, 29.79941177368164, 30.59512710571289, 31.390844345092773]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 17.0, 11.0, 13.0, 12.0, 18.0, 24.0, 15.0, 22.0, 29.0, 30.0, 36.0, 38.0, 71.0, 249.0, 122.0, 48.0, 25.0, 35.0, 29.0, 28.0, 28.0, 10.0, 17.0, 10.0, 13.0, 7.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.5032958984375, -1.452880859375, -1.4024658203125, -1.35205078125, -1.3016357421875, -1.251220703125, -1.2008056640625, -1.150390625, -1.0999755859375, -1.049560546875, -0.9991455078125, -0.94873046875, -0.8983154296875, -0.847900390625, -0.7974853515625, -0.7470703125, -0.6966552734375, -0.646240234375, -0.5958251953125, -0.54541015625, -0.4949951171875, -0.444580078125, -0.3941650390625, -0.34375, -0.2933349609375, -0.242919921875, -0.1925048828125, -0.14208984375, -0.0916748046875, -0.041259765625, 0.0091552734375, 0.0595703125, 0.1099853515625, 0.160400390625, 0.2108154296875, 0.26123046875, 0.3116455078125, 0.362060546875, 0.4124755859375, 0.462890625, 0.5133056640625, 0.563720703125, 0.6141357421875, 0.66455078125, 0.7149658203125, 0.765380859375, 0.8157958984375, 0.8662109375, 0.9166259765625, 0.967041015625, 1.0174560546875, 1.06787109375, 1.1182861328125, 1.168701171875, 1.2191162109375, 1.26953125, 1.3199462890625, 1.370361328125, 1.4207763671875, 1.47119140625, 1.5216064453125, 1.572021484375, 1.6224365234375, 1.6728515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 12.0, 5.0, 11.0, 20.0, 22.0, 17.0, 44.0, 92.0, 222.0, 538.0, 2195.0, 29759.0, 8348307.0, 5744.0, 985.0, 314.0, 122.0, 50.0, 29.0, 31.0, 15.0, 9.0, 3.0, 11.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.087568283081055, -26.318666458129883, -25.549766540527344, -24.780864715576172, -24.011962890625, -23.24306297302246, -22.47416114807129, -21.70526123046875, -20.936359405517578, -20.167457580566406, -19.398557662963867, -18.629655838012695, -17.860755920410156, -17.091854095458984, -16.322952270507812, -15.554051399230957, -14.785150527954102, -14.016249656677246, -13.24734878540039, -12.478446960449219, -11.709546089172363, -10.940645217895508, -10.171743392944336, -9.40284252166748, -8.633941650390625, -7.8650407791137695, -7.096139430999756, -6.327238082885742, -5.558337211608887, -4.789436340332031, -4.020534992218018, -3.251633644104004, -2.4827327728271484, -1.7138316631317139, -0.9449305534362793, -0.17602944374084473, 0.5928716659545898, 1.3617727756500244, 2.130673885345459, 2.8995752334594727, 3.668476104736328, 4.437376976013184, 5.206278324127197, 5.975179672241211, 6.744080543518066, 7.512981414794922, 8.281883239746094, 9.05078411102295, 9.819684982299805, 10.58858585357666, 11.357486724853516, 12.126388549804688, 12.895289421081543, 13.664190292358398, 14.43309211730957, 15.201992988586426, 15.970893859863281, 16.739795684814453, 17.508695602416992, 18.277597427368164, 19.046497344970703, 19.815399169921875, 20.584300994873047, 21.35320281982422, 22.122102737426758]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 8.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 4.0, 5.0, 4.0, 3.0, 3.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.20661163330078, -25.489341735839844, -24.772071838378906, -24.05480194091797, -23.33753204345703, -22.620262145996094, -21.902992248535156, -21.18572235107422, -20.46845245361328, -19.751182556152344, -19.033912658691406, -18.31664276123047, -17.59937286376953, -16.882102966308594, -16.164833068847656, -15.447564125061035, -14.730295181274414, -14.013025283813477, -13.295755386352539, -12.578485488891602, -11.861215591430664, -11.143945693969727, -10.426676750183105, -9.709406852722168, -8.99213695526123, -8.274867057800293, -7.5575971603393555, -6.840327739715576, -6.123057842254639, -5.405787944793701, -4.688518524169922, -3.9712486267089844, -3.253978729248047, -2.5367088317871094, -1.819439172744751, -1.1021695137023926, -0.3848996162414551, 0.3323702812194824, 1.0496397018432617, 1.7669095993041992, 2.4841794967651367, 3.201449394226074, 3.9187190532684326, 4.635988712310791, 5.3532586097717285, 6.070528507232666, 6.787797927856445, 7.505067825317383, 8.22233772277832, 8.939607620239258, 9.656877517700195, 10.374147415161133, 11.09141731262207, 11.808687210083008, 12.525956153869629, 13.243226051330566, 13.960495948791504, 14.677765846252441, 15.395035743713379, 16.1123046875, 16.829574584960938, 17.546844482421875, 18.264114379882812, 18.98138427734375, 19.698654174804688]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 9.0, 8.0, 11.0, 25.0, 23.0, 40.0, 41.0, 75.0, 117.0, 162.0, 247.0, 444.0, 978.0, 2383.0, 6784.0, 22236.0, 79559.0, 221622.0, 134231.0, 37455.0, 11177.0, 3706.0, 1397.0, 623.0, 325.0, 197.0, 121.0, 87.0, 40.0, 44.0, 20.0, 10.0, 20.0, 13.0, 11.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-15.9140625, -15.48046875, -15.046875, -14.61328125, -14.1796875, -13.74609375, -13.3125, -12.87890625, -12.4453125, -12.01171875, -11.578125, -11.14453125, -10.7109375, -10.27734375, -9.84375, -9.41015625, -8.9765625, -8.54296875, -8.109375, -7.67578125, -7.2421875, -6.80859375, -6.375, -5.94140625, -5.5078125, -5.07421875, -4.640625, -4.20703125, -3.7734375, -3.33984375, -2.90625, -2.47265625, -2.0390625, -1.60546875, -1.171875, -0.73828125, -0.3046875, 0.12890625, 0.5625, 0.99609375, 1.4296875, 1.86328125, 2.296875, 2.73046875, 3.1640625, 3.59765625, 4.03125, 4.46484375, 4.8984375, 5.33203125, 5.765625, 6.19921875, 6.6328125, 7.06640625, 7.5, 7.93359375, 8.3671875, 8.80078125, 9.234375, 9.66796875, 10.1015625, 10.53515625, 10.96875, 11.40234375, 11.8359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 5.0, 12.0, 17.0, 20.0, 10.0, 32.0, 24.0, 29.0, 36.0, 35.0, 46.0, 38.0, 52.0, 42.0, 52.0, 55.0, 64.0, 56.0, 50.0, 46.0, 38.0, 40.0, 38.0, 22.0, 13.0, 18.0, 21.0, 11.0, 15.0, 8.0, 10.0, 8.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1759033203125, -1.132080078125, -1.0882568359375, -1.04443359375, -1.0006103515625, -0.956787109375, -0.9129638671875, -0.869140625, -0.8253173828125, -0.781494140625, -0.7376708984375, -0.69384765625, -0.6500244140625, -0.606201171875, -0.5623779296875, -0.5185546875, -0.4747314453125, -0.430908203125, -0.3870849609375, -0.34326171875, -0.2994384765625, -0.255615234375, -0.2117919921875, -0.16796875, -0.1241455078125, -0.080322265625, -0.0364990234375, 0.00732421875, 0.0511474609375, 0.094970703125, 0.1387939453125, 0.1826171875, 0.2264404296875, 0.270263671875, 0.3140869140625, 0.35791015625, 0.4017333984375, 0.445556640625, 0.4893798828125, 0.533203125, 0.5770263671875, 0.620849609375, 0.6646728515625, 0.70849609375, 0.7523193359375, 0.796142578125, 0.8399658203125, 0.8837890625, 0.9276123046875, 0.971435546875, 1.0152587890625, 1.05908203125, 1.1029052734375, 1.146728515625, 1.1905517578125, 1.234375, 1.2781982421875, 1.322021484375, 1.3658447265625, 1.40966796875, 1.4534912109375, 1.497314453125, 1.5411376953125, 1.5849609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 2.0, 4.0, 6.0, 11.0, 21.0, 23.0, 31.0, 54.0, 59.0, 57.0, 52.0, 45.0, 36.0, 30.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.700535774230957, -10.33536148071289, -9.970187187194824, -9.605012893676758, -9.239838600158691, -8.874664306640625, -8.509490013122559, -8.144315719604492, -7.779141426086426, -7.413967132568359, -7.048792839050293, -6.683618545532227, -6.31844425201416, -5.953269958496094, -5.588095664978027, -5.222921371459961, -4.857747554779053, -4.492573261260986, -4.12739896774292, -3.7622246742248535, -3.397050380706787, -3.0318760871887207, -2.6667020320892334, -2.301527738571167, -1.9363534450531006, -1.5711791515350342, -1.2060048580169678, -0.8408306837081909, -0.4756563901901245, -0.1104820966720581, 0.25469207763671875, 0.6198663711547852, 0.9850406646728516, 1.350214958190918, 1.7153892517089844, 2.080563545227051, 2.445737838745117, 2.8109121322631836, 3.176086187362671, 3.5412604808807373, 3.9064347743988037, 4.271608829498291, 4.636783123016357, 5.001957416534424, 5.36713171005249, 5.732306003570557, 6.097480297088623, 6.4626545906066895, 6.827828884124756, 7.193003177642822, 7.558177471160889, 7.923351764678955, 8.288525581359863, 8.65369987487793, 9.018874168395996, 9.384048461914062, 9.749222755432129, 10.114397048950195, 10.479571342468262, 10.844745635986328, 11.209919929504395, 11.575094223022461, 11.940268516540527, 12.305442810058594, 12.67061710357666]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 11.0, 3.0, 4.0, 11.0, 11.0, 14.0, 32.0, 55.0, 49.0, 68.0, 63.0, 54.0, 29.0, 23.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.292442321777344, -8.072317123413086, -7.852191925048828, -7.63206672668457, -7.4119415283203125, -7.191816329956055, -6.971691131591797, -6.751565933227539, -6.531440734863281, -6.311315536499023, -6.091190338134766, -5.871065139770508, -5.65093994140625, -5.430814743041992, -5.210689544677734, -4.990564346313477, -4.770439147949219, -4.550313949584961, -4.330188751220703, -4.110063552856445, -3.8899383544921875, -3.6698131561279297, -3.449687957763672, -3.229562759399414, -3.009437084197998, -2.7893118858337402, -2.5691866874694824, -2.3490614891052246, -2.128936290740967, -1.9088109731674194, -1.6886857748031616, -1.4685605764389038, -1.2484354972839355, -1.0283102989196777, -0.8081851005554199, -0.5880598425865173, -0.3679346442222595, -0.14780938625335693, 0.07231581211090088, 0.2924410104751587, 0.5125662088394165, 0.7326914072036743, 0.9528166055679321, 1.1729419231414795, 1.3930671215057373, 1.6131923198699951, 1.833317518234253, 2.0534427165985107, 2.2735679149627686, 2.4936931133270264, 2.713818311691284, 2.933943510055542, 3.1540687084198, 3.3741941452026367, 3.5943193435668945, 3.8144445419311523, 4.03456974029541, 4.254694938659668, 4.474820137023926, 4.694945335388184, 4.915070533752441, 5.135195732116699, 5.355320930480957, 5.575446128845215, 5.795571327209473]}, "eval/loss": 5.412105083465576, "eval/wer": 1.2854224514081714, "eval/runtime": 687.2355, "eval/samples_per_second": 3.844, "eval/steps_per_second": 0.482} \ No newline at end of file