diff --git "a/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" --- "a/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" +++ "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.8157, "train/learning_rate": 2.4049881235154395e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 112038, "_timestamp": 1647057806, "_step": 16510, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 93.0, 21.0, 9.0, 6.0, 5.0, 3.0, 30273.0, 61.0, 21.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.84375, -39.2177734375, -37.591796875, -35.9658203125, -34.33984375, -32.7138671875, -31.087890625, -29.4619140625, -27.8359375, -26.2099609375, -24.583984375, -22.9580078125, -21.33203125, -19.7060546875, -18.080078125, -16.4541015625, -14.828125, -13.2021484375, -11.576171875, -9.9501953125, -8.32421875, -6.6982421875, -5.072265625, -3.4462890625, -1.8203125, -0.1943359375, 1.431640625, 3.0576171875, 4.68359375, 6.3095703125, 7.935546875, 9.5615234375, 11.1875, 12.8134765625, 14.439453125, 16.0654296875, 17.69140625, 19.3173828125, 20.943359375, 22.5693359375, 24.1953125, 25.8212890625, 27.447265625, 29.0732421875, 30.69921875, 32.3251953125, 33.951171875, 35.5771484375, 37.203125, 38.8291015625, 40.455078125, 42.0810546875, 43.70703125, 45.3330078125, 46.958984375, 48.5849609375, 50.2109375, 51.8369140625, 53.462890625, 55.0888671875, 56.71484375, 58.3408203125, 59.966796875, 61.5927734375, 63.21875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 28.0, 74.0, 196.0, 347.0, 243.0, 90.0, 23.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.096628189086914, -14.212224960327148, -12.327821731567383, -10.4434175491333, -8.559014320373535, -6.6746110916137695, -4.7902069091796875, -2.905803680419922, -1.0214004516601562, 0.8630030155181885, 2.747406482696533, 4.631810188293457, 6.516213417053223, 8.400616645812988, 10.28502082824707, 12.169424057006836, 14.053827285766602, 15.938230514526367, 17.822633743286133, 19.70703887939453, 21.591442108154297, 23.475845336914062, 25.360248565673828, 27.244651794433594, 29.12905502319336, 31.013458251953125, 32.89786148071289, 34.782264709472656, 36.66666793823242, 38.55107116699219, 40.43547821044922, 42.31987762451172, 44.20428466796875, 46.088687896728516, 47.97309112548828, 49.85749435424805, 51.74189758300781, 53.62630081176758, 55.510704040527344, 57.395111083984375, 59.279510498046875, 61.16391372680664, 63.048316955566406, 64.93272399902344, 66.81712341308594, 68.70153045654297, 70.58592987060547, 72.4703369140625, 74.354736328125, 76.23914337158203, 78.12354278564453, 80.00794982910156, 81.89234924316406, 83.7767562866211, 85.6611557006836, 87.54556274414062, 89.42996978759766, 91.31437683105469, 93.19877624511719, 95.08318328857422, 96.96758270263672, 98.85198974609375, 100.73638916015625, 102.62079620361328, 104.50519561767578]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 12.0, 6.0, 3.0, 8.0, 3.0, 12.0, 13.0, 13.0, 22.0, 21.0, 16.0, 27.0, 37.0, 37.0, 28.0, 36.0, 35.0, 44.0, 49.0, 47.0, 43.0, 47.0, 42.0, 42.0, 31.0, 49.0, 37.0, 38.0, 35.0, 36.0, 21.0, 14.0, 20.0, 14.0, 21.0, 17.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.896860122680664, -17.388872146606445, -16.88088607788086, -16.37289810180664, -15.864911079406738, -15.356924057006836, -14.848937034606934, -14.340950012207031, -13.832962036132812, -13.32497501373291, -12.816987991333008, -12.309000015258789, -11.801012992858887, -11.293025970458984, -10.785038948059082, -10.27705192565918, -9.769064903259277, -9.261077880859375, -8.753090858459473, -8.24510383605957, -7.737115859985352, -7.229128837585449, -6.721141815185547, -6.2131547927856445, -5.705167293548584, -5.197180271148682, -4.689192771911621, -4.181205749511719, -3.6732184886932373, -3.165231227874756, -2.6572442054748535, -2.149256944656372, -1.6412696838378906, -1.1332824230194092, -0.6252952814102173, -0.11730813980102539, 0.39067912101745605, 0.8986663818359375, 1.4066534042358398, 1.9146406650543213, 2.4226279258728027, 2.930615186691284, 3.4386024475097656, 3.946589469909668, 4.45457649230957, 4.962563991546631, 5.470551013946533, 5.978538513183594, 6.486525535583496, 6.994512557983398, 7.502500057220459, 8.010486602783203, 8.518474578857422, 9.026461601257324, 9.534448623657227, 10.042435646057129, 10.550422668457031, 11.058409690856934, 11.566396713256836, 12.074384689331055, 12.582371711730957, 13.09035873413086, 13.598345756530762, 14.106332778930664, 14.614320755004883]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 10.0, 4.0, 9.0, 10.0, 14.0, 14.0, 22.0, 12.0, 33.0, 76.0, 108.0, 266.0, 615.0, 1720.0, 5063.0, 14832.0, 42896.0, 112035.0, 225670.0, 345035.0, 178506.0, 78149.0, 28556.0, 9449.0, 3457.0, 1153.0, 418.0, 177.0, 74.0, 45.0, 27.0, 21.0, 15.0, 14.0, 10.0, 8.0, 10.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.65625, -47.14990234375, -45.6435546875, -44.13720703125, -42.630859375, -41.12451171875, -39.6181640625, -38.11181640625, -36.60546875, -35.09912109375, -33.5927734375, -32.08642578125, -30.580078125, -29.07373046875, -27.5673828125, -26.06103515625, -24.5546875, -23.04833984375, -21.5419921875, -20.03564453125, -18.529296875, -17.02294921875, -15.5166015625, -14.01025390625, -12.50390625, -10.99755859375, -9.4912109375, -7.98486328125, -6.478515625, -4.97216796875, -3.4658203125, -1.95947265625, -0.453125, 1.05322265625, 2.5595703125, 4.06591796875, 5.572265625, 7.07861328125, 8.5849609375, 10.09130859375, 11.59765625, 13.10400390625, 14.6103515625, 16.11669921875, 17.623046875, 19.12939453125, 20.6357421875, 22.14208984375, 23.6484375, 25.15478515625, 26.6611328125, 28.16748046875, 29.673828125, 31.18017578125, 32.6865234375, 34.19287109375, 35.69921875, 37.20556640625, 38.7119140625, 40.21826171875, 41.724609375, 43.23095703125, 44.7373046875, 46.24365234375, 47.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 12.0, 3.0, 14.0, 20.0, 14.0, 14.0, 18.0, 23.0, 20.0, 26.0, 28.0, 35.0, 30.0, 41.0, 30.0, 38.0, 38.0, 59.0, 94.0, 39.0, 29.0, 46.0, 41.0, 37.0, 28.0, 25.0, 27.0, 32.0, 26.0, 24.0, 12.0, 14.0, 13.0, 13.0, 4.0, 13.0, 5.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.5078125, -13.08740234375, -12.6669921875, -12.24658203125, -11.826171875, -11.40576171875, -10.9853515625, -10.56494140625, -10.14453125, -9.72412109375, -9.3037109375, -8.88330078125, -8.462890625, -8.04248046875, -7.6220703125, -7.20166015625, -6.78125, -6.36083984375, -5.9404296875, -5.52001953125, -5.099609375, -4.67919921875, -4.2587890625, -3.83837890625, -3.41796875, -2.99755859375, -2.5771484375, -2.15673828125, -1.736328125, -1.31591796875, -0.8955078125, -0.47509765625, -0.0546875, 0.36572265625, 0.7861328125, 1.20654296875, 1.626953125, 2.04736328125, 2.4677734375, 2.88818359375, 3.30859375, 3.72900390625, 4.1494140625, 4.56982421875, 4.990234375, 5.41064453125, 5.8310546875, 6.25146484375, 6.671875, 7.09228515625, 7.5126953125, 7.93310546875, 8.353515625, 8.77392578125, 9.1943359375, 9.61474609375, 10.03515625, 10.45556640625, 10.8759765625, 11.29638671875, 11.716796875, 12.13720703125, 12.5576171875, 12.97802734375, 13.3984375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 7.0, 14.0, 9.0, 14.0, 9.0, 17.0, 25.0, 25.0, 32.0, 30.0, 32.0, 39.0, 29.0, 45.0, 51.0, 72.0, 61.0, 57.0, 53.0, 58.0, 50.0, 50.0, 37.0, 33.0, 34.0, 29.0, 15.0, 14.0, 15.0, 5.0, 9.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.938274383544922, -17.386890411376953, -16.835508346557617, -16.28412628173828, -15.732742309570312, -15.18135929107666, -14.629976272583008, -14.078593254089355, -13.527210235595703, -12.97582721710205, -12.424444198608398, -11.873061180114746, -11.321678161621094, -10.770295143127441, -10.218912124633789, -9.667529106140137, -9.116146087646484, -8.564763069152832, -8.01338005065918, -7.461997032165527, -6.910614013671875, -6.359230995178223, -5.80784797668457, -5.256464958190918, -4.705081939697266, -4.153698921203613, -3.602315902709961, -3.0509328842163086, -2.4995498657226562, -1.948166847229004, -1.3967838287353516, -0.8454008102416992, -0.29401588439941406, 0.2573671340942383, 0.8087501525878906, 1.360133171081543, 1.9115161895751953, 2.4628992080688477, 3.0142822265625, 3.5656652450561523, 4.117048263549805, 4.668431282043457, 5.219814300537109, 5.771197319030762, 6.322580337524414, 6.873963356018066, 7.425346374511719, 7.976729393005371, 8.528112411499023, 9.079495429992676, 9.630878448486328, 10.18226146697998, 10.733644485473633, 11.285027503967285, 11.836410522460938, 12.38779354095459, 12.939176559448242, 13.490559577941895, 14.041942596435547, 14.5933256149292, 15.144708633422852, 15.696091651916504, 16.247474670410156, 16.798858642578125, 17.35024070739746]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 3.0, 7.0, 10.0, 10.0, 6.0, 8.0, 14.0, 17.0, 18.0, 21.0, 16.0, 32.0, 18.0, 19.0, 27.0, 21.0, 27.0, 46.0, 40.0, 38.0, 44.0, 44.0, 38.0, 30.0, 31.0, 29.0, 36.0, 29.0, 32.0, 30.0, 32.0, 15.0, 25.0, 24.0, 17.0, 16.0, 16.0, 24.0, 16.0, 10.0, 9.0, 14.0, 5.0, 9.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0], "bins": [-15.767623901367188, -15.255992889404297, -14.744361877441406, -14.2327299118042, -13.721098899841309, -13.209467887878418, -12.697835922241211, -12.18620491027832, -11.67457389831543, -11.162942886352539, -10.651311874389648, -10.139679908752441, -9.62804889678955, -9.11641788482666, -8.604785919189453, -8.093154907226562, -7.581523895263672, -7.069892883300781, -6.558261394500732, -6.046629905700684, -5.534998893737793, -5.023367881774902, -4.5117363929748535, -4.000104904174805, -3.488473892211914, -2.9768426418304443, -2.4652113914489746, -1.9535801410675049, -1.4419488906860352, -0.9303176403045654, -0.4186863899230957, 0.09294486045837402, 0.6045780181884766, 1.1162092685699463, 1.627840518951416, 2.1394717693328857, 2.6511030197143555, 3.162734270095825, 3.674365520477295, 4.185997009277344, 4.697628021240234, 5.209259033203125, 5.720890522003174, 6.232522010803223, 6.744153022766113, 7.255784034729004, 7.767415523529053, 8.279047012329102, 8.790678024291992, 9.302309036254883, 9.813940048217773, 10.32557201385498, 10.837203025817871, 11.348834037780762, 11.860466003417969, 12.37209701538086, 12.88372802734375, 13.39535903930664, 13.906990051269531, 14.418622016906738, 14.930253028869629, 15.44188404083252, 15.953516006469727, 16.465147018432617, 16.976778030395508]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 8.0, 6.0, 8.0, 8.0, 16.0, 10.0, 22.0, 23.0, 28.0, 51.0, 58.0, 92.0, 152.0, 296.0, 533.0, 1112.0, 2372.0, 5479.0, 13994.0, 42343.0, 304005.0, 3570178.0, 196721.0, 35179.0, 12246.0, 4805.0, 2167.0, 1038.0, 527.0, 290.0, 163.0, 94.0, 68.0, 45.0, 31.0, 26.0, 18.0, 19.0, 8.0, 11.0, 2.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-32.125, -31.10302734375, -30.0810546875, -29.05908203125, -28.037109375, -27.01513671875, -25.9931640625, -24.97119140625, -23.94921875, -22.92724609375, -21.9052734375, -20.88330078125, -19.861328125, -18.83935546875, -17.8173828125, -16.79541015625, -15.7734375, -14.75146484375, -13.7294921875, -12.70751953125, -11.685546875, -10.66357421875, -9.6416015625, -8.61962890625, -7.59765625, -6.57568359375, -5.5537109375, -4.53173828125, -3.509765625, -2.48779296875, -1.4658203125, -0.44384765625, 0.578125, 1.60009765625, 2.6220703125, 3.64404296875, 4.666015625, 5.68798828125, 6.7099609375, 7.73193359375, 8.75390625, 9.77587890625, 10.7978515625, 11.81982421875, 12.841796875, 13.86376953125, 14.8857421875, 15.90771484375, 16.9296875, 17.95166015625, 18.9736328125, 19.99560546875, 21.017578125, 22.03955078125, 23.0615234375, 24.08349609375, 25.10546875, 26.12744140625, 27.1494140625, 28.17138671875, 29.193359375, 30.21533203125, 31.2373046875, 32.25927734375, 33.28125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 5.0, 9.0, 9.0, 15.0, 13.0, 13.0, 18.0, 23.0, 26.0, 30.0, 28.0, 37.0, 33.0, 39.0, 23.0, 35.0, 40.0, 38.0, 37.0, 43.0, 42.0, 34.0, 37.0, 31.0, 29.0, 27.0, 28.0, 23.0, 31.0, 30.0, 21.0, 20.0, 19.0, 13.0, 16.0, 18.0, 8.0, 8.0, 6.0, 2.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.3359375, -9.995361328125, -9.65478515625, -9.314208984375, -8.9736328125, -8.633056640625, -8.29248046875, -7.951904296875, -7.611328125, -7.270751953125, -6.93017578125, -6.589599609375, -6.2490234375, -5.908447265625, -5.56787109375, -5.227294921875, -4.88671875, -4.546142578125, -4.20556640625, -3.864990234375, -3.5244140625, -3.183837890625, -2.84326171875, -2.502685546875, -2.162109375, -1.821533203125, -1.48095703125, -1.140380859375, -0.7998046875, -0.459228515625, -0.11865234375, 0.221923828125, 0.5625, 0.903076171875, 1.24365234375, 1.584228515625, 1.9248046875, 2.265380859375, 2.60595703125, 2.946533203125, 3.287109375, 3.627685546875, 3.96826171875, 4.308837890625, 4.6494140625, 4.989990234375, 5.33056640625, 5.671142578125, 6.01171875, 6.352294921875, 6.69287109375, 7.033447265625, 7.3740234375, 7.714599609375, 8.05517578125, 8.395751953125, 8.736328125, 9.076904296875, 9.41748046875, 9.758056640625, 10.0986328125, 10.439208984375, 10.77978515625, 11.120361328125, 11.4609375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 6.0, 15.0, 28.0, 53.0, 83.0, 202.0, 654.0, 22225.0, 4162711.0, 7446.0, 512.0, 154.0, 83.0, 42.0, 17.0, 16.0, 12.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-306.25, -299.5048828125, -292.759765625, -286.0146484375, -279.26953125, -272.5244140625, -265.779296875, -259.0341796875, -252.2890625, -245.5439453125, -238.798828125, -232.0537109375, -225.30859375, -218.5634765625, -211.818359375, -205.0732421875, -198.328125, -191.5830078125, -184.837890625, -178.0927734375, -171.34765625, -164.6025390625, -157.857421875, -151.1123046875, -144.3671875, -137.6220703125, -130.876953125, -124.1318359375, -117.38671875, -110.6416015625, -103.896484375, -97.1513671875, -90.40625, -83.6611328125, -76.916015625, -70.1708984375, -63.42578125, -56.6806640625, -49.935546875, -43.1904296875, -36.4453125, -29.7001953125, -22.955078125, -16.2099609375, -9.46484375, -2.7197265625, 4.025390625, 10.7705078125, 17.515625, 24.2607421875, 31.005859375, 37.7509765625, 44.49609375, 51.2412109375, 57.986328125, 64.7314453125, 71.4765625, 78.2216796875, 84.966796875, 91.7119140625, 98.45703125, 105.2021484375, 111.947265625, 118.6923828125, 125.4375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 3.0, 5.0, 16.0, 19.0, 31.0, 58.0, 82.0, 171.0, 400.0, 1575.0, 1085.0, 304.0, 137.0, 77.0, 40.0, 26.0, 18.0, 14.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.51995849609375, -15.1492919921875, -14.77862548828125, -14.407958984375, -14.03729248046875, -13.6666259765625, -13.29595947265625, -12.92529296875, -12.55462646484375, -12.1839599609375, -11.81329345703125, -11.442626953125, -11.07196044921875, -10.7012939453125, -10.33062744140625, -9.9599609375, -9.58929443359375, -9.2186279296875, -8.84796142578125, -8.477294921875, -8.10662841796875, -7.7359619140625, -7.36529541015625, -6.99462890625, -6.62396240234375, -6.2532958984375, -5.88262939453125, -5.511962890625, -5.14129638671875, -4.7706298828125, -4.39996337890625, -4.029296875, -3.65863037109375, -3.2879638671875, -2.91729736328125, -2.546630859375, -2.17596435546875, -1.8052978515625, -1.43463134765625, -1.06396484375, -0.69329833984375, -0.3226318359375, 0.04803466796875, 0.418701171875, 0.78936767578125, 1.1600341796875, 1.53070068359375, 1.9013671875, 2.27203369140625, 2.6427001953125, 3.01336669921875, 3.384033203125, 3.75469970703125, 4.1253662109375, 4.49603271484375, 4.86669921875, 5.23736572265625, 5.6080322265625, 5.97869873046875, 6.349365234375, 6.72003173828125, 7.0906982421875, 7.46136474609375, 7.83203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 12.0, 7.0, 14.0, 14.0, 11.0, 14.0, 13.0, 25.0, 16.0, 28.0, 33.0, 35.0, 39.0, 39.0, 49.0, 46.0, 43.0, 42.0, 36.0, 37.0, 43.0, 51.0, 31.0, 41.0, 31.0, 34.0, 31.0, 32.0, 20.0, 26.0, 8.0, 11.0, 16.0, 11.0, 8.0, 10.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.581073760986328, -9.288092613220215, -8.995112419128418, -8.702131271362305, -8.409150123596191, -8.116168975830078, -7.823188781738281, -7.530207633972168, -7.237226963043213, -6.944246292114258, -6.6512651443481445, -6.3582844734191895, -6.065303802490234, -5.772322654724121, -5.479341983795166, -5.186361312866211, -4.893380165100098, -4.600399494171143, -4.307418346405029, -4.014437675476074, -3.72145676612854, -3.428475856781006, -3.135495185852051, -2.8425142765045166, -2.5495333671569824, -2.2565524578094482, -1.9635716676712036, -1.670590877532959, -1.3776099681854248, -1.0846290588378906, -0.791648268699646, -0.49866747856140137, -0.20568561553955078, 0.08729523420333862, 0.380276083946228, 0.6732569336891174, 0.9662377834320068, 1.259218692779541, 1.5521994829177856, 1.8451802730560303, 2.1381611824035645, 2.4311420917510986, 2.724123001098633, 3.017103672027588, 3.310084581375122, 3.6030654907226562, 3.8960461616516113, 4.189026832580566, 4.48200798034668, 4.774988651275635, 5.067969799041748, 5.360950469970703, 5.653931617736816, 5.9469122886657715, 6.239892959594727, 6.53287410736084, 6.825854778289795, 7.11883544921875, 7.411816596984863, 7.704797267913818, 7.997777938842773, 8.290759086608887, 8.583740234375, 8.876720428466797, 9.16970157623291]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 10.0, 14.0, 9.0, 4.0, 23.0, 20.0, 23.0, 18.0, 21.0, 22.0, 40.0, 37.0, 34.0, 38.0, 38.0, 37.0, 34.0, 42.0, 48.0, 45.0, 39.0, 52.0, 43.0, 37.0, 30.0, 29.0, 21.0, 29.0, 17.0, 26.0, 15.0, 18.0, 20.0, 13.0, 5.0, 5.0, 3.0, 7.0, 3.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.7284574508667, -11.350062370300293, -10.97166633605957, -10.593271255493164, -10.214875221252441, -9.836480140686035, -9.458084106445312, -9.079689025878906, -8.7012939453125, -8.322898864746094, -7.944502830505371, -7.566107749938965, -7.187711715698242, -6.809316635131836, -6.4309210777282715, -6.052525520324707, -5.674129486083984, -5.29573392868042, -4.9173383712768555, -4.538943290710449, -4.160547256469727, -3.782151937484741, -3.403756618499756, -3.0253610610961914, -2.646965503692627, -2.2685699462890625, -1.8901745080947876, -1.5117790699005127, -1.1333835124969482, -0.7549879550933838, -0.37659263610839844, 0.0018029212951660156, 0.38019752502441406, 0.7585930228233337, 1.1369885206222534, 1.5153839588165283, 1.8937795162200928, 2.2721750736236572, 2.6505703926086426, 3.028965950012207, 3.4073615074157715, 3.785757064819336, 4.1641526222229, 4.542548179626465, 4.920943260192871, 5.299339294433594, 5.677734375, 6.0561299324035645, 6.434525489807129, 6.812921047210693, 7.191316604614258, 7.569711685180664, 7.948107719421387, 8.326502799987793, 8.704898834228516, 9.083293914794922, 9.461688995361328, 9.840084075927734, 10.218480110168457, 10.596875190734863, 10.975271224975586, 11.353666305541992, 11.732061386108398, 12.110457420349121, 12.488853454589844]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 6.0, 11.0, 26.0, 26.0, 53.0, 88.0, 116.0, 168.0, 251.0, 348.0, 538.0, 856.0, 1237.0, 1875.0, 2950.0, 4523.0, 7155.0, 11365.0, 18852.0, 33673.0, 63181.0, 122789.0, 233218.0, 249569.0, 135287.0, 69307.0, 36901.0, 20754.0, 12104.0, 7462.0, 4810.0, 3098.0, 2049.0, 1289.0, 856.0, 607.0, 394.0, 248.0, 174.0, 112.0, 82.0, 56.0, 32.0, 16.0, 13.0, 14.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.34375, -24.528076171875, -23.71240234375, -22.896728515625, -22.0810546875, -21.265380859375, -20.44970703125, -19.634033203125, -18.818359375, -18.002685546875, -17.18701171875, -16.371337890625, -15.5556640625, -14.739990234375, -13.92431640625, -13.108642578125, -12.29296875, -11.477294921875, -10.66162109375, -9.845947265625, -9.0302734375, -8.214599609375, -7.39892578125, -6.583251953125, -5.767578125, -4.951904296875, -4.13623046875, -3.320556640625, -2.5048828125, -1.689208984375, -0.87353515625, -0.057861328125, 0.7578125, 1.573486328125, 2.38916015625, 3.204833984375, 4.0205078125, 4.836181640625, 5.65185546875, 6.467529296875, 7.283203125, 8.098876953125, 8.91455078125, 9.730224609375, 10.5458984375, 11.361572265625, 12.17724609375, 12.992919921875, 13.80859375, 14.624267578125, 15.43994140625, 16.255615234375, 17.0712890625, 17.886962890625, 18.70263671875, 19.518310546875, 20.333984375, 21.149658203125, 21.96533203125, 22.781005859375, 23.5966796875, 24.412353515625, 25.22802734375, 26.043701171875, 26.859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 7.0, 8.0, 7.0, 6.0, 10.0, 9.0, 31.0, 18.0, 18.0, 22.0, 25.0, 31.0, 25.0, 35.0, 26.0, 34.0, 36.0, 34.0, 52.0, 29.0, 45.0, 44.0, 28.0, 44.0, 42.0, 29.0, 37.0, 32.0, 29.0, 31.0, 27.0, 19.0, 16.0, 19.0, 11.0, 11.0, 13.0, 15.0, 7.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.5291748046875, -9.206787109375, -8.8843994140625, -8.56201171875, -8.2396240234375, -7.917236328125, -7.5948486328125, -7.2724609375, -6.9500732421875, -6.627685546875, -6.3052978515625, -5.98291015625, -5.6605224609375, -5.338134765625, -5.0157470703125, -4.693359375, -4.3709716796875, -4.048583984375, -3.7261962890625, -3.40380859375, -3.0814208984375, -2.759033203125, -2.4366455078125, -2.1142578125, -1.7918701171875, -1.469482421875, -1.1470947265625, -0.82470703125, -0.5023193359375, -0.179931640625, 0.1424560546875, 0.46484375, 0.7872314453125, 1.109619140625, 1.4320068359375, 1.75439453125, 2.0767822265625, 2.399169921875, 2.7215576171875, 3.0439453125, 3.3663330078125, 3.688720703125, 4.0111083984375, 4.33349609375, 4.6558837890625, 4.978271484375, 5.3006591796875, 5.623046875, 5.9454345703125, 6.267822265625, 6.5902099609375, 6.91259765625, 7.2349853515625, 7.557373046875, 7.8797607421875, 8.2021484375, 8.5245361328125, 8.846923828125, 9.1693115234375, 9.49169921875, 9.8140869140625, 10.136474609375, 10.4588623046875, 10.78125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 16.0, 21.0, 27.0, 32.0, 30.0, 50.0, 59.0, 82.0, 129.0, 209.0, 252.0, 423.0, 600.0, 1004.0, 1916.0, 4231.0, 12062.0, 53128.0, 697902.0, 232249.0, 29006.0, 8054.0, 3037.0, 1487.0, 829.0, 519.0, 339.0, 241.0, 141.0, 120.0, 87.0, 88.0, 35.0, 28.0, 18.0, 15.0, 23.0, 17.0, 13.0, 8.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-53.6875, -51.7578125, -49.828125, -47.8984375, -45.96875, -44.0390625, -42.109375, -40.1796875, -38.25, -36.3203125, -34.390625, -32.4609375, -30.53125, -28.6015625, -26.671875, -24.7421875, -22.8125, -20.8828125, -18.953125, -17.0234375, -15.09375, -13.1640625, -11.234375, -9.3046875, -7.375, -5.4453125, -3.515625, -1.5859375, 0.34375, 2.2734375, 4.203125, 6.1328125, 8.0625, 9.9921875, 11.921875, 13.8515625, 15.78125, 17.7109375, 19.640625, 21.5703125, 23.5, 25.4296875, 27.359375, 29.2890625, 31.21875, 33.1484375, 35.078125, 37.0078125, 38.9375, 40.8671875, 42.796875, 44.7265625, 46.65625, 48.5859375, 50.515625, 52.4453125, 54.375, 56.3046875, 58.234375, 60.1640625, 62.09375, 64.0234375, 65.953125, 67.8828125, 69.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 12.0, 8.0, 13.0, 19.0, 21.0, 29.0, 19.0, 33.0, 34.0, 27.0, 32.0, 33.0, 43.0, 48.0, 52.0, 41.0, 46.0, 50.0, 51.0, 44.0, 37.0, 33.0, 42.0, 26.0, 30.0, 30.0, 27.0, 19.0, 21.0, 13.0, 14.0, 9.0, 10.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.108642578125, -7.85009765625, -7.591552734375, -7.3330078125, -7.074462890625, -6.81591796875, -6.557373046875, -6.298828125, -6.040283203125, -5.78173828125, -5.523193359375, -5.2646484375, -5.006103515625, -4.74755859375, -4.489013671875, -4.23046875, -3.971923828125, -3.71337890625, -3.454833984375, -3.1962890625, -2.937744140625, -2.67919921875, -2.420654296875, -2.162109375, -1.903564453125, -1.64501953125, -1.386474609375, -1.1279296875, -0.869384765625, -0.61083984375, -0.352294921875, -0.09375, 0.164794921875, 0.42333984375, 0.681884765625, 0.9404296875, 1.198974609375, 1.45751953125, 1.716064453125, 1.974609375, 2.233154296875, 2.49169921875, 2.750244140625, 3.0087890625, 3.267333984375, 3.52587890625, 3.784423828125, 4.04296875, 4.301513671875, 4.56005859375, 4.818603515625, 5.0771484375, 5.335693359375, 5.59423828125, 5.852783203125, 6.111328125, 6.369873046875, 6.62841796875, 6.886962890625, 7.1455078125, 7.404052734375, 7.66259765625, 7.921142578125, 8.1796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 12.0, 17.0, 10.0, 17.0, 20.0, 28.0, 30.0, 50.0, 69.0, 66.0, 117.0, 142.0, 173.0, 200.0, 277.0, 395.0, 544.0, 801.0, 1219.0, 1837.0, 2947.0, 5162.0, 9763.0, 22359.0, 72449.0, 678153.0, 181896.0, 37482.0, 14262.0, 6907.0, 3877.0, 2316.0, 1442.0, 990.0, 663.0, 448.0, 348.0, 233.0, 180.0, 165.0, 115.0, 82.0, 74.0, 37.0, 45.0, 33.0, 21.0, 20.0, 19.0, 17.0, 7.0, 8.0, 6.0, 4.0, 2.0, 3.0], "bins": [-34.65625, -33.62939453125, -32.6025390625, -31.57568359375, -30.548828125, -29.52197265625, -28.4951171875, -27.46826171875, -26.44140625, -25.41455078125, -24.3876953125, -23.36083984375, -22.333984375, -21.30712890625, -20.2802734375, -19.25341796875, -18.2265625, -17.19970703125, -16.1728515625, -15.14599609375, -14.119140625, -13.09228515625, -12.0654296875, -11.03857421875, -10.01171875, -8.98486328125, -7.9580078125, -6.93115234375, -5.904296875, -4.87744140625, -3.8505859375, -2.82373046875, -1.796875, -0.77001953125, 0.2568359375, 1.28369140625, 2.310546875, 3.33740234375, 4.3642578125, 5.39111328125, 6.41796875, 7.44482421875, 8.4716796875, 9.49853515625, 10.525390625, 11.55224609375, 12.5791015625, 13.60595703125, 14.6328125, 15.65966796875, 16.6865234375, 17.71337890625, 18.740234375, 19.76708984375, 20.7939453125, 21.82080078125, 22.84765625, 23.87451171875, 24.9013671875, 25.92822265625, 26.955078125, 27.98193359375, 29.0087890625, 30.03564453125, 31.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 15.0, 7.0, 14.0, 11.0, 19.0, 20.0, 37.0, 30.0, 72.0, 135.0, 212.0, 130.0, 69.0, 47.0, 43.0, 42.0, 23.0, 13.0, 10.0, 7.0, 3.0, 12.0, 6.0, 1.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028839111328125, -0.002800464630126953, -0.0027170181274414062, -0.0026335716247558594, -0.0025501251220703125, -0.0024666786193847656, -0.0023832321166992188, -0.002299785614013672, -0.002216339111328125, -0.002132892608642578, -0.0020494461059570312, -0.0019659996032714844, -0.0018825531005859375, -0.0017991065979003906, -0.0017156600952148438, -0.0016322135925292969, -0.00154876708984375, -0.0014653205871582031, -0.0013818740844726562, -0.0012984275817871094, -0.0012149810791015625, -0.0011315345764160156, -0.0010480880737304688, -0.0009646415710449219, -0.000881195068359375, -0.0007977485656738281, -0.0007143020629882812, -0.0006308555603027344, -0.0005474090576171875, -0.0004639625549316406, -0.00038051605224609375, -0.0002970695495605469, -0.000213623046875, -0.00013017654418945312, -4.673004150390625e-05, 3.6716461181640625e-05, 0.0001201629638671875, 0.00020360946655273438, 0.00028705596923828125, 0.0003705024719238281, 0.000453948974609375, 0.0005373954772949219, 0.0006208419799804688, 0.0007042884826660156, 0.0007877349853515625, 0.0008711814880371094, 0.0009546279907226562, 0.0010380744934082031, 0.00112152099609375, 0.0012049674987792969, 0.0012884140014648438, 0.0013718605041503906, 0.0014553070068359375, 0.0015387535095214844, 0.0016222000122070312, 0.0017056465148925781, 0.001789093017578125, 0.0018725395202636719, 0.0019559860229492188, 0.0020394325256347656, 0.0021228790283203125, 0.0022063255310058594, 0.0022897720336914062, 0.002373218536376953, 0.0024566650390625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 3.0, 6.0, 1.0, 7.0, 10.0, 17.0, 20.0, 23.0, 24.0, 37.0, 102.0, 661.0, 23950.0, 1010797.0, 12165.0, 476.0, 83.0, 38.0, 28.0, 16.0, 18.0, 12.0, 6.0, 6.0, 5.0, 9.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-149.125, -144.6640625, -140.203125, -135.7421875, -131.28125, -126.8203125, -122.359375, -117.8984375, -113.4375, -108.9765625, -104.515625, -100.0546875, -95.59375, -91.1328125, -86.671875, -82.2109375, -77.75, -73.2890625, -68.828125, -64.3671875, -59.90625, -55.4453125, -50.984375, -46.5234375, -42.0625, -37.6015625, -33.140625, -28.6796875, -24.21875, -19.7578125, -15.296875, -10.8359375, -6.375, -1.9140625, 2.546875, 7.0078125, 11.46875, 15.9296875, 20.390625, 24.8515625, 29.3125, 33.7734375, 38.234375, 42.6953125, 47.15625, 51.6171875, 56.078125, 60.5390625, 65.0, 69.4609375, 73.921875, 78.3828125, 82.84375, 87.3046875, 91.765625, 96.2265625, 100.6875, 105.1484375, 109.609375, 114.0703125, 118.53125, 122.9921875, 127.453125, 131.9140625, 136.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 6.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 15.0, 14.0, 14.0, 20.0, 32.0, 38.0, 69.0, 82.0, 111.0, 132.0, 104.0, 83.0, 67.0, 44.0, 29.0, 19.0, 15.0, 12.0, 7.0, 10.0, 3.0, 5.0, 4.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.158203125, -5.96875, -5.779296875, -5.58984375, -5.400390625, -5.2109375, -5.021484375, -4.83203125, -4.642578125, -4.453125, -4.263671875, -4.07421875, -3.884765625, -3.6953125, -3.505859375, -3.31640625, -3.126953125, -2.9375, -2.748046875, -2.55859375, -2.369140625, -2.1796875, -1.990234375, -1.80078125, -1.611328125, -1.421875, -1.232421875, -1.04296875, -0.853515625, -0.6640625, -0.474609375, -0.28515625, -0.095703125, 0.09375, 0.283203125, 0.47265625, 0.662109375, 0.8515625, 1.041015625, 1.23046875, 1.419921875, 1.609375, 1.798828125, 1.98828125, 2.177734375, 2.3671875, 2.556640625, 2.74609375, 2.935546875, 3.125, 3.314453125, 3.50390625, 3.693359375, 3.8828125, 4.072265625, 4.26171875, 4.451171875, 4.640625, 4.830078125, 5.01953125, 5.208984375, 5.3984375, 5.587890625, 5.77734375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 4.0, 10.0, 13.0, 15.0, 21.0, 19.0, 24.0, 28.0, 44.0, 41.0, 41.0, 53.0, 49.0, 58.0, 61.0, 54.0, 60.0, 70.0, 48.0, 40.0, 37.0, 52.0, 25.0, 31.0, 20.0, 17.0, 11.0, 17.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.13398551940918, -14.742134094238281, -14.350281715393066, -13.958430290222168, -13.566577911376953, -13.174726486206055, -12.782875061035156, -12.391022682189941, -11.999171257019043, -11.607319831848145, -11.21546745300293, -10.823616027832031, -10.431763648986816, -10.039912223815918, -9.648059844970703, -9.256208419799805, -8.864356994628906, -8.472505569458008, -8.080653190612793, -7.6888017654418945, -7.296949863433838, -6.905097961425781, -6.513246059417725, -6.121394157409668, -5.729541778564453, -5.3376898765563965, -4.94583797454834, -4.553986549377441, -4.162134647369385, -3.770282745361328, -3.3784308433532715, -2.986579179763794, -2.5947275161743164, -2.2028756141662598, -1.8110239505767822, -1.4191720485687256, -1.0273202657699585, -0.6354684829711914, -0.24361658096313477, 0.14823508262634277, 0.5400869846343994, 0.9319387674331665, 1.3237905502319336, 1.7156424522399902, 2.107494354248047, 2.4993460178375244, 2.891197919845581, 3.2830495834350586, 3.6749014854431152, 4.066753387451172, 4.4586052894592285, 4.850457191467285, 5.242308616638184, 5.63416051864624, 6.026012420654297, 6.417863845825195, 6.80971622467041, 7.201568126678467, 7.593420028686523, 7.985271453857422, 8.377123832702637, 8.768975257873535, 9.16082763671875, 9.552679061889648, 9.944530487060547]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 10.0, 6.0, 15.0, 11.0, 17.0, 16.0, 16.0, 23.0, 34.0, 34.0, 32.0, 37.0, 27.0, 39.0, 38.0, 38.0, 49.0, 42.0, 29.0, 34.0, 36.0, 53.0, 43.0, 50.0, 39.0, 43.0, 30.0, 16.0, 28.0, 23.0, 13.0, 14.0, 11.0, 16.0, 4.0, 7.0, 5.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.904741287231445, -9.562287330627441, -9.219834327697754, -8.87738037109375, -8.534926414489746, -8.192472457885742, -7.850019454956055, -7.507565498352051, -7.165112018585205, -6.822658538818359, -6.4802045822143555, -6.13775110244751, -5.795297622680664, -5.45284366607666, -5.1103901863098145, -4.767936706542969, -4.425482749938965, -4.083029270172119, -3.7405753135681152, -3.3981218338012695, -3.0556681156158447, -2.71321439743042, -2.370760917663574, -2.0283071994781494, -1.6858534812927246, -1.3433997631072998, -1.0009461641311646, -0.6584925651550293, -0.3160388469696045, 0.026414871215820312, 0.368868350982666, 0.7113220691680908, 1.0537748336791992, 1.396228551864624, 1.7386821508407593, 2.0811357498168945, 2.4235894680023193, 2.766043186187744, 3.10849666595459, 3.4509503841400146, 3.7934041023254395, 4.135857582092285, 4.478311538696289, 4.820765018463135, 5.1632184982299805, 5.505672454833984, 5.84812593460083, 6.190579414367676, 6.53303337097168, 6.875486850738525, 7.217940807342529, 7.560394287109375, 7.902848243713379, 8.245302200317383, 8.58775520324707, 8.930209159851074, 9.272663116455078, 9.615117073059082, 9.95757007598877, 10.300024032592773, 10.642477989196777, 10.984931945800781, 11.327384948730469, 11.669838905334473, 12.01229190826416]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 16.0, 19.0, 23.0, 47.0, 53.0, 94.0, 143.0, 229.0, 384.0, 699.0, 1308.0, 2339.0, 4365.0, 8164.0, 14965.0, 27995.0, 50690.0, 85121.0, 131307.0, 171213.0, 177290.0, 144173.0, 96924.0, 58782.0, 32901.0, 18012.0, 9764.0, 5195.0, 2761.0, 1504.0, 849.0, 497.0, 267.0, 145.0, 111.0, 62.0, 39.0, 23.0, 23.0, 19.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.875, -12.43310546875, -11.9912109375, -11.54931640625, -11.107421875, -10.66552734375, -10.2236328125, -9.78173828125, -9.33984375, -8.89794921875, -8.4560546875, -8.01416015625, -7.572265625, -7.13037109375, -6.6884765625, -6.24658203125, -5.8046875, -5.36279296875, -4.9208984375, -4.47900390625, -4.037109375, -3.59521484375, -3.1533203125, -2.71142578125, -2.26953125, -1.82763671875, -1.3857421875, -0.94384765625, -0.501953125, -0.06005859375, 0.3818359375, 0.82373046875, 1.265625, 1.70751953125, 2.1494140625, 2.59130859375, 3.033203125, 3.47509765625, 3.9169921875, 4.35888671875, 4.80078125, 5.24267578125, 5.6845703125, 6.12646484375, 6.568359375, 7.01025390625, 7.4521484375, 7.89404296875, 8.3359375, 8.77783203125, 9.2197265625, 9.66162109375, 10.103515625, 10.54541015625, 10.9873046875, 11.42919921875, 11.87109375, 12.31298828125, 12.7548828125, 13.19677734375, 13.638671875, 14.08056640625, 14.5224609375, 14.96435546875, 15.40625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 12.0, 7.0, 9.0, 6.0, 12.0, 22.0, 13.0, 28.0, 26.0, 23.0, 20.0, 29.0, 36.0, 39.0, 28.0, 49.0, 29.0, 44.0, 38.0, 45.0, 40.0, 39.0, 33.0, 37.0, 42.0, 35.0, 37.0, 30.0, 36.0, 29.0, 14.0, 25.0, 19.0, 11.0, 15.0, 8.0, 7.0, 9.0, 7.0, 0.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.4593505859375, -5.254638671875, -5.0499267578125, -4.84521484375, -4.6405029296875, -4.435791015625, -4.2310791015625, -4.0263671875, -3.8216552734375, -3.616943359375, -3.4122314453125, -3.20751953125, -3.0028076171875, -2.798095703125, -2.5933837890625, -2.388671875, -2.1839599609375, -1.979248046875, -1.7745361328125, -1.56982421875, -1.3651123046875, -1.160400390625, -0.9556884765625, -0.7509765625, -0.5462646484375, -0.341552734375, -0.1368408203125, 0.06787109375, 0.2725830078125, 0.477294921875, 0.6820068359375, 0.88671875, 1.0914306640625, 1.296142578125, 1.5008544921875, 1.70556640625, 1.9102783203125, 2.114990234375, 2.3197021484375, 2.5244140625, 2.7291259765625, 2.933837890625, 3.1385498046875, 3.34326171875, 3.5479736328125, 3.752685546875, 3.9573974609375, 4.162109375, 4.3668212890625, 4.571533203125, 4.7762451171875, 4.98095703125, 5.1856689453125, 5.390380859375, 5.5950927734375, 5.7998046875, 6.0045166015625, 6.209228515625, 6.4139404296875, 6.61865234375, 6.8233642578125, 7.028076171875, 7.2327880859375, 7.4375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 4.0, 7.0, 7.0, 8.0, 8.0, 12.0, 17.0, 15.0, 21.0, 22.0, 28.0, 27.0, 23.0, 28.0, 21.0, 35.0, 46.0, 34.0, 147.0, 4708.0, 301022.0, 720895.0, 20546.0, 440.0, 57.0, 43.0, 36.0, 25.0, 32.0, 29.0, 26.0, 32.0, 7.0, 18.0, 17.0, 16.0, 11.0, 10.0, 16.0, 11.0, 3.0, 7.0, 3.0, 6.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-90.5625, -87.5615234375, -84.560546875, -81.5595703125, -78.55859375, -75.5576171875, -72.556640625, -69.5556640625, -66.5546875, -63.5537109375, -60.552734375, -57.5517578125, -54.55078125, -51.5498046875, -48.548828125, -45.5478515625, -42.546875, -39.5458984375, -36.544921875, -33.5439453125, -30.54296875, -27.5419921875, -24.541015625, -21.5400390625, -18.5390625, -15.5380859375, -12.537109375, -9.5361328125, -6.53515625, -3.5341796875, -0.533203125, 2.4677734375, 5.46875, 8.4697265625, 11.470703125, 14.4716796875, 17.47265625, 20.4736328125, 23.474609375, 26.4755859375, 29.4765625, 32.4775390625, 35.478515625, 38.4794921875, 41.48046875, 44.4814453125, 47.482421875, 50.4833984375, 53.484375, 56.4853515625, 59.486328125, 62.4873046875, 65.48828125, 68.4892578125, 71.490234375, 74.4912109375, 77.4921875, 80.4931640625, 83.494140625, 86.4951171875, 89.49609375, 92.4970703125, 95.498046875, 98.4990234375, 101.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 5.0, 8.0, 7.0, 7.0, 8.0, 12.0, 14.0, 27.0, 17.0, 29.0, 24.0, 23.0, 30.0, 29.0, 30.0, 30.0, 40.0, 45.0, 46.0, 27.0, 36.0, 26.0, 41.0, 38.0, 49.0, 39.0, 35.0, 24.0, 28.0, 33.0, 21.0, 21.0, 21.0, 19.0, 17.0, 11.0, 14.0, 15.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.265625, -6.0545654296875, -5.843505859375, -5.6324462890625, -5.42138671875, -5.2103271484375, -4.999267578125, -4.7882080078125, -4.5771484375, -4.3660888671875, -4.155029296875, -3.9439697265625, -3.73291015625, -3.5218505859375, -3.310791015625, -3.0997314453125, -2.888671875, -2.6776123046875, -2.466552734375, -2.2554931640625, -2.04443359375, -1.8333740234375, -1.622314453125, -1.4112548828125, -1.2001953125, -0.9891357421875, -0.778076171875, -0.5670166015625, -0.35595703125, -0.1448974609375, 0.066162109375, 0.2772216796875, 0.48828125, 0.6993408203125, 0.910400390625, 1.1214599609375, 1.33251953125, 1.5435791015625, 1.754638671875, 1.9656982421875, 2.1767578125, 2.3878173828125, 2.598876953125, 2.8099365234375, 3.02099609375, 3.2320556640625, 3.443115234375, 3.6541748046875, 3.865234375, 4.0762939453125, 4.287353515625, 4.4984130859375, 4.70947265625, 4.9205322265625, 5.131591796875, 5.3426513671875, 5.5537109375, 5.7647705078125, 5.975830078125, 6.1868896484375, 6.39794921875, 6.6090087890625, 6.820068359375, 7.0311279296875, 7.2421875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 10.0, 30.0, 32.0, 60.0, 83.0, 121.0, 168.0, 329.0, 464.0, 671.0, 1060.0, 1735.0, 2769.0, 4627.0, 7498.0, 12947.0, 23331.0, 45777.0, 96536.0, 257522.0, 348675.0, 122978.0, 55074.0, 27969.0, 15264.0, 8798.0, 5342.0, 3180.0, 1916.0, 1261.0, 834.0, 558.0, 308.0, 180.0, 122.0, 95.0, 69.0, 48.0, 26.0, 21.0, 11.0, 13.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-5.87890625, -5.71160888671875, -5.5443115234375, -5.37701416015625, -5.209716796875, -5.04241943359375, -4.8751220703125, -4.70782470703125, -4.54052734375, -4.37322998046875, -4.2059326171875, -4.03863525390625, -3.871337890625, -3.70404052734375, -3.5367431640625, -3.36944580078125, -3.2021484375, -3.03485107421875, -2.8675537109375, -2.70025634765625, -2.532958984375, -2.36566162109375, -2.1983642578125, -2.03106689453125, -1.86376953125, -1.69647216796875, -1.5291748046875, -1.36187744140625, -1.194580078125, -1.02728271484375, -0.8599853515625, -0.69268798828125, -0.525390625, -0.35809326171875, -0.1907958984375, -0.02349853515625, 0.143798828125, 0.31109619140625, 0.4783935546875, 0.64569091796875, 0.81298828125, 0.98028564453125, 1.1475830078125, 1.31488037109375, 1.482177734375, 1.64947509765625, 1.8167724609375, 1.98406982421875, 2.1513671875, 2.31866455078125, 2.4859619140625, 2.65325927734375, 2.820556640625, 2.98785400390625, 3.1551513671875, 3.32244873046875, 3.48974609375, 3.65704345703125, 3.8243408203125, 3.99163818359375, 4.158935546875, 4.32623291015625, 4.4935302734375, 4.66082763671875, 4.828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 9.0, 12.0, 11.0, 17.0, 16.0, 19.0, 29.0, 37.0, 51.0, 50.0, 63.0, 64.0, 94.0, 92.0, 80.0, 66.0, 47.0, 40.0, 40.0, 25.0, 22.0, 17.0, 22.0, 11.0, 7.0, 9.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0008687973022460938, -0.0008444711565971375, -0.0008201450109481812, -0.0007958188652992249, -0.0007714927196502686, -0.0007471665740013123, -0.000722840428352356, -0.0006985142827033997, -0.0006741881370544434, -0.0006498619914054871, -0.0006255358457565308, -0.0006012097001075745, -0.0005768835544586182, -0.0005525574088096619, -0.0005282312631607056, -0.0005039051175117493, -0.00047957897186279297, -0.00045525282621383667, -0.00043092668056488037, -0.00040660053491592407, -0.0003822743892669678, -0.0003579482436180115, -0.0003336220979690552, -0.0003092959523200989, -0.0002849698066711426, -0.0002606436610221863, -0.00023631751537322998, -0.00021199136972427368, -0.00018766522407531738, -0.00016333907842636108, -0.00013901293277740479, -0.00011468678712844849, -9.036064147949219e-05, -6.603449583053589e-05, -4.170835018157959e-05, -1.738220453262329e-05, 6.943941116333008e-06, 3.127008676528931e-05, 5.5596232414245605e-05, 7.99223780632019e-05, 0.0001042485237121582, 0.0001285746693611145, 0.0001529008150100708, 0.0001772269606590271, 0.0002015531063079834, 0.0002258792519569397, 0.000250205397605896, 0.0002745315432548523, 0.0002988576889038086, 0.0003231838345527649, 0.0003475099802017212, 0.0003718361258506775, 0.0003961622714996338, 0.0004204884171485901, 0.0004448145627975464, 0.0004691407084465027, 0.000493466854095459, 0.0005177929997444153, 0.0005421191453933716, 0.0005664452910423279, 0.0005907714366912842, 0.0006150975823402405, 0.0006394237279891968, 0.0006637498736381531, 0.0006880760192871094]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 4.0, 12.0, 11.0, 10.0, 17.0, 13.0, 16.0, 29.0, 33.0, 43.0, 69.0, 189.0, 1032.0, 10360.0, 355760.0, 663286.0, 15744.0, 1413.0, 224.0, 66.0, 38.0, 24.0, 28.0, 24.0, 25.0, 13.0, 11.0, 14.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.076416015625, -22.30908203125, -21.541748046875, -20.7744140625, -20.007080078125, -19.23974609375, -18.472412109375, -17.705078125, -16.937744140625, -16.17041015625, -15.403076171875, -14.6357421875, -13.868408203125, -13.10107421875, -12.333740234375, -11.56640625, -10.799072265625, -10.03173828125, -9.264404296875, -8.4970703125, -7.729736328125, -6.96240234375, -6.195068359375, -5.427734375, -4.660400390625, -3.89306640625, -3.125732421875, -2.3583984375, -1.591064453125, -0.82373046875, -0.056396484375, 0.7109375, 1.478271484375, 2.24560546875, 3.012939453125, 3.7802734375, 4.547607421875, 5.31494140625, 6.082275390625, 6.849609375, 7.616943359375, 8.38427734375, 9.151611328125, 9.9189453125, 10.686279296875, 11.45361328125, 12.220947265625, 12.98828125, 13.755615234375, 14.52294921875, 15.290283203125, 16.0576171875, 16.824951171875, 17.59228515625, 18.359619140625, 19.126953125, 19.894287109375, 20.66162109375, 21.428955078125, 22.1962890625, 22.963623046875, 23.73095703125, 24.498291015625, 25.265625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 10.0, 7.0, 7.0, 10.0, 11.0, 17.0, 11.0, 15.0, 24.0, 41.0, 32.0, 39.0, 42.0, 44.0, 58.0, 72.0, 70.0, 59.0, 77.0, 59.0, 35.0, 45.0, 32.0, 27.0, 23.0, 23.0, 15.0, 17.0, 19.0, 9.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4529876708984375, -1.405975341796875, -1.3589630126953125, -1.31195068359375, -1.2649383544921875, -1.217926025390625, -1.1709136962890625, -1.1239013671875, -1.0768890380859375, -1.029876708984375, -0.9828643798828125, -0.93585205078125, -0.8888397216796875, -0.841827392578125, -0.7948150634765625, -0.747802734375, -0.7007904052734375, -0.653778076171875, -0.6067657470703125, -0.55975341796875, -0.5127410888671875, -0.465728759765625, -0.4187164306640625, -0.3717041015625, -0.3246917724609375, -0.277679443359375, -0.2306671142578125, -0.18365478515625, -0.1366424560546875, -0.089630126953125, -0.0426177978515625, 0.00439453125, 0.0514068603515625, 0.098419189453125, 0.1454315185546875, 0.19244384765625, 0.2394561767578125, 0.286468505859375, 0.3334808349609375, 0.3804931640625, 0.4275054931640625, 0.474517822265625, 0.5215301513671875, 0.56854248046875, 0.6155548095703125, 0.662567138671875, 0.7095794677734375, 0.756591796875, 0.8036041259765625, 0.850616455078125, 0.8976287841796875, 0.94464111328125, 0.9916534423828125, 1.038665771484375, 1.0856781005859375, 1.1326904296875, 1.1797027587890625, 1.226715087890625, 1.2737274169921875, 1.32073974609375, 1.3677520751953125, 1.414764404296875, 1.4617767333984375, 1.5087890625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 18.0, 53.0, 120.0, 223.0, 274.0, 191.0, 91.0, 24.0, 11.0, 2.0, 2.0, 1.0], "bins": [-70.91986846923828, -69.6584701538086, -68.3970718383789, -67.13568115234375, -65.87428283691406, -64.61288452148438, -63.35148620605469, -62.090091705322266, -60.82869338989258, -59.56729507446289, -58.30590057373047, -57.04450225830078, -55.78310775756836, -54.52170944213867, -53.26031494140625, -51.99891662597656, -50.737518310546875, -49.47611999511719, -48.214725494384766, -46.95332717895508, -45.691932678222656, -44.43053436279297, -43.16913604736328, -41.90774154663086, -40.64634704589844, -39.38494873046875, -38.12355422973633, -36.86215591430664, -35.60076141357422, -34.33936309814453, -33.077964782714844, -31.816570281982422, -30.5551700592041, -29.293773651123047, -28.032377243041992, -26.770980834960938, -25.50958251953125, -24.248186111450195, -22.98678970336914, -21.725391387939453, -20.46399688720703, -19.202600479125977, -17.941204071044922, -16.679805755615234, -15.41840934753418, -14.157012939453125, -12.89561653137207, -11.6342191696167, -10.372821807861328, -9.111425399780273, -7.850028038024902, -6.588631629943848, -5.327234745025635, -4.065837860107422, -2.804441452026367, -1.543044090270996, -0.2816476821899414, 0.9797490835189819, 2.2411458492279053, 3.502542495727539, 4.763939380645752, 6.025336265563965, 7.2867326736450195, 8.54813003540039, 9.809526443481445]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 5.0, 3.0, 7.0, 7.0, 9.0, 13.0, 17.0, 8.0, 13.0, 20.0, 20.0, 26.0, 27.0, 30.0, 27.0, 43.0, 31.0, 51.0, 33.0, 35.0, 33.0, 40.0, 31.0, 45.0, 33.0, 37.0, 31.0, 39.0, 36.0, 23.0, 27.0, 19.0, 28.0, 21.0, 21.0, 17.0, 14.0, 13.0, 11.0, 10.0, 14.0, 9.0, 10.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-10.352606773376465, -10.040038108825684, -9.727468490600586, -9.414899826049805, -9.102330207824707, -8.789761543273926, -8.477191925048828, -8.164623260498047, -7.852054119110107, -7.539484977722168, -7.2269158363342285, -6.914346694946289, -6.601778030395508, -6.28920841217041, -5.976639747619629, -5.6640706062316895, -5.35150146484375, -5.0389323234558105, -4.726363182067871, -4.413794040679932, -4.101224899291992, -3.788655996322632, -3.4760870933532715, -3.163517951965332, -2.8509488105773926, -2.538379669189453, -2.2258105278015137, -1.9132416248321533, -1.6006724834442139, -1.2881033420562744, -0.9755343198776245, -0.6629652976989746, -0.35039615631103516, -0.03782707452774048, 0.2747420072555542, 0.5873110890388489, 0.8998801708221436, 1.212449312210083, 1.525018334388733, 1.8375873565673828, 2.1501564979553223, 2.4627256393432617, 2.775294780731201, 3.0878636837005615, 3.400432825088501, 3.7130019664764404, 4.025570869445801, 4.33814001083374, 4.65070915222168, 4.963278293609619, 5.275847434997559, 5.588416576385498, 5.9009857177734375, 6.213554382324219, 6.526123523712158, 6.838692665100098, 7.151261806488037, 7.463830947875977, 7.776400089263916, 8.088969230651855, 8.401537895202637, 8.714107513427734, 9.026676177978516, 9.339244842529297, 9.651814460754395]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 6.0, 3.0, 8.0, 11.0, 7.0, 14.0, 27.0, 21.0, 32.0, 55.0, 72.0, 79.0, 126.0, 137.0, 220.0, 298.0, 392.0, 621.0, 835.0, 1210.0, 1706.0, 2613.0, 3751.0, 5776.0, 9081.0, 14469.0, 25488.0, 48833.0, 119670.0, 866640.0, 2577947.0, 342982.0, 79277.0, 36749.0, 20406.0, 12184.0, 7668.0, 4812.0, 3237.0, 2146.0, 1387.0, 990.0, 667.0, 460.0, 345.0, 255.0, 169.0, 136.0, 78.0, 53.0, 48.0, 39.0, 17.0, 11.0, 8.0, 8.0, 9.0, 3.0, 4.0, 0.0, 2.0], "bins": [-13.1015625, -12.7081298828125, -12.314697265625, -11.9212646484375, -11.52783203125, -11.1343994140625, -10.740966796875, -10.3475341796875, -9.9541015625, -9.5606689453125, -9.167236328125, -8.7738037109375, -8.38037109375, -7.9869384765625, -7.593505859375, -7.2000732421875, -6.806640625, -6.4132080078125, -6.019775390625, -5.6263427734375, -5.23291015625, -4.8394775390625, -4.446044921875, -4.0526123046875, -3.6591796875, -3.2657470703125, -2.872314453125, -2.4788818359375, -2.08544921875, -1.6920166015625, -1.298583984375, -0.9051513671875, -0.51171875, -0.1182861328125, 0.275146484375, 0.6685791015625, 1.06201171875, 1.4554443359375, 1.848876953125, 2.2423095703125, 2.6357421875, 3.0291748046875, 3.422607421875, 3.8160400390625, 4.20947265625, 4.6029052734375, 4.996337890625, 5.3897705078125, 5.783203125, 6.1766357421875, 6.570068359375, 6.9635009765625, 7.35693359375, 7.7503662109375, 8.143798828125, 8.5372314453125, 8.9306640625, 9.3240966796875, 9.717529296875, 10.1109619140625, 10.50439453125, 10.8978271484375, 11.291259765625, 11.6846923828125, 12.078125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 12.0, 9.0, 11.0, 11.0, 14.0, 21.0, 22.0, 30.0, 29.0, 23.0, 26.0, 47.0, 33.0, 34.0, 51.0, 36.0, 35.0, 48.0, 43.0, 45.0, 45.0, 29.0, 35.0, 34.0, 39.0, 33.0, 29.0, 14.0, 22.0, 12.0, 16.0, 25.0, 13.0, 11.0, 14.0, 8.0, 10.0, 6.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.93359375, -6.72900390625, -6.5244140625, -6.31982421875, -6.115234375, -5.91064453125, -5.7060546875, -5.50146484375, -5.296875, -5.09228515625, -4.8876953125, -4.68310546875, -4.478515625, -4.27392578125, -4.0693359375, -3.86474609375, -3.66015625, -3.45556640625, -3.2509765625, -3.04638671875, -2.841796875, -2.63720703125, -2.4326171875, -2.22802734375, -2.0234375, -1.81884765625, -1.6142578125, -1.40966796875, -1.205078125, -1.00048828125, -0.7958984375, -0.59130859375, -0.38671875, -0.18212890625, 0.0224609375, 0.22705078125, 0.431640625, 0.63623046875, 0.8408203125, 1.04541015625, 1.25, 1.45458984375, 1.6591796875, 1.86376953125, 2.068359375, 2.27294921875, 2.4775390625, 2.68212890625, 2.88671875, 3.09130859375, 3.2958984375, 3.50048828125, 3.705078125, 3.90966796875, 4.1142578125, 4.31884765625, 4.5234375, 4.72802734375, 4.9326171875, 5.13720703125, 5.341796875, 5.54638671875, 5.7509765625, 5.95556640625, 6.16015625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 8.0, 12.0, 10.0, 22.0, 22.0, 44.0, 45.0, 53.0, 78.0, 122.0, 258.0, 2074.0, 570514.0, 3616750.0, 3508.0, 316.0, 116.0, 67.0, 63.0, 40.0, 40.0, 21.0, 13.0, 11.0, 5.0, 5.0, 10.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.25, -102.830078125, -99.41015625, -95.990234375, -92.5703125, -89.150390625, -85.73046875, -82.310546875, -78.890625, -75.470703125, -72.05078125, -68.630859375, -65.2109375, -61.791015625, -58.37109375, -54.951171875, -51.53125, -48.111328125, -44.69140625, -41.271484375, -37.8515625, -34.431640625, -31.01171875, -27.591796875, -24.171875, -20.751953125, -17.33203125, -13.912109375, -10.4921875, -7.072265625, -3.65234375, -0.232421875, 3.1875, 6.607421875, 10.02734375, 13.447265625, 16.8671875, 20.287109375, 23.70703125, 27.126953125, 30.546875, 33.966796875, 37.38671875, 40.806640625, 44.2265625, 47.646484375, 51.06640625, 54.486328125, 57.90625, 61.326171875, 64.74609375, 68.166015625, 71.5859375, 75.005859375, 78.42578125, 81.845703125, 85.265625, 88.685546875, 92.10546875, 95.525390625, 98.9453125, 102.365234375, 105.78515625, 109.205078125, 112.625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 6.0, 7.0, 8.0, 8.0, 13.0, 15.0, 22.0, 32.0, 39.0, 44.0, 67.0, 92.0, 162.0, 278.0, 724.0, 1081.0, 653.0, 326.0, 140.0, 81.0, 65.0, 58.0, 34.0, 28.0, 20.0, 9.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.67010498046875, -4.5120849609375, -4.35406494140625, -4.196044921875, -4.03802490234375, -3.8800048828125, -3.72198486328125, -3.56396484375, -3.40594482421875, -3.2479248046875, -3.08990478515625, -2.931884765625, -2.77386474609375, -2.6158447265625, -2.45782470703125, -2.2998046875, -2.14178466796875, -1.9837646484375, -1.82574462890625, -1.667724609375, -1.50970458984375, -1.3516845703125, -1.19366455078125, -1.03564453125, -0.87762451171875, -0.7196044921875, -0.56158447265625, -0.403564453125, -0.24554443359375, -0.0875244140625, 0.07049560546875, 0.228515625, 0.38653564453125, 0.5445556640625, 0.70257568359375, 0.860595703125, 1.01861572265625, 1.1766357421875, 1.33465576171875, 1.49267578125, 1.65069580078125, 1.8087158203125, 1.96673583984375, 2.124755859375, 2.28277587890625, 2.4407958984375, 2.59881591796875, 2.7568359375, 2.91485595703125, 3.0728759765625, 3.23089599609375, 3.388916015625, 3.54693603515625, 3.7049560546875, 3.86297607421875, 4.02099609375, 4.17901611328125, 4.3370361328125, 4.49505615234375, 4.653076171875, 4.81109619140625, 4.9691162109375, 5.12713623046875, 5.28515625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 10.0, 17.0, 39.0, 52.0, 84.0, 113.0, 123.0, 140.0, 144.0, 100.0, 65.0, 43.0, 32.0, 20.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640901565551758, -7.142813205718994, -6.644725322723389, -6.146636962890625, -5.6485490798950195, -5.150460720062256, -4.652372360229492, -4.154284477233887, -3.656196117401123, -3.1581079959869385, -2.660019874572754, -2.1619315147399902, -1.6638433933258057, -1.165755271911621, -0.6676669120788574, -0.16957879066467285, 0.3285093307495117, 0.8265975117683411, 1.3246856927871704, 1.8227739334106445, 2.320862054824829, 2.8189501762390137, 3.3170385360717773, 3.815126657485962, 4.3132147789001465, 4.81130313873291, 5.309391021728516, 5.807479381561279, 6.305567741394043, 6.803655624389648, 7.301743984222412, 7.799832344055176, 8.297920227050781, 8.796008110046387, 9.294096946716309, 9.792184829711914, 10.29027271270752, 10.788360595703125, 11.286449432373047, 11.784537315368652, 12.282625198364258, 12.780713081359863, 13.278801918029785, 13.77688980102539, 14.274977684020996, 14.773065567016602, 15.271154403686523, 15.769242286682129, 16.267330169677734, 16.765419006347656, 17.263505935668945, 17.761594772338867, 18.25968360900879, 18.757770538330078, 19.255859375, 19.753948211669922, 20.252037048339844, 20.750125885009766, 21.248212814331055, 21.746301651000977, 22.2443904876709, 22.742477416992188, 23.24056625366211, 23.73865509033203, 24.23674201965332]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 7.0, 6.0, 10.0, 20.0, 9.0, 16.0, 22.0, 20.0, 24.0, 23.0, 25.0, 32.0, 34.0, 31.0, 31.0, 31.0, 35.0, 38.0, 29.0, 27.0, 34.0, 35.0, 33.0, 47.0, 37.0, 29.0, 37.0, 30.0, 34.0, 25.0, 25.0, 19.0, 23.0, 12.0, 14.0, 12.0, 16.0, 12.0, 11.0, 7.0, 8.0, 4.0, 8.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-7.735259056091309, -7.508742332458496, -7.282225608825684, -7.055708885192871, -6.829192161560059, -6.602675437927246, -6.376158714294434, -6.149641990661621, -5.923125267028809, -5.696608543395996, -5.470091819763184, -5.243575096130371, -5.017058372497559, -4.790541648864746, -4.564024925231934, -4.337508201599121, -4.11099100112915, -3.884474277496338, -3.6579575538635254, -3.431440830230713, -3.2049241065979004, -2.978407382965088, -2.7518904209136963, -2.525373697280884, -2.2988569736480713, -2.072340250015259, -1.8458235263824463, -1.6193066835403442, -1.3927899599075317, -1.1662732362747192, -0.9397563934326172, -0.7132396697998047, -0.4867229461669922, -0.2602061927318573, -0.03368943929672241, 0.19282734394073486, 0.41934406757354736, 0.6458607912063599, 0.8723776340484619, 1.0988943576812744, 1.325411081314087, 1.5519278049468994, 1.778444528579712, 2.0049614906311035, 2.231478214263916, 2.4579949378967285, 2.684511661529541, 2.9110283851623535, 3.137545108795166, 3.3640618324279785, 3.590578556060791, 3.8170952796936035, 4.043612003326416, 4.2701287269592285, 4.496645927429199, 4.723162651062012, 4.949679374694824, 5.176196098327637, 5.402712821960449, 5.629229545593262, 5.855746269226074, 6.082262992858887, 6.308779716491699, 6.535296440124512, 6.761813163757324]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 16.0, 18.0, 19.0, 39.0, 52.0, 80.0, 114.0, 189.0, 275.0, 418.0, 698.0, 1179.0, 1988.0, 3309.0, 6140.0, 11489.0, 21691.0, 43468.0, 93510.0, 204522.0, 311411.0, 182321.0, 82912.0, 39299.0, 19684.0, 10268.0, 5644.0, 3130.0, 1781.0, 1101.0, 600.0, 409.0, 245.0, 174.0, 132.0, 79.0, 39.0, 29.0, 17.0, 14.0, 14.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.3323974609375, -14.844482421875, -14.3565673828125, -13.86865234375, -13.3807373046875, -12.892822265625, -12.4049072265625, -11.9169921875, -11.4290771484375, -10.941162109375, -10.4532470703125, -9.96533203125, -9.4774169921875, -8.989501953125, -8.5015869140625, -8.013671875, -7.5257568359375, -7.037841796875, -6.5499267578125, -6.06201171875, -5.5740966796875, -5.086181640625, -4.5982666015625, -4.1103515625, -3.6224365234375, -3.134521484375, -2.6466064453125, -2.15869140625, -1.6707763671875, -1.182861328125, -0.6949462890625, -0.20703125, 0.2808837890625, 0.768798828125, 1.2567138671875, 1.74462890625, 2.2325439453125, 2.720458984375, 3.2083740234375, 3.6962890625, 4.1842041015625, 4.672119140625, 5.1600341796875, 5.64794921875, 6.1358642578125, 6.623779296875, 7.1116943359375, 7.599609375, 8.0875244140625, 8.575439453125, 9.0633544921875, 9.55126953125, 10.0391845703125, 10.527099609375, 11.0150146484375, 11.5029296875, 11.9908447265625, 12.478759765625, 12.9666748046875, 13.45458984375, 13.9425048828125, 14.430419921875, 14.9183349609375, 15.40625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 7.0, 6.0, 17.0, 24.0, 16.0, 19.0, 32.0, 24.0, 27.0, 30.0, 34.0, 23.0, 33.0, 49.0, 36.0, 35.0, 33.0, 27.0, 35.0, 42.0, 32.0, 36.0, 47.0, 39.0, 33.0, 30.0, 24.0, 22.0, 26.0, 24.0, 25.0, 9.0, 16.0, 13.0, 9.0, 14.0, 6.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.8558349609375, -5.672607421875, -5.4893798828125, -5.30615234375, -5.1229248046875, -4.939697265625, -4.7564697265625, -4.5732421875, -4.3900146484375, -4.206787109375, -4.0235595703125, -3.84033203125, -3.6571044921875, -3.473876953125, -3.2906494140625, -3.107421875, -2.9241943359375, -2.740966796875, -2.5577392578125, -2.37451171875, -2.1912841796875, -2.008056640625, -1.8248291015625, -1.6416015625, -1.4583740234375, -1.275146484375, -1.0919189453125, -0.90869140625, -0.7254638671875, -0.542236328125, -0.3590087890625, -0.17578125, 0.0074462890625, 0.190673828125, 0.3739013671875, 0.55712890625, 0.7403564453125, 0.923583984375, 1.1068115234375, 1.2900390625, 1.4732666015625, 1.656494140625, 1.8397216796875, 2.02294921875, 2.2061767578125, 2.389404296875, 2.5726318359375, 2.755859375, 2.9390869140625, 3.122314453125, 3.3055419921875, 3.48876953125, 3.6719970703125, 3.855224609375, 4.0384521484375, 4.2216796875, 4.4049072265625, 4.588134765625, 4.7713623046875, 4.95458984375, 5.1378173828125, 5.321044921875, 5.5042724609375, 5.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 7.0, 11.0, 22.0, 17.0, 17.0, 41.0, 54.0, 58.0, 75.0, 103.0, 133.0, 189.0, 268.0, 382.0, 552.0, 915.0, 1440.0, 2538.0, 4718.0, 9460.0, 21939.0, 61890.0, 358091.0, 468696.0, 70400.0, 24061.0, 10229.0, 5054.0, 2624.0, 1502.0, 1012.0, 620.0, 417.0, 271.0, 178.0, 143.0, 94.0, 78.0, 58.0, 56.0, 35.0, 24.0, 16.0, 25.0, 13.0, 5.0, 5.0, 2.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0], "bins": [-20.9375, -20.303955078125, -19.67041015625, -19.036865234375, -18.4033203125, -17.769775390625, -17.13623046875, -16.502685546875, -15.869140625, -15.235595703125, -14.60205078125, -13.968505859375, -13.3349609375, -12.701416015625, -12.06787109375, -11.434326171875, -10.80078125, -10.167236328125, -9.53369140625, -8.900146484375, -8.2666015625, -7.633056640625, -6.99951171875, -6.365966796875, -5.732421875, -5.098876953125, -4.46533203125, -3.831787109375, -3.1982421875, -2.564697265625, -1.93115234375, -1.297607421875, -0.6640625, -0.030517578125, 0.60302734375, 1.236572265625, 1.8701171875, 2.503662109375, 3.13720703125, 3.770751953125, 4.404296875, 5.037841796875, 5.67138671875, 6.304931640625, 6.9384765625, 7.572021484375, 8.20556640625, 8.839111328125, 9.47265625, 10.106201171875, 10.73974609375, 11.373291015625, 12.0068359375, 12.640380859375, 13.27392578125, 13.907470703125, 14.541015625, 15.174560546875, 15.80810546875, 16.441650390625, 17.0751953125, 17.708740234375, 18.34228515625, 18.975830078125, 19.609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 5.0, 10.0, 12.0, 14.0, 16.0, 14.0, 22.0, 25.0, 31.0, 30.0, 40.0, 38.0, 34.0, 47.0, 45.0, 36.0, 37.0, 52.0, 43.0, 53.0, 52.0, 43.0, 38.0, 38.0, 39.0, 29.0, 22.0, 31.0, 22.0, 17.0, 13.0, 7.0, 11.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.0546875, -5.89349365234375, -5.7322998046875, -5.57110595703125, -5.409912109375, -5.24871826171875, -5.0875244140625, -4.92633056640625, -4.76513671875, -4.60394287109375, -4.4427490234375, -4.28155517578125, -4.120361328125, -3.95916748046875, -3.7979736328125, -3.63677978515625, -3.4755859375, -3.31439208984375, -3.1531982421875, -2.99200439453125, -2.830810546875, -2.66961669921875, -2.5084228515625, -2.34722900390625, -2.18603515625, -2.02484130859375, -1.8636474609375, -1.70245361328125, -1.541259765625, -1.38006591796875, -1.2188720703125, -1.05767822265625, -0.896484375, -0.73529052734375, -0.5740966796875, -0.41290283203125, -0.251708984375, -0.09051513671875, 0.0706787109375, 0.23187255859375, 0.39306640625, 0.55426025390625, 0.7154541015625, 0.87664794921875, 1.037841796875, 1.19903564453125, 1.3602294921875, 1.52142333984375, 1.6826171875, 1.84381103515625, 2.0050048828125, 2.16619873046875, 2.327392578125, 2.48858642578125, 2.6497802734375, 2.81097412109375, 2.97216796875, 3.13336181640625, 3.2945556640625, 3.45574951171875, 3.616943359375, 3.77813720703125, 3.9393310546875, 4.10052490234375, 4.26171875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 11.0, 14.0, 15.0, 17.0, 27.0, 39.0, 54.0, 50.0, 76.0, 139.0, 162.0, 245.0, 366.0, 555.0, 902.0, 1570.0, 3412.0, 9445.0, 46898.0, 895502.0, 69131.0, 11387.0, 3869.0, 1759.0, 983.0, 563.0, 383.0, 291.0, 187.0, 139.0, 84.0, 60.0, 46.0, 42.0, 27.0, 23.0, 21.0, 17.0, 4.0, 10.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-68.5, -66.3974609375, -64.294921875, -62.1923828125, -60.08984375, -57.9873046875, -55.884765625, -53.7822265625, -51.6796875, -49.5771484375, -47.474609375, -45.3720703125, -43.26953125, -41.1669921875, -39.064453125, -36.9619140625, -34.859375, -32.7568359375, -30.654296875, -28.5517578125, -26.44921875, -24.3466796875, -22.244140625, -20.1416015625, -18.0390625, -15.9365234375, -13.833984375, -11.7314453125, -9.62890625, -7.5263671875, -5.423828125, -3.3212890625, -1.21875, 0.8837890625, 2.986328125, 5.0888671875, 7.19140625, 9.2939453125, 11.396484375, 13.4990234375, 15.6015625, 17.7041015625, 19.806640625, 21.9091796875, 24.01171875, 26.1142578125, 28.216796875, 30.3193359375, 32.421875, 34.5244140625, 36.626953125, 38.7294921875, 40.83203125, 42.9345703125, 45.037109375, 47.1396484375, 49.2421875, 51.3447265625, 53.447265625, 55.5498046875, 57.65234375, 59.7548828125, 61.857421875, 63.9599609375, 66.0625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 16.0, 16.0, 21.0, 20.0, 42.0, 59.0, 106.0, 202.0, 197.0, 107.0, 64.0, 44.0, 23.0, 19.0, 13.0, 13.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000972747802734375, -0.0009286850690841675, -0.00088462233543396, -0.0008405596017837524, -0.0007964968681335449, -0.0007524341344833374, -0.0007083714008331299, -0.0006643086671829224, -0.0006202459335327148, -0.0005761831998825073, -0.0005321204662322998, -0.0004880577325820923, -0.00044399499893188477, -0.00039993226528167725, -0.0003558695316314697, -0.0003118067979812622, -0.0002677440643310547, -0.00022368133068084717, -0.00017961859703063965, -0.00013555586338043213, -9.149312973022461e-05, -4.743039608001709e-05, -3.3676624298095703e-06, 4.069507122039795e-05, 8.475780487060547e-05, 0.000128820538520813, 0.0001728832721710205, 0.00021694600582122803, 0.00026100873947143555, 0.00030507147312164307, 0.0003491342067718506, 0.0003931969404220581, 0.0004372596740722656, 0.00048132240772247314, 0.0005253851413726807, 0.0005694478750228882, 0.0006135106086730957, 0.0006575733423233032, 0.0007016360759735107, 0.0007456988096237183, 0.0007897615432739258, 0.0008338242769241333, 0.0008778870105743408, 0.0009219497442245483, 0.0009660124778747559, 0.0010100752115249634, 0.001054137945175171, 0.0010982006788253784, 0.001142263412475586, 0.0011863261461257935, 0.001230388879776001, 0.0012744516134262085, 0.001318514347076416, 0.0013625770807266235, 0.001406639814376831, 0.0014507025480270386, 0.001494765281677246, 0.0015388280153274536, 0.0015828907489776611, 0.0016269534826278687, 0.0016710162162780762, 0.0017150789499282837, 0.0017591416835784912, 0.0018032044172286987, 0.0018472671508789062]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 14.0, 16.0, 26.0, 22.0, 32.0, 52.0, 144.0, 2713.0, 1035505.0, 9556.0, 231.0, 66.0, 39.0, 26.0, 17.0, 16.0, 9.0, 5.0, 9.0, 8.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.25, -195.423828125, -188.59765625, -181.771484375, -174.9453125, -168.119140625, -161.29296875, -154.466796875, -147.640625, -140.814453125, -133.98828125, -127.162109375, -120.3359375, -113.509765625, -106.68359375, -99.857421875, -93.03125, -86.205078125, -79.37890625, -72.552734375, -65.7265625, -58.900390625, -52.07421875, -45.248046875, -38.421875, -31.595703125, -24.76953125, -17.943359375, -11.1171875, -4.291015625, 2.53515625, 9.361328125, 16.1875, 23.013671875, 29.83984375, 36.666015625, 43.4921875, 50.318359375, 57.14453125, 63.970703125, 70.796875, 77.623046875, 84.44921875, 91.275390625, 98.1015625, 104.927734375, 111.75390625, 118.580078125, 125.40625, 132.232421875, 139.05859375, 145.884765625, 152.7109375, 159.537109375, 166.36328125, 173.189453125, 180.015625, 186.841796875, 193.66796875, 200.494140625, 207.3203125, 214.146484375, 220.97265625, 227.798828125, 234.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 11.0, 23.0, 27.0, 23.0, 29.0, 63.0, 86.0, 198.0, 206.0, 91.0, 68.0, 47.0, 26.0, 20.0, 12.0, 5.0, 6.0, 12.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.756591796875, -7.48974609375, -7.222900390625, -6.9560546875, -6.689208984375, -6.42236328125, -6.155517578125, -5.888671875, -5.621826171875, -5.35498046875, -5.088134765625, -4.8212890625, -4.554443359375, -4.28759765625, -4.020751953125, -3.75390625, -3.487060546875, -3.22021484375, -2.953369140625, -2.6865234375, -2.419677734375, -2.15283203125, -1.885986328125, -1.619140625, -1.352294921875, -1.08544921875, -0.818603515625, -0.5517578125, -0.284912109375, -0.01806640625, 0.248779296875, 0.515625, 0.782470703125, 1.04931640625, 1.316162109375, 1.5830078125, 1.849853515625, 2.11669921875, 2.383544921875, 2.650390625, 2.917236328125, 3.18408203125, 3.450927734375, 3.7177734375, 3.984619140625, 4.25146484375, 4.518310546875, 4.78515625, 5.052001953125, 5.31884765625, 5.585693359375, 5.8525390625, 6.119384765625, 6.38623046875, 6.653076171875, 6.919921875, 7.186767578125, 7.45361328125, 7.720458984375, 7.9873046875, 8.254150390625, 8.52099609375, 8.787841796875, 9.0546875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 5.0, 11.0, 15.0, 35.0, 35.0, 48.0, 58.0, 67.0, 89.0, 96.0, 83.0, 89.0, 75.0, 90.0, 54.0, 36.0, 31.0, 20.0, 17.0, 8.0, 12.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.572351455688477, -5.2435760498046875, -4.914801120758057, -4.586026191711426, -4.257250785827637, -3.9284756183624268, -3.599700450897217, -3.270925283432007, -2.942150115966797, -2.613374948501587, -2.284599781036377, -1.955824613571167, -1.627049446105957, -1.298274278640747, -0.9694991111755371, -0.6407239437103271, -0.3119487762451172, 0.016826391220092773, 0.34560155868530273, 0.6743767261505127, 1.0031518936157227, 1.3319270610809326, 1.6607022285461426, 1.9894773960113525, 2.3182525634765625, 2.6470277309417725, 2.9758028984069824, 3.3045780658721924, 3.6333532333374023, 3.9621284008026123, 4.290903568267822, 4.619678497314453, 4.948453903198242, 5.277229309082031, 5.606004238128662, 5.934779167175293, 6.263554573059082, 6.592329978942871, 6.921104907989502, 7.249879837036133, 7.578655242919922, 7.907430648803711, 8.2362060546875, 8.564980506896973, 8.893755912780762, 9.22253131866455, 9.551305770874023, 9.880081176757812, 10.208856582641602, 10.53763198852539, 10.86640739440918, 11.195181846618652, 11.523957252502441, 11.85273265838623, 12.181507110595703, 12.510282516479492, 12.839057922363281, 13.16783332824707, 13.49660873413086, 13.825383186340332, 14.154158592224121, 14.48293399810791, 14.811708450317383, 15.140483856201172, 15.469259262084961]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 5.0, 8.0, 10.0, 8.0, 13.0, 20.0, 11.0, 15.0, 13.0, 25.0, 20.0, 23.0, 28.0, 32.0, 32.0, 35.0, 27.0, 31.0, 42.0, 40.0, 40.0, 33.0, 40.0, 41.0, 39.0, 45.0, 36.0, 30.0, 32.0, 29.0, 22.0, 30.0, 24.0, 19.0, 17.0, 13.0, 11.0, 11.0, 9.0, 11.0, 9.0, 7.0, 4.0, 2.0, 6.0, 4.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8455376625061035, -6.634451866149902, -6.423366069793701, -6.2122802734375, -6.001194953918457, -5.790108680725098, -5.579023361206055, -5.3679375648498535, -5.156851768493652, -4.945765972137451, -4.73468017578125, -4.523594379425049, -4.312508583068848, -4.101423263549805, -3.8903374671936035, -3.6792516708374023, -3.468165874481201, -3.257080078125, -3.045994281768799, -2.8349087238311768, -2.6238229274749756, -2.4127371311187744, -2.2016515731811523, -1.9905657768249512, -1.77947998046875, -1.5683941841125488, -1.3573085069656372, -1.1462228298187256, -0.9351370334625244, -0.7240512371063232, -0.5129655599594116, -0.3018798828125, -0.09079360961914062, 0.12029212713241577, 0.33137786388397217, 0.5424636006355286, 0.753549337387085, 0.9646351337432861, 1.1757208108901978, 1.3868064880371094, 1.5978922843933105, 1.8089780807495117, 2.020063877105713, 2.231149435043335, 2.442235231399536, 2.6533210277557373, 2.8644065856933594, 3.0754923820495605, 3.2865781784057617, 3.497663974761963, 3.708749771118164, 3.919835329055786, 4.130921363830566, 4.342006683349609, 4.5530924797058105, 4.764178276062012, 4.975264072418213, 5.186349868774414, 5.397435665130615, 5.608521461486816, 5.819606781005859, 6.030693054199219, 6.241778373718262, 6.452864170074463, 6.663949966430664]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 12.0, 17.0, 21.0, 28.0, 53.0, 61.0, 84.0, 114.0, 149.0, 212.0, 257.0, 347.0, 466.0, 684.0, 885.0, 1350.0, 1893.0, 3122.0, 5788.0, 11131.0, 23476.0, 51917.0, 115249.0, 223418.0, 270713.0, 176684.0, 84308.0, 37341.0, 17500.0, 8459.0, 4506.0, 2550.0, 1697.0, 1102.0, 740.0, 558.0, 424.0, 339.0, 227.0, 174.0, 125.0, 124.0, 79.0, 38.0, 50.0, 23.0, 16.0, 16.0, 9.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6875, -15.186279296875, -14.68505859375, -14.183837890625, -13.6826171875, -13.181396484375, -12.68017578125, -12.178955078125, -11.677734375, -11.176513671875, -10.67529296875, -10.174072265625, -9.6728515625, -9.171630859375, -8.67041015625, -8.169189453125, -7.66796875, -7.166748046875, -6.66552734375, -6.164306640625, -5.6630859375, -5.161865234375, -4.66064453125, -4.159423828125, -3.658203125, -3.156982421875, -2.65576171875, -2.154541015625, -1.6533203125, -1.152099609375, -0.65087890625, -0.149658203125, 0.3515625, 0.852783203125, 1.35400390625, 1.855224609375, 2.3564453125, 2.857666015625, 3.35888671875, 3.860107421875, 4.361328125, 4.862548828125, 5.36376953125, 5.864990234375, 6.3662109375, 6.867431640625, 7.36865234375, 7.869873046875, 8.37109375, 8.872314453125, 9.37353515625, 9.874755859375, 10.3759765625, 10.877197265625, 11.37841796875, 11.879638671875, 12.380859375, 12.882080078125, 13.38330078125, 13.884521484375, 14.3857421875, 14.886962890625, 15.38818359375, 15.889404296875, 16.390625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 19.0, 18.0, 14.0, 23.0, 25.0, 27.0, 25.0, 32.0, 35.0, 41.0, 47.0, 45.0, 41.0, 40.0, 43.0, 50.0, 47.0, 42.0, 40.0, 44.0, 37.0, 38.0, 26.0, 21.0, 27.0, 19.0, 25.0, 22.0, 14.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.77777099609375, -5.5438232421875, -5.30987548828125, -5.075927734375, -4.84197998046875, -4.6080322265625, -4.37408447265625, -4.14013671875, -3.90618896484375, -3.6722412109375, -3.43829345703125, -3.204345703125, -2.97039794921875, -2.7364501953125, -2.50250244140625, -2.2685546875, -2.03460693359375, -1.8006591796875, -1.56671142578125, -1.332763671875, -1.09881591796875, -0.8648681640625, -0.63092041015625, -0.39697265625, -0.16302490234375, 0.0709228515625, 0.30487060546875, 0.538818359375, 0.77276611328125, 1.0067138671875, 1.24066162109375, 1.474609375, 1.70855712890625, 1.9425048828125, 2.17645263671875, 2.410400390625, 2.64434814453125, 2.8782958984375, 3.11224365234375, 3.34619140625, 3.58013916015625, 3.8140869140625, 4.04803466796875, 4.281982421875, 4.51593017578125, 4.7498779296875, 4.98382568359375, 5.2177734375, 5.45172119140625, 5.6856689453125, 5.91961669921875, 6.153564453125, 6.38751220703125, 6.6214599609375, 6.85540771484375, 7.08935546875, 7.32330322265625, 7.5572509765625, 7.79119873046875, 8.025146484375, 8.25909423828125, 8.4930419921875, 8.72698974609375, 8.9609375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 6.0, 14.0, 17.0, 21.0, 22.0, 26.0, 20.0, 36.0, 31.0, 31.0, 59.0, 202.0, 1124.0, 18245.0, 934229.0, 91066.0, 2633.0, 328.0, 87.0, 64.0, 52.0, 41.0, 28.0, 20.0, 21.0, 21.0, 13.0, 10.0, 13.0, 5.0, 11.0, 7.0, 4.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-114.5, -110.884765625, -107.26953125, -103.654296875, -100.0390625, -96.423828125, -92.80859375, -89.193359375, -85.578125, -81.962890625, -78.34765625, -74.732421875, -71.1171875, -67.501953125, -63.88671875, -60.271484375, -56.65625, -53.041015625, -49.42578125, -45.810546875, -42.1953125, -38.580078125, -34.96484375, -31.349609375, -27.734375, -24.119140625, -20.50390625, -16.888671875, -13.2734375, -9.658203125, -6.04296875, -2.427734375, 1.1875, 4.802734375, 8.41796875, 12.033203125, 15.6484375, 19.263671875, 22.87890625, 26.494140625, 30.109375, 33.724609375, 37.33984375, 40.955078125, 44.5703125, 48.185546875, 51.80078125, 55.416015625, 59.03125, 62.646484375, 66.26171875, 69.876953125, 73.4921875, 77.107421875, 80.72265625, 84.337890625, 87.953125, 91.568359375, 95.18359375, 98.798828125, 102.4140625, 106.029296875, 109.64453125, 113.259765625, 116.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 12.0, 9.0, 20.0, 26.0, 24.0, 22.0, 30.0, 41.0, 35.0, 40.0, 46.0, 48.0, 46.0, 51.0, 64.0, 64.0, 69.0, 55.0, 59.0, 45.0, 32.0, 25.0, 31.0, 18.0, 12.0, 10.0, 7.0, 7.0, 9.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.125, -11.7406005859375, -11.356201171875, -10.9718017578125, -10.58740234375, -10.2030029296875, -9.818603515625, -9.4342041015625, -9.0498046875, -8.6654052734375, -8.281005859375, -7.8966064453125, -7.51220703125, -7.1278076171875, -6.743408203125, -6.3590087890625, -5.974609375, -5.5902099609375, -5.205810546875, -4.8214111328125, -4.43701171875, -4.0526123046875, -3.668212890625, -3.2838134765625, -2.8994140625, -2.5150146484375, -2.130615234375, -1.7462158203125, -1.36181640625, -0.9774169921875, -0.593017578125, -0.2086181640625, 0.17578125, 0.5601806640625, 0.944580078125, 1.3289794921875, 1.71337890625, 2.0977783203125, 2.482177734375, 2.8665771484375, 3.2509765625, 3.6353759765625, 4.019775390625, 4.4041748046875, 4.78857421875, 5.1729736328125, 5.557373046875, 5.9417724609375, 6.326171875, 6.7105712890625, 7.094970703125, 7.4793701171875, 7.86376953125, 8.2481689453125, 8.632568359375, 9.0169677734375, 9.4013671875, 9.7857666015625, 10.170166015625, 10.5545654296875, 10.93896484375, 11.3233642578125, 11.707763671875, 12.0921630859375, 12.4765625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 17.0, 28.0, 57.0, 97.0, 163.0, 322.0, 662.0, 1298.0, 2798.0, 7615.0, 28318.0, 162429.0, 707317.0, 106045.0, 20626.0, 6082.0, 2396.0, 1061.0, 530.0, 298.0, 171.0, 97.0, 39.0, 39.0, 14.0, 13.0, 5.0, 4.0, 5.0, 1.0], "bins": [-5.0546875, -4.94573974609375, -4.8367919921875, -4.72784423828125, -4.618896484375, -4.50994873046875, -4.4010009765625, -4.29205322265625, -4.18310546875, -4.07415771484375, -3.9652099609375, -3.85626220703125, -3.747314453125, -3.63836669921875, -3.5294189453125, -3.42047119140625, -3.3115234375, -3.20257568359375, -3.0936279296875, -2.98468017578125, -2.875732421875, -2.76678466796875, -2.6578369140625, -2.54888916015625, -2.43994140625, -2.33099365234375, -2.2220458984375, -2.11309814453125, -2.004150390625, -1.89520263671875, -1.7862548828125, -1.67730712890625, -1.568359375, -1.45941162109375, -1.3504638671875, -1.24151611328125, -1.132568359375, -1.02362060546875, -0.9146728515625, -0.80572509765625, -0.69677734375, -0.58782958984375, -0.4788818359375, -0.36993408203125, -0.260986328125, -0.15203857421875, -0.0430908203125, 0.06585693359375, 0.1748046875, 0.28375244140625, 0.3927001953125, 0.50164794921875, 0.610595703125, 0.71954345703125, 0.8284912109375, 0.93743896484375, 1.04638671875, 1.15533447265625, 1.2642822265625, 1.37322998046875, 1.482177734375, 1.59112548828125, 1.7000732421875, 1.80902099609375, 1.91796875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 7.0, 6.0, 14.0, 30.0, 35.0, 37.0, 47.0, 74.0, 105.0, 123.0, 141.0, 106.0, 86.0, 53.0, 26.0, 18.0, 21.0, 13.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022649765014648438, -0.0002174191176891327, -0.000208340585231781, -0.00019926205277442932, -0.00019018352031707764, -0.00018110498785972595, -0.00017202645540237427, -0.00016294792294502258, -0.0001538693904876709, -0.00014479085803031921, -0.00013571232557296753, -0.00012663379311561584, -0.00011755526065826416, -0.00010847672820091248, -9.939819574356079e-05, -9.03196632862091e-05, -8.124113082885742e-05, -7.216259837150574e-05, -6.308406591415405e-05, -5.400553345680237e-05, -4.4927000999450684e-05, -3.5848468542099e-05, -2.6769936084747314e-05, -1.769140362739563e-05, -8.612871170043945e-06, 4.6566128730773926e-07, 9.544193744659424e-06, 1.862272620201111e-05, 2.7701258659362793e-05, 3.677979111671448e-05, 4.585832357406616e-05, 5.493685603141785e-05, 6.401538848876953e-05, 7.309392094612122e-05, 8.21724534034729e-05, 9.125098586082458e-05, 0.00010032951831817627, 0.00010940805077552795, 0.00011848658323287964, 0.00012756511569023132, 0.000136643648147583, 0.0001457221806049347, 0.00015480071306228638, 0.00016387924551963806, 0.00017295777797698975, 0.00018203631043434143, 0.00019111484289169312, 0.0002001933753490448, 0.00020927190780639648, 0.00021835044026374817, 0.00022742897272109985, 0.00023650750517845154, 0.0002455860376358032, 0.0002546645700931549, 0.0002637431025505066, 0.0002728216350078583, 0.00028190016746520996, 0.00029097869992256165, 0.00030005723237991333, 0.000309135764837265, 0.0003182142972946167, 0.0003272928297519684, 0.00033637136220932007, 0.00034544989466667175, 0.00035452842712402344]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 10.0, 8.0, 10.0, 7.0, 8.0, 21.0, 24.0, 32.0, 45.0, 107.0, 966.0, 30969.0, 1005291.0, 10241.0, 558.0, 84.0, 36.0, 28.0, 15.0, 9.0, 13.0, 10.0, 3.0, 11.0, 9.0, 4.0, 3.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.2939453125, -16.759765625, -16.2255859375, -15.69140625, -15.1572265625, -14.623046875, -14.0888671875, -13.5546875, -13.0205078125, -12.486328125, -11.9521484375, -11.41796875, -10.8837890625, -10.349609375, -9.8154296875, -9.28125, -8.7470703125, -8.212890625, -7.6787109375, -7.14453125, -6.6103515625, -6.076171875, -5.5419921875, -5.0078125, -4.4736328125, -3.939453125, -3.4052734375, -2.87109375, -2.3369140625, -1.802734375, -1.2685546875, -0.734375, -0.2001953125, 0.333984375, 0.8681640625, 1.40234375, 1.9365234375, 2.470703125, 3.0048828125, 3.5390625, 4.0732421875, 4.607421875, 5.1416015625, 5.67578125, 6.2099609375, 6.744140625, 7.2783203125, 7.8125, 8.3466796875, 8.880859375, 9.4150390625, 9.94921875, 10.4833984375, 11.017578125, 11.5517578125, 12.0859375, 12.6201171875, 13.154296875, 13.6884765625, 14.22265625, 14.7568359375, 15.291015625, 15.8251953125, 16.359375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 9.0, 11.0, 8.0, 8.0, 14.0, 22.0, 33.0, 34.0, 45.0, 59.0, 74.0, 216.0, 118.0, 92.0, 64.0, 39.0, 29.0, 26.0, 7.0, 11.0, 14.0, 6.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1650390625, -1.129547119140625, -1.09405517578125, -1.058563232421875, -1.0230712890625, -0.987579345703125, -0.95208740234375, -0.916595458984375, -0.881103515625, -0.845611572265625, -0.81011962890625, -0.774627685546875, -0.7391357421875, -0.703643798828125, -0.66815185546875, -0.632659912109375, -0.59716796875, -0.561676025390625, -0.52618408203125, -0.490692138671875, -0.4552001953125, -0.419708251953125, -0.38421630859375, -0.348724365234375, -0.313232421875, -0.277740478515625, -0.24224853515625, -0.206756591796875, -0.1712646484375, -0.135772705078125, -0.10028076171875, -0.064788818359375, -0.029296875, 0.006195068359375, 0.04168701171875, 0.077178955078125, 0.1126708984375, 0.148162841796875, 0.18365478515625, 0.219146728515625, 0.254638671875, 0.290130615234375, 0.32562255859375, 0.361114501953125, 0.3966064453125, 0.432098388671875, 0.46759033203125, 0.503082275390625, 0.53857421875, 0.574066162109375, 0.60955810546875, 0.645050048828125, 0.6805419921875, 0.716033935546875, 0.75152587890625, 0.787017822265625, 0.822509765625, 0.858001708984375, 0.89349365234375, 0.928985595703125, 0.9644775390625, 0.999969482421875, 1.03546142578125, 1.070953369140625, 1.1064453125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 13.0, 51.0, 125.0, 297.0, 267.0, 154.0, 68.0, 17.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.72831916809082, -29.0510311126709, -28.373743057250977, -27.696455001831055, -27.019166946411133, -26.34187889099121, -25.664592742919922, -24.9873046875, -24.310016632080078, -23.632728576660156, -22.955440521240234, -22.278152465820312, -21.60086441040039, -20.92357635498047, -20.246288299560547, -19.569000244140625, -18.891712188720703, -18.21442413330078, -17.53713607788086, -16.859848022460938, -16.182559967041016, -15.505271911621094, -14.827984809875488, -14.150696754455566, -13.473408699035645, -12.796120643615723, -12.1188325881958, -11.441545486450195, -10.764257431030273, -10.086969375610352, -9.40968132019043, -8.732393264770508, -8.055107116699219, -7.377819061279297, -6.700531005859375, -6.023243427276611, -5.3459553718566895, -4.668667316436768, -3.991379737854004, -3.314091682434082, -2.63680362701416, -1.9595156908035278, -1.2822277545928955, -0.6049399375915527, 0.07234811782836914, 0.749636173248291, 1.4269237518310547, 2.1042118072509766, 2.7814998626708984, 3.4587879180908203, 4.136075973510742, 4.813363552093506, 5.490651607513428, 6.16793966293335, 6.845227241516113, 7.522515296936035, 8.199803352355957, 8.877091407775879, 9.5543794631958, 10.231666564941406, 10.908954620361328, 11.58624267578125, 12.263530731201172, 12.940818786621094, 13.618106842041016]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 15.0, 11.0, 8.0, 9.0, 17.0, 18.0, 23.0, 32.0, 27.0, 29.0, 22.0, 26.0, 34.0, 35.0, 31.0, 39.0, 32.0, 47.0, 46.0, 39.0, 32.0, 29.0, 31.0, 42.0, 39.0, 30.0, 30.0, 28.0, 21.0, 21.0, 15.0, 22.0, 14.0, 13.0, 18.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.392449855804443, -7.142343521118164, -6.892237663269043, -6.642131328582764, -6.392024993896484, -6.141919136047363, -5.891812801361084, -5.641706466674805, -5.391600608825684, -5.141494274139404, -4.891388416290283, -4.641282081604004, -4.391176223754883, -4.1410698890686035, -3.890963554382324, -3.640857458114624, -3.390751361846924, -3.1406452655792236, -2.8905391693115234, -2.640432834625244, -2.390326738357544, -2.1402206420898438, -1.890114426612854, -1.6400082111358643, -1.389902114868164, -1.1397960186004639, -0.8896898031234741, -0.6395836472511292, -0.3894774913787842, -0.13937139511108398, 0.11073482036590576, 0.3608410358428955, 0.6109466552734375, 0.8610528111457825, 1.1111589670181274, 1.3612651824951172, 1.6113712787628174, 1.8614773750305176, 2.111583709716797, 2.361689805984497, 2.6117959022521973, 2.8619019985198975, 3.1120080947875977, 3.362114429473877, 3.612220525741577, 3.8623266220092773, 4.112432956695557, 4.362539291381836, 4.612645149230957, 4.862751483917236, 5.112857341766357, 5.362963676452637, 5.613069534301758, 5.863175868988037, 6.113282203674316, 6.3633880615234375, 6.613494396209717, 6.863600730895996, 7.113706588745117, 7.3638129234313965, 7.613919258117676, 7.864025115966797, 8.114130973815918, 8.364237785339355, 8.614343643188477]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 5.0, 5.0, 14.0, 18.0, 27.0, 40.0, 46.0, 65.0, 127.0, 163.0, 224.0, 307.0, 493.0, 796.0, 1302.0, 2064.0, 3804.0, 7271.0, 17615.0, 89634.0, 1079657.0, 2578514.0, 351897.0, 36168.0, 11246.0, 5122.0, 2843.0, 1684.0, 1059.0, 678.0, 446.0, 280.0, 205.0, 147.0, 96.0, 55.0, 50.0, 22.0, 19.0, 18.0, 18.0, 13.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.93212890625, -7.6611328125, -7.39013671875, -7.119140625, -6.84814453125, -6.5771484375, -6.30615234375, -6.03515625, -5.76416015625, -5.4931640625, -5.22216796875, -4.951171875, -4.68017578125, -4.4091796875, -4.13818359375, -3.8671875, -3.59619140625, -3.3251953125, -3.05419921875, -2.783203125, -2.51220703125, -2.2412109375, -1.97021484375, -1.69921875, -1.42822265625, -1.1572265625, -0.88623046875, -0.615234375, -0.34423828125, -0.0732421875, 0.19775390625, 0.46875, 0.73974609375, 1.0107421875, 1.28173828125, 1.552734375, 1.82373046875, 2.0947265625, 2.36572265625, 2.63671875, 2.90771484375, 3.1787109375, 3.44970703125, 3.720703125, 3.99169921875, 4.2626953125, 4.53369140625, 4.8046875, 5.07568359375, 5.3466796875, 5.61767578125, 5.888671875, 6.15966796875, 6.4306640625, 6.70166015625, 6.97265625, 7.24365234375, 7.5146484375, 7.78564453125, 8.056640625, 8.32763671875, 8.5986328125, 8.86962890625, 9.140625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 9.0, 4.0, 10.0, 11.0, 12.0, 23.0, 24.0, 21.0, 38.0, 34.0, 29.0, 23.0, 44.0, 35.0, 42.0, 39.0, 42.0, 48.0, 29.0, 46.0, 41.0, 33.0, 41.0, 42.0, 32.0, 32.0, 25.0, 26.0, 26.0, 30.0, 17.0, 15.0, 15.0, 10.0, 11.0, 6.0, 9.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.84765625, -4.69232177734375, -4.5369873046875, -4.38165283203125, -4.226318359375, -4.07098388671875, -3.9156494140625, -3.76031494140625, -3.60498046875, -3.44964599609375, -3.2943115234375, -3.13897705078125, -2.983642578125, -2.82830810546875, -2.6729736328125, -2.51763916015625, -2.3623046875, -2.20697021484375, -2.0516357421875, -1.89630126953125, -1.740966796875, -1.58563232421875, -1.4302978515625, -1.27496337890625, -1.11962890625, -0.96429443359375, -0.8089599609375, -0.65362548828125, -0.498291015625, -0.34295654296875, -0.1876220703125, -0.03228759765625, 0.123046875, 0.27838134765625, 0.4337158203125, 0.58905029296875, 0.744384765625, 0.89971923828125, 1.0550537109375, 1.21038818359375, 1.36572265625, 1.52105712890625, 1.6763916015625, 1.83172607421875, 1.987060546875, 2.14239501953125, 2.2977294921875, 2.45306396484375, 2.6083984375, 2.76373291015625, 2.9190673828125, 3.07440185546875, 3.229736328125, 3.38507080078125, 3.5404052734375, 3.69573974609375, 3.85107421875, 4.00640869140625, 4.1617431640625, 4.31707763671875, 4.472412109375, 4.62774658203125, 4.7830810546875, 4.93841552734375, 5.09375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 5.0, 4.0, 8.0, 9.0, 6.0, 11.0, 14.0, 14.0, 19.0, 31.0, 31.0, 69.0, 83.0, 181.0, 320.0, 632.0, 5578.0, 4096434.0, 88556.0, 1284.0, 401.0, 221.0, 115.0, 63.0, 34.0, 34.0, 24.0, 17.0, 22.0, 12.0, 6.0, 5.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-52.9375, -51.32177734375, -49.7060546875, -48.09033203125, -46.474609375, -44.85888671875, -43.2431640625, -41.62744140625, -40.01171875, -38.39599609375, -36.7802734375, -35.16455078125, -33.548828125, -31.93310546875, -30.3173828125, -28.70166015625, -27.0859375, -25.47021484375, -23.8544921875, -22.23876953125, -20.623046875, -19.00732421875, -17.3916015625, -15.77587890625, -14.16015625, -12.54443359375, -10.9287109375, -9.31298828125, -7.697265625, -6.08154296875, -4.4658203125, -2.85009765625, -1.234375, 0.38134765625, 1.9970703125, 3.61279296875, 5.228515625, 6.84423828125, 8.4599609375, 10.07568359375, 11.69140625, 13.30712890625, 14.9228515625, 16.53857421875, 18.154296875, 19.77001953125, 21.3857421875, 23.00146484375, 24.6171875, 26.23291015625, 27.8486328125, 29.46435546875, 31.080078125, 32.69580078125, 34.3115234375, 35.92724609375, 37.54296875, 39.15869140625, 40.7744140625, 42.39013671875, 44.005859375, 45.62158203125, 47.2373046875, 48.85302734375, 50.46875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 7.0, 11.0, 13.0, 8.0, 17.0, 16.0, 28.0, 33.0, 54.0, 72.0, 136.0, 248.0, 399.0, 601.0, 723.0, 603.0, 399.0, 255.0, 142.0, 66.0, 54.0, 36.0, 22.0, 22.0, 16.0, 21.0, 10.0, 4.0, 10.0, 3.0, 7.0, 0.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.251953125, -2.18304443359375, -2.1141357421875, -2.04522705078125, -1.976318359375, -1.90740966796875, -1.8385009765625, -1.76959228515625, -1.70068359375, -1.63177490234375, -1.5628662109375, -1.49395751953125, -1.425048828125, -1.35614013671875, -1.2872314453125, -1.21832275390625, -1.1494140625, -1.08050537109375, -1.0115966796875, -0.94268798828125, -0.873779296875, -0.80487060546875, -0.7359619140625, -0.66705322265625, -0.59814453125, -0.52923583984375, -0.4603271484375, -0.39141845703125, -0.322509765625, -0.25360107421875, -0.1846923828125, -0.11578369140625, -0.046875, 0.02203369140625, 0.0909423828125, 0.15985107421875, 0.228759765625, 0.29766845703125, 0.3665771484375, 0.43548583984375, 0.50439453125, 0.57330322265625, 0.6422119140625, 0.71112060546875, 0.780029296875, 0.84893798828125, 0.9178466796875, 0.98675537109375, 1.0556640625, 1.12457275390625, 1.1934814453125, 1.26239013671875, 1.331298828125, 1.40020751953125, 1.4691162109375, 1.53802490234375, 1.60693359375, 1.67584228515625, 1.7447509765625, 1.81365966796875, 1.882568359375, 1.95147705078125, 2.0203857421875, 2.08929443359375, 2.158203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 28.0, 120.0, 236.0, 313.0, 195.0, 84.0, 21.0, 4.0, 3.0, 4.0], "bins": [-34.89724349975586, -34.28702163696289, -33.67679977416992, -33.06657409667969, -32.45635223388672, -31.84613037109375, -31.23590660095215, -30.62568473815918, -30.015460968017578, -29.40523910522461, -28.795015335083008, -28.18479347229004, -27.574569702148438, -26.96434783935547, -26.354124069213867, -25.7439022064209, -25.13368034362793, -24.52345848083496, -23.91323471069336, -23.30301284790039, -22.69278907775879, -22.08256721496582, -21.47234344482422, -20.86212158203125, -20.25189971923828, -19.641677856445312, -19.03145408630371, -18.421232223510742, -17.81100845336914, -17.200786590576172, -16.59056282043457, -15.980340957641602, -15.3701171875, -14.759894371032715, -14.14967155456543, -13.539448738098145, -12.92922592163086, -12.31900405883789, -11.708781242370605, -11.09855842590332, -10.488334655761719, -9.878111839294434, -9.267889022827148, -8.657666206359863, -8.047443389892578, -7.437221050262451, -6.826998710632324, -6.216775894165039, -5.606553554534912, -4.996330738067627, -4.3861083984375, -3.775885581970215, -3.1656627655029297, -2.5554399490356445, -1.9452173709869385, -1.3349947929382324, -0.7247719764709473, -0.11454927921295166, 0.49567341804504395, 1.1058961153030396, 1.7161188125610352, 2.3263416290283203, 2.9365642070770264, 3.5467867851257324, 4.157009601593018]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 7.0, 19.0, 11.0, 12.0, 14.0, 22.0, 21.0, 26.0, 24.0, 26.0, 24.0, 40.0, 31.0, 28.0, 38.0, 58.0, 42.0, 29.0, 44.0, 37.0, 38.0, 36.0, 32.0, 33.0, 38.0, 29.0, 29.0, 38.0, 21.0, 24.0, 21.0, 11.0, 18.0, 16.0, 11.0, 12.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.268026828765869, -5.104257106781006, -4.940487384796143, -4.776717662811279, -4.612947940826416, -4.449178218841553, -4.2854084968566895, -4.121638774871826, -3.957869052886963, -3.7940993309020996, -3.6303296089172363, -3.466559886932373, -3.3027901649475098, -3.1390204429626465, -2.975250720977783, -2.81148099899292, -2.6477110385894775, -2.4839413166046143, -2.320171594619751, -2.1564018726348877, -1.9926321506500244, -1.8288624286651611, -1.6650925874710083, -1.501322865486145, -1.3375531435012817, -1.1737834215164185, -1.0100136995315552, -0.8462439179420471, -0.6824741959571838, -0.5187044739723206, -0.3549346923828125, -0.19116497039794922, -0.027395248413085938, 0.13637448847293854, 0.300144225358963, 0.4639139771461487, 0.627683699131012, 0.7914534211158752, 0.9552232027053833, 1.1189929246902466, 1.2827626466751099, 1.4465323686599731, 1.6103020906448364, 1.7740719318389893, 1.9378416538238525, 2.101611375808716, 2.265381097793579, 2.4291508197784424, 2.5929205417633057, 2.756690263748169, 2.9204599857330322, 3.0842297077178955, 3.247999429702759, 3.411769151687622, 3.5755391120910645, 3.7393088340759277, 3.903078556060791, 4.066848278045654, 4.230618000030518, 4.394387722015381, 4.558157444000244, 4.721927165985107, 4.885696887969971, 5.049466609954834, 5.213236331939697]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 12.0, 12.0, 19.0, 33.0, 47.0, 46.0, 102.0, 145.0, 230.0, 279.0, 415.0, 602.0, 831.0, 1267.0, 1896.0, 2957.0, 4453.0, 7027.0, 11523.0, 20875.0, 39426.0, 79221.0, 160529.0, 281272.0, 211336.0, 105984.0, 52264.0, 26876.0, 14443.0, 8539.0, 5300.0, 3451.0, 2158.0, 1623.0, 1046.0, 731.0, 506.0, 307.0, 243.0, 144.0, 133.0, 74.0, 57.0, 35.0, 26.0, 18.0, 15.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.883056640625, -7.61767578125, -7.352294921875, -7.0869140625, -6.821533203125, -6.55615234375, -6.290771484375, -6.025390625, -5.760009765625, -5.49462890625, -5.229248046875, -4.9638671875, -4.698486328125, -4.43310546875, -4.167724609375, -3.90234375, -3.636962890625, -3.37158203125, -3.106201171875, -2.8408203125, -2.575439453125, -2.31005859375, -2.044677734375, -1.779296875, -1.513916015625, -1.24853515625, -0.983154296875, -0.7177734375, -0.452392578125, -0.18701171875, 0.078369140625, 0.34375, 0.609130859375, 0.87451171875, 1.139892578125, 1.4052734375, 1.670654296875, 1.93603515625, 2.201416015625, 2.466796875, 2.732177734375, 2.99755859375, 3.262939453125, 3.5283203125, 3.793701171875, 4.05908203125, 4.324462890625, 4.58984375, 4.855224609375, 5.12060546875, 5.385986328125, 5.6513671875, 5.916748046875, 6.18212890625, 6.447509765625, 6.712890625, 6.978271484375, 7.24365234375, 7.509033203125, 7.7744140625, 8.039794921875, 8.30517578125, 8.570556640625, 8.8359375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 16.0, 12.0, 9.0, 21.0, 16.0, 11.0, 16.0, 20.0, 27.0, 15.0, 26.0, 31.0, 30.0, 33.0, 40.0, 41.0, 35.0, 41.0, 31.0, 40.0, 44.0, 33.0, 29.0, 31.0, 33.0, 26.0, 39.0, 40.0, 33.0, 27.0, 19.0, 18.0, 12.0, 22.0, 11.0, 10.0, 4.0, 11.0, 8.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.349609375, -3.2415771484375, -3.133544921875, -3.0255126953125, -2.91748046875, -2.8094482421875, -2.701416015625, -2.5933837890625, -2.4853515625, -2.3773193359375, -2.269287109375, -2.1612548828125, -2.05322265625, -1.9451904296875, -1.837158203125, -1.7291259765625, -1.62109375, -1.5130615234375, -1.405029296875, -1.2969970703125, -1.18896484375, -1.0809326171875, -0.972900390625, -0.8648681640625, -0.7568359375, -0.6488037109375, -0.540771484375, -0.4327392578125, -0.32470703125, -0.2166748046875, -0.108642578125, -0.0006103515625, 0.107421875, 0.2154541015625, 0.323486328125, 0.4315185546875, 0.53955078125, 0.6475830078125, 0.755615234375, 0.8636474609375, 0.9716796875, 1.0797119140625, 1.187744140625, 1.2957763671875, 1.40380859375, 1.5118408203125, 1.619873046875, 1.7279052734375, 1.8359375, 1.9439697265625, 2.052001953125, 2.1600341796875, 2.26806640625, 2.3760986328125, 2.484130859375, 2.5921630859375, 2.7001953125, 2.8082275390625, 2.916259765625, 3.0242919921875, 3.13232421875, 3.2403564453125, 3.348388671875, 3.4564208984375, 3.564453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 5.0, 14.0, 13.0, 20.0, 19.0, 31.0, 33.0, 33.0, 69.0, 94.0, 84.0, 127.0, 191.0, 248.0, 302.0, 442.0, 589.0, 879.0, 1244.0, 1738.0, 2599.0, 4021.0, 6481.0, 10891.0, 19172.0, 38869.0, 91085.0, 333497.0, 351626.0, 94342.0, 39191.0, 19895.0, 10937.0, 6529.0, 4011.0, 2770.0, 1821.0, 1208.0, 913.0, 594.0, 462.0, 374.0, 253.0, 193.0, 156.0, 111.0, 93.0, 71.0, 36.0, 43.0, 36.0, 22.0, 20.0, 15.0, 9.0, 11.0, 10.0, 11.0, 5.0, 1.0, 4.0], "bins": [-6.46484375, -6.25640869140625, -6.0479736328125, -5.83953857421875, -5.631103515625, -5.42266845703125, -5.2142333984375, -5.00579833984375, -4.79736328125, -4.58892822265625, -4.3804931640625, -4.17205810546875, -3.963623046875, -3.75518798828125, -3.5467529296875, -3.33831787109375, -3.1298828125, -2.92144775390625, -2.7130126953125, -2.50457763671875, -2.296142578125, -2.08770751953125, -1.8792724609375, -1.67083740234375, -1.46240234375, -1.25396728515625, -1.0455322265625, -0.83709716796875, -0.628662109375, -0.42022705078125, -0.2117919921875, -0.00335693359375, 0.205078125, 0.41351318359375, 0.6219482421875, 0.83038330078125, 1.038818359375, 1.24725341796875, 1.4556884765625, 1.66412353515625, 1.87255859375, 2.08099365234375, 2.2894287109375, 2.49786376953125, 2.706298828125, 2.91473388671875, 3.1231689453125, 3.33160400390625, 3.5400390625, 3.74847412109375, 3.9569091796875, 4.16534423828125, 4.373779296875, 4.58221435546875, 4.7906494140625, 4.99908447265625, 5.20751953125, 5.41595458984375, 5.6243896484375, 5.83282470703125, 6.041259765625, 6.24969482421875, 6.4581298828125, 6.66656494140625, 6.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 5.0, 10.0, 23.0, 15.0, 29.0, 11.0, 11.0, 22.0, 17.0, 29.0, 42.0, 38.0, 30.0, 39.0, 36.0, 37.0, 38.0, 43.0, 42.0, 30.0, 34.0, 27.0, 43.0, 37.0, 31.0, 36.0, 25.0, 26.0, 18.0, 19.0, 20.0, 21.0, 19.0, 15.0, 12.0, 11.0, 5.0, 10.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.462890625, -2.386322021484375, -2.30975341796875, -2.233184814453125, -2.1566162109375, -2.080047607421875, -2.00347900390625, -1.926910400390625, -1.850341796875, -1.773773193359375, -1.69720458984375, -1.620635986328125, -1.5440673828125, -1.467498779296875, -1.39093017578125, -1.314361572265625, -1.23779296875, -1.161224365234375, -1.08465576171875, -1.008087158203125, -0.9315185546875, -0.854949951171875, -0.77838134765625, -0.701812744140625, -0.625244140625, -0.548675537109375, -0.47210693359375, -0.395538330078125, -0.3189697265625, -0.242401123046875, -0.16583251953125, -0.089263916015625, -0.0126953125, 0.063873291015625, 0.14044189453125, 0.217010498046875, 0.2935791015625, 0.370147705078125, 0.44671630859375, 0.523284912109375, 0.599853515625, 0.676422119140625, 0.75299072265625, 0.829559326171875, 0.9061279296875, 0.982696533203125, 1.05926513671875, 1.135833740234375, 1.21240234375, 1.288970947265625, 1.36553955078125, 1.442108154296875, 1.5186767578125, 1.595245361328125, 1.67181396484375, 1.748382568359375, 1.824951171875, 1.901519775390625, 1.97808837890625, 2.054656982421875, 2.1312255859375, 2.207794189453125, 2.28436279296875, 2.360931396484375, 2.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 6.0, 9.0, 11.0, 10.0, 11.0, 25.0, 29.0, 33.0, 38.0, 42.0, 80.0, 117.0, 172.0, 225.0, 378.0, 597.0, 976.0, 1662.0, 3099.0, 6996.0, 19014.0, 89299.0, 843380.0, 55504.0, 14525.0, 5680.0, 2737.0, 1418.0, 805.0, 490.0, 320.0, 244.0, 159.0, 109.0, 92.0, 66.0, 43.0, 35.0, 25.0, 22.0, 18.0, 10.0, 10.0, 4.0, 3.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.8125, -16.240234375, -15.66796875, -15.095703125, -14.5234375, -13.951171875, -13.37890625, -12.806640625, -12.234375, -11.662109375, -11.08984375, -10.517578125, -9.9453125, -9.373046875, -8.80078125, -8.228515625, -7.65625, -7.083984375, -6.51171875, -5.939453125, -5.3671875, -4.794921875, -4.22265625, -3.650390625, -3.078125, -2.505859375, -1.93359375, -1.361328125, -0.7890625, -0.216796875, 0.35546875, 0.927734375, 1.5, 2.072265625, 2.64453125, 3.216796875, 3.7890625, 4.361328125, 4.93359375, 5.505859375, 6.078125, 6.650390625, 7.22265625, 7.794921875, 8.3671875, 8.939453125, 9.51171875, 10.083984375, 10.65625, 11.228515625, 11.80078125, 12.373046875, 12.9453125, 13.517578125, 14.08984375, 14.662109375, 15.234375, 15.806640625, 16.37890625, 16.951171875, 17.5234375, 18.095703125, 18.66796875, 19.240234375, 19.8125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 11.0, 18.0, 34.0, 29.0, 41.0, 69.0, 113.0, 173.0, 153.0, 111.0, 61.0, 46.0, 41.0, 13.0, 20.0, 11.0, 9.0, 3.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003237724304199219, -0.0003082677721977234, -0.0002927631139755249, -0.0002772584557533264, -0.00026175379753112793, -0.00024624913930892944, -0.00023074448108673096, -0.00021523982286453247, -0.00019973516464233398, -0.0001842305064201355, -0.000168725848197937, -0.00015322118997573853, -0.00013771653175354004, -0.00012221187353134155, -0.00010670721530914307, -9.120255708694458e-05, -7.56978988647461e-05, -6.019324064254761e-05, -4.468858242034912e-05, -2.9183924198150635e-05, -1.3679265975952148e-05, 1.8253922462463379e-06, 1.7330050468444824e-05, 3.283470869064331e-05, 4.83393669128418e-05, 6.384402513504028e-05, 7.934868335723877e-05, 9.485334157943726e-05, 0.00011035799980163574, 0.00012586265802383423, 0.00014136731624603271, 0.0001568719744682312, 0.0001723766326904297, 0.00018788129091262817, 0.00020338594913482666, 0.00021889060735702515, 0.00023439526557922363, 0.0002498999238014221, 0.0002654045820236206, 0.0002809092402458191, 0.0002964138984680176, 0.00031191855669021606, 0.00032742321491241455, 0.00034292787313461304, 0.0003584325313568115, 0.00037393718957901, 0.0003894418478012085, 0.000404946506023407, 0.00042045116424560547, 0.00043595582246780396, 0.00045146048069000244, 0.00046696513891220093, 0.0004824697971343994, 0.0004979744553565979, 0.0005134791135787964, 0.0005289837718009949, 0.0005444884300231934, 0.0005599930882453918, 0.0005754977464675903, 0.0005910024046897888, 0.0006065070629119873, 0.0006220117211341858, 0.0006375163793563843, 0.0006530210375785828, 0.0006685256958007812]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 16.0, 29.0, 45.0, 357.0, 1039975.0, 7908.0, 118.0, 33.0, 14.0, 10.0, 6.0, 8.0, 5.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.5, -346.08203125, -332.6640625, -319.24609375, -305.828125, -292.41015625, -278.9921875, -265.57421875, -252.15625, -238.73828125, -225.3203125, -211.90234375, -198.484375, -185.06640625, -171.6484375, -158.23046875, -144.8125, -131.39453125, -117.9765625, -104.55859375, -91.140625, -77.72265625, -64.3046875, -50.88671875, -37.46875, -24.05078125, -10.6328125, 2.78515625, 16.203125, 29.62109375, 43.0390625, 56.45703125, 69.875, 83.29296875, 96.7109375, 110.12890625, 123.546875, 136.96484375, 150.3828125, 163.80078125, 177.21875, 190.63671875, 204.0546875, 217.47265625, 230.890625, 244.30859375, 257.7265625, 271.14453125, 284.5625, 297.98046875, 311.3984375, 324.81640625, 338.234375, 351.65234375, 365.0703125, 378.48828125, 391.90625, 405.32421875, 418.7421875, 432.16015625, 445.578125, 458.99609375, 472.4140625, 485.83203125, 499.25]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 15.0, 34.0, 84.0, 596.0, 148.0, 63.0, 18.0, 10.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -9.9498291015625, -9.563720703125, -9.1776123046875, -8.79150390625, -8.4053955078125, -8.019287109375, -7.6331787109375, -7.2470703125, -6.8609619140625, -6.474853515625, -6.0887451171875, -5.70263671875, -5.3165283203125, -4.930419921875, -4.5443115234375, -4.158203125, -3.7720947265625, -3.385986328125, -2.9998779296875, -2.61376953125, -2.2276611328125, -1.841552734375, -1.4554443359375, -1.0693359375, -0.6832275390625, -0.297119140625, 0.0889892578125, 0.47509765625, 0.8612060546875, 1.247314453125, 1.6334228515625, 2.01953125, 2.4056396484375, 2.791748046875, 3.1778564453125, 3.56396484375, 3.9500732421875, 4.336181640625, 4.7222900390625, 5.1083984375, 5.4945068359375, 5.880615234375, 6.2667236328125, 6.65283203125, 7.0389404296875, 7.425048828125, 7.8111572265625, 8.197265625, 8.5833740234375, 8.969482421875, 9.3555908203125, 9.74169921875, 10.1278076171875, 10.513916015625, 10.9000244140625, 11.2861328125, 11.6722412109375, 12.058349609375, 12.4444580078125, 12.83056640625, 13.2166748046875, 13.602783203125, 13.9888916015625, 14.375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 12.0, 39.0, 214.0, 619.0, 119.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.161507606506348, -11.581197738647461, -10.000887870788574, -8.420578002929688, -6.840267658233643, -5.259957790374756, -3.679647445678711, -2.099337577819824, -0.5190277099609375, 1.0612822771072388, 2.641592264175415, 4.221902370452881, 5.802212238311768, 7.382522106170654, 8.9628324508667, 10.543142318725586, 12.123452186584473, 13.70376205444336, 15.284071922302246, 16.864381790161133, 18.444692611694336, 20.025001525878906, 21.60531234741211, 23.185623168945312, 24.765932083129883, 26.346242904663086, 27.926551818847656, 29.50686264038086, 31.08717155456543, 32.66748046875, 34.2477912902832, 35.828102111816406, 37.40841293334961, 38.98872375488281, 40.569034576416016, 42.14934158325195, 43.729652404785156, 45.30996322631836, 46.89027404785156, 48.4705810546875, 50.0508918762207, 51.631202697753906, 53.21151351928711, 54.79182052612305, 56.37213134765625, 57.95244216918945, 59.532752990722656, 61.113059997558594, 62.69337463378906, 64.273681640625, 65.85399627685547, 67.4343032836914, 69.01461791992188, 70.59492492675781, 72.17523193359375, 73.75554656982422, 75.33585357666016, 76.9161605834961, 78.49647521972656, 80.0767822265625, 81.65709686279297, 83.2374038696289, 84.81771087646484, 86.39802551269531, 87.97833251953125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 7.0, 9.0, 11.0, 14.0, 12.0, 13.0, 20.0, 24.0, 30.0, 25.0, 32.0, 30.0, 26.0, 46.0, 31.0, 30.0, 45.0, 41.0, 43.0, 52.0, 55.0, 51.0, 49.0, 34.0, 41.0, 26.0, 34.0, 27.0, 28.0, 17.0, 15.0, 11.0, 14.0, 5.0, 17.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.244912624359131, -5.088364601135254, -4.931816577911377, -4.7752685546875, -4.618720531463623, -4.462172508239746, -4.305624485015869, -4.149076461791992, -3.992528200149536, -3.835980176925659, -3.6794321537017822, -3.5228841304779053, -3.366335868835449, -3.2097878456115723, -3.0532398223876953, -2.8966917991638184, -2.7401437759399414, -2.5835957527160645, -2.4270477294921875, -2.2704997062683105, -2.1139516830444336, -1.957403540611267, -1.8008553981781006, -1.6443073749542236, -1.4877593517303467, -1.3312113285064697, -1.1746633052825928, -1.0181151628494263, -0.8615671396255493, -0.7050191164016724, -0.5484710335731506, -0.3919229507446289, -0.23537540435791016, -0.07882735133171082, 0.07772070169448853, 0.23426875472068787, 0.3908168077468872, 0.5473648309707642, 0.7039129137992859, 0.8604609966278076, 1.0170090198516846, 1.1735570430755615, 1.3301050662994385, 1.486653208732605, 1.643201231956482, 1.7997492551803589, 1.9562973976135254, 2.1128454208374023, 2.2693934440612793, 2.4259414672851562, 2.582489490509033, 2.73903751373291, 2.895585536956787, 3.052133560180664, 3.20868182182312, 3.365229845046997, 3.521777868270874, 3.678325891494751, 3.834873914718628, 3.991421937942505, 4.147970199584961, 4.304518222808838, 4.461066246032715, 4.617614269256592, 4.774162292480469]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 10.0, 21.0, 20.0, 32.0, 51.0, 103.0, 146.0, 303.0, 607.0, 1421.0, 3445.0, 9056.0, 27560.0, 98023.0, 353505.0, 391568.0, 113761.0, 31759.0, 10257.0, 3838.0, 1598.0, 722.0, 318.0, 173.0, 95.0, 40.0, 38.0, 19.0, 11.0, 11.0, 10.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1484375, -14.6085205078125, -14.068603515625, -13.5286865234375, -12.98876953125, -12.4488525390625, -11.908935546875, -11.3690185546875, -10.8291015625, -10.2891845703125, -9.749267578125, -9.2093505859375, -8.66943359375, -8.1295166015625, -7.589599609375, -7.0496826171875, -6.509765625, -5.9698486328125, -5.429931640625, -4.8900146484375, -4.35009765625, -3.8101806640625, -3.270263671875, -2.7303466796875, -2.1904296875, -1.6505126953125, -1.110595703125, -0.5706787109375, -0.03076171875, 0.5091552734375, 1.049072265625, 1.5889892578125, 2.12890625, 2.6688232421875, 3.208740234375, 3.7486572265625, 4.28857421875, 4.8284912109375, 5.368408203125, 5.9083251953125, 6.4482421875, 6.9881591796875, 7.528076171875, 8.0679931640625, 8.60791015625, 9.1478271484375, 9.687744140625, 10.2276611328125, 10.767578125, 11.3074951171875, 11.847412109375, 12.3873291015625, 12.92724609375, 13.4671630859375, 14.007080078125, 14.5469970703125, 15.0869140625, 15.6268310546875, 16.166748046875, 16.7066650390625, 17.24658203125, 17.7864990234375, 18.326416015625, 18.8663330078125, 19.40625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 7.0, 9.0, 13.0, 10.0, 26.0, 16.0, 31.0, 17.0, 31.0, 40.0, 30.0, 48.0, 42.0, 36.0, 50.0, 35.0, 52.0, 56.0, 57.0, 52.0, 52.0, 47.0, 33.0, 29.0, 28.0, 32.0, 23.0, 15.0, 13.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.90625, -4.7279052734375, -4.549560546875, -4.3712158203125, -4.19287109375, -4.0145263671875, -3.836181640625, -3.6578369140625, -3.4794921875, -3.3011474609375, -3.122802734375, -2.9444580078125, -2.76611328125, -2.5877685546875, -2.409423828125, -2.2310791015625, -2.052734375, -1.8743896484375, -1.696044921875, -1.5177001953125, -1.33935546875, -1.1610107421875, -0.982666015625, -0.8043212890625, -0.6259765625, -0.4476318359375, -0.269287109375, -0.0909423828125, 0.08740234375, 0.2657470703125, 0.444091796875, 0.6224365234375, 0.80078125, 0.9791259765625, 1.157470703125, 1.3358154296875, 1.51416015625, 1.6925048828125, 1.870849609375, 2.0491943359375, 2.2275390625, 2.4058837890625, 2.584228515625, 2.7625732421875, 2.94091796875, 3.1192626953125, 3.297607421875, 3.4759521484375, 3.654296875, 3.8326416015625, 4.010986328125, 4.1893310546875, 4.36767578125, 4.5460205078125, 4.724365234375, 4.9027099609375, 5.0810546875, 5.2593994140625, 5.437744140625, 5.6160888671875, 5.79443359375, 5.9727783203125, 6.151123046875, 6.3294677734375, 6.5078125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 15.0, 8.0, 10.0, 9.0, 21.0, 21.0, 15.0, 30.0, 18.0, 29.0, 23.0, 42.0, 32.0, 53.0, 96.0, 286.0, 2083.0, 61531.0, 916227.0, 65076.0, 2169.0, 297.0, 108.0, 51.0, 45.0, 32.0, 27.0, 34.0, 28.0, 24.0, 20.0, 15.0, 6.0, 11.0, 12.0, 9.0, 8.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-57.34375, -55.63232421875, -53.9208984375, -52.20947265625, -50.498046875, -48.78662109375, -47.0751953125, -45.36376953125, -43.65234375, -41.94091796875, -40.2294921875, -38.51806640625, -36.806640625, -35.09521484375, -33.3837890625, -31.67236328125, -29.9609375, -28.24951171875, -26.5380859375, -24.82666015625, -23.115234375, -21.40380859375, -19.6923828125, -17.98095703125, -16.26953125, -14.55810546875, -12.8466796875, -11.13525390625, -9.423828125, -7.71240234375, -6.0009765625, -4.28955078125, -2.578125, -0.86669921875, 0.8447265625, 2.55615234375, 4.267578125, 5.97900390625, 7.6904296875, 9.40185546875, 11.11328125, 12.82470703125, 14.5361328125, 16.24755859375, 17.958984375, 19.67041015625, 21.3818359375, 23.09326171875, 24.8046875, 26.51611328125, 28.2275390625, 29.93896484375, 31.650390625, 33.36181640625, 35.0732421875, 36.78466796875, 38.49609375, 40.20751953125, 41.9189453125, 43.63037109375, 45.341796875, 47.05322265625, 48.7646484375, 50.47607421875, 52.1875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 10.0, 9.0, 13.0, 18.0, 13.0, 15.0, 21.0, 28.0, 19.0, 19.0, 25.0, 26.0, 33.0, 36.0, 36.0, 31.0, 43.0, 33.0, 44.0, 35.0, 36.0, 40.0, 33.0, 26.0, 39.0, 45.0, 29.0, 31.0, 25.0, 29.0, 34.0, 16.0, 15.0, 9.0, 12.0, 14.0, 7.0, 8.0, 8.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.546875, -5.3807373046875, -5.214599609375, -5.0484619140625, -4.88232421875, -4.7161865234375, -4.550048828125, -4.3839111328125, -4.2177734375, -4.0516357421875, -3.885498046875, -3.7193603515625, -3.55322265625, -3.3870849609375, -3.220947265625, -3.0548095703125, -2.888671875, -2.7225341796875, -2.556396484375, -2.3902587890625, -2.22412109375, -2.0579833984375, -1.891845703125, -1.7257080078125, -1.5595703125, -1.3934326171875, -1.227294921875, -1.0611572265625, -0.89501953125, -0.7288818359375, -0.562744140625, -0.3966064453125, -0.23046875, -0.0643310546875, 0.101806640625, 0.2679443359375, 0.43408203125, 0.6002197265625, 0.766357421875, 0.9324951171875, 1.0986328125, 1.2647705078125, 1.430908203125, 1.5970458984375, 1.76318359375, 1.9293212890625, 2.095458984375, 2.2615966796875, 2.427734375, 2.5938720703125, 2.760009765625, 2.9261474609375, 3.09228515625, 3.2584228515625, 3.424560546875, 3.5906982421875, 3.7568359375, 3.9229736328125, 4.089111328125, 4.2552490234375, 4.42138671875, 4.5875244140625, 4.753662109375, 4.9197998046875, 5.0859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 21.0, 19.0, 21.0, 46.0, 61.0, 95.0, 251.0, 999.0, 6866.0, 106310.0, 899347.0, 30649.0, 2904.0, 533.0, 167.0, 83.0, 55.0, 48.0, 23.0, 9.0, 13.0, 7.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.16796875, -3.0893707275390625, -3.010772705078125, -2.9321746826171875, -2.85357666015625, -2.7749786376953125, -2.696380615234375, -2.6177825927734375, -2.5391845703125, -2.4605865478515625, -2.381988525390625, -2.3033905029296875, -2.22479248046875, -2.1461944580078125, -2.067596435546875, -1.9889984130859375, -1.910400390625, -1.8318023681640625, -1.753204345703125, -1.6746063232421875, -1.59600830078125, -1.5174102783203125, -1.438812255859375, -1.3602142333984375, -1.2816162109375, -1.2030181884765625, -1.124420166015625, -1.0458221435546875, -0.96722412109375, -0.8886260986328125, -0.810028076171875, -0.7314300537109375, -0.65283203125, -0.5742340087890625, -0.495635986328125, -0.4170379638671875, -0.33843994140625, -0.2598419189453125, -0.181243896484375, -0.1026458740234375, -0.0240478515625, 0.0545501708984375, 0.133148193359375, 0.2117462158203125, 0.29034423828125, 0.3689422607421875, 0.447540283203125, 0.5261383056640625, 0.604736328125, 0.6833343505859375, 0.761932373046875, 0.8405303955078125, 0.91912841796875, 0.9977264404296875, 1.076324462890625, 1.1549224853515625, 1.2335205078125, 1.3121185302734375, 1.390716552734375, 1.4693145751953125, 1.54791259765625, 1.6265106201171875, 1.705108642578125, 1.7837066650390625, 1.8623046875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 20.0, 31.0, 51.0, 58.0, 91.0, 166.0, 212.0, 106.0, 66.0, 53.0, 34.0, 25.0, 15.0, 11.0, 16.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018215179443359375, -0.00017493963241577148, -0.00016772747039794922, -0.00016051530838012695, -0.0001533031463623047, -0.00014609098434448242, -0.00013887882232666016, -0.0001316666603088379, -0.00012445449829101562, -0.00011724233627319336, -0.0001100301742553711, -0.00010281801223754883, -9.560585021972656e-05, -8.83936882019043e-05, -8.118152618408203e-05, -7.396936416625977e-05, -6.67572021484375e-05, -5.9545040130615234e-05, -5.233287811279297e-05, -4.51207160949707e-05, -3.790855407714844e-05, -3.069639205932617e-05, -2.3484230041503906e-05, -1.627206802368164e-05, -9.059906005859375e-06, -1.8477439880371094e-06, 5.364418029785156e-06, 1.2576580047607422e-05, 1.9788742065429688e-05, 2.7000904083251953e-05, 3.421306610107422e-05, 4.1425228118896484e-05, 4.863739013671875e-05, 5.5849552154541016e-05, 6.306171417236328e-05, 7.027387619018555e-05, 7.748603820800781e-05, 8.469820022583008e-05, 9.191036224365234e-05, 9.912252426147461e-05, 0.00010633468627929688, 0.00011354684829711914, 0.0001207590103149414, 0.00012797117233276367, 0.00013518333435058594, 0.0001423954963684082, 0.00014960765838623047, 0.00015681982040405273, 0.000164031982421875, 0.00017124414443969727, 0.00017845630645751953, 0.0001856684684753418, 0.00019288063049316406, 0.00020009279251098633, 0.0002073049545288086, 0.00021451711654663086, 0.00022172927856445312, 0.0002289414405822754, 0.00023615360260009766, 0.00024336576461791992, 0.0002505779266357422, 0.00025779008865356445, 0.0002650022506713867, 0.000272214412689209, 0.00027942657470703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 14.0, 14.0, 15.0, 34.0, 109.0, 886.0, 19013.0, 1012094.0, 15348.0, 766.0, 101.0, 60.0, 20.0, 16.0, 9.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.57427978515625, -4.4376220703125, -4.30096435546875, -4.164306640625, -4.02764892578125, -3.8909912109375, -3.75433349609375, -3.61767578125, -3.48101806640625, -3.3443603515625, -3.20770263671875, -3.071044921875, -2.93438720703125, -2.7977294921875, -2.66107177734375, -2.5244140625, -2.38775634765625, -2.2510986328125, -2.11444091796875, -1.977783203125, -1.84112548828125, -1.7044677734375, -1.56781005859375, -1.43115234375, -1.29449462890625, -1.1578369140625, -1.02117919921875, -0.884521484375, -0.74786376953125, -0.6112060546875, -0.47454833984375, -0.337890625, -0.20123291015625, -0.0645751953125, 0.07208251953125, 0.208740234375, 0.34539794921875, 0.4820556640625, 0.61871337890625, 0.75537109375, 0.89202880859375, 1.0286865234375, 1.16534423828125, 1.302001953125, 1.43865966796875, 1.5753173828125, 1.71197509765625, 1.8486328125, 1.98529052734375, 2.1219482421875, 2.25860595703125, 2.395263671875, 2.53192138671875, 2.6685791015625, 2.80523681640625, 2.94189453125, 3.07855224609375, 3.2152099609375, 3.35186767578125, 3.488525390625, 3.62518310546875, 3.7618408203125, 3.89849853515625, 4.03515625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 6.0, 10.0, 14.0, 15.0, 30.0, 41.0, 81.0, 149.0, 318.0, 115.0, 70.0, 50.0, 22.0, 30.0, 11.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.483154296875, -0.4690818786621094, -0.45500946044921875, -0.4409370422363281, -0.4268646240234375, -0.4127922058105469, -0.39871978759765625, -0.3846473693847656, -0.370574951171875, -0.3565025329589844, -0.34243011474609375, -0.3283576965332031, -0.3142852783203125, -0.3002128601074219, -0.28614044189453125, -0.2720680236816406, -0.25799560546875, -0.24392318725585938, -0.22985076904296875, -0.21577835083007812, -0.2017059326171875, -0.18763351440429688, -0.17356109619140625, -0.15948867797851562, -0.145416259765625, -0.13134384155273438, -0.11727142333984375, -0.10319900512695312, -0.0891265869140625, -0.07505416870117188, -0.06098175048828125, -0.046909332275390625, -0.0328369140625, -0.018764495849609375, -0.00469207763671875, 0.009380340576171875, 0.0234527587890625, 0.037525177001953125, 0.05159759521484375, 0.06567001342773438, 0.079742431640625, 0.09381484985351562, 0.10788726806640625, 0.12195968627929688, 0.1360321044921875, 0.15010452270507812, 0.16417694091796875, 0.17824935913085938, 0.19232177734375, 0.20639419555664062, 0.22046661376953125, 0.23453903198242188, 0.2486114501953125, 0.2626838684082031, 0.27675628662109375, 0.2908287048339844, 0.304901123046875, 0.3189735412597656, 0.33304595947265625, 0.3471183776855469, 0.3611907958984375, 0.3752632141113281, 0.38933563232421875, 0.4034080505371094, 0.41748046875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 20.0, 939.0, 59.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.67070007324219, -77.39862823486328, -74.1265640258789, -70.8544921875, -67.58242797851562, -64.31035614013672, -61.03828811645508, -57.76622009277344, -54.4941520690918, -51.222084045410156, -47.950016021728516, -44.677947998046875, -41.40587615966797, -38.133811950683594, -34.86174011230469, -31.589672088623047, -28.317604064941406, -25.045536041259766, -21.773468017578125, -18.50139808654785, -15.229330062866211, -11.95726203918457, -8.685192108154297, -5.413124084472656, -2.1410560607910156, 1.1310124397277832, 4.403080940246582, 7.675149917602539, 10.94721794128418, 14.21928596496582, 17.491355895996094, 20.763423919677734, 24.035491943359375, 27.307559967041016, 30.579627990722656, 33.85169982910156, 37.12376403808594, 40.395835876464844, 43.667903900146484, 46.939971923828125, 50.212039947509766, 53.484107971191406, 56.75617599487305, 60.02824401855469, 63.300315856933594, 66.57238006591797, 69.84445190429688, 73.11651611328125, 76.38858795166016, 79.66065979003906, 82.93272399902344, 86.20479583740234, 89.47686004638672, 92.74893188476562, 96.02099609375, 99.2930679321289, 102.56513977050781, 105.83721160888672, 109.1092758178711, 112.38134765625, 115.65341186523438, 118.92548370361328, 122.19755554199219, 125.46961975097656, 128.74168395996094]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 8.0, 6.0, 6.0, 6.0, 11.0, 19.0, 13.0, 15.0, 14.0, 34.0, 36.0, 21.0, 37.0, 31.0, 37.0, 30.0, 31.0, 32.0, 47.0, 40.0, 40.0, 52.0, 47.0, 47.0, 39.0, 26.0, 42.0, 30.0, 27.0, 25.0, 24.0, 20.0, 19.0, 19.0, 18.0, 14.0, 15.0, 2.0, 10.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.860681533813477, -6.655023574829102, -6.449366092681885, -6.24370813369751, -6.038050651550293, -5.832392692565918, -5.626734733581543, -5.421077251434326, -5.215419769287109, -5.009761810302734, -4.804104328155518, -4.598446369171143, -4.392788887023926, -4.187130928039551, -3.981473207473755, -3.775815486907959, -3.570157527923584, -3.364499807357788, -3.158842086791992, -2.953184127807617, -2.7475266456604004, -2.5418686866760254, -2.3362109661102295, -2.1305532455444336, -1.9248955249786377, -1.7192378044128418, -1.513580083847046, -1.3079222440719604, -1.1022645235061646, -0.8966068029403687, -0.6909489631652832, -0.4852912425994873, -0.2796330451965332, -0.07397529482841492, 0.13168245553970337, 0.33734023571014404, 0.5429979562759399, 0.7486556768417358, 0.9543135166168213, 1.1599712371826172, 1.365628957748413, 1.571286678314209, 1.7769443988800049, 1.9826022386550903, 2.188260078430176, 2.3939175605773926, 2.5995755195617676, 2.8052332401275635, 3.0108909606933594, 3.2165486812591553, 3.422206401824951, 3.627864360809326, 3.833521842956543, 4.039179801940918, 4.244837760925293, 4.45049524307251, 4.656152725219727, 4.861810684204102, 5.067468166351318, 5.273126125335693, 5.47878360748291, 5.684441566467285, 5.89009952545166, 6.095757007598877, 6.301414966583252]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 7.0, 10.0, 10.0, 14.0, 23.0, 24.0, 20.0, 44.0, 60.0, 71.0, 93.0, 129.0, 183.0, 271.0, 346.0, 562.0, 1010.0, 1844.0, 3957.0, 11055.0, 108952.0, 3755733.0, 284514.0, 14955.0, 4933.0, 2186.0, 1167.0, 653.0, 421.0, 275.0, 192.0, 131.0, 100.0, 62.0, 52.0, 52.0, 50.0, 33.0, 21.0, 23.0, 14.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6640625, -9.3262939453125, -8.988525390625, -8.6507568359375, -8.31298828125, -7.9752197265625, -7.637451171875, -7.2996826171875, -6.9619140625, -6.6241455078125, -6.286376953125, -5.9486083984375, -5.61083984375, -5.2730712890625, -4.935302734375, -4.5975341796875, -4.259765625, -3.9219970703125, -3.584228515625, -3.2464599609375, -2.90869140625, -2.5709228515625, -2.233154296875, -1.8953857421875, -1.5576171875, -1.2198486328125, -0.882080078125, -0.5443115234375, -0.20654296875, 0.1312255859375, 0.468994140625, 0.8067626953125, 1.14453125, 1.4822998046875, 1.820068359375, 2.1578369140625, 2.49560546875, 2.8333740234375, 3.171142578125, 3.5089111328125, 3.8466796875, 4.1844482421875, 4.522216796875, 4.8599853515625, 5.19775390625, 5.5355224609375, 5.873291015625, 6.2110595703125, 6.548828125, 6.8865966796875, 7.224365234375, 7.5621337890625, 7.89990234375, 8.2376708984375, 8.575439453125, 8.9132080078125, 9.2509765625, 9.5887451171875, 9.926513671875, 10.2642822265625, 10.60205078125, 10.9398193359375, 11.277587890625, 11.6153564453125, 11.953125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 12.0, 14.0, 14.0, 25.0, 21.0, 30.0, 31.0, 28.0, 31.0, 30.0, 28.0, 46.0, 39.0, 41.0, 44.0, 54.0, 47.0, 48.0, 44.0, 32.0, 44.0, 38.0, 34.0, 28.0, 21.0, 24.0, 19.0, 15.0, 24.0, 17.0, 10.0, 15.0, 11.0, 4.0, 7.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.984375, -2.88970947265625, -2.7950439453125, -2.70037841796875, -2.605712890625, -2.51104736328125, -2.4163818359375, -2.32171630859375, -2.22705078125, -2.13238525390625, -2.0377197265625, -1.94305419921875, -1.848388671875, -1.75372314453125, -1.6590576171875, -1.56439208984375, -1.4697265625, -1.37506103515625, -1.2803955078125, -1.18572998046875, -1.091064453125, -0.99639892578125, -0.9017333984375, -0.80706787109375, -0.71240234375, -0.61773681640625, -0.5230712890625, -0.42840576171875, -0.333740234375, -0.23907470703125, -0.1444091796875, -0.04974365234375, 0.044921875, 0.13958740234375, 0.2342529296875, 0.32891845703125, 0.423583984375, 0.51824951171875, 0.6129150390625, 0.70758056640625, 0.80224609375, 0.89691162109375, 0.9915771484375, 1.08624267578125, 1.180908203125, 1.27557373046875, 1.3702392578125, 1.46490478515625, 1.5595703125, 1.65423583984375, 1.7489013671875, 1.84356689453125, 1.938232421875, 2.03289794921875, 2.1275634765625, 2.22222900390625, 2.31689453125, 2.41156005859375, 2.5062255859375, 2.60089111328125, 2.695556640625, 2.79022216796875, 2.8848876953125, 2.97955322265625, 3.07421875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 16.0, 19.0, 29.0, 56.0, 114.0, 300.0, 2070.0, 3979733.0, 209965.0, 1398.0, 308.0, 114.0, 52.0, 31.0, 22.0, 14.0, 4.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -72.91357421875, -70.7646484375, -68.61572265625, -66.466796875, -64.31787109375, -62.1689453125, -60.02001953125, -57.87109375, -55.72216796875, -53.5732421875, -51.42431640625, -49.275390625, -47.12646484375, -44.9775390625, -42.82861328125, -40.6796875, -38.53076171875, -36.3818359375, -34.23291015625, -32.083984375, -29.93505859375, -27.7861328125, -25.63720703125, -23.48828125, -21.33935546875, -19.1904296875, -17.04150390625, -14.892578125, -12.74365234375, -10.5947265625, -8.44580078125, -6.296875, -4.14794921875, -1.9990234375, 0.14990234375, 2.298828125, 4.44775390625, 6.5966796875, 8.74560546875, 10.89453125, 13.04345703125, 15.1923828125, 17.34130859375, 19.490234375, 21.63916015625, 23.7880859375, 25.93701171875, 28.0859375, 30.23486328125, 32.3837890625, 34.53271484375, 36.681640625, 38.83056640625, 40.9794921875, 43.12841796875, 45.27734375, 47.42626953125, 49.5751953125, 51.72412109375, 53.873046875, 56.02197265625, 58.1708984375, 60.31982421875, 62.46875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 10.0, 16.0, 23.0, 48.0, 81.0, 398.0, 1722.0, 1309.0, 262.0, 75.0, 40.0, 25.0, 19.0, 12.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.046875, -3.930877685546875, -3.81488037109375, -3.698883056640625, -3.5828857421875, -3.466888427734375, -3.35089111328125, -3.234893798828125, -3.118896484375, -3.002899169921875, -2.88690185546875, -2.770904541015625, -2.6549072265625, -2.538909912109375, -2.42291259765625, -2.306915283203125, -2.19091796875, -2.074920654296875, -1.95892333984375, -1.842926025390625, -1.7269287109375, -1.610931396484375, -1.49493408203125, -1.378936767578125, -1.262939453125, -1.146942138671875, -1.03094482421875, -0.914947509765625, -0.7989501953125, -0.682952880859375, -0.56695556640625, -0.450958251953125, -0.3349609375, -0.218963623046875, -0.10296630859375, 0.013031005859375, 0.1290283203125, 0.245025634765625, 0.36102294921875, 0.477020263671875, 0.593017578125, 0.709014892578125, 0.82501220703125, 0.941009521484375, 1.0570068359375, 1.173004150390625, 1.28900146484375, 1.404998779296875, 1.52099609375, 1.636993408203125, 1.75299072265625, 1.868988037109375, 1.9849853515625, 2.100982666015625, 2.21697998046875, 2.332977294921875, 2.448974609375, 2.564971923828125, 2.68096923828125, 2.796966552734375, 2.9129638671875, 3.028961181640625, 3.14495849609375, 3.260955810546875, 3.376953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 24.0, 55.0, 284.0, 504.0, 100.0, 26.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.207728862762451, -6.501781463623047, -5.795834541320801, -5.089887619018555, -4.38394021987915, -3.677993059158325, -2.9720458984375, -2.2660984992980957, -1.5601515769958496, -0.8542044162750244, -0.14825725555419922, 0.557689905166626, 1.2636370658874512, 1.9695842266082764, 2.6755313873291016, 3.381478786468506, 4.087425708770752, 4.793373107910156, 5.499320030212402, 6.205266952514648, 6.911214351654053, 7.617161750793457, 8.323108673095703, 9.029056549072266, 9.735002517700195, 10.440949440002441, 11.146896362304688, 11.85284423828125, 12.558791160583496, 13.264738082885742, 13.970685958862305, 14.67663288116455, 15.382579803466797, 16.08852767944336, 16.79447364807129, 17.50042152404785, 18.20636749267578, 18.912315368652344, 19.618263244628906, 20.32421112060547, 21.0301570892334, 21.73610496520996, 22.44205093383789, 23.147998809814453, 23.853946685791016, 24.559892654418945, 25.265840530395508, 25.971786499023438, 26.677734375, 27.383682250976562, 28.089628219604492, 28.795576095581055, 29.501522064208984, 30.207469940185547, 30.91341781616211, 31.619365692138672, 32.32530975341797, 33.03125762939453, 33.737205505371094, 34.44314956665039, 35.14909744262695, 35.855045318603516, 36.56099319458008, 37.26694107055664, 37.9728889465332]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 9.0, 15.0, 18.0, 20.0, 18.0, 18.0, 27.0, 28.0, 24.0, 23.0, 22.0, 34.0, 45.0, 38.0, 29.0, 37.0, 31.0, 45.0, 47.0, 45.0, 41.0, 40.0, 34.0, 26.0, 31.0, 28.0, 21.0, 25.0, 18.0, 24.0, 16.0, 13.0, 11.0, 17.0, 12.0, 6.0, 4.0, 13.0, 2.0, 10.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.899132013320923, -2.804241895675659, -2.7093520164489746, -2.614461898803711, -2.5195717811584473, -2.4246816635131836, -2.329791784286499, -2.2349016666412354, -2.140011787414551, -2.045121669769287, -1.950231671333313, -1.8553416728973389, -1.7604515552520752, -1.665561556816101, -1.570671558380127, -1.4757814407348633, -1.3808913230895996, -1.2860013246536255, -1.1911112070083618, -1.0962212085723877, -1.001331090927124, -0.9064410924911499, -0.8115510940551758, -0.7166610360145569, -0.621770977973938, -0.5268809199333191, -0.4319908916950226, -0.3371008634567261, -0.24221080541610718, -0.14732074737548828, -0.05243074893951416, 0.042459309101104736, 0.13734936714172363, 0.23223941028118134, 0.32712945342063904, 0.42201948165893555, 0.5169095396995544, 0.6117995977401733, 0.7066895961761475, 0.8015796542167664, 0.8964697122573853, 0.9913597702980042, 1.086249828338623, 1.1811398267745972, 1.2760298252105713, 1.370919942855835, 1.465809941291809, 1.5606999397277832, 1.6555900573730469, 1.750480055809021, 1.8453701734542847, 1.9402601718902588, 2.0351502895355225, 2.130040168762207, 2.2249302864074707, 2.3198204040527344, 2.414710521697998, 2.5096006393432617, 2.6044905185699463, 2.69938063621521, 2.7942707538604736, 2.889160633087158, 2.984050750732422, 3.0789408683776855, 3.17383074760437]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 5.0, 4.0, 11.0, 8.0, 16.0, 27.0, 41.0, 73.0, 111.0, 251.0, 420.0, 806.0, 1629.0, 3390.0, 6907.0, 15326.0, 36792.0, 101327.0, 347545.0, 361194.0, 104802.0, 38016.0, 15780.0, 7094.0, 3448.0, 1683.0, 885.0, 432.0, 205.0, 124.0, 70.0, 35.0, 26.0, 17.0, 14.0, 12.0, 7.0, 8.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.703125, -12.23291015625, -11.7626953125, -11.29248046875, -10.822265625, -10.35205078125, -9.8818359375, -9.41162109375, -8.94140625, -8.47119140625, -8.0009765625, -7.53076171875, -7.060546875, -6.59033203125, -6.1201171875, -5.64990234375, -5.1796875, -4.70947265625, -4.2392578125, -3.76904296875, -3.298828125, -2.82861328125, -2.3583984375, -1.88818359375, -1.41796875, -0.94775390625, -0.4775390625, -0.00732421875, 0.462890625, 0.93310546875, 1.4033203125, 1.87353515625, 2.34375, 2.81396484375, 3.2841796875, 3.75439453125, 4.224609375, 4.69482421875, 5.1650390625, 5.63525390625, 6.10546875, 6.57568359375, 7.0458984375, 7.51611328125, 7.986328125, 8.45654296875, 8.9267578125, 9.39697265625, 9.8671875, 10.33740234375, 10.8076171875, 11.27783203125, 11.748046875, 12.21826171875, 12.6884765625, 13.15869140625, 13.62890625, 14.09912109375, 14.5693359375, 15.03955078125, 15.509765625, 15.97998046875, 16.4501953125, 16.92041015625, 17.390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 12.0, 29.0, 22.0, 30.0, 37.0, 36.0, 22.0, 53.0, 63.0, 64.0, 56.0, 70.0, 66.0, 55.0, 51.0, 54.0, 52.0, 37.0, 29.0, 36.0, 25.0, 15.0, 9.0, 14.0, 6.0, 13.0, 8.0, 3.0, 3.0, 8.0], "bins": [-3.724609375, -3.64312744140625, -3.5616455078125, -3.48016357421875, -3.398681640625, -3.31719970703125, -3.2357177734375, -3.15423583984375, -3.07275390625, -2.99127197265625, -2.9097900390625, -2.82830810546875, -2.746826171875, -2.66534423828125, -2.5838623046875, -2.50238037109375, -2.4208984375, -2.33941650390625, -2.2579345703125, -2.17645263671875, -2.094970703125, -2.01348876953125, -1.9320068359375, -1.85052490234375, -1.76904296875, -1.68756103515625, -1.6060791015625, -1.52459716796875, -1.443115234375, -1.36163330078125, -1.2801513671875, -1.19866943359375, -1.1171875, -1.03570556640625, -0.9542236328125, -0.87274169921875, -0.791259765625, -0.70977783203125, -0.6282958984375, -0.54681396484375, -0.46533203125, -0.38385009765625, -0.3023681640625, -0.22088623046875, -0.139404296875, -0.05792236328125, 0.0235595703125, 0.10504150390625, 0.1865234375, 0.26800537109375, 0.3494873046875, 0.43096923828125, 0.512451171875, 0.59393310546875, 0.6754150390625, 0.75689697265625, 0.83837890625, 0.91986083984375, 1.0013427734375, 1.08282470703125, 1.164306640625, 1.24578857421875, 1.3272705078125, 1.40875244140625, 1.490234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 10.0, 9.0, 22.0, 33.0, 40.0, 43.0, 79.0, 95.0, 153.0, 232.0, 304.0, 420.0, 548.0, 718.0, 1106.0, 1624.0, 2339.0, 3531.0, 5266.0, 7857.0, 12530.0, 20574.0, 38641.0, 103995.0, 654044.0, 99756.0, 38064.0, 20355.0, 12167.0, 7760.0, 5060.0, 3518.0, 2341.0, 1609.0, 1033.0, 778.0, 567.0, 365.0, 279.0, 211.0, 127.0, 94.0, 80.0, 46.0, 32.0, 28.0, 21.0, 12.0, 15.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-10.90625, -10.5484619140625, -10.190673828125, -9.8328857421875, -9.47509765625, -9.1173095703125, -8.759521484375, -8.4017333984375, -8.0439453125, -7.6861572265625, -7.328369140625, -6.9705810546875, -6.61279296875, -6.2550048828125, -5.897216796875, -5.5394287109375, -5.181640625, -4.8238525390625, -4.466064453125, -4.1082763671875, -3.75048828125, -3.3927001953125, -3.034912109375, -2.6771240234375, -2.3193359375, -1.9615478515625, -1.603759765625, -1.2459716796875, -0.88818359375, -0.5303955078125, -0.172607421875, 0.1851806640625, 0.54296875, 0.9007568359375, 1.258544921875, 1.6163330078125, 1.97412109375, 2.3319091796875, 2.689697265625, 3.0474853515625, 3.4052734375, 3.7630615234375, 4.120849609375, 4.4786376953125, 4.83642578125, 5.1942138671875, 5.552001953125, 5.9097900390625, 6.267578125, 6.6253662109375, 6.983154296875, 7.3409423828125, 7.69873046875, 8.0565185546875, 8.414306640625, 8.7720947265625, 9.1298828125, 9.4876708984375, 9.845458984375, 10.2032470703125, 10.56103515625, 10.9188232421875, 11.276611328125, 11.6343994140625, 11.9921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 16.0, 15.0, 12.0, 18.0, 14.0, 23.0, 26.0, 24.0, 28.0, 37.0, 32.0, 34.0, 29.0, 33.0, 35.0, 37.0, 35.0, 43.0, 46.0, 38.0, 26.0, 38.0, 37.0, 37.0, 26.0, 25.0, 29.0, 29.0, 23.0, 18.0, 22.0, 20.0, 11.0, 9.0, 13.0, 4.0, 13.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.380859375, -1.3377227783203125, -1.294586181640625, -1.2514495849609375, -1.20831298828125, -1.1651763916015625, -1.122039794921875, -1.0789031982421875, -1.0357666015625, -0.9926300048828125, -0.949493408203125, -0.9063568115234375, -0.86322021484375, -0.8200836181640625, -0.776947021484375, -0.7338104248046875, -0.690673828125, -0.6475372314453125, -0.604400634765625, -0.5612640380859375, -0.51812744140625, -0.4749908447265625, -0.431854248046875, -0.3887176513671875, -0.3455810546875, -0.3024444580078125, -0.259307861328125, -0.2161712646484375, -0.17303466796875, -0.1298980712890625, -0.086761474609375, -0.0436248779296875, -0.00048828125, 0.0426483154296875, 0.085784912109375, 0.1289215087890625, 0.17205810546875, 0.2151947021484375, 0.258331298828125, 0.3014678955078125, 0.3446044921875, 0.3877410888671875, 0.430877685546875, 0.4740142822265625, 0.51715087890625, 0.5602874755859375, 0.603424072265625, 0.6465606689453125, 0.689697265625, 0.7328338623046875, 0.775970458984375, 0.8191070556640625, 0.86224365234375, 0.9053802490234375, 0.948516845703125, 0.9916534423828125, 1.0347900390625, 1.0779266357421875, 1.121063232421875, 1.1641998291015625, 1.20733642578125, 1.2504730224609375, 1.293609619140625, 1.3367462158203125, 1.3798828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 12.0, 5.0, 12.0, 21.0, 29.0, 44.0, 48.0, 71.0, 92.0, 124.0, 227.0, 275.0, 407.0, 674.0, 1106.0, 1932.0, 3590.0, 8467.0, 35619.0, 951365.0, 28691.0, 7671.0, 3293.0, 1800.0, 999.0, 673.0, 418.0, 281.0, 177.0, 107.0, 80.0, 57.0, 46.0, 43.0, 28.0, 18.0, 8.0, 6.0, 7.0, 10.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.8125, -17.186279296875, -16.56005859375, -15.933837890625, -15.3076171875, -14.681396484375, -14.05517578125, -13.428955078125, -12.802734375, -12.176513671875, -11.55029296875, -10.924072265625, -10.2978515625, -9.671630859375, -9.04541015625, -8.419189453125, -7.79296875, -7.166748046875, -6.54052734375, -5.914306640625, -5.2880859375, -4.661865234375, -4.03564453125, -3.409423828125, -2.783203125, -2.156982421875, -1.53076171875, -0.904541015625, -0.2783203125, 0.347900390625, 0.97412109375, 1.600341796875, 2.2265625, 2.852783203125, 3.47900390625, 4.105224609375, 4.7314453125, 5.357666015625, 5.98388671875, 6.610107421875, 7.236328125, 7.862548828125, 8.48876953125, 9.114990234375, 9.7412109375, 10.367431640625, 10.99365234375, 11.619873046875, 12.24609375, 12.872314453125, 13.49853515625, 14.124755859375, 14.7509765625, 15.377197265625, 16.00341796875, 16.629638671875, 17.255859375, 17.882080078125, 18.50830078125, 19.134521484375, 19.7607421875, 20.386962890625, 21.01318359375, 21.639404296875, 22.265625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 6.0, 7.0, 15.0, 25.0, 104.0, 689.0, 89.0, 25.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00145721435546875, -0.0014271438121795654, -0.0013970732688903809, -0.0013670027256011963, -0.0013369321823120117, -0.0013068616390228271, -0.0012767910957336426, -0.001246720552444458, -0.0012166500091552734, -0.0011865794658660889, -0.0011565089225769043, -0.0011264383792877197, -0.0010963678359985352, -0.0010662972927093506, -0.001036226749420166, -0.0010061562061309814, -0.0009760856628417969, -0.0009460151195526123, -0.0009159445762634277, -0.0008858740329742432, -0.0008558034896850586, -0.000825732946395874, -0.0007956624031066895, -0.0007655918598175049, -0.0007355213165283203, -0.0007054507732391357, -0.0006753802299499512, -0.0006453096866607666, -0.000615239143371582, -0.0005851686000823975, -0.0005550980567932129, -0.0005250275135040283, -0.0004949569702148438, -0.0004648864269256592, -0.0004348158836364746, -0.00040474534034729004, -0.00037467479705810547, -0.0003446042537689209, -0.00031453371047973633, -0.00028446316719055176, -0.0002543926239013672, -0.00022432208061218262, -0.00019425153732299805, -0.00016418099403381348, -0.0001341104507446289, -0.00010403990745544434, -7.396936416625977e-05, -4.3898820877075195e-05, -1.3828277587890625e-05, 1.6242265701293945e-05, 4.6312808990478516e-05, 7.638335227966309e-05, 0.00010645389556884766, 0.00013652443885803223, 0.0001665949821472168, 0.00019666552543640137, 0.00022673606872558594, 0.0002568066120147705, 0.0002868771553039551, 0.00031694769859313965, 0.0003470182418823242, 0.0003770887851715088, 0.00040715932846069336, 0.00043722987174987793, 0.0004673004150390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 9.0, 3.0, 7.0, 11.0, 18.0, 17.0, 32.0, 43.0, 88.0, 147.0, 328.0, 909.0, 3925.0, 1026207.0, 13797.0, 1947.0, 580.0, 209.0, 117.0, 49.0, 35.0, 14.0, 14.0, 20.0, 12.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5, -131.40234375, -126.3046875, -121.20703125, -116.109375, -111.01171875, -105.9140625, -100.81640625, -95.71875, -90.62109375, -85.5234375, -80.42578125, -75.328125, -70.23046875, -65.1328125, -60.03515625, -54.9375, -49.83984375, -44.7421875, -39.64453125, -34.546875, -29.44921875, -24.3515625, -19.25390625, -14.15625, -9.05859375, -3.9609375, 1.13671875, 6.234375, 11.33203125, 16.4296875, 21.52734375, 26.625, 31.72265625, 36.8203125, 41.91796875, 47.015625, 52.11328125, 57.2109375, 62.30859375, 67.40625, 72.50390625, 77.6015625, 82.69921875, 87.796875, 92.89453125, 97.9921875, 103.08984375, 108.1875, 113.28515625, 118.3828125, 123.48046875, 128.578125, 133.67578125, 138.7734375, 143.87109375, 148.96875, 154.06640625, 159.1640625, 164.26171875, 169.359375, 174.45703125, 179.5546875, 184.65234375, 189.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 14.0, 113.0, 786.0, 25.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.88909912109375, -5.6727294921875, -5.45635986328125, -5.239990234375, -5.02362060546875, -4.8072509765625, -4.59088134765625, -4.37451171875, -4.15814208984375, -3.9417724609375, -3.72540283203125, -3.509033203125, -3.29266357421875, -3.0762939453125, -2.85992431640625, -2.6435546875, -2.42718505859375, -2.2108154296875, -1.99444580078125, -1.778076171875, -1.56170654296875, -1.3453369140625, -1.12896728515625, -0.91259765625, -0.69622802734375, -0.4798583984375, -0.26348876953125, -0.047119140625, 0.16925048828125, 0.3856201171875, 0.60198974609375, 0.818359375, 1.03472900390625, 1.2510986328125, 1.46746826171875, 1.683837890625, 1.90020751953125, 2.1165771484375, 2.33294677734375, 2.54931640625, 2.76568603515625, 2.9820556640625, 3.19842529296875, 3.414794921875, 3.63116455078125, 3.8475341796875, 4.06390380859375, 4.2802734375, 4.49664306640625, 4.7130126953125, 4.92938232421875, 5.145751953125, 5.36212158203125, 5.5784912109375, 5.79486083984375, 6.01123046875, 6.22760009765625, 6.4439697265625, 6.66033935546875, 6.876708984375, 7.09307861328125, 7.3094482421875, 7.52581787109375, 7.7421875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 15.0, 33.0, 172.0, 578.0, 137.0, 29.0, 18.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.072463989257812, -16.192249298095703, -15.312036514282227, -14.431821823120117, -13.55160903930664, -12.671394348144531, -11.791180610656738, -10.910966873168945, -10.030753135681152, -9.15053939819336, -8.270325660705566, -7.390111446380615, -6.509897708892822, -5.629683971405029, -4.749469757080078, -3.869256019592285, -2.989042282104492, -2.108828544616699, -1.2286145687103271, -0.3484005928039551, 0.5318131446838379, 1.4120268821716309, 2.292241096496582, 3.172454833984375, 4.052668571472168, 4.932882308959961, 5.813096046447754, 6.693310260772705, 7.573523998260498, 8.453737258911133, 9.333951950073242, 10.214165687561035, 11.094379425048828, 11.974593162536621, 12.854806900024414, 13.735021591186523, 14.615234375, 15.49544906616211, 16.37566375732422, 17.255876541137695, 18.136089324951172, 19.01630401611328, 19.896516799926758, 20.776731491088867, 21.656944274902344, 22.537158966064453, 23.417373657226562, 24.29758644104004, 25.17780113220215, 26.058015823364258, 26.938228607177734, 27.818443298339844, 28.69865608215332, 29.57887077331543, 30.459083557128906, 31.339298248291016, 32.219512939453125, 33.099727630615234, 33.979942321777344, 34.86015319824219, 35.7403678894043, 36.620582580566406, 37.500797271728516, 38.381011962890625, 39.26122283935547]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 4.0, 9.0, 7.0, 11.0, 16.0, 13.0, 27.0, 26.0, 30.0, 22.0, 31.0, 27.0, 41.0, 33.0, 33.0, 48.0, 45.0, 41.0, 45.0, 35.0, 48.0, 38.0, 27.0, 50.0, 38.0, 45.0, 31.0, 31.0, 25.0, 24.0, 14.0, 11.0, 11.0, 10.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1880156993865967, -2.1060471534729004, -2.024078607559204, -1.9421099424362183, -1.860141396522522, -1.7781728506088257, -1.6962041854858398, -1.6142356395721436, -1.5322670936584473, -1.450298547744751, -1.3683300018310547, -1.2863613367080688, -1.2043927907943726, -1.1224242448806763, -1.0404555797576904, -0.9584870338439941, -0.8765184879302979, -0.7945499420166016, -0.7125813364982605, -0.6306127309799194, -0.5486441850662231, -0.46667560935020447, -0.3847070336341858, -0.3027384281158447, -0.22076988220214844, -0.13880130648612976, -0.056832730770111084, 0.025135844945907593, 0.10710442066192627, 0.18907299637794495, 0.2710415720939636, 0.3530101776123047, 0.434978723526001, 0.5169472694396973, 0.5989158749580383, 0.6808844804763794, 0.7628530263900757, 0.844821572303772, 0.926790177822113, 1.008758783340454, 1.0907273292541504, 1.1726958751678467, 1.254664421081543, 1.3366330862045288, 1.418601632118225, 1.5005701780319214, 1.5825388431549072, 1.6645073890686035, 1.7464759349822998, 1.828444480895996, 1.9104130268096924, 1.9923816919326782, 2.074350357055664, 2.1563189029693604, 2.2382874488830566, 2.320255994796753, 2.402224540710449, 2.4841930866241455, 2.566161632537842, 2.648130178451538, 2.7300987243652344, 2.8120675086975098, 2.894036054611206, 2.9760046005249023, 3.0579731464385986]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 8.0, 17.0, 25.0, 27.0, 42.0, 57.0, 89.0, 150.0, 229.0, 341.0, 524.0, 910.0, 1629.0, 3347.0, 8045.0, 23643.0, 114547.0, 676712.0, 169757.0, 30423.0, 9369.0, 3911.0, 2013.0, 1081.0, 628.0, 354.0, 221.0, 118.0, 94.0, 61.0, 51.0, 28.0, 26.0, 22.0, 7.0, 11.0, 3.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.145263671875, -15.63427734375, -15.123291015625, -14.6123046875, -14.101318359375, -13.59033203125, -13.079345703125, -12.568359375, -12.057373046875, -11.54638671875, -11.035400390625, -10.5244140625, -10.013427734375, -9.50244140625, -8.991455078125, -8.48046875, -7.969482421875, -7.45849609375, -6.947509765625, -6.4365234375, -5.925537109375, -5.41455078125, -4.903564453125, -4.392578125, -3.881591796875, -3.37060546875, -2.859619140625, -2.3486328125, -1.837646484375, -1.32666015625, -0.815673828125, -0.3046875, 0.206298828125, 0.71728515625, 1.228271484375, 1.7392578125, 2.250244140625, 2.76123046875, 3.272216796875, 3.783203125, 4.294189453125, 4.80517578125, 5.316162109375, 5.8271484375, 6.338134765625, 6.84912109375, 7.360107421875, 7.87109375, 8.382080078125, 8.89306640625, 9.404052734375, 9.9150390625, 10.426025390625, 10.93701171875, 11.447998046875, 11.958984375, 12.469970703125, 12.98095703125, 13.491943359375, 14.0029296875, 14.513916015625, 15.02490234375, 15.535888671875, 16.046875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 11.0, 11.0, 17.0, 21.0, 37.0, 58.0, 75.0, 92.0, 91.0, 104.0, 108.0, 110.0, 84.0, 45.0, 34.0, 25.0, 14.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4296875, -5.272216796875, -5.11474609375, -4.957275390625, -4.7998046875, -4.642333984375, -4.48486328125, -4.327392578125, -4.169921875, -4.012451171875, -3.85498046875, -3.697509765625, -3.5400390625, -3.382568359375, -3.22509765625, -3.067626953125, -2.91015625, -2.752685546875, -2.59521484375, -2.437744140625, -2.2802734375, -2.122802734375, -1.96533203125, -1.807861328125, -1.650390625, -1.492919921875, -1.33544921875, -1.177978515625, -1.0205078125, -0.863037109375, -0.70556640625, -0.548095703125, -0.390625, -0.233154296875, -0.07568359375, 0.081787109375, 0.2392578125, 0.396728515625, 0.55419921875, 0.711669921875, 0.869140625, 1.026611328125, 1.18408203125, 1.341552734375, 1.4990234375, 1.656494140625, 1.81396484375, 1.971435546875, 2.12890625, 2.286376953125, 2.44384765625, 2.601318359375, 2.7587890625, 2.916259765625, 3.07373046875, 3.231201171875, 3.388671875, 3.546142578125, 3.70361328125, 3.861083984375, 4.0185546875, 4.176025390625, 4.33349609375, 4.490966796875, 4.6484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 12.0, 11.0, 6.0, 10.0, 19.0, 17.0, 21.0, 20.0, 31.0, 32.0, 30.0, 43.0, 53.0, 145.0, 398.0, 2058.0, 16789.0, 246098.0, 732419.0, 44744.0, 4338.0, 722.0, 164.0, 83.0, 43.0, 41.0, 24.0, 25.0, 28.0, 22.0, 17.0, 15.0, 16.0, 10.0, 7.0, 10.0, 7.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.015625, -18.385986328125, -17.75634765625, -17.126708984375, -16.4970703125, -15.867431640625, -15.23779296875, -14.608154296875, -13.978515625, -13.348876953125, -12.71923828125, -12.089599609375, -11.4599609375, -10.830322265625, -10.20068359375, -9.571044921875, -8.94140625, -8.311767578125, -7.68212890625, -7.052490234375, -6.4228515625, -5.793212890625, -5.16357421875, -4.533935546875, -3.904296875, -3.274658203125, -2.64501953125, -2.015380859375, -1.3857421875, -0.756103515625, -0.12646484375, 0.503173828125, 1.1328125, 1.762451171875, 2.39208984375, 3.021728515625, 3.6513671875, 4.281005859375, 4.91064453125, 5.540283203125, 6.169921875, 6.799560546875, 7.42919921875, 8.058837890625, 8.6884765625, 9.318115234375, 9.94775390625, 10.577392578125, 11.20703125, 11.836669921875, 12.46630859375, 13.095947265625, 13.7255859375, 14.355224609375, 14.98486328125, 15.614501953125, 16.244140625, 16.873779296875, 17.50341796875, 18.133056640625, 18.7626953125, 19.392333984375, 20.02197265625, 20.651611328125, 21.28125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 12.0, 11.0, 7.0, 11.0, 16.0, 17.0, 25.0, 19.0, 27.0, 18.0, 30.0, 31.0, 37.0, 33.0, 38.0, 54.0, 46.0, 43.0, 44.0, 32.0, 49.0, 45.0, 37.0, 27.0, 28.0, 36.0, 30.0, 20.0, 21.0, 25.0, 18.0, 15.0, 22.0, 19.0, 13.0, 6.0, 10.0, 1.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.149688720703125, -2.06695556640625, -1.984222412109375, -1.9014892578125, -1.818756103515625, -1.73602294921875, -1.653289794921875, -1.570556640625, -1.487823486328125, -1.40509033203125, -1.322357177734375, -1.2396240234375, -1.156890869140625, -1.07415771484375, -0.991424560546875, -0.90869140625, -0.825958251953125, -0.74322509765625, -0.660491943359375, -0.5777587890625, -0.495025634765625, -0.41229248046875, -0.329559326171875, -0.246826171875, -0.164093017578125, -0.08135986328125, 0.001373291015625, 0.0841064453125, 0.166839599609375, 0.24957275390625, 0.332305908203125, 0.4150390625, 0.497772216796875, 0.58050537109375, 0.663238525390625, 0.7459716796875, 0.828704833984375, 0.91143798828125, 0.994171142578125, 1.076904296875, 1.159637451171875, 1.24237060546875, 1.325103759765625, 1.4078369140625, 1.490570068359375, 1.57330322265625, 1.656036376953125, 1.73876953125, 1.821502685546875, 1.90423583984375, 1.986968994140625, 2.0697021484375, 2.152435302734375, 2.23516845703125, 2.317901611328125, 2.400634765625, 2.483367919921875, 2.56610107421875, 2.648834228515625, 2.7315673828125, 2.814300537109375, 2.89703369140625, 2.979766845703125, 3.0625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 12.0, 14.0, 24.0, 24.0, 47.0, 54.0, 99.0, 184.0, 237.0, 454.0, 797.0, 1553.0, 3179.0, 7530.0, 22235.0, 115151.0, 782268.0, 83536.0, 18666.0, 6578.0, 2814.0, 1338.0, 666.0, 405.0, 235.0, 150.0, 88.0, 71.0, 43.0, 32.0, 15.0, 14.0, 13.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40234375, -0.38767242431640625, -0.3730010986328125, -0.35832977294921875, -0.343658447265625, -0.32898712158203125, -0.3143157958984375, -0.29964447021484375, -0.28497314453125, -0.27030181884765625, -0.2556304931640625, -0.24095916748046875, -0.226287841796875, -0.21161651611328125, -0.1969451904296875, -0.18227386474609375, -0.1676025390625, -0.15293121337890625, -0.1382598876953125, -0.12358856201171875, -0.108917236328125, -0.09424591064453125, -0.0795745849609375, -0.06490325927734375, -0.05023193359375, -0.03556060791015625, -0.0208892822265625, -0.00621795654296875, 0.008453369140625, 0.02312469482421875, 0.0377960205078125, 0.05246734619140625, 0.067138671875, 0.08180999755859375, 0.0964813232421875, 0.11115264892578125, 0.125823974609375, 0.14049530029296875, 0.1551666259765625, 0.16983795166015625, 0.18450927734375, 0.19918060302734375, 0.2138519287109375, 0.22852325439453125, 0.243194580078125, 0.25786590576171875, 0.2725372314453125, 0.28720855712890625, 0.3018798828125, 0.31655120849609375, 0.3312225341796875, 0.34589385986328125, 0.360565185546875, 0.37523651123046875, 0.3899078369140625, 0.40457916259765625, 0.41925048828125, 0.43392181396484375, 0.4485931396484375, 0.46326446533203125, 0.477935791015625, 0.49260711669921875, 0.5072784423828125, 0.5219497680664062, 0.53662109375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 9.0, 5.0, 7.0, 9.0, 9.0, 13.0, 19.0, 32.0, 36.0, 62.0, 88.0, 145.0, 181.0, 111.0, 69.0, 34.0, 32.0, 28.0, 21.0, 16.0, 16.0, 12.0, 8.0, 4.0, 9.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014925003051757812, -0.00014415010809898376, -0.0001390501856803894, -0.00013395026326179504, -0.00012885034084320068, -0.00012375041842460632, -0.00011865049600601196, -0.0001135505735874176, -0.00010845065116882324, -0.00010335072875022888, -9.825080633163452e-05, -9.315088391304016e-05, -8.80509614944458e-05, -8.295103907585144e-05, -7.785111665725708e-05, -7.275119423866272e-05, -6.765127182006836e-05, -6.2551349401474e-05, -5.745142698287964e-05, -5.235150456428528e-05, -4.725158214569092e-05, -4.215165972709656e-05, -3.70517373085022e-05, -3.195181488990784e-05, -2.6851892471313477e-05, -2.1751970052719116e-05, -1.6652047634124756e-05, -1.1552125215530396e-05, -6.452202796936035e-06, -1.3522803783416748e-06, 3.7476420402526855e-06, 8.847564458847046e-06, 1.3947486877441406e-05, 1.9047409296035767e-05, 2.4147331714630127e-05, 2.9247254133224487e-05, 3.434717655181885e-05, 3.944709897041321e-05, 4.454702138900757e-05, 4.964694380760193e-05, 5.474686622619629e-05, 5.984678864479065e-05, 6.494671106338501e-05, 7.004663348197937e-05, 7.514655590057373e-05, 8.024647831916809e-05, 8.534640073776245e-05, 9.044632315635681e-05, 9.554624557495117e-05, 0.00010064616799354553, 0.00010574609041213989, 0.00011084601283073425, 0.00011594593524932861, 0.00012104585766792297, 0.00012614578008651733, 0.0001312457025051117, 0.00013634562492370605, 0.00014144554734230042, 0.00014654546976089478, 0.00015164539217948914, 0.0001567453145980835, 0.00016184523701667786, 0.00016694515943527222, 0.00017204508185386658, 0.00017714500427246094]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 3.0, 3.0, 8.0, 6.0, 11.0, 12.0, 13.0, 10.0, 20.0, 15.0, 26.0, 36.0, 36.0, 45.0, 82.0, 251.0, 1335.0, 10202.0, 135267.0, 851923.0, 43350.0, 4772.0, 676.0, 151.0, 77.0, 46.0, 34.0, 23.0, 14.0, 11.0, 14.0, 11.0, 11.0, 11.0, 7.0, 8.0, 6.0, 5.0, 1.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3605537414550781, -0.34903717041015625, -0.3375205993652344, -0.3260040283203125, -0.3144874572753906, -0.30297088623046875, -0.2914543151855469, -0.279937744140625, -0.2684211730957031, -0.25690460205078125, -0.24538803100585938, -0.2338714599609375, -0.22235488891601562, -0.21083831787109375, -0.19932174682617188, -0.18780517578125, -0.17628860473632812, -0.16477203369140625, -0.15325546264648438, -0.1417388916015625, -0.13022232055664062, -0.11870574951171875, -0.10718917846679688, -0.095672607421875, -0.08415603637695312, -0.07263946533203125, -0.061122894287109375, -0.0496063232421875, -0.038089752197265625, -0.02657318115234375, -0.015056610107421875, -0.0035400390625, 0.007976531982421875, 0.01949310302734375, 0.031009674072265625, 0.0425262451171875, 0.054042816162109375, 0.06555938720703125, 0.07707595825195312, 0.088592529296875, 0.10010910034179688, 0.11162567138671875, 0.12314224243164062, 0.1346588134765625, 0.14617538452148438, 0.15769195556640625, 0.16920852661132812, 0.18072509765625, 0.19224166870117188, 0.20375823974609375, 0.21527481079101562, 0.2267913818359375, 0.23830795288085938, 0.24982452392578125, 0.2613410949707031, 0.272857666015625, 0.2843742370605469, 0.29589080810546875, 0.3074073791503906, 0.3189239501953125, 0.3304405212402344, 0.34195709228515625, 0.3534736633300781, 0.364990234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 4.0, 3.0, 5.0, 9.0, 6.0, 6.0, 13.0, 8.0, 19.0, 19.0, 16.0, 23.0, 33.0, 32.0, 40.0, 42.0, 43.0, 54.0, 65.0, 62.0, 64.0, 56.0, 72.0, 46.0, 41.0, 36.0, 23.0, 35.0, 20.0, 14.0, 12.0, 8.0, 9.0, 12.0, 5.0, 11.0, 7.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.04880523681640625, -0.0472259521484375, -0.04564666748046875, -0.0440673828125, -0.04248809814453125, -0.0409088134765625, -0.03932952880859375, -0.037750244140625, -0.03617095947265625, -0.0345916748046875, -0.03301239013671875, -0.03143310546875, -0.02985382080078125, -0.0282745361328125, -0.02669525146484375, -0.025115966796875, -0.02353668212890625, -0.0219573974609375, -0.02037811279296875, -0.018798828125, -0.01721954345703125, -0.0156402587890625, -0.01406097412109375, -0.012481689453125, -0.01090240478515625, -0.0093231201171875, -0.00774383544921875, -0.00616455078125, -0.00458526611328125, -0.0030059814453125, -0.00142669677734375, 0.000152587890625, 0.00173187255859375, 0.0033111572265625, 0.00489044189453125, 0.0064697265625, 0.00804901123046875, 0.0096282958984375, 0.01120758056640625, 0.012786865234375, 0.01436614990234375, 0.0159454345703125, 0.01752471923828125, 0.01910400390625, 0.02068328857421875, 0.0222625732421875, 0.02384185791015625, 0.025421142578125, 0.02700042724609375, 0.0285797119140625, 0.03015899658203125, 0.03173828125, 0.03331756591796875, 0.0348968505859375, 0.03647613525390625, 0.038055419921875, 0.03963470458984375, 0.0412139892578125, 0.04279327392578125, 0.04437255859375, 0.04595184326171875, 0.0475311279296875, 0.04911041259765625, 0.050689697265625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 27.0, 148.0, 699.0, 117.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.592079162597656, -25.74797821044922, -24.90387535095215, -24.059772491455078, -23.21567153930664, -22.371570587158203, -21.527467727661133, -20.683364868164062, -19.839263916015625, -18.995162963867188, -18.151060104370117, -17.306957244873047, -16.46285629272461, -15.618754386901855, -14.774652481079102, -13.930550575256348, -13.086448669433594, -12.24234676361084, -11.398244857788086, -10.554142951965332, -9.710041046142578, -8.865939140319824, -8.02183723449707, -7.177735328674316, -6.3336334228515625, -5.489531517028809, -4.645429611206055, -3.801327705383301, -2.957225799560547, -2.113123893737793, -1.269021987915039, -0.42492008209228516, 0.41918182373046875, 1.2632837295532227, 2.1073856353759766, 2.9514875411987305, 3.7955894470214844, 4.639691352844238, 5.483793258666992, 6.327895164489746, 7.1719970703125, 8.016098976135254, 8.860200881958008, 9.704302787780762, 10.548404693603516, 11.39250659942627, 12.236608505249023, 13.080710411071777, 13.924812316894531, 14.768914222717285, 15.613016128540039, 16.45711898803711, 17.301219940185547, 18.145320892333984, 18.989423751831055, 19.833526611328125, 20.677627563476562, 21.521728515625, 22.36583137512207, 23.20993423461914, 24.054035186767578, 24.898136138916016, 25.742238998413086, 26.586341857910156, 27.430442810058594]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 12.0, 12.0, 16.0, 16.0, 21.0, 19.0, 32.0, 28.0, 41.0, 47.0, 42.0, 48.0, 49.0, 56.0, 26.0, 60.0, 49.0, 57.0, 38.0, 38.0, 34.0, 36.0, 24.0, 34.0, 35.0, 33.0, 9.0, 20.0, 11.0, 17.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4972128868103027, -3.3730785846710205, -3.2489442825317383, -3.124809741973877, -3.0006754398345947, -2.8765411376953125, -2.7524068355560303, -2.628272533416748, -2.5041379928588867, -2.3800036907196045, -2.2558693885803223, -2.131734848022461, -2.0076005458831787, -1.8834662437438965, -1.7593319416046143, -1.635197639465332, -1.5110633373260498, -1.3869290351867676, -1.2627946138381958, -1.1386603116989136, -1.0145258903503418, -0.8903915882110596, -0.7662572860717773, -0.6421229243278503, -0.5179885625839233, -0.39385420083999634, -0.2697198688983917, -0.1455855369567871, -0.021451175212860107, 0.1026831865310669, 0.22681748867034912, 0.3509518504142761, 0.4750862121582031, 0.5992205739021301, 0.7233549356460571, 0.8474892377853394, 0.9716235995292664, 1.0957579612731934, 1.2198922634124756, 1.3440265655517578, 1.4681609869003296, 1.5922952890396118, 1.7164297103881836, 1.8405640125274658, 1.964698314666748, 2.0888328552246094, 2.2129669189453125, 2.337101459503174, 2.461235761642456, 2.5853700637817383, 2.7095043659210205, 2.8336386680603027, 2.957773208618164, 3.0819075107574463, 3.2060418128967285, 3.3301761150360107, 3.454310417175293, 3.578444719314575, 3.7025790214538574, 3.8267135620117188, 3.950847864151001, 4.074982166290283, 4.1991167068481445, 4.323250770568848, 4.447385311126709]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 21.0, 30.0, 34.0, 53.0, 94.0, 194.0, 383.0, 885.0, 3313.0, 3963093.0, 222027.0, 2662.0, 775.0, 311.0, 152.0, 76.0, 53.0, 34.0, 28.0, 15.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-50.625, -49.446533203125, -48.26806640625, -47.089599609375, -45.9111328125, -44.732666015625, -43.55419921875, -42.375732421875, -41.197265625, -40.018798828125, -38.84033203125, -37.661865234375, -36.4833984375, -35.304931640625, -34.12646484375, -32.947998046875, -31.76953125, -30.591064453125, -29.41259765625, -28.234130859375, -27.0556640625, -25.877197265625, -24.69873046875, -23.520263671875, -22.341796875, -21.163330078125, -19.98486328125, -18.806396484375, -17.6279296875, -16.449462890625, -15.27099609375, -14.092529296875, -12.9140625, -11.735595703125, -10.55712890625, -9.378662109375, -8.2001953125, -7.021728515625, -5.84326171875, -4.664794921875, -3.486328125, -2.307861328125, -1.12939453125, 0.049072265625, 1.2275390625, 2.406005859375, 3.58447265625, 4.762939453125, 5.94140625, 7.119873046875, 8.29833984375, 9.476806640625, 10.6552734375, 11.833740234375, 13.01220703125, 14.190673828125, 15.369140625, 16.547607421875, 17.72607421875, 18.904541015625, 20.0830078125, 21.261474609375, 22.43994140625, 23.618408203125, 24.796875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 10.0, 16.0, 24.0, 16.0, 30.0, 46.0, 52.0, 64.0, 72.0, 80.0, 88.0, 96.0, 80.0, 61.0, 58.0, 50.0, 50.0, 29.0, 25.0, 14.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0], "bins": [-3.392578125, -3.313568115234375, -3.23455810546875, -3.155548095703125, -3.0765380859375, -2.997528076171875, -2.91851806640625, -2.839508056640625, -2.760498046875, -2.681488037109375, -2.60247802734375, -2.523468017578125, -2.4444580078125, -2.365447998046875, -2.28643798828125, -2.207427978515625, -2.12841796875, -2.049407958984375, -1.97039794921875, -1.891387939453125, -1.8123779296875, -1.733367919921875, -1.65435791015625, -1.575347900390625, -1.496337890625, -1.417327880859375, -1.33831787109375, -1.259307861328125, -1.1802978515625, -1.101287841796875, -1.02227783203125, -0.943267822265625, -0.8642578125, -0.785247802734375, -0.70623779296875, -0.627227783203125, -0.5482177734375, -0.469207763671875, -0.39019775390625, -0.311187744140625, -0.232177734375, -0.153167724609375, -0.07415771484375, 0.004852294921875, 0.0838623046875, 0.162872314453125, 0.24188232421875, 0.320892333984375, 0.39990234375, 0.478912353515625, 0.55792236328125, 0.636932373046875, 0.7159423828125, 0.794952392578125, 0.87396240234375, 0.952972412109375, 1.031982421875, 1.110992431640625, 1.19000244140625, 1.269012451171875, 1.3480224609375, 1.427032470703125, 1.50604248046875, 1.585052490234375, 1.6640625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 14.0, 25.0, 57.0, 103.0, 264.0, 880.0, 8154.0, 4162942.0, 19877.0, 1300.0, 359.0, 128.0, 59.0, 33.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.53125, -35.41162109375, -34.2919921875, -33.17236328125, -32.052734375, -30.93310546875, -29.8134765625, -28.69384765625, -27.57421875, -26.45458984375, -25.3349609375, -24.21533203125, -23.095703125, -21.97607421875, -20.8564453125, -19.73681640625, -18.6171875, -17.49755859375, -16.3779296875, -15.25830078125, -14.138671875, -13.01904296875, -11.8994140625, -10.77978515625, -9.66015625, -8.54052734375, -7.4208984375, -6.30126953125, -5.181640625, -4.06201171875, -2.9423828125, -1.82275390625, -0.703125, 0.41650390625, 1.5361328125, 2.65576171875, 3.775390625, 4.89501953125, 6.0146484375, 7.13427734375, 8.25390625, 9.37353515625, 10.4931640625, 11.61279296875, 12.732421875, 13.85205078125, 14.9716796875, 16.09130859375, 17.2109375, 18.33056640625, 19.4501953125, 20.56982421875, 21.689453125, 22.80908203125, 23.9287109375, 25.04833984375, 26.16796875, 27.28759765625, 28.4072265625, 29.52685546875, 30.646484375, 31.76611328125, 32.8857421875, 34.00537109375, 35.125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 8.0, 8.0, 6.0, 8.0, 9.0, 10.0, 16.0, 34.0, 98.0, 379.0, 2880.0, 387.0, 111.0, 45.0, 18.0, 11.0, 9.0, 9.0, 3.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.1708526611328125, -1.124908447265625, -1.0789642333984375, -1.03302001953125, -0.9870758056640625, -0.941131591796875, -0.8951873779296875, -0.8492431640625, -0.8032989501953125, -0.757354736328125, -0.7114105224609375, -0.66546630859375, -0.6195220947265625, -0.573577880859375, -0.5276336669921875, -0.481689453125, -0.4357452392578125, -0.389801025390625, -0.3438568115234375, -0.29791259765625, -0.2519683837890625, -0.206024169921875, -0.1600799560546875, -0.1141357421875, -0.0681915283203125, -0.022247314453125, 0.0236968994140625, 0.06964111328125, 0.1155853271484375, 0.161529541015625, 0.2074737548828125, 0.25341796875, 0.2993621826171875, 0.345306396484375, 0.3912506103515625, 0.43719482421875, 0.4831390380859375, 0.529083251953125, 0.5750274658203125, 0.6209716796875, 0.6669158935546875, 0.712860107421875, 0.7588043212890625, 0.80474853515625, 0.8506927490234375, 0.896636962890625, 0.9425811767578125, 0.988525390625, 1.0344696044921875, 1.080413818359375, 1.1263580322265625, 1.17230224609375, 1.2182464599609375, 1.264190673828125, 1.3101348876953125, 1.3560791015625, 1.4020233154296875, 1.447967529296875, 1.4939117431640625, 1.53985595703125, 1.5858001708984375, 1.631744384765625, 1.6776885986328125, 1.7236328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 19.0, 65.0, 300.0, 513.0, 75.0, 17.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.319766521453857, -4.881290912628174, -4.44281530380249, -4.004339694976807, -3.565864086151123, -3.1273882389068604, -2.6889126300811768, -2.250437021255493, -1.8119614124298096, -1.373485803604126, -0.9350101351737976, -0.49653446674346924, -0.058058857917785645, 0.3804168701171875, 0.8188924789428711, 1.2573680877685547, 1.6958436965942383, 2.134319305419922, 2.5727949142456055, 3.011270523071289, 3.4497461318969727, 3.8882219791412354, 4.32669734954834, 4.765172958374023, 5.203648567199707, 5.642124176025391, 6.080599784851074, 6.519075393676758, 6.957551002502441, 7.396026611328125, 7.834502220153809, 8.272977828979492, 8.711453437805176, 9.14992904663086, 9.588404655456543, 10.026880264282227, 10.46535587310791, 10.903831481933594, 11.342307090759277, 11.780782699584961, 12.219258308410645, 12.657733917236328, 13.096209526062012, 13.534685134887695, 13.973160743713379, 14.411636352539062, 14.850111961364746, 15.28858757019043, 15.72706413269043, 16.16554069519043, 16.604015350341797, 17.042491912841797, 17.480966567993164, 17.919443130493164, 18.35791778564453, 18.79639434814453, 19.2348690032959, 19.6733455657959, 20.111820220947266, 20.550296783447266, 20.988771438598633, 21.427248001098633, 21.86572265625, 22.30419921875, 22.742673873901367]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 6.0, 9.0, 7.0, 12.0, 13.0, 17.0, 10.0, 15.0, 12.0, 27.0, 28.0, 28.0, 33.0, 25.0, 31.0, 35.0, 43.0, 52.0, 41.0, 39.0, 32.0, 29.0, 33.0, 33.0, 46.0, 32.0, 21.0, 32.0, 29.0, 25.0, 18.0, 29.0, 21.0, 19.0, 24.0, 17.0, 9.0, 12.0, 10.0, 15.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0150731801986694, -0.9798888564109802, -0.9447044730186462, -0.909520149230957, -0.874335765838623, -0.8391514420509338, -0.8039671182632446, -0.7687827348709106, -0.7335984110832214, -0.6984140872955322, -0.6632297039031982, -0.628045380115509, -0.5928610563278198, -0.5576766729354858, -0.5224923491477966, -0.48730799555778503, -0.45212364196777344, -0.41693928837776184, -0.38175493478775024, -0.34657061100006104, -0.31138625741004944, -0.27620190382003784, -0.24101756513118744, -0.20583322644233704, -0.17064887285232544, -0.13546451926231384, -0.10028018057346344, -0.06509583443403244, -0.02991148829460144, 0.005272865295410156, 0.04045720398426056, 0.07564154267311096, 0.11082589626312256, 0.14601024985313416, 0.18119458854198456, 0.21637892723083496, 0.25156328082084656, 0.28674763441085815, 0.32193195819854736, 0.35711631178855896, 0.39230066537857056, 0.42748501896858215, 0.46266937255859375, 0.49785369634628296, 0.5330380201339722, 0.5682224035263062, 0.6034067273139954, 0.6385910511016846, 0.6737754344940186, 0.7089597582817078, 0.7441441416740417, 0.779328465461731, 0.8145128488540649, 0.8496971726417542, 0.8848814964294434, 0.9200658798217773, 0.9552502036094666, 0.9904345273971558, 1.0256189107894897, 1.0608032941818237, 1.0959875583648682, 1.1311719417572021, 1.1663563251495361, 1.2015405893325806, 1.2367249727249146]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 10.0, 21.0, 16.0, 30.0, 64.0, 78.0, 145.0, 268.0, 464.0, 1051.0, 2277.0, 6003.0, 17985.0, 76640.0, 528185.0, 338796.0, 53875.0, 14024.0, 4696.0, 1937.0, 889.0, 450.0, 255.0, 139.0, 85.0, 56.0, 33.0, 19.0, 8.0, 7.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.984375, -10.6695556640625, -10.354736328125, -10.0399169921875, -9.72509765625, -9.4102783203125, -9.095458984375, -8.7806396484375, -8.4658203125, -8.1510009765625, -7.836181640625, -7.5213623046875, -7.20654296875, -6.8917236328125, -6.576904296875, -6.2620849609375, -5.947265625, -5.6324462890625, -5.317626953125, -5.0028076171875, -4.68798828125, -4.3731689453125, -4.058349609375, -3.7435302734375, -3.4287109375, -3.1138916015625, -2.799072265625, -2.4842529296875, -2.16943359375, -1.8546142578125, -1.539794921875, -1.2249755859375, -0.91015625, -0.5953369140625, -0.280517578125, 0.0343017578125, 0.34912109375, 0.6639404296875, 0.978759765625, 1.2935791015625, 1.6083984375, 1.9232177734375, 2.238037109375, 2.5528564453125, 2.86767578125, 3.1824951171875, 3.497314453125, 3.8121337890625, 4.126953125, 4.4417724609375, 4.756591796875, 5.0714111328125, 5.38623046875, 5.7010498046875, 6.015869140625, 6.3306884765625, 6.6455078125, 6.9603271484375, 7.275146484375, 7.5899658203125, 7.90478515625, 8.2196044921875, 8.534423828125, 8.8492431640625, 9.1640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 7.0, 14.0, 22.0, 26.0, 52.0, 55.0, 67.0, 89.0, 96.0, 102.0, 94.0, 71.0, 77.0, 53.0, 60.0, 38.0, 27.0, 17.0, 8.0, 2.0, 4.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.8310546875, -1.78717041015625, -1.7432861328125, -1.69940185546875, -1.655517578125, -1.61163330078125, -1.5677490234375, -1.52386474609375, -1.47998046875, -1.43609619140625, -1.3922119140625, -1.34832763671875, -1.304443359375, -1.26055908203125, -1.2166748046875, -1.17279052734375, -1.12890625, -1.08502197265625, -1.0411376953125, -0.99725341796875, -0.953369140625, -0.90948486328125, -0.8656005859375, -0.82171630859375, -0.77783203125, -0.73394775390625, -0.6900634765625, -0.64617919921875, -0.602294921875, -0.55841064453125, -0.5145263671875, -0.47064208984375, -0.4267578125, -0.38287353515625, -0.3389892578125, -0.29510498046875, -0.251220703125, -0.20733642578125, -0.1634521484375, -0.11956787109375, -0.07568359375, -0.03179931640625, 0.0120849609375, 0.05596923828125, 0.099853515625, 0.14373779296875, 0.1876220703125, 0.23150634765625, 0.275390625, 0.31927490234375, 0.3631591796875, 0.40704345703125, 0.450927734375, 0.49481201171875, 0.5386962890625, 0.58258056640625, 0.62646484375, 0.67034912109375, 0.7142333984375, 0.75811767578125, 0.802001953125, 0.84588623046875, 0.8897705078125, 0.93365478515625, 0.9775390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 2.0, 4.0, 8.0, 8.0, 18.0, 28.0, 39.0, 34.0, 55.0, 66.0, 108.0, 150.0, 169.0, 249.0, 359.0, 447.0, 574.0, 855.0, 1260.0, 1913.0, 2796.0, 4392.0, 6897.0, 11282.0, 19774.0, 36863.0, 83656.0, 619373.0, 143291.0, 49987.0, 25213.0, 14233.0, 8377.0, 5249.0, 3399.0, 2250.0, 1474.0, 1056.0, 735.0, 539.0, 369.0, 263.0, 186.0, 143.0, 102.0, 74.0, 61.0, 46.0, 29.0, 25.0, 18.0, 12.0, 14.0, 18.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-3.283203125, -3.179656982421875, -3.07611083984375, -2.972564697265625, -2.8690185546875, -2.765472412109375, -2.66192626953125, -2.558380126953125, -2.454833984375, -2.351287841796875, -2.24774169921875, -2.144195556640625, -2.0406494140625, -1.937103271484375, -1.83355712890625, -1.730010986328125, -1.62646484375, -1.522918701171875, -1.41937255859375, -1.315826416015625, -1.2122802734375, -1.108734130859375, -1.00518798828125, -0.901641845703125, -0.798095703125, -0.694549560546875, -0.59100341796875, -0.487457275390625, -0.3839111328125, -0.280364990234375, -0.17681884765625, -0.073272705078125, 0.0302734375, 0.133819580078125, 0.23736572265625, 0.340911865234375, 0.4444580078125, 0.548004150390625, 0.65155029296875, 0.755096435546875, 0.858642578125, 0.962188720703125, 1.06573486328125, 1.169281005859375, 1.2728271484375, 1.376373291015625, 1.47991943359375, 1.583465576171875, 1.68701171875, 1.790557861328125, 1.89410400390625, 1.997650146484375, 2.1011962890625, 2.204742431640625, 2.30828857421875, 2.411834716796875, 2.515380859375, 2.618927001953125, 2.72247314453125, 2.826019287109375, 2.9295654296875, 3.033111572265625, 3.13665771484375, 3.240203857421875, 3.34375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 8.0, 12.0, 7.0, 5.0, 10.0, 14.0, 17.0, 12.0, 20.0, 27.0, 19.0, 28.0, 19.0, 24.0, 29.0, 30.0, 45.0, 36.0, 41.0, 33.0, 39.0, 47.0, 35.0, 42.0, 28.0, 36.0, 25.0, 29.0, 26.0, 24.0, 30.0, 23.0, 28.0, 16.0, 18.0, 23.0, 17.0, 15.0, 8.0, 9.0, 11.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-0.419189453125, -0.40625762939453125, -0.3933258056640625, -0.38039398193359375, -0.367462158203125, -0.35453033447265625, -0.3415985107421875, -0.32866668701171875, -0.31573486328125, -0.30280303955078125, -0.2898712158203125, -0.27693939208984375, -0.264007568359375, -0.25107574462890625, -0.2381439208984375, -0.22521209716796875, -0.2122802734375, -0.19934844970703125, -0.1864166259765625, -0.17348480224609375, -0.160552978515625, -0.14762115478515625, -0.1346893310546875, -0.12175750732421875, -0.10882568359375, -0.09589385986328125, -0.0829620361328125, -0.07003021240234375, -0.057098388671875, -0.04416656494140625, -0.0312347412109375, -0.01830291748046875, -0.00537109375, 0.00756072998046875, 0.0204925537109375, 0.03342437744140625, 0.046356201171875, 0.05928802490234375, 0.0722198486328125, 0.08515167236328125, 0.09808349609375, 0.11101531982421875, 0.1239471435546875, 0.13687896728515625, 0.149810791015625, 0.16274261474609375, 0.1756744384765625, 0.18860626220703125, 0.2015380859375, 0.21446990966796875, 0.2274017333984375, 0.24033355712890625, 0.253265380859375, 0.26619720458984375, 0.2791290283203125, 0.29206085205078125, 0.30499267578125, 0.31792449951171875, 0.3308563232421875, 0.34378814697265625, 0.356719970703125, 0.36965179443359375, 0.3825836181640625, 0.39551544189453125, 0.408447265625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 7.0, 15.0, 17.0, 17.0, 30.0, 32.0, 53.0, 68.0, 103.0, 141.0, 197.0, 313.0, 476.0, 764.0, 1346.0, 2664.0, 6875.0, 39073.0, 949356.0, 34212.0, 6680.0, 2565.0, 1308.0, 780.0, 470.0, 329.0, 197.0, 146.0, 87.0, 55.0, 44.0, 38.0, 23.0, 15.0, 11.0, 8.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6970901489257812, -0.6749420166015625, -0.6527938842773438, -0.630645751953125, -0.6084976196289062, -0.5863494873046875, -0.5642013549804688, -0.54205322265625, -0.5199050903320312, -0.4977569580078125, -0.47560882568359375, -0.453460693359375, -0.43131256103515625, -0.4091644287109375, -0.38701629638671875, -0.3648681640625, -0.34272003173828125, -0.3205718994140625, -0.29842376708984375, -0.276275634765625, -0.25412750244140625, -0.2319793701171875, -0.20983123779296875, -0.18768310546875, -0.16553497314453125, -0.1433868408203125, -0.12123870849609375, -0.099090576171875, -0.07694244384765625, -0.0547943115234375, -0.03264617919921875, -0.010498046875, 0.01165008544921875, 0.0337982177734375, 0.05594635009765625, 0.078094482421875, 0.10024261474609375, 0.1223907470703125, 0.14453887939453125, 0.16668701171875, 0.18883514404296875, 0.2109832763671875, 0.23313140869140625, 0.255279541015625, 0.27742767333984375, 0.2995758056640625, 0.32172393798828125, 0.3438720703125, 0.36602020263671875, 0.3881683349609375, 0.41031646728515625, 0.432464599609375, 0.45461273193359375, 0.4767608642578125, 0.49890899658203125, 0.52105712890625, 0.5432052612304688, 0.5653533935546875, 0.5875015258789062, 0.609649658203125, 0.6317977905273438, 0.6539459228515625, 0.6760940551757812, 0.6982421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 5.0, 5.0, 9.0, 4.0, 2.0, 9.0, 5.0, 10.0, 16.0, 30.0, 28.0, 41.0, 72.0, 80.0, 195.0, 171.0, 97.0, 49.0, 37.0, 26.0, 21.0, 17.0, 12.0, 7.0, 15.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6510486602783203e-05, -1.5897676348686218e-05, -1.5284866094589233e-05, -1.4672055840492249e-05, -1.4059245586395264e-05, -1.3446435332298279e-05, -1.2833625078201294e-05, -1.2220814824104309e-05, -1.1608004570007324e-05, -1.099519431591034e-05, -1.0382384061813354e-05, -9.76957380771637e-06, -9.156763553619385e-06, -8.5439532995224e-06, -7.931143045425415e-06, -7.31833279132843e-06, -6.705522537231445e-06, -6.0927122831344604e-06, -5.479902029037476e-06, -4.867091774940491e-06, -4.254281520843506e-06, -3.641471266746521e-06, -3.028661012649536e-06, -2.4158507585525513e-06, -1.8030405044555664e-06, -1.1902302503585815e-06, -5.774199962615967e-07, 3.5390257835388184e-08, 6.48200511932373e-07, 1.261010766029358e-06, 1.8738210201263428e-06, 2.4866312742233276e-06, 3.0994415283203125e-06, 3.7122517824172974e-06, 4.325062036514282e-06, 4.937872290611267e-06, 5.550682544708252e-06, 6.163492798805237e-06, 6.776303052902222e-06, 7.3891133069992065e-06, 8.001923561096191e-06, 8.614733815193176e-06, 9.227544069290161e-06, 9.840354323387146e-06, 1.0453164577484131e-05, 1.1065974831581116e-05, 1.16787850856781e-05, 1.2291595339775085e-05, 1.290440559387207e-05, 1.3517215847969055e-05, 1.413002610206604e-05, 1.4742836356163025e-05, 1.535564661026001e-05, 1.5968456864356995e-05, 1.658126711845398e-05, 1.7194077372550964e-05, 1.780688762664795e-05, 1.8419697880744934e-05, 1.903250813484192e-05, 1.9645318388938904e-05, 2.025812864303589e-05, 2.0870938897132874e-05, 2.148374915122986e-05, 2.2096559405326843e-05, 2.2709369659423828e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 7.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 10.0, 33.0, 41.0, 94.0, 284.0, 1353.0, 18496.0, 1023470.0, 3833.0, 620.0, 153.0, 38.0, 30.0, 16.0, 9.0, 12.0, 3.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.369140625, -1.326690673828125, -1.28424072265625, -1.241790771484375, -1.1993408203125, -1.156890869140625, -1.11444091796875, -1.071990966796875, -1.029541015625, -0.987091064453125, -0.94464111328125, -0.902191162109375, -0.8597412109375, -0.817291259765625, -0.77484130859375, -0.732391357421875, -0.68994140625, -0.647491455078125, -0.60504150390625, -0.562591552734375, -0.5201416015625, -0.477691650390625, -0.43524169921875, -0.392791748046875, -0.350341796875, -0.307891845703125, -0.26544189453125, -0.222991943359375, -0.1805419921875, -0.138092041015625, -0.09564208984375, -0.053192138671875, -0.0107421875, 0.031707763671875, 0.07415771484375, 0.116607666015625, 0.1590576171875, 0.201507568359375, 0.24395751953125, 0.286407470703125, 0.328857421875, 0.371307373046875, 0.41375732421875, 0.456207275390625, 0.4986572265625, 0.541107177734375, 0.58355712890625, 0.626007080078125, 0.66845703125, 0.710906982421875, 0.75335693359375, 0.795806884765625, 0.8382568359375, 0.880706787109375, 0.92315673828125, 0.965606689453125, 1.008056640625, 1.050506591796875, 1.09295654296875, 1.135406494140625, 1.1778564453125, 1.220306396484375, 1.26275634765625, 1.305206298828125, 1.34765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 2.0, 7.0, 22.0, 51.0, 157.0, 556.0, 113.0, 39.0, 13.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0860595703125, -0.0834054946899414, -0.08075141906738281, -0.07809734344482422, -0.07544326782226562, -0.07278919219970703, -0.07013511657714844, -0.06748104095458984, -0.06482696533203125, -0.062172889709472656, -0.05951881408691406, -0.05686473846435547, -0.054210662841796875, -0.05155658721923828, -0.04890251159667969, -0.046248435974121094, -0.0435943603515625, -0.040940284729003906, -0.03828620910644531, -0.03563213348388672, -0.032978057861328125, -0.03032398223876953, -0.027669906616210938, -0.025015830993652344, -0.02236175537109375, -0.019707679748535156, -0.017053604125976562, -0.014399528503417969, -0.011745452880859375, -0.009091377258300781, -0.0064373016357421875, -0.0037832260131835938, -0.001129150390625, 0.0015249252319335938, 0.0041790008544921875, 0.006833076477050781, 0.009487152099609375, 0.012141227722167969, 0.014795303344726562, 0.017449378967285156, 0.02010345458984375, 0.022757530212402344, 0.025411605834960938, 0.02806568145751953, 0.030719757080078125, 0.03337383270263672, 0.03602790832519531, 0.038681983947753906, 0.0413360595703125, 0.043990135192871094, 0.04664421081542969, 0.04929828643798828, 0.051952362060546875, 0.05460643768310547, 0.05726051330566406, 0.059914588928222656, 0.06256866455078125, 0.06522274017333984, 0.06787681579589844, 0.07053089141845703, 0.07318496704101562, 0.07583904266357422, 0.07849311828613281, 0.0811471939086914, 0.08380126953125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 30.0, 128.0, 629.0, 160.0, 32.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6101734638214111, -1.4408358335494995, -1.2714980840682983, -1.1021604537963867, -0.9328227639198303, -0.7634850740432739, -0.5941474437713623, -0.42480969429016113, -0.2554720640182495, -0.08613438904285431, 0.0832032859325409, 0.2525409460067749, 0.4218786358833313, 0.5912163257598877, 0.7605539560317993, 0.9298917055130005, 1.099229335784912, 1.2685669660568237, 1.437904715538025, 1.6072423458099365, 1.7765800952911377, 1.9459177255630493, 2.115255355834961, 2.284593105316162, 2.4539308547973633, 2.6232686042785645, 2.7926061153411865, 2.9619438648223877, 3.131281614303589, 3.300619125366211, 3.469956874847412, 3.6392946243286133, 3.8086323738098145, 3.9779701232910156, 4.147307872772217, 4.316645622253418, 4.485982894897461, 4.655320644378662, 4.824658393859863, 4.9939961433410645, 5.163333892822266, 5.332671642303467, 5.502009391784668, 5.671346664428711, 5.840684413909912, 6.010022163391113, 6.1793599128723145, 6.348697662353516, 6.518034934997559, 6.68737268447876, 6.856710433959961, 7.026047706604004, 7.195385456085205, 7.364723205566406, 7.534060955047607, 7.703398704528809, 7.87273645401001, 8.042074203491211, 8.211411476135254, 8.380749702453613, 8.550086975097656, 8.719425201416016, 8.888762474060059, 9.058099746704102, 9.227437973022461]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 1.0, 8.0, 8.0, 6.0, 7.0, 9.0, 16.0, 23.0, 23.0, 16.0, 18.0, 28.0, 27.0, 30.0, 39.0, 43.0, 38.0, 41.0, 42.0, 48.0, 39.0, 39.0, 44.0, 36.0, 44.0, 28.0, 34.0, 30.0, 24.0, 32.0, 21.0, 20.0, 18.0, 21.0, 25.0, 20.0, 10.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.465716689825058, -0.450582355260849, -0.43544802069664, -0.42031365633010864, -0.40517932176589966, -0.3900449872016907, -0.3749106526374817, -0.3597763180732727, -0.3446419835090637, -0.32950764894485474, -0.31437331438064575, -0.29923897981643677, -0.2841046154499054, -0.2689702808856964, -0.2538359463214874, -0.23870161175727844, -0.22356724739074707, -0.20843291282653809, -0.1932985633611679, -0.17816422879695892, -0.16302987933158875, -0.14789554476737976, -0.13276121020317078, -0.1176268681883812, -0.10249252617359161, -0.08735818415880203, -0.07222384214401245, -0.05708950757980347, -0.041955165565013885, -0.026820823550224304, -0.01168648898601532, 0.0034478530287742615, 0.018582165241241455, 0.033716507256031036, 0.04885084554553032, 0.0639851838350296, 0.07911952584981918, 0.09425386786460876, 0.10938820242881775, 0.12452254444360733, 0.1396568864583969, 0.1547912210226059, 0.16992557048797607, 0.18505990505218506, 0.20019423961639404, 0.21532858908176422, 0.2304629236459732, 0.24559727311134338, 0.26073160767555237, 0.27586594223976135, 0.29100027680397034, 0.3061346411705017, 0.3212689757347107, 0.3364033102989197, 0.35153764486312866, 0.36667197942733765, 0.38180631399154663, 0.3969406485557556, 0.4120749831199646, 0.4272093176841736, 0.44234368205070496, 0.45747801661491394, 0.4726123511791229, 0.4877466857433319, 0.5028810501098633]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 9.0, 18.0, 10.0, 26.0, 53.0, 63.0, 97.0, 149.0, 233.0, 403.0, 701.0, 1209.0, 2400.0, 5425.0, 15760.0, 61331.0, 529371.0, 359366.0, 49302.0, 13153.0, 4655.0, 2152.0, 1096.0, 598.0, 367.0, 211.0, 116.0, 90.0, 60.0, 43.0, 26.0, 14.0, 7.0, 6.0, 7.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.423828125, -3.33355712890625, -3.2432861328125, -3.15301513671875, -3.062744140625, -2.97247314453125, -2.8822021484375, -2.79193115234375, -2.70166015625, -2.61138916015625, -2.5211181640625, -2.43084716796875, -2.340576171875, -2.25030517578125, -2.1600341796875, -2.06976318359375, -1.9794921875, -1.88922119140625, -1.7989501953125, -1.70867919921875, -1.618408203125, -1.52813720703125, -1.4378662109375, -1.34759521484375, -1.25732421875, -1.16705322265625, -1.0767822265625, -0.98651123046875, -0.896240234375, -0.80596923828125, -0.7156982421875, -0.62542724609375, -0.53515625, -0.44488525390625, -0.3546142578125, -0.26434326171875, -0.174072265625, -0.08380126953125, 0.0064697265625, 0.09674072265625, 0.18701171875, 0.27728271484375, 0.3675537109375, 0.45782470703125, 0.548095703125, 0.63836669921875, 0.7286376953125, 0.81890869140625, 0.9091796875, 0.99945068359375, 1.0897216796875, 1.17999267578125, 1.270263671875, 1.36053466796875, 1.4508056640625, 1.54107666015625, 1.63134765625, 1.72161865234375, 1.8118896484375, 1.90216064453125, 1.992431640625, 2.08270263671875, 2.1729736328125, 2.26324462890625, 2.353515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 12.0, 11.0, 23.0, 36.0, 51.0, 60.0, 89.0, 102.0, 105.0, 107.0, 100.0, 81.0, 48.0, 46.0, 48.0, 22.0, 16.0, 9.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.24943923950195312, -0.23813629150390625, -0.22683334350585938, -0.2155303955078125, -0.20422744750976562, -0.19292449951171875, -0.18162155151367188, -0.170318603515625, -0.15901565551757812, -0.14771270751953125, -0.13640975952148438, -0.1251068115234375, -0.11380386352539062, -0.10250091552734375, -0.09119796752929688, -0.07989501953125, -0.06859207153320312, -0.05728912353515625, -0.045986175537109375, -0.0346832275390625, -0.023380279541015625, -0.01207733154296875, -0.000774383544921875, 0.010528564453125, 0.021831512451171875, 0.03313446044921875, 0.044437408447265625, 0.0557403564453125, 0.06704330444335938, 0.07834625244140625, 0.08964920043945312, 0.1009521484375, 0.11225509643554688, 0.12355804443359375, 0.13486099243164062, 0.1461639404296875, 0.15746688842773438, 0.16876983642578125, 0.18007278442382812, 0.191375732421875, 0.20267868041992188, 0.21398162841796875, 0.22528457641601562, 0.2365875244140625, 0.24789047241210938, 0.25919342041015625, 0.2704963684082031, 0.28179931640625, 0.2931022644042969, 0.30440521240234375, 0.3157081604003906, 0.3270111083984375, 0.3383140563964844, 0.34961700439453125, 0.3609199523925781, 0.372222900390625, 0.3835258483886719, 0.39482879638671875, 0.4061317443847656, 0.4174346923828125, 0.4287376403808594, 0.44004058837890625, 0.4513435363769531, 0.462646484375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 10.0, 12.0, 22.0, 34.0, 33.0, 61.0, 105.0, 152.0, 292.0, 494.0, 912.0, 1789.0, 3610.0, 7550.0, 16821.0, 38695.0, 100107.0, 378769.0, 340377.0, 92731.0, 36284.0, 15570.0, 7091.0, 3299.0, 1654.0, 888.0, 469.0, 241.0, 171.0, 97.0, 70.0, 39.0, 26.0, 18.0, 19.0, 13.0, 5.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.769805908203125, -0.74322509765625, -0.716644287109375, -0.6900634765625, -0.663482666015625, -0.63690185546875, -0.610321044921875, -0.583740234375, -0.557159423828125, -0.53057861328125, -0.503997802734375, -0.4774169921875, -0.450836181640625, -0.42425537109375, -0.397674560546875, -0.37109375, -0.344512939453125, -0.31793212890625, -0.291351318359375, -0.2647705078125, -0.238189697265625, -0.21160888671875, -0.185028076171875, -0.158447265625, -0.131866455078125, -0.10528564453125, -0.078704833984375, -0.0521240234375, -0.025543212890625, 0.00103759765625, 0.027618408203125, 0.05419921875, 0.080780029296875, 0.10736083984375, 0.133941650390625, 0.1605224609375, 0.187103271484375, 0.21368408203125, 0.240264892578125, 0.266845703125, 0.293426513671875, 0.32000732421875, 0.346588134765625, 0.3731689453125, 0.399749755859375, 0.42633056640625, 0.452911376953125, 0.4794921875, 0.506072998046875, 0.53265380859375, 0.559234619140625, 0.5858154296875, 0.612396240234375, 0.63897705078125, 0.665557861328125, 0.692138671875, 0.718719482421875, 0.74530029296875, 0.771881103515625, 0.7984619140625, 0.825042724609375, 0.85162353515625, 0.878204345703125, 0.90478515625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 5.0, 10.0, 19.0, 17.0, 23.0, 26.0, 25.0, 28.0, 32.0, 36.0, 35.0, 41.0, 44.0, 41.0, 51.0, 38.0, 58.0, 48.0, 38.0, 37.0, 38.0, 37.0, 28.0, 32.0, 30.0, 27.0, 21.0, 16.0, 21.0, 15.0, 15.0, 10.0, 13.0, 7.0, 6.0, 7.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.1510772705078125, -0.145782470703125, -0.1404876708984375, -0.13519287109375, -0.1298980712890625, -0.124603271484375, -0.1193084716796875, -0.114013671875, -0.1087188720703125, -0.103424072265625, -0.0981292724609375, -0.09283447265625, -0.0875396728515625, -0.082244873046875, -0.0769500732421875, -0.0716552734375, -0.0663604736328125, -0.061065673828125, -0.0557708740234375, -0.05047607421875, -0.0451812744140625, -0.039886474609375, -0.0345916748046875, -0.029296875, -0.0240020751953125, -0.018707275390625, -0.0134124755859375, -0.00811767578125, -0.0028228759765625, 0.002471923828125, 0.0077667236328125, 0.0130615234375, 0.0183563232421875, 0.023651123046875, 0.0289459228515625, 0.03424072265625, 0.0395355224609375, 0.044830322265625, 0.0501251220703125, 0.055419921875, 0.0607147216796875, 0.066009521484375, 0.0713043212890625, 0.07659912109375, 0.0818939208984375, 0.087188720703125, 0.0924835205078125, 0.0977783203125, 0.1030731201171875, 0.108367919921875, 0.1136627197265625, 0.11895751953125, 0.1242523193359375, 0.129547119140625, 0.1348419189453125, 0.14013671875, 0.1454315185546875, 0.150726318359375, 0.1560211181640625, 0.16131591796875, 0.1666107177734375, 0.171905517578125, 0.1772003173828125, 0.1824951171875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 9.0, 11.0, 19.0, 23.0, 31.0, 63.0, 71.0, 95.0, 163.0, 240.0, 396.0, 666.0, 1446.0, 3279.0, 9643.0, 58750.0, 907372.0, 50954.0, 8983.0, 3170.0, 1387.0, 700.0, 356.0, 251.0, 142.0, 94.0, 67.0, 48.0, 31.0, 23.0, 14.0, 14.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1787109375, -0.1738109588623047, -0.16891098022460938, -0.16401100158691406, -0.15911102294921875, -0.15421104431152344, -0.14931106567382812, -0.1444110870361328, -0.1395111083984375, -0.1346111297607422, -0.12971115112304688, -0.12481117248535156, -0.11991119384765625, -0.11501121520996094, -0.11011123657226562, -0.10521125793457031, -0.100311279296875, -0.09541130065917969, -0.09051132202148438, -0.08561134338378906, -0.08071136474609375, -0.07581138610839844, -0.07091140747070312, -0.06601142883300781, -0.0611114501953125, -0.05621147155761719, -0.051311492919921875, -0.04641151428222656, -0.04151153564453125, -0.03661155700683594, -0.031711578369140625, -0.026811599731445312, -0.02191162109375, -0.017011642456054688, -0.012111663818359375, -0.0072116851806640625, -0.00231170654296875, 0.0025882720947265625, 0.007488250732421875, 0.012388229370117188, 0.0172882080078125, 0.022188186645507812, 0.027088165283203125, 0.03198814392089844, 0.03688812255859375, 0.04178810119628906, 0.046688079833984375, 0.05158805847167969, 0.056488037109375, 0.06138801574707031, 0.06628799438476562, 0.07118797302246094, 0.07608795166015625, 0.08098793029785156, 0.08588790893554688, 0.09078788757324219, 0.0956878662109375, 0.10058784484863281, 0.10548782348632812, 0.11038780212402344, 0.11528778076171875, 0.12018775939941406, 0.12508773803710938, 0.1299877166748047, 0.1348876953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 3.0, 5.0, 9.0, 11.0, 13.0, 19.0, 37.0, 58.0, 70.0, 130.0, 215.0, 174.0, 90.0, 46.0, 28.0, 19.0, 13.0, 16.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.142375499010086e-05, -3.036297857761383e-05, -2.93022021651268e-05, -2.824142575263977e-05, -2.718064934015274e-05, -2.611987292766571e-05, -2.505909651517868e-05, -2.399832010269165e-05, -2.293754369020462e-05, -2.187676727771759e-05, -2.081599086523056e-05, -1.975521445274353e-05, -1.86944380402565e-05, -1.763366162776947e-05, -1.657288521528244e-05, -1.551210880279541e-05, -1.445133239030838e-05, -1.339055597782135e-05, -1.232977956533432e-05, -1.126900315284729e-05, -1.020822674036026e-05, -9.14745032787323e-06, -8.0866739153862e-06, -7.02589750289917e-06, -5.96512109041214e-06, -4.90434467792511e-06, -3.84356826543808e-06, -2.78279185295105e-06, -1.7220154404640198e-06, -6.612390279769897e-07, 3.995373845100403e-07, 1.4603137969970703e-06, 2.5210902094841003e-06, 3.5818666219711304e-06, 4.64264303445816e-06, 5.7034194469451904e-06, 6.7641958594322205e-06, 7.82497227191925e-06, 8.88574868440628e-06, 9.94652509689331e-06, 1.100730150938034e-05, 1.206807792186737e-05, 1.31288543343544e-05, 1.418963074684143e-05, 1.525040715932846e-05, 1.631118357181549e-05, 1.737195998430252e-05, 1.843273639678955e-05, 1.949351280927658e-05, 2.055428922176361e-05, 2.161506563425064e-05, 2.267584204673767e-05, 2.37366184592247e-05, 2.479739487171173e-05, 2.585817128419876e-05, 2.691894769668579e-05, 2.797972410917282e-05, 2.904050052165985e-05, 3.010127693414688e-05, 3.116205334663391e-05, 3.222282975912094e-05, 3.328360617160797e-05, 3.4344382584095e-05, 3.540515899658203e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 8.0, 8.0, 10.0, 21.0, 36.0, 49.0, 91.0, 140.0, 250.0, 449.0, 848.0, 1603.0, 3056.0, 6492.0, 14699.0, 43050.0, 232456.0, 623107.0, 81606.0, 22638.0, 9085.0, 4166.0, 2108.0, 1099.0, 601.0, 320.0, 221.0, 129.0, 66.0, 40.0, 26.0, 25.0, 10.0, 15.0, 4.0, 7.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.03990888595581055, -0.038588523864746094, -0.03726816177368164, -0.03594779968261719, -0.034627437591552734, -0.03330707550048828, -0.03198671340942383, -0.030666351318359375, -0.029345989227294922, -0.02802562713623047, -0.026705265045166016, -0.025384902954101562, -0.02406454086303711, -0.022744178771972656, -0.021423816680908203, -0.02010345458984375, -0.018783092498779297, -0.017462730407714844, -0.01614236831665039, -0.014822006225585938, -0.013501644134521484, -0.012181282043457031, -0.010860919952392578, -0.009540557861328125, -0.008220195770263672, -0.006899833679199219, -0.005579471588134766, -0.0042591094970703125, -0.0029387474060058594, -0.0016183853149414062, -0.0002980232238769531, 0.0010223388671875, 0.002342700958251953, 0.0036630630493164062, 0.004983425140380859, 0.0063037872314453125, 0.007624149322509766, 0.008944511413574219, 0.010264873504638672, 0.011585235595703125, 0.012905597686767578, 0.014225959777832031, 0.015546321868896484, 0.016866683959960938, 0.01818704605102539, 0.019507408142089844, 0.020827770233154297, 0.02214813232421875, 0.023468494415283203, 0.024788856506347656, 0.02610921859741211, 0.027429580688476562, 0.028749942779541016, 0.03007030487060547, 0.03139066696166992, 0.032711029052734375, 0.03403139114379883, 0.03535175323486328, 0.036672115325927734, 0.03799247741699219, 0.03931283950805664, 0.040633201599121094, 0.04195356369018555, 0.04327392578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 10.0, 7.0, 11.0, 18.0, 17.0, 31.0, 36.0, 54.0, 71.0, 84.0, 76.0, 87.0, 81.0, 85.0, 60.0, 52.0, 38.0, 35.0, 23.0, 12.0, 19.0, 10.0, 8.0, 8.0, 5.0, 5.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00815582275390625, -0.007896661758422852, -0.007637500762939453, -0.007378339767456055, -0.007119178771972656, -0.006860017776489258, -0.006600856781005859, -0.006341695785522461, -0.0060825347900390625, -0.005823373794555664, -0.005564212799072266, -0.005305051803588867, -0.005045890808105469, -0.00478672981262207, -0.004527568817138672, -0.0042684078216552734, -0.004009246826171875, -0.0037500858306884766, -0.003490924835205078, -0.0032317638397216797, -0.0029726028442382812, -0.002713441848754883, -0.0024542808532714844, -0.002195119857788086, -0.0019359588623046875, -0.001676797866821289, -0.0014176368713378906, -0.0011584758758544922, -0.0008993148803710938, -0.0006401538848876953, -0.0003809928894042969, -0.00012183189392089844, 0.0001373291015625, 0.00039649009704589844, 0.0006556510925292969, 0.0009148120880126953, 0.0011739730834960938, 0.0014331340789794922, 0.0016922950744628906, 0.001951456069946289, 0.0022106170654296875, 0.002469778060913086, 0.0027289390563964844, 0.002988100051879883, 0.0032472610473632812, 0.0035064220428466797, 0.003765583038330078, 0.0040247440338134766, 0.004283905029296875, 0.0045430660247802734, 0.004802227020263672, 0.00506138801574707, 0.005320549011230469, 0.005579710006713867, 0.005838871002197266, 0.006098031997680664, 0.0063571929931640625, 0.006616353988647461, 0.006875514984130859, 0.007134675979614258, 0.007393836975097656, 0.007652997970581055, 0.007912158966064453, 0.008171319961547852, 0.00843048095703125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 11.0, 25.0, 25.0, 31.0, 43.0, 78.0, 131.0, 233.0, 156.0, 90.0, 67.0, 36.0, 27.0, 10.0, 15.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415453165769577, -0.3985787630081177, -0.3817043602466583, -0.364829957485199, -0.3479555547237396, -0.3310811519622803, -0.3142067790031433, -0.2973323464393616, -0.2804579734802246, -0.26358357071876526, -0.2467091679573059, -0.22983476519584656, -0.2129603624343872, -0.19608595967292786, -0.1792115718126297, -0.16233716905117035, -0.1454627513885498, -0.12858834862709045, -0.1117139458656311, -0.09483955055475235, -0.077965147793293, -0.06109074503183365, -0.044216349720954895, -0.027341946959495544, -0.010467544198036194, 0.0064068567007780075, 0.02328125759959221, 0.04015565663576126, 0.05703005939722061, 0.07390446215867996, 0.09077885746955872, 0.10765326023101807, 0.1245276927947998, 0.14140209555625916, 0.1582764983177185, 0.17515090107917786, 0.1920253038406372, 0.20889970660209656, 0.22577409446239471, 0.24264849722385406, 0.2595229148864746, 0.27639731764793396, 0.2932717204093933, 0.31014612317085266, 0.327020525932312, 0.34389492869377136, 0.3607693314552307, 0.3776437044143677, 0.394518107175827, 0.4113925099372864, 0.4282669126987457, 0.4451413154602051, 0.46201571822166443, 0.4788901209831238, 0.49576449394226074, 0.5126389265060425, 0.5295132994651794, 0.5463876724243164, 0.5632621049880981, 0.5801364779472351, 0.5970109105110168, 0.6138852834701538, 0.6307597160339355, 0.6476340889930725, 0.6645085215568542]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 7.0, 12.0, 6.0, 10.0, 3.0, 7.0, 10.0, 16.0, 16.0, 17.0, 20.0, 31.0, 23.0, 23.0, 28.0, 27.0, 31.0, 43.0, 28.0, 29.0, 41.0, 32.0, 27.0, 44.0, 34.0, 40.0, 29.0, 35.0, 39.0, 29.0, 20.0, 20.0, 26.0, 27.0, 26.0, 25.0, 24.0, 16.0, 16.0, 10.0, 13.0, 9.0, 6.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.16232359409332275, -0.1570339947938919, -0.15174439549446106, -0.1464548110961914, -0.14116521179676056, -0.1358756124973297, -0.13058601319789886, -0.12529641389846802, -0.12000681459903717, -0.11471721529960632, -0.10942762345075607, -0.10413802415132523, -0.09884842485189438, -0.09355883300304413, -0.08826923370361328, -0.08297963440418243, -0.07769004255533218, -0.07240044325590134, -0.06711085140705109, -0.06182125210762024, -0.05653165280818939, -0.05124205723404884, -0.045952461659908295, -0.04066286236047745, -0.0353732667863369, -0.0300836693495512, -0.024794071912765503, -0.019504476338624954, -0.014214878901839256, -0.008925281465053558, -0.0036356858909130096, 0.0016539134085178375, 0.006943508982658386, 0.012233106419444084, 0.017522703856229782, 0.02281229943037033, 0.02810189686715603, 0.03339149430394173, 0.038681089878082275, 0.04397068917751312, 0.04926028475165367, 0.05454988032579422, 0.05983947962522507, 0.06512907147407532, 0.07041867077350616, 0.07570827007293701, 0.08099786937236786, 0.0862874686717987, 0.09157706052064896, 0.0968666598200798, 0.10215625166893005, 0.1074458509683609, 0.11273545026779175, 0.1180250495672226, 0.12331464141607285, 0.1286042332649231, 0.13389383256435394, 0.1391834318637848, 0.14447303116321564, 0.14976263046264648, 0.15505221486091614, 0.16034181416034698, 0.16563141345977783, 0.17092101275920868, 0.17621061205863953]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 9.0, 13.0, 26.0, 29.0, 33.0, 56.0, 94.0, 131.0, 241.0, 387.0, 676.0, 1219.0, 2354.0, 6739.0, 4123256.0, 50418.0, 4014.0, 1976.0, 1077.0, 627.0, 340.0, 212.0, 113.0, 70.0, 46.0, 30.0, 23.0, 15.0, 14.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.134765625, -1.1030197143554688, -1.0712738037109375, -1.0395278930664062, -1.007781982421875, -0.9760360717773438, -0.9442901611328125, -0.9125442504882812, -0.88079833984375, -0.8490524291992188, -0.8173065185546875, -0.7855606079101562, -0.753814697265625, -0.7220687866210938, -0.6903228759765625, -0.6585769653320312, -0.6268310546875, -0.5950851440429688, -0.5633392333984375, -0.5315933227539062, -0.499847412109375, -0.46810150146484375, -0.4363555908203125, -0.40460968017578125, -0.37286376953125, -0.34111785888671875, -0.3093719482421875, -0.27762603759765625, -0.245880126953125, -0.21413421630859375, -0.1823883056640625, -0.15064239501953125, -0.118896484375, -0.08715057373046875, -0.0554046630859375, -0.02365875244140625, 0.008087158203125, 0.03983306884765625, 0.0715789794921875, 0.10332489013671875, 0.13507080078125, 0.16681671142578125, 0.1985626220703125, 0.23030853271484375, 0.262054443359375, 0.29380035400390625, 0.3255462646484375, 0.35729217529296875, 0.3890380859375, 0.42078399658203125, 0.4525299072265625, 0.48427581787109375, 0.516021728515625, 0.5477676391601562, 0.5795135498046875, 0.6112594604492188, 0.64300537109375, 0.6747512817382812, 0.7064971923828125, 0.7382431030273438, 0.769989013671875, 0.8017349243164062, 0.8334808349609375, 0.8652267456054688, 0.89697265625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 13.0, 13.0, 13.0, 29.0, 28.0, 27.0, 35.0, 45.0, 55.0, 56.0, 60.0, 66.0, 70.0, 70.0, 55.0, 46.0, 50.0, 49.0, 49.0, 35.0, 31.0, 26.0, 22.0, 16.0, 11.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2763671875, -0.26875877380371094, -0.2611503601074219, -0.2535419464111328, -0.24593353271484375, -0.2383251190185547, -0.23071670532226562, -0.22310829162597656, -0.2154998779296875, -0.20789146423339844, -0.20028305053710938, -0.1926746368408203, -0.18506622314453125, -0.1774578094482422, -0.16984939575195312, -0.16224098205566406, -0.154632568359375, -0.14702415466308594, -0.13941574096679688, -0.1318073272705078, -0.12419891357421875, -0.11659049987792969, -0.10898208618164062, -0.10137367248535156, -0.0937652587890625, -0.08615684509277344, -0.07854843139648438, -0.07094001770019531, -0.06333160400390625, -0.05572319030761719, -0.048114776611328125, -0.04050636291503906, -0.03289794921875, -0.025289535522460938, -0.017681121826171875, -0.010072708129882812, -0.00246429443359375, 0.0051441192626953125, 0.012752532958984375, 0.020360946655273438, 0.0279693603515625, 0.03557777404785156, 0.043186187744140625, 0.05079460144042969, 0.05840301513671875, 0.06601142883300781, 0.07361984252929688, 0.08122825622558594, 0.088836669921875, 0.09644508361816406, 0.10405349731445312, 0.11166191101074219, 0.11927032470703125, 0.1268787384033203, 0.13448715209960938, 0.14209556579589844, 0.1497039794921875, 0.15731239318847656, 0.16492080688476562, 0.1725292205810547, 0.18013763427734375, 0.1877460479736328, 0.19535446166992188, 0.20296287536621094, 0.2105712890625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 12.0, 12.0, 19.0, 27.0, 23.0, 33.0, 60.0, 58.0, 113.0, 200.0, 345.0, 669.0, 1541.0, 3834.0, 17091.0, 4116574.0, 44331.0, 5393.0, 1941.0, 902.0, 440.0, 216.0, 145.0, 70.0, 52.0, 37.0, 33.0, 35.0, 13.0, 15.0, 12.0, 7.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.111328125, -1.0801544189453125, -1.048980712890625, -1.0178070068359375, -0.98663330078125, -0.9554595947265625, -0.924285888671875, -0.8931121826171875, -0.8619384765625, -0.8307647705078125, -0.799591064453125, -0.7684173583984375, -0.73724365234375, -0.7060699462890625, -0.674896240234375, -0.6437225341796875, -0.612548828125, -0.5813751220703125, -0.550201416015625, -0.5190277099609375, -0.48785400390625, -0.4566802978515625, -0.425506591796875, -0.3943328857421875, -0.3631591796875, -0.3319854736328125, -0.300811767578125, -0.2696380615234375, -0.23846435546875, -0.2072906494140625, -0.176116943359375, -0.1449432373046875, -0.11376953125, -0.0825958251953125, -0.051422119140625, -0.0202484130859375, 0.01092529296875, 0.0420989990234375, 0.073272705078125, 0.1044464111328125, 0.1356201171875, 0.1667938232421875, 0.197967529296875, 0.2291412353515625, 0.26031494140625, 0.2914886474609375, 0.322662353515625, 0.3538360595703125, 0.385009765625, 0.4161834716796875, 0.447357177734375, 0.4785308837890625, 0.50970458984375, 0.5408782958984375, 0.572052001953125, 0.6032257080078125, 0.6343994140625, 0.6655731201171875, 0.696746826171875, 0.7279205322265625, 0.75909423828125, 0.7902679443359375, 0.821441650390625, 0.8526153564453125, 0.8837890625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 22.0, 82.0, 416.0, 3360.0, 117.0, 37.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2332763671875, -0.22787094116210938, -0.22246551513671875, -0.21706008911132812, -0.2116546630859375, -0.20624923706054688, -0.20084381103515625, -0.19543838500976562, -0.190032958984375, -0.18462753295898438, -0.17922210693359375, -0.17381668090820312, -0.1684112548828125, -0.16300582885742188, -0.15760040283203125, -0.15219497680664062, -0.14678955078125, -0.14138412475585938, -0.13597869873046875, -0.13057327270507812, -0.1251678466796875, -0.11976242065429688, -0.11435699462890625, -0.10895156860351562, -0.103546142578125, -0.09814071655273438, -0.09273529052734375, -0.08732986450195312, -0.0819244384765625, -0.07651901245117188, -0.07111358642578125, -0.06570816040039062, -0.060302734375, -0.054897308349609375, -0.04949188232421875, -0.044086456298828125, -0.0386810302734375, -0.033275604248046875, -0.02787017822265625, -0.022464752197265625, -0.017059326171875, -0.011653900146484375, -0.00624847412109375, -0.000843048095703125, 0.0045623779296875, 0.009967803955078125, 0.01537322998046875, 0.020778656005859375, 0.02618408203125, 0.031589508056640625, 0.03699493408203125, 0.042400360107421875, 0.0478057861328125, 0.053211212158203125, 0.05861663818359375, 0.06402206420898438, 0.069427490234375, 0.07483291625976562, 0.08023834228515625, 0.08564376831054688, 0.0910491943359375, 0.09645462036132812, 0.10186004638671875, 0.10726547241210938, 0.1126708984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 16.0, 29.0, 41.0, 47.0, 65.0, 207.0, 282.0, 125.0, 71.0, 48.0, 26.0, 15.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42864012718200684, -0.4129214286804199, -0.397202730178833, -0.3814840614795685, -0.36576536297798157, -0.35004666447639465, -0.3343279957771301, -0.3186092972755432, -0.3028905987739563, -0.2871719002723694, -0.27145320177078247, -0.25573453307151794, -0.24001583456993103, -0.22429713606834412, -0.2085784524679184, -0.19285976886749268, -0.17714107036590576, -0.16142237186431885, -0.14570368826389313, -0.1299850046634674, -0.1142663061618805, -0.09854761511087418, -0.08282892405986786, -0.06711023300886154, -0.051391541957855225, -0.03567285090684891, -0.01995415985584259, -0.004235468804836273, 0.011483222246170044, 0.02720191329717636, 0.04292060434818268, 0.058639295399188995, 0.07435804605484009, 0.0900767371058464, 0.10579542815685272, 0.12151411920785904, 0.13723281025886536, 0.15295150876045227, 0.168670192360878, 0.1843888759613037, 0.20010757446289062, 0.21582627296447754, 0.23154495656490326, 0.24726364016532898, 0.2629823386669159, 0.2787010371685028, 0.29441970586776733, 0.31013840436935425, 0.32585710287094116, 0.3415758013725281, 0.357294499874115, 0.3730131685733795, 0.38873186707496643, 0.40445056557655334, 0.42016923427581787, 0.4358879327774048, 0.4516066312789917, 0.4673253297805786, 0.4830440282821655, 0.49876269698143005, 0.5144814252853394, 0.5302000641822815, 0.5459187626838684, 0.5616374611854553, 0.5773561596870422]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 8.0, 2.0, 10.0, 11.0, 14.0, 9.0, 8.0, 18.0, 11.0, 13.0, 18.0, 22.0, 24.0, 28.0, 27.0, 33.0, 38.0, 36.0, 32.0, 43.0, 41.0, 43.0, 30.0, 36.0, 29.0, 36.0, 32.0, 43.0, 33.0, 36.0, 23.0, 22.0, 30.0, 21.0, 32.0, 19.0, 19.0, 6.0, 20.0, 14.0, 7.0, 7.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12995807826519012, -0.12581567466259003, -0.12167328596115112, -0.11753088980913162, -0.11338849365711212, -0.10924609005451202, -0.10510369390249252, -0.10096129775047302, -0.09681890159845352, -0.09267650544643402, -0.08853410929441452, -0.08439171314239502, -0.08024930953979492, -0.07610692083835602, -0.07196451723575592, -0.06782212108373642, -0.06367972493171692, -0.05953732877969742, -0.05539493262767792, -0.05125253275036812, -0.04711013659834862, -0.04296774044632912, -0.03882534056901932, -0.03468294441699982, -0.030540548264980316, -0.026398152112960815, -0.022255754098296165, -0.018113356083631516, -0.013970959931612015, -0.009828563779592514, -0.005686165764927864, -0.0015437677502632141, 0.0025986284017562866, 0.006741025485098362, 0.010883422568440437, 0.015025819651782513, 0.019168216735124588, 0.02331061288714409, 0.02745301090180874, 0.03159540891647339, 0.03573780506849289, 0.03988020122051239, 0.04402259737253189, 0.04816499724984169, 0.05230739340186119, 0.05644978955388069, 0.06059218943119049, 0.06473458558320999, 0.06887698173522949, 0.07301937788724899, 0.0771617740392685, 0.081304170191288, 0.0854465663433075, 0.08958896994590759, 0.0937313660979271, 0.0978737622499466, 0.1020161584019661, 0.1061585545539856, 0.1103009507060051, 0.1144433468580246, 0.1185857504606247, 0.1227281391620636, 0.1268705427646637, 0.1310129463672638, 0.1351553350687027]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 11.0, 10.0, 20.0, 15.0, 28.0, 46.0, 52.0, 73.0, 90.0, 160.0, 222.0, 345.0, 494.0, 766.0, 1222.0, 1907.0, 3474.0, 6280.0, 12255.0, 27218.0, 67660.0, 199003.0, 461032.0, 161165.0, 56487.0, 23659.0, 10957.0, 5720.0, 3220.0, 1711.0, 1075.0, 705.0, 445.0, 324.0, 198.0, 113.0, 124.0, 74.0, 51.0, 41.0, 30.0, 12.0, 15.0, 13.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.6064453125, -0.5882949829101562, -0.5701446533203125, -0.5519943237304688, -0.533843994140625, -0.5156936645507812, -0.4975433349609375, -0.47939300537109375, -0.46124267578125, -0.44309234619140625, -0.4249420166015625, -0.40679168701171875, -0.388641357421875, -0.37049102783203125, -0.3523406982421875, -0.33419036865234375, -0.3160400390625, -0.29788970947265625, -0.2797393798828125, -0.26158905029296875, -0.243438720703125, -0.22528839111328125, -0.2071380615234375, -0.18898773193359375, -0.17083740234375, -0.15268707275390625, -0.1345367431640625, -0.11638641357421875, -0.098236083984375, -0.08008575439453125, -0.0619354248046875, -0.04378509521484375, -0.025634765625, -0.00748443603515625, 0.0106658935546875, 0.02881622314453125, 0.046966552734375, 0.06511688232421875, 0.0832672119140625, 0.10141754150390625, 0.11956787109375, 0.13771820068359375, 0.1558685302734375, 0.17401885986328125, 0.192169189453125, 0.21031951904296875, 0.2284698486328125, 0.24662017822265625, 0.2647705078125, 0.28292083740234375, 0.3010711669921875, 0.31922149658203125, 0.337371826171875, 0.35552215576171875, 0.3736724853515625, 0.39182281494140625, 0.40997314453125, 0.42812347412109375, 0.4462738037109375, 0.46442413330078125, 0.482574462890625, 0.5007247924804688, 0.5188751220703125, 0.5370254516601562, 0.55517578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 9.0, 12.0, 9.0, 11.0, 22.0, 38.0, 34.0, 40.0, 34.0, 37.0, 56.0, 50.0, 58.0, 62.0, 61.0, 55.0, 43.0, 50.0, 55.0, 37.0, 46.0, 27.0, 29.0, 26.0, 16.0, 20.0, 7.0, 9.0, 6.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.1034708023071289, -0.10031318664550781, -0.09715557098388672, -0.09399795532226562, -0.09084033966064453, -0.08768272399902344, -0.08452510833740234, -0.08136749267578125, -0.07820987701416016, -0.07505226135253906, -0.07189464569091797, -0.06873703002929688, -0.06557941436767578, -0.06242179870605469, -0.059264183044433594, -0.0561065673828125, -0.052948951721191406, -0.04979133605957031, -0.04663372039794922, -0.043476104736328125, -0.04031848907470703, -0.03716087341308594, -0.034003257751464844, -0.03084564208984375, -0.027688026428222656, -0.024530410766601562, -0.02137279510498047, -0.018215179443359375, -0.015057563781738281, -0.011899948120117188, -0.008742332458496094, -0.005584716796875, -0.0024271011352539062, 0.0007305145263671875, 0.0038881301879882812, 0.007045745849609375, 0.010203361511230469, 0.013360977172851562, 0.016518592834472656, 0.01967620849609375, 0.022833824157714844, 0.025991439819335938, 0.02914905548095703, 0.032306671142578125, 0.03546428680419922, 0.03862190246582031, 0.041779518127441406, 0.0449371337890625, 0.048094749450683594, 0.05125236511230469, 0.05440998077392578, 0.057567596435546875, 0.06072521209716797, 0.06388282775878906, 0.06704044342041016, 0.07019805908203125, 0.07335567474365234, 0.07651329040527344, 0.07967090606689453, 0.08282852172851562, 0.08598613739013672, 0.08914375305175781, 0.0923013687133789, 0.095458984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 6.0, 14.0, 12.0, 21.0, 15.0, 17.0, 20.0, 26.0, 34.0, 73.0, 79.0, 88.0, 142.0, 176.0, 244.0, 344.0, 506.0, 705.0, 1001.0, 1535.0, 2234.0, 3615.0, 5790.0, 9712.0, 17662.0, 36073.0, 90411.0, 655938.0, 127145.0, 43705.0, 21107.0, 11282.0, 6639.0, 4030.0, 2481.0, 1715.0, 1141.0, 760.0, 520.0, 371.0, 292.0, 252.0, 167.0, 125.0, 83.0, 55.0, 58.0, 43.0, 26.0, 20.0, 13.0, 12.0, 10.0, 5.0, 8.0, 0.0, 3.0, 1.0, 2.0, 4.0], "bins": [-0.3857421875, -0.3735466003417969, -0.36135101318359375, -0.3491554260253906, -0.3369598388671875, -0.3247642517089844, -0.31256866455078125, -0.3003730773925781, -0.288177490234375, -0.2759819030761719, -0.26378631591796875, -0.2515907287597656, -0.2393951416015625, -0.22719955444335938, -0.21500396728515625, -0.20280838012695312, -0.19061279296875, -0.17841720581054688, -0.16622161865234375, -0.15402603149414062, -0.1418304443359375, -0.12963485717773438, -0.11743927001953125, -0.10524368286132812, -0.093048095703125, -0.08085250854492188, -0.06865692138671875, -0.056461334228515625, -0.0442657470703125, -0.032070159912109375, -0.01987457275390625, -0.007678985595703125, 0.0045166015625, 0.016712188720703125, 0.02890777587890625, 0.041103363037109375, 0.0532989501953125, 0.06549453735351562, 0.07769012451171875, 0.08988571166992188, 0.102081298828125, 0.11427688598632812, 0.12647247314453125, 0.13866806030273438, 0.1508636474609375, 0.16305923461914062, 0.17525482177734375, 0.18745040893554688, 0.19964599609375, 0.21184158325195312, 0.22403717041015625, 0.23623275756835938, 0.2484283447265625, 0.2606239318847656, 0.27281951904296875, 0.2850151062011719, 0.297210693359375, 0.3094062805175781, 0.32160186767578125, 0.3337974548339844, 0.3459930419921875, 0.3581886291503906, 0.37038421630859375, 0.3825798034667969, 0.394775390625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 9.0, 9.0, 11.0, 19.0, 16.0, 28.0, 24.0, 24.0, 29.0, 23.0, 21.0, 39.0, 40.0, 39.0, 34.0, 34.0, 35.0, 38.0, 37.0, 43.0, 31.0, 45.0, 51.0, 31.0, 35.0, 17.0, 31.0, 25.0, 24.0, 25.0, 21.0, 22.0, 12.0, 4.0, 9.0, 12.0, 10.0, 3.0, 2.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.04888916015625, -0.047374725341796875, -0.04586029052734375, -0.044345855712890625, -0.0428314208984375, -0.041316986083984375, -0.03980255126953125, -0.038288116455078125, -0.036773681640625, -0.035259246826171875, -0.03374481201171875, -0.032230377197265625, -0.0307159423828125, -0.029201507568359375, -0.02768707275390625, -0.026172637939453125, -0.024658203125, -0.023143768310546875, -0.02162933349609375, -0.020114898681640625, -0.0186004638671875, -0.017086029052734375, -0.01557159423828125, -0.014057159423828125, -0.012542724609375, -0.011028289794921875, -0.00951385498046875, -0.007999420166015625, -0.0064849853515625, -0.004970550537109375, -0.00345611572265625, -0.001941680908203125, -0.00042724609375, 0.001087188720703125, 0.00260162353515625, 0.004116058349609375, 0.0056304931640625, 0.007144927978515625, 0.00865936279296875, 0.010173797607421875, 0.011688232421875, 0.013202667236328125, 0.01471710205078125, 0.016231536865234375, 0.0177459716796875, 0.019260406494140625, 0.02077484130859375, 0.022289276123046875, 0.0238037109375, 0.025318145751953125, 0.02683258056640625, 0.028347015380859375, 0.0298614501953125, 0.031375885009765625, 0.03289031982421875, 0.034404754638671875, 0.035919189453125, 0.037433624267578125, 0.03894805908203125, 0.040462493896484375, 0.0419769287109375, 0.043491363525390625, 0.04500579833984375, 0.046520233154296875, 0.04803466796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 12.0, 6.0, 10.0, 14.0, 17.0, 34.0, 31.0, 39.0, 54.0, 61.0, 64.0, 73.0, 108.0, 130.0, 144.0, 204.0, 241.0, 322.0, 435.0, 559.0, 726.0, 912.0, 1354.0, 2166.0, 3512.0, 6447.0, 15198.0, 64513.0, 891092.0, 33690.0, 11208.0, 5248.0, 2912.0, 1923.0, 1214.0, 859.0, 632.0, 525.0, 400.0, 309.0, 246.0, 171.0, 139.0, 119.0, 101.0, 76.0, 59.0, 61.0, 47.0, 30.0, 35.0, 24.0, 20.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0], "bins": [-0.0628662109375, -0.060921669006347656, -0.05897712707519531, -0.05703258514404297, -0.055088043212890625, -0.05314350128173828, -0.05119895935058594, -0.049254417419433594, -0.04730987548828125, -0.045365333557128906, -0.04342079162597656, -0.04147624969482422, -0.039531707763671875, -0.03758716583251953, -0.03564262390136719, -0.033698081970214844, -0.0317535400390625, -0.029808998107910156, -0.027864456176757812, -0.02591991424560547, -0.023975372314453125, -0.02203083038330078, -0.020086288452148438, -0.018141746520996094, -0.01619720458984375, -0.014252662658691406, -0.012308120727539062, -0.010363578796386719, -0.008419036865234375, -0.006474494934082031, -0.0045299530029296875, -0.0025854110717773438, -0.000640869140625, 0.0013036727905273438, 0.0032482147216796875, 0.005192756652832031, 0.007137298583984375, 0.009081840515136719, 0.011026382446289062, 0.012970924377441406, 0.01491546630859375, 0.016860008239746094, 0.018804550170898438, 0.02074909210205078, 0.022693634033203125, 0.02463817596435547, 0.026582717895507812, 0.028527259826660156, 0.0304718017578125, 0.032416343688964844, 0.03436088562011719, 0.03630542755126953, 0.038249969482421875, 0.04019451141357422, 0.04213905334472656, 0.044083595275878906, 0.04602813720703125, 0.047972679138183594, 0.04991722106933594, 0.05186176300048828, 0.053806304931640625, 0.05575084686279297, 0.05769538879394531, 0.059639930725097656, 0.06158447265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 9.0, 5.0, 11.0, 15.0, 31.0, 43.0, 52.0, 81.0, 90.0, 181.0, 131.0, 105.0, 67.0, 42.0, 35.0, 30.0, 24.0, 14.0, 6.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.484558641910553e-06, -5.306676030158997e-06, -5.12879341840744e-06, -4.950910806655884e-06, -4.773028194904327e-06, -4.595145583152771e-06, -4.417262971401215e-06, -4.239380359649658e-06, -4.061497747898102e-06, -3.883615136146545e-06, -3.705732524394989e-06, -3.5278499126434326e-06, -3.3499673008918762e-06, -3.17208468914032e-06, -2.9942020773887634e-06, -2.816319465637207e-06, -2.6384368538856506e-06, -2.4605542421340942e-06, -2.282671630382538e-06, -2.1047890186309814e-06, -1.926906406879425e-06, -1.7490237951278687e-06, -1.5711411833763123e-06, -1.3932585716247559e-06, -1.2153759598731995e-06, -1.037493348121643e-06, -8.596107363700867e-07, -6.817281246185303e-07, -5.038455128669739e-07, -3.259629011154175e-07, -1.4808028936386108e-07, 2.9802322387695312e-08, 2.076849341392517e-07, 3.855675458908081e-07, 5.634501576423645e-07, 7.413327693939209e-07, 9.192153811454773e-07, 1.0970979928970337e-06, 1.27498060464859e-06, 1.4528632164001465e-06, 1.6307458281517029e-06, 1.8086284399032593e-06, 1.9865110516548157e-06, 2.164393663406372e-06, 2.3422762751579285e-06, 2.520158886909485e-06, 2.6980414986610413e-06, 2.8759241104125977e-06, 3.053806722164154e-06, 3.2316893339157104e-06, 3.409571945667267e-06, 3.5874545574188232e-06, 3.7653371691703796e-06, 3.943219780921936e-06, 4.1211023926734924e-06, 4.298985004425049e-06, 4.476867616176605e-06, 4.654750227928162e-06, 4.832632839679718e-06, 5.010515451431274e-06, 5.188398063182831e-06, 5.366280674934387e-06, 5.544163286685944e-06, 5.7220458984375e-06]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 7.0, 15.0, 15.0, 25.0, 27.0, 32.0, 35.0, 62.0, 111.0, 162.0, 291.0, 437.0, 780.0, 1457.0, 2844.0, 6515.0, 23201.0, 988412.0, 13589.0, 5112.0, 2486.0, 1206.0, 658.0, 391.0, 195.0, 139.0, 89.0, 61.0, 43.0, 34.0, 22.0, 15.0, 12.0, 9.0, 8.0, 8.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1783447265625, -0.17299842834472656, -0.16765213012695312, -0.1623058319091797, -0.15695953369140625, -0.1516132354736328, -0.14626693725585938, -0.14092063903808594, -0.1355743408203125, -0.13022804260253906, -0.12488174438476562, -0.11953544616699219, -0.11418914794921875, -0.10884284973144531, -0.10349655151367188, -0.09815025329589844, -0.092803955078125, -0.08745765686035156, -0.08211135864257812, -0.07676506042480469, -0.07141876220703125, -0.06607246398925781, -0.060726165771484375, -0.05537986755371094, -0.0500335693359375, -0.04468727111816406, -0.039340972900390625, -0.03399467468261719, -0.02864837646484375, -0.023302078247070312, -0.017955780029296875, -0.012609481811523438, -0.00726318359375, -0.0019168853759765625, 0.003429412841796875, 0.008775711059570312, 0.01412200927734375, 0.019468307495117188, 0.024814605712890625, 0.030160903930664062, 0.0355072021484375, 0.04085350036621094, 0.046199798583984375, 0.05154609680175781, 0.05689239501953125, 0.06223869323730469, 0.06758499145507812, 0.07293128967285156, 0.078277587890625, 0.08362388610839844, 0.08897018432617188, 0.09431648254394531, 0.09966278076171875, 0.10500907897949219, 0.11035537719726562, 0.11570167541503906, 0.1210479736328125, 0.12639427185058594, 0.13174057006835938, 0.1370868682861328, 0.14243316650390625, 0.1477794647216797, 0.15312576293945312, 0.15847206115722656, 0.163818359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 31.0, 160.0, 665.0, 44.0, 13.0, 11.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.017807483673095703, -0.017151832580566406, -0.01649618148803711, -0.015840530395507812, -0.015184879302978516, -0.014529228210449219, -0.013873577117919922, -0.013217926025390625, -0.012562274932861328, -0.011906623840332031, -0.011250972747802734, -0.010595321655273438, -0.00993967056274414, -0.009284019470214844, -0.008628368377685547, -0.00797271728515625, -0.007317066192626953, -0.006661415100097656, -0.006005764007568359, -0.0053501129150390625, -0.004694461822509766, -0.004038810729980469, -0.003383159637451172, -0.002727508544921875, -0.002071857452392578, -0.0014162063598632812, -0.0007605552673339844, -0.0001049041748046875, 0.0005507469177246094, 0.0012063980102539062, 0.0018620491027832031, 0.0025177001953125, 0.003173351287841797, 0.0038290023803710938, 0.004484653472900391, 0.0051403045654296875, 0.005795955657958984, 0.006451606750488281, 0.007107257843017578, 0.007762908935546875, 0.008418560028076172, 0.009074211120605469, 0.009729862213134766, 0.010385513305664062, 0.01104116439819336, 0.011696815490722656, 0.012352466583251953, 0.01300811767578125, 0.013663768768310547, 0.014319419860839844, 0.01497507095336914, 0.015630722045898438, 0.016286373138427734, 0.01694202423095703, 0.017597675323486328, 0.018253326416015625, 0.018908977508544922, 0.01956462860107422, 0.020220279693603516, 0.020875930786132812, 0.02153158187866211, 0.022187232971191406, 0.022842884063720703, 0.02349853515625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 17.0, 9.0, 17.0, 22.0, 40.0, 72.0, 124.0, 207.0, 200.0, 110.0, 46.0, 44.0, 28.0, 12.0, 15.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2568246126174927, -0.250991553068161, -0.24515849351882935, -0.23932543396949768, -0.2334923893213272, -0.22765932977199554, -0.22182627022266388, -0.21599321067333221, -0.21016015112400055, -0.20432709157466888, -0.19849403202533722, -0.19266098737716675, -0.18682792782783508, -0.18099486827850342, -0.17516180872917175, -0.1693287491798401, -0.16349568963050842, -0.15766263008117676, -0.1518295705318451, -0.14599651098251343, -0.14016346633434296, -0.1343304067850113, -0.12849734723567963, -0.12266428768634796, -0.11683124303817749, -0.11099818348884583, -0.10516513139009476, -0.09933207184076309, -0.09349901229143143, -0.08766596019268036, -0.0818329006433487, -0.07599984109401703, -0.07016677409410477, -0.0643337145447731, -0.058500658720731735, -0.05266760289669037, -0.046834543347358704, -0.04100148752331734, -0.03516843169927597, -0.029335372149944305, -0.02350231632590294, -0.017669258639216423, -0.011836201883852482, -0.006003145128488541, -0.00017008744180202484, 0.005662970244884491, 0.011496026068925858, 0.017329085618257523, 0.02316214144229889, 0.028995199128985405, 0.03482825681567192, 0.04066131263971329, 0.04649437218904495, 0.05232742801308632, 0.058160483837127686, 0.06399354338645935, 0.06982660293579102, 0.07565966248512268, 0.08149271458387375, 0.08732577413320541, 0.09315883368253708, 0.09899188578128815, 0.10482494533061981, 0.11065800487995148, 0.11649105697870255]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 2.0, 10.0, 7.0, 9.0, 12.0, 12.0, 17.0, 1.0, 16.0, 20.0, 22.0, 18.0, 25.0, 25.0, 26.0, 26.0, 39.0, 36.0, 40.0, 33.0, 41.0, 42.0, 44.0, 35.0, 26.0, 39.0, 37.0, 24.0, 42.0, 27.0, 38.0, 28.0, 23.0, 21.0, 19.0, 19.0, 13.0, 18.0, 14.0, 12.0, 10.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.054172586649656296, -0.05237709730863571, -0.05058160796761513, -0.04878611862659454, -0.04699062928557396, -0.045195139944553375, -0.04339965432882309, -0.04160416126251221, -0.03980867564678192, -0.03801318630576134, -0.03621769696474075, -0.03442220762372017, -0.032626718282699585, -0.030831228941679, -0.029035741463303566, -0.027240252122282982, -0.02544476091861725, -0.023649271577596664, -0.02185378223657608, -0.020058292895555496, -0.018262803554534912, -0.016467314213514328, -0.014671826735138893, -0.012876337394118309, -0.011080848053097725, -0.00928535871207714, -0.007489869836717844, -0.005694380961358547, -0.003898891620337963, -0.002103402279317379, -0.0003079138696193695, 0.0014875754714012146, 0.0032830610871315002, 0.005078550428152084, 0.006874039303511381, 0.008669528178870678, 0.010465017519891262, 0.012260506860911846, 0.014055995270609856, 0.01585148461163044, 0.017646973952651024, 0.019442463293671608, 0.021237952634692192, 0.023033440113067627, 0.02482892945408821, 0.026624418795108795, 0.02841990813612938, 0.030215397477149963, 0.03201088681817055, 0.03380637615919113, 0.035601865500211716, 0.0373973548412323, 0.039192844182252884, 0.04098833352327347, 0.042783819139003754, 0.044579312205314636, 0.04637479782104492, 0.048170287162065506, 0.04996577650308609, 0.051761265844106674, 0.05355675518512726, 0.05535224452614784, 0.057147733867168427, 0.05894321948289871, 0.060738712549209595]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 12.0, 16.0, 20.0, 23.0, 28.0, 31.0, 38.0, 64.0, 96.0, 262.0, 834.0, 4135.0, 33438.0, 729604.0, 259956.0, 16468.0, 2398.0, 560.0, 200.0, 92.0, 57.0, 42.0, 26.0, 29.0, 22.0, 20.0, 14.0, 8.0, 12.0, 12.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62548828125, -0.6064453125, -0.58740234375, -0.568359375, -0.54931640625, -0.5302734375, -0.51123046875, -0.4921875, -0.47314453125, -0.4541015625, -0.43505859375, -0.416015625, -0.39697265625, -0.3779296875, -0.35888671875, -0.33984375, -0.32080078125, -0.3017578125, -0.28271484375, -0.263671875, -0.24462890625, -0.2255859375, -0.20654296875, -0.1875, -0.16845703125, -0.1494140625, -0.13037109375, -0.111328125, -0.09228515625, -0.0732421875, -0.05419921875, -0.03515625, -0.01611328125, 0.0029296875, 0.02197265625, 0.041015625, 0.06005859375, 0.0791015625, 0.09814453125, 0.1171875, 0.13623046875, 0.1552734375, 0.17431640625, 0.193359375, 0.21240234375, 0.2314453125, 0.25048828125, 0.26953125, 0.28857421875, 0.3076171875, 0.32666015625, 0.345703125, 0.36474609375, 0.3837890625, 0.40283203125, 0.421875, 0.44091796875, 0.4599609375, 0.47900390625, 0.498046875, 0.51708984375, 0.5361328125, 0.55517578125, 0.57421875, 0.59326171875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 18.0, 19.0, 54.0, 65.0, 96.0, 144.0, 140.0, 133.0, 123.0, 90.0, 54.0, 32.0, 17.0, 9.0, 10.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.125732421875, -0.12330293655395508, -0.12087345123291016, -0.11844396591186523, -0.11601448059082031, -0.11358499526977539, -0.11115550994873047, -0.10872602462768555, -0.10629653930664062, -0.1038670539855957, -0.10143756866455078, -0.09900808334350586, -0.09657859802246094, -0.09414911270141602, -0.0917196273803711, -0.08929014205932617, -0.08686065673828125, -0.08443117141723633, -0.0820016860961914, -0.07957220077514648, -0.07714271545410156, -0.07471323013305664, -0.07228374481201172, -0.0698542594909668, -0.06742477416992188, -0.06499528884887695, -0.06256580352783203, -0.06013631820678711, -0.05770683288574219, -0.055277347564697266, -0.052847862243652344, -0.05041837692260742, -0.0479888916015625, -0.04555940628051758, -0.043129920959472656, -0.040700435638427734, -0.03827095031738281, -0.03584146499633789, -0.03341197967529297, -0.030982494354248047, -0.028553009033203125, -0.026123523712158203, -0.02369403839111328, -0.02126455307006836, -0.018835067749023438, -0.016405582427978516, -0.013976097106933594, -0.011546611785888672, -0.00911712646484375, -0.006687641143798828, -0.004258155822753906, -0.0018286705017089844, 0.0006008148193359375, 0.0030303001403808594, 0.005459785461425781, 0.007889270782470703, 0.010318756103515625, 0.012748241424560547, 0.015177726745605469, 0.01760721206665039, 0.020036697387695312, 0.022466182708740234, 0.024895668029785156, 0.027325153350830078, 0.029754638671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 11.0, 16.0, 17.0, 32.0, 65.0, 80.0, 149.0, 267.0, 454.0, 892.0, 1637.0, 3037.0, 5569.0, 11184.0, 22746.0, 49343.0, 121904.0, 371582.0, 284702.0, 95747.0, 40306.0, 18968.0, 9422.0, 4729.0, 2545.0, 1394.0, 742.0, 408.0, 234.0, 139.0, 73.0, 56.0, 27.0, 20.0, 8.0, 8.0, 7.0, 10.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08990478515625, -0.0867910385131836, -0.08367729187011719, -0.08056354522705078, -0.07744979858398438, -0.07433605194091797, -0.07122230529785156, -0.06810855865478516, -0.06499481201171875, -0.061881065368652344, -0.05876731872558594, -0.05565357208251953, -0.052539825439453125, -0.04942607879638672, -0.04631233215332031, -0.043198585510253906, -0.0400848388671875, -0.036971092224121094, -0.03385734558105469, -0.03074359893798828, -0.027629852294921875, -0.02451610565185547, -0.021402359008789062, -0.018288612365722656, -0.01517486572265625, -0.012061119079589844, -0.008947372436523438, -0.005833625793457031, -0.002719879150390625, 0.00039386749267578125, 0.0035076141357421875, 0.006621360778808594, 0.009735107421875, 0.012848854064941406, 0.015962600708007812, 0.01907634735107422, 0.022190093994140625, 0.02530384063720703, 0.028417587280273438, 0.031531333923339844, 0.03464508056640625, 0.037758827209472656, 0.04087257385253906, 0.04398632049560547, 0.047100067138671875, 0.05021381378173828, 0.05332756042480469, 0.056441307067871094, 0.0595550537109375, 0.0626688003540039, 0.06578254699707031, 0.06889629364013672, 0.07201004028320312, 0.07512378692626953, 0.07823753356933594, 0.08135128021240234, 0.08446502685546875, 0.08757877349853516, 0.09069252014160156, 0.09380626678466797, 0.09692001342773438, 0.10003376007080078, 0.10314750671386719, 0.1062612533569336, 0.109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 9.0, 3.0, 12.0, 8.0, 22.0, 15.0, 19.0, 15.0, 25.0, 33.0, 31.0, 35.0, 34.0, 41.0, 34.0, 40.0, 50.0, 49.0, 40.0, 49.0, 46.0, 40.0, 42.0, 29.0, 39.0, 30.0, 30.0, 20.0, 22.0, 31.0, 22.0, 15.0, 13.0, 8.0, 5.0, 11.0, 5.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0247650146484375, -0.02404618263244629, -0.023327350616455078, -0.022608518600463867, -0.021889686584472656, -0.021170854568481445, -0.020452022552490234, -0.019733190536499023, -0.019014358520507812, -0.0182955265045166, -0.01757669448852539, -0.01685786247253418, -0.01613903045654297, -0.015420198440551758, -0.014701366424560547, -0.013982534408569336, -0.013263702392578125, -0.012544870376586914, -0.011826038360595703, -0.011107206344604492, -0.010388374328613281, -0.00966954231262207, -0.00895071029663086, -0.008231878280639648, -0.0075130462646484375, -0.0067942142486572266, -0.006075382232666016, -0.005356550216674805, -0.004637718200683594, -0.003918886184692383, -0.003200054168701172, -0.002481222152709961, -0.00176239013671875, -0.001043558120727539, -0.0003247261047363281, 0.0003941059112548828, 0.0011129379272460938, 0.0018317699432373047, 0.0025506019592285156, 0.0032694339752197266, 0.0039882659912109375, 0.0047070980072021484, 0.005425930023193359, 0.00614476203918457, 0.006863594055175781, 0.007582426071166992, 0.008301258087158203, 0.009020090103149414, 0.009738922119140625, 0.010457754135131836, 0.011176586151123047, 0.011895418167114258, 0.012614250183105469, 0.01333308219909668, 0.01405191421508789, 0.014770746231079102, 0.015489578247070312, 0.016208410263061523, 0.016927242279052734, 0.017646074295043945, 0.018364906311035156, 0.019083738327026367, 0.019802570343017578, 0.02052140235900879, 0.021240234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 17.0, 26.0, 36.0, 48.0, 61.0, 91.0, 126.0, 226.0, 338.0, 608.0, 1012.0, 1949.0, 4202.0, 11124.0, 49954.0, 880630.0, 74517.0, 13754.0, 4866.0, 2113.0, 1120.0, 620.0, 385.0, 234.0, 140.0, 93.0, 78.0, 43.0, 32.0, 19.0, 16.0, 16.0, 8.0, 12.0, 3.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0192718505859375, -0.018745064735412598, -0.018218278884887695, -0.017691493034362793, -0.01716470718383789, -0.01663792133331299, -0.016111135482788086, -0.015584349632263184, -0.015057563781738281, -0.014530777931213379, -0.014003992080688477, -0.013477206230163574, -0.012950420379638672, -0.01242363452911377, -0.011896848678588867, -0.011370062828063965, -0.010843276977539062, -0.01031649112701416, -0.009789705276489258, -0.009262919425964355, -0.008736133575439453, -0.00820934772491455, -0.0076825618743896484, -0.007155776023864746, -0.006628990173339844, -0.006102204322814941, -0.005575418472290039, -0.005048632621765137, -0.004521846771240234, -0.003995060920715332, -0.0034682750701904297, -0.0029414892196655273, -0.002414703369140625, -0.0018879175186157227, -0.0013611316680908203, -0.000834345817565918, -0.0003075599670410156, 0.00021922588348388672, 0.0007460117340087891, 0.0012727975845336914, 0.0017995834350585938, 0.002326369285583496, 0.0028531551361083984, 0.0033799409866333008, 0.003906726837158203, 0.0044335126876831055, 0.004960298538208008, 0.00548708438873291, 0.0060138702392578125, 0.006540656089782715, 0.007067441940307617, 0.0075942277908325195, 0.008121013641357422, 0.008647799491882324, 0.009174585342407227, 0.009701371192932129, 0.010228157043457031, 0.010754942893981934, 0.011281728744506836, 0.011808514595031738, 0.01233530044555664, 0.012862086296081543, 0.013388872146606445, 0.013915657997131348, 0.01444244384765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 7.0, 2.0, 8.0, 7.0, 10.0, 14.0, 12.0, 22.0, 28.0, 68.0, 91.0, 146.0, 138.0, 142.0, 81.0, 70.0, 44.0, 25.0, 20.0, 13.0, 6.0, 13.0, 3.0, 5.0, 9.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2218952178955078e-05, -1.189298927783966e-05, -1.1567026376724243e-05, -1.1241063475608826e-05, -1.0915100574493408e-05, -1.058913767337799e-05, -1.0263174772262573e-05, -9.937211871147156e-06, -9.611248970031738e-06, -9.28528606891632e-06, -8.959323167800903e-06, -8.633360266685486e-06, -8.307397365570068e-06, -7.981434464454651e-06, -7.655471563339233e-06, -7.329508662223816e-06, -7.0035457611083984e-06, -6.677582859992981e-06, -6.3516199588775635e-06, -6.025657057762146e-06, -5.6996941566467285e-06, -5.373731255531311e-06, -5.0477683544158936e-06, -4.721805453300476e-06, -4.395842552185059e-06, -4.069879651069641e-06, -3.7439167499542236e-06, -3.417953848838806e-06, -3.0919909477233887e-06, -2.766028046607971e-06, -2.4400651454925537e-06, -2.1141022443771362e-06, -1.7881393432617188e-06, -1.4621764421463013e-06, -1.1362135410308838e-06, -8.102506399154663e-07, -4.842877388000488e-07, -1.5832483768463135e-07, 1.6763806343078613e-07, 4.936009645462036e-07, 8.195638656616211e-07, 1.1455267667770386e-06, 1.471489667892456e-06, 1.7974525690078735e-06, 2.123415470123291e-06, 2.4493783712387085e-06, 2.775341272354126e-06, 3.1013041734695435e-06, 3.427267074584961e-06, 3.7532299757003784e-06, 4.079192876815796e-06, 4.405155777931213e-06, 4.731118679046631e-06, 5.057081580162048e-06, 5.383044481277466e-06, 5.709007382392883e-06, 6.034970283508301e-06, 6.360933184623718e-06, 6.686896085739136e-06, 7.012858986854553e-06, 7.338821887969971e-06, 7.664784789085388e-06, 7.990747690200806e-06, 8.316710591316223e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 15.0, 11.0, 31.0, 44.0, 77.0, 126.0, 191.0, 290.0, 496.0, 877.0, 1506.0, 2767.0, 5522.0, 11705.0, 29383.0, 110481.0, 698985.0, 128295.0, 32131.0, 12844.0, 5912.0, 3097.0, 1556.0, 880.0, 532.0, 301.0, 165.0, 116.0, 74.0, 44.0, 27.0, 20.0, 11.0, 14.0, 9.0, 6.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00492095947265625, -0.004769742488861084, -0.004618525505065918, -0.004467308521270752, -0.004316091537475586, -0.00416487455368042, -0.004013657569885254, -0.003862440586090088, -0.003711223602294922, -0.003560006618499756, -0.00340878963470459, -0.003257572650909424, -0.003106355667114258, -0.002955138683319092, -0.0028039216995239258, -0.0026527047157287598, -0.0025014877319335938, -0.0023502707481384277, -0.0021990537643432617, -0.0020478367805480957, -0.0018966197967529297, -0.0017454028129577637, -0.0015941858291625977, -0.0014429688453674316, -0.0012917518615722656, -0.0011405348777770996, -0.0009893178939819336, -0.0008381009101867676, -0.0006868839263916016, -0.0005356669425964355, -0.00038444995880126953, -0.00023323297500610352, -8.20159912109375e-05, 6.920099258422852e-05, 0.00022041797637939453, 0.00037163496017456055, 0.0005228519439697266, 0.0006740689277648926, 0.0008252859115600586, 0.0009765028953552246, 0.0011277198791503906, 0.0012789368629455566, 0.0014301538467407227, 0.0015813708305358887, 0.0017325878143310547, 0.0018838047981262207, 0.0020350217819213867, 0.0021862387657165527, 0.0023374557495117188, 0.0024886727333068848, 0.0026398897171020508, 0.002791106700897217, 0.002942323684692383, 0.003093540668487549, 0.003244757652282715, 0.003395974636077881, 0.003547191619873047, 0.003698408603668213, 0.003849625587463379, 0.004000842571258545, 0.004152059555053711, 0.004303276538848877, 0.004454493522644043, 0.004605710506439209, 0.004756927490234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 8.0, 4.0, 6.0, 7.0, 10.0, 8.0, 17.0, 18.0, 20.0, 20.0, 31.0, 56.0, 99.0, 123.0, 106.0, 115.0, 82.0, 67.0, 41.0, 24.0, 28.0, 18.0, 18.0, 15.0, 11.0, 7.0, 11.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011148452758789062, -0.0010794848203659058, -0.0010441243648529053, -0.0010087639093399048, -0.0009734034538269043, -0.0009380429983139038, -0.0009026825428009033, -0.0008673220872879028, -0.0008319616317749023, -0.0007966011762619019, -0.0007612407207489014, -0.0007258802652359009, -0.0006905198097229004, -0.0006551593542098999, -0.0006197988986968994, -0.0005844384431838989, -0.0005490779876708984, -0.000513717532157898, -0.00047835707664489746, -0.00044299662113189697, -0.0004076361656188965, -0.000372275710105896, -0.0003369152545928955, -0.000301554799079895, -0.00026619434356689453, -0.00023083388805389404, -0.00019547343254089355, -0.00016011297702789307, -0.00012475252151489258, -8.939206600189209e-05, -5.40316104888916e-05, -1.8671154975891113e-05, 1.6689300537109375e-05, 5.204975605010986e-05, 8.741021156311035e-05, 0.00012277066707611084, 0.00015813112258911133, 0.00019349157810211182, 0.0002288520336151123, 0.0002642124891281128, 0.0002995729446411133, 0.00033493340015411377, 0.00037029385566711426, 0.00040565431118011475, 0.00044101476669311523, 0.0004763752222061157, 0.0005117356777191162, 0.0005470961332321167, 0.0005824565887451172, 0.0006178170442581177, 0.0006531774997711182, 0.0006885379552841187, 0.0007238984107971191, 0.0007592588663101196, 0.0007946193218231201, 0.0008299797773361206, 0.0008653402328491211, 0.0009007006883621216, 0.0009360611438751221, 0.0009714215993881226, 0.001006782054901123, 0.0010421425104141235, 0.001077502965927124, 0.0011128634214401245, 0.001148223876953125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 11.0, 20.0, 19.0, 34.0, 61.0, 96.0, 158.0, 212.0, 151.0, 82.0, 38.0, 37.0, 15.0, 23.0, 10.0, 5.0, 3.0, 6.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03994635492563248, -0.03764902055263519, -0.03535168245434761, -0.03305434808135033, -0.030757011845707893, -0.02845967561006546, -0.026162341237068176, -0.023865005001425743, -0.02156766876578331, -0.019270332530140877, -0.016972996294498444, -0.01467566192150116, -0.012378325685858727, -0.010080989450216293, -0.007783654145896435, -0.005486318841576576, -0.003188982605934143, -0.0008916468359529972, 0.0014056889340281487, 0.0037030247040092945, 0.00600036047399044, 0.008297696709632874, 0.010595032013952732, 0.01289236731827259, 0.015189703553915024, 0.017487039789557457, 0.01978437602519989, 0.022081710398197174, 0.024379046633839607, 0.02667638286948204, 0.028973717242479324, 0.03127105534076691, 0.033568382263183594, 0.03586571663618088, 0.03816305473446846, 0.040460389107465744, 0.042757727205753326, 0.04505506157875061, 0.047352395951747894, 0.04964973032474518, 0.05194706842303276, 0.054244402796030045, 0.05654174089431763, 0.05883907526731491, 0.061136409640312195, 0.06343375146389008, 0.06573108583688736, 0.06802842020988464, 0.07032575458288193, 0.07262308895587921, 0.0749204233288765, 0.07721776515245438, 0.07951509952545166, 0.08181243389844894, 0.08410976827144623, 0.08640710264444351, 0.0887044370174408, 0.09100177139043808, 0.09329910576343536, 0.09559644758701324, 0.09789378196001053, 0.10019111633300781, 0.1024884507060051, 0.10478578507900238, 0.10708312690258026]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 11.0, 11.0, 13.0, 14.0, 12.0, 30.0, 27.0, 28.0, 30.0, 32.0, 34.0, 47.0, 42.0, 41.0, 56.0, 44.0, 42.0, 40.0, 56.0, 39.0, 48.0, 32.0, 28.0, 40.0, 24.0, 18.0, 24.0, 16.0, 19.0, 14.0, 13.0, 7.0, 8.0, 9.0, 8.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024606158956885338, -0.023748796433210373, -0.022891435772180557, -0.022034073248505592, -0.021176710724830627, -0.020319350063800812, -0.019461987540125847, -0.018604625016450882, -0.017747264355421066, -0.0168899018317461, -0.016032541170716286, -0.01517517864704132, -0.014317816123366356, -0.013460454531013966, -0.012603092938661575, -0.01174573041498661, -0.010888367891311646, -0.010031006298959255, -0.00917364377528429, -0.0083162821829319, -0.007458920124918222, -0.006601558066904545, -0.0057441964745521545, -0.004886834416538477, -0.004029472358524799, -0.0031721103005111217, -0.002314748475328088, -0.0014573866501450539, -0.0006000245921313763, 0.00025733746588230133, 0.0011146990582346916, 0.0019720611162483692, 0.0028294213116168976, 0.003686783369630575, 0.004544145427644253, 0.005401507019996643, 0.006258869078010321, 0.007116231136023998, 0.007973592728376389, 0.008830955252051353, 0.009688316844403744, 0.010545678436756134, 0.011403040960431099, 0.01226040255278349, 0.01311776414513588, 0.013975126668810844, 0.014832488261163235, 0.015689849853515625, 0.01654721237719059, 0.017404574900865555, 0.01826193556189537, 0.019119298085570335, 0.0199766606092453, 0.020834021270275116, 0.02169138379395008, 0.022548746317625046, 0.02340610697865486, 0.024263469502329826, 0.025120830163359642, 0.025978192687034607, 0.026835555210709572, 0.027692917734384537, 0.028550278395414352, 0.029407640919089317, 0.030265003442764282]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 18.0, 19.0, 46.0, 210.0, 445.0, 1423.0, 13414.0, 4173506.0, 4033.0, 796.0, 211.0, 85.0, 39.0, 19.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.06949710845947266, -0.06337165832519531, -0.05724620819091797, -0.051120758056640625, -0.04499530792236328, -0.03886985778808594, -0.032744407653808594, -0.02661895751953125, -0.020493507385253906, -0.014368057250976562, -0.008242607116699219, -0.002117156982421875, 0.004008293151855469, 0.010133743286132812, 0.016259193420410156, 0.0223846435546875, 0.028510093688964844, 0.03463554382324219, 0.04076099395751953, 0.046886444091796875, 0.05301189422607422, 0.05913734436035156, 0.0652627944946289, 0.07138824462890625, 0.0775136947631836, 0.08363914489746094, 0.08976459503173828, 0.09589004516601562, 0.10201549530029297, 0.10814094543457031, 0.11426639556884766, 0.120391845703125, 0.12651729583740234, 0.1326427459716797, 0.13876819610595703, 0.14489364624023438, 0.15101909637451172, 0.15714454650878906, 0.1632699966430664, 0.16939544677734375, 0.1755208969116211, 0.18164634704589844, 0.18777179718017578, 0.19389724731445312, 0.20002269744873047, 0.2061481475830078, 0.21227359771728516, 0.2183990478515625, 0.22452449798583984, 0.2306499481201172, 0.23677539825439453, 0.24290084838867188, 0.24902629852294922, 0.25515174865722656, 0.2612771987915039, 0.26740264892578125, 0.2735280990600586, 0.27965354919433594, 0.2857789993286133, 0.2919044494628906, 0.29802989959716797, 0.3041553497314453, 0.31028079986572266, 0.31640625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 10.0, 12.0, 28.0, 49.0, 82.0, 126.0, 145.0, 158.0, 123.0, 117.0, 66.0, 44.0, 31.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303497314453125, -0.027678251266479492, -0.025006771087646484, -0.022335290908813477, -0.01966381072998047, -0.01699233055114746, -0.014320850372314453, -0.011649370193481445, -0.008977890014648438, -0.00630640983581543, -0.003634929656982422, -0.0009634494781494141, 0.0017080307006835938, 0.0043795108795166016, 0.007050991058349609, 0.009722471237182617, 0.012393951416015625, 0.015065431594848633, 0.01773691177368164, 0.02040839195251465, 0.023079872131347656, 0.025751352310180664, 0.028422832489013672, 0.03109431266784668, 0.03376579284667969, 0.036437273025512695, 0.0391087532043457, 0.04178023338317871, 0.04445171356201172, 0.04712319374084473, 0.049794673919677734, 0.05246615409851074, 0.05513763427734375, 0.05780911445617676, 0.060480594635009766, 0.06315207481384277, 0.06582355499267578, 0.06849503517150879, 0.0711665153503418, 0.0738379955291748, 0.07650947570800781, 0.07918095588684082, 0.08185243606567383, 0.08452391624450684, 0.08719539642333984, 0.08986687660217285, 0.09253835678100586, 0.09520983695983887, 0.09788131713867188, 0.10055279731750488, 0.10322427749633789, 0.1058957576751709, 0.1085672378540039, 0.11123871803283691, 0.11391019821166992, 0.11658167839050293, 0.11925315856933594, 0.12192463874816895, 0.12459611892700195, 0.12726759910583496, 0.12993907928466797, 0.13261055946350098, 0.13528203964233398, 0.137953519821167, 0.140625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 17.0, 33.0, 49.0, 129.0, 246.0, 569.0, 1743.0, 9334.0, 4122285.0, 54156.0, 4019.0, 1034.0, 345.0, 174.0, 75.0, 30.0, 15.0, 12.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1656494140625, -0.16008377075195312, -0.15451812744140625, -0.14895248413085938, -0.1433868408203125, -0.13782119750976562, -0.13225555419921875, -0.12668991088867188, -0.121124267578125, -0.11555862426757812, -0.10999298095703125, -0.10442733764648438, -0.0988616943359375, -0.09329605102539062, -0.08773040771484375, -0.08216476440429688, -0.07659912109375, -0.07103347778320312, -0.06546783447265625, -0.059902191162109375, -0.0543365478515625, -0.048770904541015625, -0.04320526123046875, -0.037639617919921875, -0.032073974609375, -0.026508331298828125, -0.02094268798828125, -0.015377044677734375, -0.0098114013671875, -0.004245758056640625, 0.00131988525390625, 0.006885528564453125, 0.012451171875, 0.018016815185546875, 0.02358245849609375, 0.029148101806640625, 0.0347137451171875, 0.040279388427734375, 0.04584503173828125, 0.051410675048828125, 0.056976318359375, 0.06254196166992188, 0.06810760498046875, 0.07367324829101562, 0.0792388916015625, 0.08480453491210938, 0.09037017822265625, 0.09593582153320312, 0.10150146484375, 0.10706710815429688, 0.11263275146484375, 0.11819839477539062, 0.1237640380859375, 0.12932968139648438, 0.13489532470703125, 0.14046096801757812, 0.146026611328125, 0.15159225463867188, 0.15715789794921875, 0.16272354125976562, 0.1682891845703125, 0.17385482788085938, 0.17942047119140625, 0.18498611450195312, 0.1905517578125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 7.0, 20.0, 27.0, 54.0, 234.0, 3306.0, 284.0, 72.0, 27.0, 16.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176544189453125, -0.017128944396972656, -0.016603469848632812, -0.01607799530029297, -0.015552520751953125, -0.015027046203613281, -0.014501571655273438, -0.013976097106933594, -0.01345062255859375, -0.012925148010253906, -0.012399673461914062, -0.011874198913574219, -0.011348724365234375, -0.010823249816894531, -0.010297775268554688, -0.009772300720214844, -0.009246826171875, -0.008721351623535156, -0.008195877075195312, -0.007670402526855469, -0.007144927978515625, -0.006619453430175781, -0.0060939788818359375, -0.005568504333496094, -0.00504302978515625, -0.004517555236816406, -0.0039920806884765625, -0.0034666061401367188, -0.002941131591796875, -0.0024156570434570312, -0.0018901824951171875, -0.0013647079467773438, -0.0008392333984375, -0.00031375885009765625, 0.0002117156982421875, 0.0007371902465820312, 0.001262664794921875, 0.0017881393432617188, 0.0023136138916015625, 0.0028390884399414062, 0.00336456298828125, 0.0038900375366210938, 0.0044155120849609375, 0.004940986633300781, 0.005466461181640625, 0.005991935729980469, 0.0065174102783203125, 0.007042884826660156, 0.007568359375, 0.008093833923339844, 0.008619308471679688, 0.009144783020019531, 0.009670257568359375, 0.010195732116699219, 0.010721206665039062, 0.011246681213378906, 0.01177215576171875, 0.012297630310058594, 0.012823104858398438, 0.013348579406738281, 0.013874053955078125, 0.014399528503417969, 0.014925003051757812, 0.015450477600097656, 0.0159759521484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 8.0, 5.0, 10.0, 14.0, 14.0, 16.0, 20.0, 27.0, 40.0, 44.0, 68.0, 91.0, 127.0, 125.0, 110.0, 70.0, 42.0, 39.0, 23.0, 25.0, 8.0, 10.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.033240869641304016, -0.032137662172317505, -0.031034456565976143, -0.02993125095963478, -0.02882804349064827, -0.027724837884306908, -0.026621632277965546, -0.025518424808979034, -0.024415219202637672, -0.02331201359629631, -0.0222088061273098, -0.021105600520968437, -0.020002394914627075, -0.018899187445640564, -0.017795981839299202, -0.01669277623295784, -0.015589568763971329, -0.014486362226307392, -0.013383155688643456, -0.012279950082302094, -0.011176743544638157, -0.01007353700697422, -0.008970331400632858, -0.007867124862968922, -0.006763918325304985, -0.005660711787641048, -0.004557505715638399, -0.003454299410805106, -0.002351093105971813, -0.0012478865683078766, -0.00014468049630522728, 0.000958525575697422, 0.0020617321133613586, 0.0031649384181946516, 0.0042681447230279446, 0.005371350795030594, 0.0064745573326945305, 0.007577763870358467, 0.008680969476699829, 0.009784176014363766, 0.010887382552027702, 0.011990589089691639, 0.013093795627355576, 0.014197001233696938, 0.015300207771360874, 0.01640341430902481, 0.017506619915366173, 0.018609825521707535, 0.019713032990694046, 0.020816238597035408, 0.02191944606602192, 0.02302265167236328, 0.024125859141349792, 0.025229064747691154, 0.026332270354032516, 0.027435477823019028, 0.02853868342936039, 0.02964188903570175, 0.030745096504688263, 0.031848303973674774, 0.03295150771737099, 0.0340547151863575, 0.03515792265534401, 0.03626112639904022, 0.03736433386802673]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 7.0, 2.0, 5.0, 3.0, 5.0, 6.0, 2.0, 14.0, 5.0, 14.0, 13.0, 26.0, 30.0, 32.0, 25.0, 23.0, 31.0, 48.0, 41.0, 50.0, 44.0, 59.0, 32.0, 53.0, 50.0, 46.0, 34.0, 36.0, 37.0, 37.0, 24.0, 25.0, 24.0, 15.0, 20.0, 15.0, 18.0, 14.0, 7.0, 13.0, 7.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02007206901907921, -0.01937422901391983, -0.018676387146115303, -0.017978547140955925, -0.017280705273151398, -0.01658286526799202, -0.01588502526283264, -0.015187183395028114, -0.014489342458546162, -0.013791501522064209, -0.013093660585582256, -0.012395819649100304, -0.011697979643940926, -0.011000137776136398, -0.01030229777097702, -0.009604456834495068, -0.008906615898013115, -0.008208774961531162, -0.00751093402504921, -0.006813093554228544, -0.006115252617746592, -0.005417411681264639, -0.0047195712104439735, -0.004021730273962021, -0.003323889337480068, -0.0026260484009981155, -0.0019282076973468065, -0.0012303669936954975, -0.0005325260572135448, 0.00016531487926840782, 0.0008631553500890732, 0.0015609962865710258, 0.0022588353604078293, 0.002956676296889782, 0.003654517000541091, 0.0043523577041924, 0.005050198640674353, 0.005748039577156305, 0.006445880047976971, 0.007143720984458923, 0.007841561920940876, 0.008539402857422829, 0.009237243793904781, 0.009935084730386734, 0.010632924735546112, 0.01133076660335064, 0.012028606608510017, 0.01272644754499197, 0.013424288481473923, 0.014122129417955875, 0.014819970354437828, 0.015517810359597206, 0.016215652227401733, 0.01691349223256111, 0.01761133223772049, 0.018309174105525017, 0.019007015973329544, 0.019704855978488922, 0.02040269784629345, 0.021100537851452827, 0.021798379719257355, 0.022496219724416733, 0.02319405972957611, 0.023891901597380638, 0.024589741602540016]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 12.0, 8.0, 13.0, 15.0, 24.0, 47.0, 67.0, 86.0, 129.0, 157.0, 261.0, 331.0, 482.0, 718.0, 990.0, 1493.0, 2119.0, 3026.0, 4545.0, 6835.0, 10404.0, 16152.0, 26181.0, 43906.0, 79192.0, 152192.0, 275236.0, 190107.0, 95994.0, 52779.0, 30449.0, 18574.0, 11820.0, 7827.0, 5259.0, 3492.0, 2343.0, 1672.0, 1086.0, 748.0, 505.0, 341.0, 279.0, 182.0, 133.0, 104.0, 74.0, 48.0, 42.0, 19.0, 20.0, 14.0, 6.0, 7.0, 2.0, 6.0, 2.0], "bins": [-0.05145263671875, -0.04992389678955078, -0.04839515686035156, -0.046866416931152344, -0.045337677001953125, -0.043808937072753906, -0.04228019714355469, -0.04075145721435547, -0.03922271728515625, -0.03769397735595703, -0.03616523742675781, -0.034636497497558594, -0.033107757568359375, -0.031579017639160156, -0.030050277709960938, -0.02852153778076172, -0.0269927978515625, -0.02546405792236328, -0.023935317993164062, -0.022406578063964844, -0.020877838134765625, -0.019349098205566406, -0.017820358276367188, -0.01629161834716797, -0.01476287841796875, -0.013234138488769531, -0.011705398559570312, -0.010176658630371094, -0.008647918701171875, -0.007119178771972656, -0.0055904388427734375, -0.004061698913574219, -0.002532958984375, -0.0010042190551757812, 0.0005245208740234375, 0.0020532608032226562, 0.003582000732421875, 0.005110740661621094, 0.0066394805908203125, 0.008168220520019531, 0.00969696044921875, 0.011225700378417969, 0.012754440307617188, 0.014283180236816406, 0.015811920166015625, 0.017340660095214844, 0.018869400024414062, 0.02039813995361328, 0.0219268798828125, 0.02345561981201172, 0.024984359741210938, 0.026513099670410156, 0.028041839599609375, 0.029570579528808594, 0.031099319458007812, 0.03262805938720703, 0.03415679931640625, 0.03568553924560547, 0.03721427917480469, 0.038743019104003906, 0.040271759033203125, 0.041800498962402344, 0.04332923889160156, 0.04485797882080078, 0.04638671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 11.0, 6.0, 5.0, 12.0, 17.0, 14.0, 16.0, 26.0, 36.0, 28.0, 29.0, 38.0, 43.0, 52.0, 52.0, 59.0, 49.0, 47.0, 50.0, 36.0, 36.0, 49.0, 50.0, 23.0, 28.0, 21.0, 25.0, 27.0, 12.0, 15.0, 15.0, 13.0, 14.0, 6.0, 9.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0160980224609375, -0.015557050704956055, -0.01501607894897461, -0.014475107192993164, -0.013934135437011719, -0.013393163681030273, -0.012852191925048828, -0.012311220169067383, -0.011770248413085938, -0.011229276657104492, -0.010688304901123047, -0.010147333145141602, -0.009606361389160156, -0.009065389633178711, -0.008524417877197266, -0.00798344612121582, -0.007442474365234375, -0.00690150260925293, -0.006360530853271484, -0.005819559097290039, -0.005278587341308594, -0.0047376155853271484, -0.004196643829345703, -0.003655672073364258, -0.0031147003173828125, -0.002573728561401367, -0.002032756805419922, -0.0014917850494384766, -0.0009508132934570312, -0.00040984153747558594, 0.00013113021850585938, 0.0006721019744873047, 0.00121307373046875, 0.0017540454864501953, 0.0022950172424316406, 0.002835988998413086, 0.0033769607543945312, 0.0039179325103759766, 0.004458904266357422, 0.004999876022338867, 0.0055408477783203125, 0.006081819534301758, 0.006622791290283203, 0.0071637630462646484, 0.007704734802246094, 0.008245706558227539, 0.008786678314208984, 0.00932765007019043, 0.009868621826171875, 0.01040959358215332, 0.010950565338134766, 0.011491537094116211, 0.012032508850097656, 0.012573480606079102, 0.013114452362060547, 0.013655424118041992, 0.014196395874023438, 0.014737367630004883, 0.015278339385986328, 0.015819311141967773, 0.01636028289794922, 0.016901254653930664, 0.01744222640991211, 0.017983198165893555, 0.018524169921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 9.0, 9.0, 6.0, 16.0, 18.0, 34.0, 37.0, 37.0, 82.0, 88.0, 97.0, 118.0, 204.0, 259.0, 439.0, 569.0, 788.0, 1163.0, 1819.0, 2867.0, 4775.0, 8102.0, 14908.0, 30231.0, 74574.0, 635550.0, 172195.0, 48870.0, 22153.0, 11290.0, 6274.0, 3818.0, 2236.0, 1480.0, 1003.0, 638.0, 480.0, 360.0, 259.0, 156.0, 139.0, 108.0, 78.0, 50.0, 39.0, 35.0, 21.0, 30.0, 21.0, 11.0, 9.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.071044921875, -0.06848812103271484, -0.06593132019042969, -0.06337451934814453, -0.060817718505859375, -0.05826091766357422, -0.05570411682128906, -0.053147315979003906, -0.05059051513671875, -0.048033714294433594, -0.04547691345214844, -0.04292011260986328, -0.040363311767578125, -0.03780651092529297, -0.03524971008300781, -0.032692909240722656, -0.0301361083984375, -0.027579307556152344, -0.025022506713867188, -0.02246570587158203, -0.019908905029296875, -0.01735210418701172, -0.014795303344726562, -0.012238502502441406, -0.00968170166015625, -0.007124900817871094, -0.0045680999755859375, -0.0020112991333007812, 0.000545501708984375, 0.0031023025512695312, 0.0056591033935546875, 0.008215904235839844, 0.010772705078125, 0.013329505920410156, 0.015886306762695312, 0.01844310760498047, 0.020999908447265625, 0.02355670928955078, 0.026113510131835938, 0.028670310974121094, 0.03122711181640625, 0.033783912658691406, 0.03634071350097656, 0.03889751434326172, 0.041454315185546875, 0.04401111602783203, 0.04656791687011719, 0.049124717712402344, 0.0516815185546875, 0.054238319396972656, 0.05679512023925781, 0.05935192108154297, 0.061908721923828125, 0.06446552276611328, 0.06702232360839844, 0.0695791244506836, 0.07213592529296875, 0.0746927261352539, 0.07724952697753906, 0.07980632781982422, 0.08236312866210938, 0.08491992950439453, 0.08747673034667969, 0.09003353118896484, 0.09259033203125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 10.0, 7.0, 10.0, 14.0, 11.0, 18.0, 13.0, 19.0, 21.0, 18.0, 23.0, 22.0, 29.0, 34.0, 30.0, 40.0, 31.0, 39.0, 49.0, 36.0, 41.0, 39.0, 39.0, 37.0, 40.0, 42.0, 26.0, 28.0, 30.0, 25.0, 26.0, 24.0, 13.0, 17.0, 16.0, 12.0, 7.0, 9.0, 17.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 5.0, 0.0, 3.0], "bins": [-0.01068878173828125, -0.010386109352111816, -0.010083436965942383, -0.00978076457977295, -0.009478092193603516, -0.009175419807434082, -0.008872747421264648, -0.008570075035095215, -0.008267402648925781, -0.007964730262756348, -0.007662057876586914, -0.0073593854904174805, -0.007056713104248047, -0.006754040718078613, -0.00645136833190918, -0.006148695945739746, -0.0058460235595703125, -0.005543351173400879, -0.005240678787231445, -0.004938006401062012, -0.004635334014892578, -0.0043326616287231445, -0.004029989242553711, -0.0037273168563842773, -0.0034246444702148438, -0.00312197208404541, -0.0028192996978759766, -0.002516627311706543, -0.0022139549255371094, -0.0019112825393676758, -0.0016086101531982422, -0.0013059377670288086, -0.001003265380859375, -0.0007005929946899414, -0.0003979206085205078, -9.524822235107422e-05, 0.00020742416381835938, 0.000510096549987793, 0.0008127689361572266, 0.0011154413223266602, 0.0014181137084960938, 0.0017207860946655273, 0.002023458480834961, 0.0023261308670043945, 0.002628803253173828, 0.0029314756393432617, 0.0032341480255126953, 0.003536820411682129, 0.0038394927978515625, 0.004142165184020996, 0.00444483757019043, 0.004747509956359863, 0.005050182342529297, 0.0053528547286987305, 0.005655527114868164, 0.005958199501037598, 0.006260871887207031, 0.006563544273376465, 0.0068662166595458984, 0.007168889045715332, 0.007471561431884766, 0.007774233818054199, 0.008076906204223633, 0.008379578590393066, 0.0086822509765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 10.0, 10.0, 6.0, 18.0, 23.0, 29.0, 39.0, 39.0, 46.0, 79.0, 98.0, 139.0, 209.0, 267.0, 399.0, 552.0, 861.0, 1478.0, 2680.0, 9113.0, 1001123.0, 22611.0, 3751.0, 1719.0, 1036.0, 649.0, 444.0, 257.0, 237.0, 177.0, 111.0, 85.0, 45.0, 41.0, 51.0, 30.0, 22.0, 21.0, 13.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03466796875, -0.033573150634765625, -0.03247833251953125, -0.031383514404296875, -0.0302886962890625, -0.029193878173828125, -0.02809906005859375, -0.027004241943359375, -0.025909423828125, -0.024814605712890625, -0.02371978759765625, -0.022624969482421875, -0.0215301513671875, -0.020435333251953125, -0.01934051513671875, -0.018245697021484375, -0.01715087890625, -0.016056060791015625, -0.01496124267578125, -0.013866424560546875, -0.0127716064453125, -0.011676788330078125, -0.01058197021484375, -0.009487152099609375, -0.008392333984375, -0.007297515869140625, -0.00620269775390625, -0.005107879638671875, -0.0040130615234375, -0.002918243408203125, -0.00182342529296875, -0.000728607177734375, 0.0003662109375, 0.001461029052734375, 0.00255584716796875, 0.003650665283203125, 0.0047454833984375, 0.005840301513671875, 0.00693511962890625, 0.008029937744140625, 0.009124755859375, 0.010219573974609375, 0.01131439208984375, 0.012409210205078125, 0.0135040283203125, 0.014598846435546875, 0.01569366455078125, 0.016788482666015625, 0.01788330078125, 0.018978118896484375, 0.02007293701171875, 0.021167755126953125, 0.0222625732421875, 0.023357391357421875, 0.02445220947265625, 0.025547027587890625, 0.026641845703125, 0.027736663818359375, 0.02883148193359375, 0.029926300048828125, 0.0310211181640625, 0.032115936279296875, 0.03321075439453125, 0.034305572509765625, 0.035400390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 10.0, 10.0, 6.0, 2.0, 4.0, 11.0, 6.0, 24.0, 11.0, 7.0, 16.0, 14.0, 44.0, 36.0, 42.0, 47.0, 63.0, 102.0, 69.0, 38.0, 54.0, 40.0, 45.0, 73.0, 27.0, 14.0, 22.0, 17.0, 36.0, 12.0, 13.0, 16.0, 7.0, 16.0, 9.0, 8.0, 5.0, 6.0, 3.0, 6.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.8961727619171143e-06, -1.8253922462463379e-06, -1.7546117305755615e-06, -1.6838312149047852e-06, -1.6130506992340088e-06, -1.5422701835632324e-06, -1.471489667892456e-06, -1.4007091522216797e-06, -1.3299286365509033e-06, -1.259148120880127e-06, -1.1883676052093506e-06, -1.1175870895385742e-06, -1.0468065738677979e-06, -9.760260581970215e-07, -9.052455425262451e-07, -8.344650268554688e-07, -7.636845111846924e-07, -6.92903995513916e-07, -6.221234798431396e-07, -5.513429641723633e-07, -4.805624485015869e-07, -4.0978193283081055e-07, -3.390014171600342e-07, -2.682209014892578e-07, -1.9744038581848145e-07, -1.2665987014770508e-07, -5.587935447692871e-08, 1.4901161193847656e-08, 8.568167686462402e-08, 1.564621925354004e-07, 2.2724270820617676e-07, 2.980232238769531e-07, 3.688037395477295e-07, 4.3958425521850586e-07, 5.103647708892822e-07, 5.811452865600586e-07, 6.51925802230835e-07, 7.227063179016113e-07, 7.934868335723877e-07, 8.642673492431641e-07, 9.350478649139404e-07, 1.0058283805847168e-06, 1.0766088962554932e-06, 1.1473894119262695e-06, 1.218169927597046e-06, 1.2889504432678223e-06, 1.3597309589385986e-06, 1.430511474609375e-06, 1.5012919902801514e-06, 1.5720725059509277e-06, 1.642853021621704e-06, 1.7136335372924805e-06, 1.7844140529632568e-06, 1.8551945686340332e-06, 1.9259750843048096e-06, 1.996755599975586e-06, 2.0675361156463623e-06, 2.1383166313171387e-06, 2.209097146987915e-06, 2.2798776626586914e-06, 2.3506581783294678e-06, 2.421438694000244e-06, 2.4922192096710205e-06, 2.562999725341797e-06]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 33.0, 69.0, 244.0, 731.0, 2537.0, 12446.0, 1013587.0, 14833.0, 2933.0, 755.0, 255.0, 72.0, 29.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0367431640625, -0.03545570373535156, -0.034168243408203125, -0.03288078308105469, -0.03159332275390625, -0.030305862426757812, -0.029018402099609375, -0.027730941772460938, -0.0264434814453125, -0.025156021118164062, -0.023868560791015625, -0.022581100463867188, -0.02129364013671875, -0.020006179809570312, -0.018718719482421875, -0.017431259155273438, -0.016143798828125, -0.014856338500976562, -0.013568878173828125, -0.012281417846679688, -0.01099395751953125, -0.009706497192382812, -0.008419036865234375, -0.0071315765380859375, -0.0058441162109375, -0.0045566558837890625, -0.003269195556640625, -0.0019817352294921875, -0.00069427490234375, 0.0005931854248046875, 0.001880645751953125, 0.0031681060791015625, 0.00445556640625, 0.0057430267333984375, 0.007030487060546875, 0.008317947387695312, 0.00960540771484375, 0.010892868041992188, 0.012180328369140625, 0.013467788696289062, 0.0147552490234375, 0.016042709350585938, 0.017330169677734375, 0.018617630004882812, 0.01990509033203125, 0.021192550659179688, 0.022480010986328125, 0.023767471313476562, 0.025054931640625, 0.026342391967773438, 0.027629852294921875, 0.028917312622070312, 0.03020477294921875, 0.03149223327636719, 0.032779693603515625, 0.03406715393066406, 0.0353546142578125, 0.03664207458496094, 0.037929534912109375, 0.03921699523925781, 0.04050445556640625, 0.04179191589355469, 0.043079376220703125, 0.04436683654785156, 0.045654296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 26.0, 155.0, 675.0, 94.0, 17.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030727386474609375, -0.002986043691635132, -0.002899348735809326, -0.0028126537799835205, -0.002725958824157715, -0.002639263868331909, -0.0025525689125061035, -0.002465873956680298, -0.002379179000854492, -0.0022924840450286865, -0.002205789089202881, -0.002119094133377075, -0.0020323991775512695, -0.0019457042217254639, -0.0018590092658996582, -0.0017723143100738525, -0.0016856193542480469, -0.0015989243984222412, -0.0015122294425964355, -0.0014255344867706299, -0.0013388395309448242, -0.0012521445751190186, -0.0011654496192932129, -0.0010787546634674072, -0.0009920597076416016, -0.0009053647518157959, -0.0008186697959899902, -0.0007319748401641846, -0.0006452798843383789, -0.0005585849285125732, -0.0004718899726867676, -0.0003851950168609619, -0.00029850006103515625, -0.00021180510520935059, -0.00012511014938354492, -3.841519355773926e-05, 4.8279762268066406e-05, 0.00013497471809387207, 0.00022166967391967773, 0.0003083646297454834, 0.00039505958557128906, 0.0004817545413970947, 0.0005684494972229004, 0.0006551444530487061, 0.0007418394088745117, 0.0008285343647003174, 0.000915229320526123, 0.0010019242763519287, 0.0010886192321777344, 0.00117531418800354, 0.0012620091438293457, 0.0013487040996551514, 0.001435399055480957, 0.0015220940113067627, 0.0016087889671325684, 0.001695483922958374, 0.0017821788787841797, 0.0018688738346099854, 0.001955568790435791, 0.0020422637462615967, 0.0021289587020874023, 0.002215653657913208, 0.0023023486137390137, 0.0023890435695648193, 0.002475738525390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 9.0, 11.0, 16.0, 31.0, 27.0, 56.0, 88.0, 107.0, 159.0, 134.0, 83.0, 74.0, 32.0, 30.0, 35.0, 16.0, 14.0, 13.0, 6.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01926487311720848, -0.018420526757836342, -0.017576180398464203, -0.016731834039092064, -0.015887487679719925, -0.015043141320347786, -0.014198794960975647, -0.013354448601603508, -0.012510102242231369, -0.01166575588285923, -0.010821409523487091, -0.009977063164114952, -0.009132716804742813, -0.008288370445370674, -0.007444023620337248, -0.006599677260965109, -0.005755330435931683, -0.004910984076559544, -0.004066637717187405, -0.003222291124984622, -0.002377944765612483, -0.0015335981734097004, -0.0006892518140375614, 0.00015509454533457756, 0.0009994409047067165, 0.0018437872640788555, 0.0026881336234509945, 0.003532480215653777, 0.00437682680785656, 0.005221173167228699, 0.006065519526600838, 0.006909865885972977, 0.007754212245345116, 0.008598558604717255, 0.009442904964089394, 0.010287251323461533, 0.011131597682833672, 0.01197594404220581, 0.01282029040157795, 0.013664636760950089, 0.014508983120322227, 0.015353329479694366, 0.016197675839066505, 0.017042022198438644, 0.017886368557810783, 0.018730714917182922, 0.01957506127655506, 0.0204194076359272, 0.02126375585794449, 0.022108102217316628, 0.022952448576688766, 0.023796794936060905, 0.024641141295433044, 0.025485487654805183, 0.026329834014177322, 0.02717418037354946, 0.0280185267329216, 0.02886287309229374, 0.02970721945166588, 0.030551565811038017, 0.031395912170410156, 0.032240260392427444, 0.033084604889154434, 0.03392895311117172, 0.03477329760789871]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 3.0, 2.0, 7.0, 2.0, 9.0, 6.0, 6.0, 16.0, 15.0, 17.0, 27.0, 29.0, 29.0, 28.0, 31.0, 41.0, 41.0, 44.0, 46.0, 48.0, 56.0, 40.0, 37.0, 43.0, 40.0, 43.0, 45.0, 38.0, 25.0, 21.0, 18.0, 22.0, 20.0, 18.0, 26.0, 13.0, 8.0, 12.0, 6.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012227381579577923, -0.01179453730583191, -0.01136169396340847, -0.010928849689662457, -0.010496006347239017, -0.010063162073493004, -0.009630318731069565, -0.009197474457323551, -0.008764630183577538, -0.008331785909831524, -0.007898942567408085, -0.007466098293662071, -0.007033254485577345, -0.0066004106774926186, -0.006167566869407892, -0.005734723061323166, -0.0053018792532384396, -0.004869035445153713, -0.004436191637068987, -0.0040033478289842606, -0.003570503555238247, -0.0031376597471535206, -0.0027048159390687943, -0.0022719718981534243, -0.001839128090068698, -0.0014062841655686498, -0.0009734402992762625, -0.0005405964329838753, -0.00010775250848382711, 0.00032509141601622105, 0.0007579352241009474, 0.0011907792650163174, 0.0016236230731010437, 0.00205646688118577, 0.00248931092210114, 0.0029221547301858664, 0.0033549987711012363, 0.0037878425791859627, 0.004220686387270689, 0.004653530195355415, 0.005086374469101429, 0.005519218277186155, 0.005952062085270882, 0.006384906359016895, 0.006817750167101622, 0.007250593975186348, 0.007683437783271074, 0.0081162815913558, 0.008549125865101814, 0.008981970138847828, 0.009414813481271267, 0.00984765775501728, 0.01028050109744072, 0.010713345371186733, 0.011146189644932747, 0.011579032987356186, 0.012011876329779625, 0.012444720603525639, 0.012877563945949078, 0.013310408219695091, 0.01374325156211853, 0.014176095835864544, 0.014608940109610558, 0.015041783452033997, 0.01547462772578001]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 7.0, 9.0, 13.0, 19.0, 37.0, 54.0, 92.0, 135.0, 242.0, 413.0, 688.0, 1190.0, 2388.0, 4769.0, 10253.0, 22505.0, 55724.0, 168923.0, 474122.0, 196810.0, 62878.0, 25340.0, 10967.0, 5313.0, 2535.0, 1329.0, 721.0, 421.0, 254.0, 143.0, 83.0, 57.0, 41.0, 22.0, 13.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.046630859375, -0.045241355895996094, -0.04385185241699219, -0.04246234893798828, -0.041072845458984375, -0.03968334197998047, -0.03829383850097656, -0.036904335021972656, -0.03551483154296875, -0.034125328063964844, -0.03273582458496094, -0.03134632110595703, -0.029956817626953125, -0.02856731414794922, -0.027177810668945312, -0.025788307189941406, -0.0243988037109375, -0.023009300231933594, -0.021619796752929688, -0.02023029327392578, -0.018840789794921875, -0.01745128631591797, -0.016061782836914062, -0.014672279357910156, -0.01328277587890625, -0.011893272399902344, -0.010503768920898438, -0.009114265441894531, -0.007724761962890625, -0.006335258483886719, -0.0049457550048828125, -0.0035562515258789062, -0.002166748046875, -0.0007772445678710938, 0.0006122589111328125, 0.0020017623901367188, 0.003391265869140625, 0.004780769348144531, 0.0061702728271484375, 0.007559776306152344, 0.00894927978515625, 0.010338783264160156, 0.011728286743164062, 0.013117790222167969, 0.014507293701171875, 0.01589679718017578, 0.017286300659179688, 0.018675804138183594, 0.0200653076171875, 0.021454811096191406, 0.022844314575195312, 0.02423381805419922, 0.025623321533203125, 0.02701282501220703, 0.028402328491210938, 0.029791831970214844, 0.03118133544921875, 0.032570838928222656, 0.03396034240722656, 0.03534984588623047, 0.036739349365234375, 0.03812885284423828, 0.03951835632324219, 0.040907859802246094, 0.04229736328125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 1.0, 7.0, 3.0, 7.0, 12.0, 10.0, 10.0, 23.0, 17.0, 23.0, 34.0, 33.0, 41.0, 42.0, 51.0, 55.0, 59.0, 53.0, 46.0, 50.0, 46.0, 60.0, 49.0, 38.0, 38.0, 23.0, 30.0, 24.0, 27.0, 30.0, 11.0, 12.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00882720947265625, -0.008536100387573242, -0.008244991302490234, -0.007953882217407227, -0.007662773132324219, -0.007371664047241211, -0.007080554962158203, -0.006789445877075195, -0.0064983367919921875, -0.00620722770690918, -0.005916118621826172, -0.005625009536743164, -0.005333900451660156, -0.0050427913665771484, -0.004751682281494141, -0.004460573196411133, -0.004169464111328125, -0.003878355026245117, -0.0035872459411621094, -0.0032961368560791016, -0.0030050277709960938, -0.002713918685913086, -0.002422809600830078, -0.0021317005157470703, -0.0018405914306640625, -0.0015494823455810547, -0.0012583732604980469, -0.0009672641754150391, -0.0006761550903320312, -0.00038504600524902344, -9.393692016601562e-05, 0.0001971721649169922, 0.00048828125, 0.0007793903350830078, 0.0010704994201660156, 0.0013616085052490234, 0.0016527175903320312, 0.001943826675415039, 0.002234935760498047, 0.0025260448455810547, 0.0028171539306640625, 0.0031082630157470703, 0.003399372100830078, 0.003690481185913086, 0.003981590270996094, 0.0042726993560791016, 0.004563808441162109, 0.004854917526245117, 0.005146026611328125, 0.005437135696411133, 0.005728244781494141, 0.0060193538665771484, 0.006310462951660156, 0.006601572036743164, 0.006892681121826172, 0.00718379020690918, 0.0074748992919921875, 0.007766008377075195, 0.008057117462158203, 0.008348226547241211, 0.008639335632324219, 0.008930444717407227, 0.009221553802490234, 0.009512662887573242, 0.00980377197265625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 4.0, 6.0, 8.0, 9.0, 7.0, 14.0, 15.0, 16.0, 12.0, 26.0, 16.0, 45.0, 85.0, 174.0, 367.0, 874.0, 2518.0, 7202.0, 20659.0, 63262.0, 258419.0, 512907.0, 125977.0, 36437.0, 12426.0, 4308.0, 1581.0, 580.0, 251.0, 89.0, 57.0, 38.0, 28.0, 33.0, 16.0, 20.0, 12.0, 16.0, 7.0, 12.0, 5.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03643798828125, -0.03514862060546875, -0.0338592529296875, -0.03256988525390625, -0.031280517578125, -0.02999114990234375, -0.0287017822265625, -0.02741241455078125, -0.026123046875, -0.02483367919921875, -0.0235443115234375, -0.02225494384765625, -0.020965576171875, -0.01967620849609375, -0.0183868408203125, -0.01709747314453125, -0.01580810546875, -0.01451873779296875, -0.0132293701171875, -0.01194000244140625, -0.010650634765625, -0.00936126708984375, -0.0080718994140625, -0.00678253173828125, -0.0054931640625, -0.00420379638671875, -0.0029144287109375, -0.00162506103515625, -0.000335693359375, 0.00095367431640625, 0.0022430419921875, 0.00353240966796875, 0.00482177734375, 0.00611114501953125, 0.0074005126953125, 0.00868988037109375, 0.009979248046875, 0.01126861572265625, 0.0125579833984375, 0.01384735107421875, 0.01513671875, 0.01642608642578125, 0.0177154541015625, 0.01900482177734375, 0.020294189453125, 0.02158355712890625, 0.0228729248046875, 0.02416229248046875, 0.02545166015625, 0.02674102783203125, 0.0280303955078125, 0.02931976318359375, 0.030609130859375, 0.03189849853515625, 0.0331878662109375, 0.03447723388671875, 0.0357666015625, 0.03705596923828125, 0.0383453369140625, 0.03963470458984375, 0.040924072265625, 0.04221343994140625, 0.0435028076171875, 0.04479217529296875, 0.04608154296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 10.0, 10.0, 10.0, 11.0, 17.0, 20.0, 24.0, 17.0, 28.0, 36.0, 25.0, 36.0, 30.0, 40.0, 35.0, 36.0, 58.0, 38.0, 43.0, 40.0, 31.0, 38.0, 45.0, 39.0, 34.0, 24.0, 29.0, 31.0, 22.0, 21.0, 18.0, 12.0, 15.0, 13.0, 13.0, 12.0, 6.0, 9.0, 6.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.007122039794921875, -0.006923973560333252, -0.006725907325744629, -0.006527841091156006, -0.006329774856567383, -0.00613170862197876, -0.005933642387390137, -0.005735576152801514, -0.005537509918212891, -0.005339443683624268, -0.0051413774490356445, -0.0049433112144470215, -0.0047452449798583984, -0.004547178745269775, -0.004349112510681152, -0.004151046276092529, -0.003952980041503906, -0.003754913806915283, -0.00355684757232666, -0.003358781337738037, -0.003160715103149414, -0.002962648868560791, -0.002764582633972168, -0.002566516399383545, -0.002368450164794922, -0.002170383930206299, -0.0019723176956176758, -0.0017742514610290527, -0.0015761852264404297, -0.0013781189918518066, -0.0011800527572631836, -0.0009819865226745605, -0.0007839202880859375, -0.0005858540534973145, -0.0003877878189086914, -0.00018972158432006836, 8.344650268554688e-06, 0.00020641088485717773, 0.0004044771194458008, 0.0006025433540344238, 0.0008006095886230469, 0.00099867582321167, 0.001196742057800293, 0.001394808292388916, 0.001592874526977539, 0.0017909407615661621, 0.001989006996154785, 0.002187073230743408, 0.0023851394653320312, 0.0025832056999206543, 0.0027812719345092773, 0.0029793381690979004, 0.0031774044036865234, 0.0033754706382751465, 0.0035735368728637695, 0.0037716031074523926, 0.003969669342041016, 0.004167735576629639, 0.004365801811218262, 0.004563868045806885, 0.004761934280395508, 0.004960000514984131, 0.005158066749572754, 0.005356132984161377, 0.00555419921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 11.0, 8.0, 10.0, 19.0, 18.0, 24.0, 41.0, 54.0, 78.0, 111.0, 185.0, 225.0, 358.0, 543.0, 861.0, 1548.0, 2776.0, 5625.0, 14876.0, 61745.0, 826661.0, 99346.0, 19020.0, 6682.0, 3213.0, 1709.0, 1004.0, 593.0, 380.0, 246.0, 158.0, 125.0, 75.0, 62.0, 40.0, 37.0, 16.0, 17.0, 13.0, 10.0, 12.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0032939910888671875, -0.003189772367477417, -0.0030855536460876465, -0.002981334924697876, -0.0028771162033081055, -0.002772897481918335, -0.0026686787605285645, -0.002564460039138794, -0.0024602413177490234, -0.002356022596359253, -0.0022518038749694824, -0.002147585153579712, -0.0020433664321899414, -0.001939147710800171, -0.0018349289894104004, -0.0017307102680206299, -0.0016264915466308594, -0.0015222728252410889, -0.0014180541038513184, -0.0013138353824615479, -0.0012096166610717773, -0.0011053979396820068, -0.0010011792182922363, -0.0008969604969024658, -0.0007927417755126953, -0.0006885230541229248, -0.0005843043327331543, -0.0004800856113433838, -0.0003758668899536133, -0.0002716481685638428, -0.00016742944717407227, -6.321072578430176e-05, 4.100799560546875e-05, 0.00014522671699523926, 0.00024944543838500977, 0.0003536641597747803, 0.0004578828811645508, 0.0005621016025543213, 0.0006663203239440918, 0.0007705390453338623, 0.0008747577667236328, 0.0009789764881134033, 0.0010831952095031738, 0.0011874139308929443, 0.0012916326522827148, 0.0013958513736724854, 0.0015000700950622559, 0.0016042888164520264, 0.0017085075378417969, 0.0018127262592315674, 0.0019169449806213379, 0.0020211637020111084, 0.002125382423400879, 0.0022296011447906494, 0.00233381986618042, 0.0024380385875701904, 0.002542257308959961, 0.0026464760303497314, 0.002750694751739502, 0.0028549134731292725, 0.002959132194519043, 0.0030633509159088135, 0.003167569637298584, 0.0032717883586883545, 0.003376007080078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 16.0, 14.0, 20.0, 26.0, 32.0, 36.0, 41.0, 60.0, 121.0, 173.0, 108.0, 85.0, 56.0, 37.0, 31.0, 23.0, 29.0, 12.0, 15.0, 6.0, 6.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2627802789211273e-05, -1.226179301738739e-05, -1.1895783245563507e-05, -1.1529773473739624e-05, -1.1163763701915741e-05, -1.0797753930091858e-05, -1.0431744158267975e-05, -1.0065734386444092e-05, -9.699724614620209e-06, -9.333714842796326e-06, -8.967705070972443e-06, -8.60169529914856e-06, -8.235685527324677e-06, -7.869675755500793e-06, -7.50366598367691e-06, -7.137656211853027e-06, -6.771646440029144e-06, -6.405636668205261e-06, -6.039626896381378e-06, -5.673617124557495e-06, -5.307607352733612e-06, -4.941597580909729e-06, -4.575587809085846e-06, -4.209578037261963e-06, -3.84356826543808e-06, -3.4775584936141968e-06, -3.1115487217903137e-06, -2.7455389499664307e-06, -2.3795291781425476e-06, -2.0135194063186646e-06, -1.6475096344947815e-06, -1.2814998626708984e-06, -9.154900908470154e-07, -5.494803190231323e-07, -1.8347054719924927e-07, 1.825392246246338e-07, 5.485489964485168e-07, 9.145587682723999e-07, 1.280568540096283e-06, 1.646578311920166e-06, 2.012588083744049e-06, 2.378597855567932e-06, 2.744607627391815e-06, 3.1106173992156982e-06, 3.4766271710395813e-06, 3.842636942863464e-06, 4.208646714687347e-06, 4.5746564865112305e-06, 4.9406662583351135e-06, 5.306676030158997e-06, 5.67268580198288e-06, 6.038695573806763e-06, 6.404705345630646e-06, 6.770715117454529e-06, 7.136724889278412e-06, 7.502734661102295e-06, 7.868744432926178e-06, 8.234754204750061e-06, 8.600763976573944e-06, 8.966773748397827e-06, 9.33278352022171e-06, 9.698793292045593e-06, 1.0064803063869476e-05, 1.043081283569336e-05]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 10.0, 16.0, 22.0, 45.0, 88.0, 177.0, 372.0, 831.0, 2147.0, 6693.0, 29278.0, 519067.0, 451509.0, 28145.0, 6570.0, 2049.0, 815.0, 354.0, 165.0, 75.0, 50.0, 30.0, 11.0, 8.0, 8.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028667449951171875, -0.002779841423034668, -0.0026929378509521484, -0.002606034278869629, -0.0025191307067871094, -0.00243222713470459, -0.0023453235626220703, -0.0022584199905395508, -0.0021715164184570312, -0.0020846128463745117, -0.001997709274291992, -0.0019108057022094727, -0.0018239021301269531, -0.0017369985580444336, -0.001650094985961914, -0.0015631914138793945, -0.001476287841796875, -0.0013893842697143555, -0.001302480697631836, -0.0012155771255493164, -0.0011286735534667969, -0.0010417699813842773, -0.0009548664093017578, -0.0008679628372192383, -0.0007810592651367188, -0.0006941556930541992, -0.0006072521209716797, -0.0005203485488891602, -0.0004334449768066406, -0.0003465414047241211, -0.00025963783264160156, -0.00017273426055908203, -8.58306884765625e-05, 1.0728836059570312e-06, 8.797645568847656e-05, 0.0001748800277709961, 0.0002617835998535156, 0.00034868717193603516, 0.0004355907440185547, 0.0005224943161010742, 0.0006093978881835938, 0.0006963014602661133, 0.0007832050323486328, 0.0008701086044311523, 0.0009570121765136719, 0.0010439157485961914, 0.001130819320678711, 0.0012177228927612305, 0.00130462646484375, 0.0013915300369262695, 0.001478433609008789, 0.0015653371810913086, 0.0016522407531738281, 0.0017391443252563477, 0.0018260478973388672, 0.0019129514694213867, 0.0019998550415039062, 0.0020867586135864258, 0.0021736621856689453, 0.002260565757751465, 0.0023474693298339844, 0.002434372901916504, 0.0025212764739990234, 0.002608180046081543, 0.0026950836181640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 2.0, 7.0, 10.0, 6.0, 12.0, 20.0, 26.0, 39.0, 49.0, 72.0, 116.0, 135.0, 137.0, 99.0, 64.0, 64.0, 25.0, 25.0, 16.0, 17.0, 15.0, 8.0, 10.0, 4.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041484832763671875, -0.0004014261066913605, -0.0003880038857460022, -0.0003745816648006439, -0.00036115944385528564, -0.00034773722290992737, -0.0003343150019645691, -0.0003208927810192108, -0.00030747056007385254, -0.00029404833912849426, -0.000280626118183136, -0.0002672038972377777, -0.00025378167629241943, -0.00024035945534706116, -0.00022693723440170288, -0.0002135150134563446, -0.00020009279251098633, -0.00018667057156562805, -0.00017324835062026978, -0.0001598261296749115, -0.00014640390872955322, -0.00013298168778419495, -0.00011955946683883667, -0.0001061372458934784, -9.271502494812012e-05, -7.929280400276184e-05, -6.587058305740356e-05, -5.244836211204529e-05, -3.902614116668701e-05, -2.5603920221328735e-05, -1.2181699275970459e-05, 1.2405216693878174e-06, 1.4662742614746094e-05, 2.808496356010437e-05, 4.1507184505462646e-05, 5.492940545082092e-05, 6.83516263961792e-05, 8.177384734153748e-05, 9.519606828689575e-05, 0.00010861828923225403, 0.0001220405101776123, 0.00013546273112297058, 0.00014888495206832886, 0.00016230717301368713, 0.0001757293939590454, 0.0001891516149044037, 0.00020257383584976196, 0.00021599605679512024, 0.00022941827774047852, 0.0002428404986858368, 0.00025626271963119507, 0.00026968494057655334, 0.0002831071615219116, 0.0002965293824672699, 0.0003099516034126282, 0.00032337382435798645, 0.0003367960453033447, 0.000350218266248703, 0.0003636404871940613, 0.00037706270813941956, 0.00039048492908477783, 0.0004039071500301361, 0.0004173293709754944, 0.00043075159192085266, 0.00044417381286621094]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 16.0, 11.0, 18.0, 28.0, 33.0, 72.0, 97.0, 146.0, 175.0, 128.0, 88.0, 49.0, 34.0, 29.0, 22.0, 15.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01949743926525116, -0.018876587972044945, -0.01825573667883873, -0.017634885385632515, -0.0170140340924263, -0.016393182799220085, -0.01577233150601387, -0.015151480212807655, -0.01453062891960144, -0.013909777626395226, -0.01328892633318901, -0.012668075039982796, -0.01204722374677658, -0.011426372453570366, -0.010805521160364151, -0.010184669867157936, -0.009563818573951721, -0.008942967280745506, -0.008322115987539291, -0.0077012646943330765, -0.007080413401126862, -0.006459562107920647, -0.005838710814714432, -0.005217859521508217, -0.004597008228302002, -0.003976156935095787, -0.003355305641889572, -0.0027344543486833572, -0.0021136030554771423, -0.0014927517622709274, -0.0008719004690647125, -0.0002510491758584976, 0.0003698021173477173, 0.0009906534105539322, 0.001611504703760147, 0.002232355996966362, 0.002853207290172577, 0.003474058583378792, 0.004094909876585007, 0.004715761169791222, 0.0053366124629974365, 0.005957463756203651, 0.006578315049409866, 0.007199166342616081, 0.007820017635822296, 0.008440868929028511, 0.009061720222234726, 0.00968257151544094, 0.010303422808647156, 0.01092427410185337, 0.011545125395059586, 0.0121659766882658, 0.012786827981472015, 0.01340767927467823, 0.014028530567884445, 0.01464938186109066, 0.015270233154296875, 0.01589108444750309, 0.016511935740709305, 0.01713278703391552, 0.017753638327121735, 0.01837448962032795, 0.018995340913534164, 0.01961619220674038, 0.020237043499946594]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 8.0, 12.0, 14.0, 19.0, 18.0, 23.0, 29.0, 20.0, 23.0, 29.0, 34.0, 35.0, 44.0, 28.0, 37.0, 36.0, 37.0, 41.0, 45.0, 57.0, 36.0, 43.0, 40.0, 41.0, 30.0, 31.0, 23.0, 24.0, 24.0, 17.0, 11.0, 16.0, 13.0, 5.0, 9.0, 5.0, 13.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007777445483952761, -0.007515905424952507, -0.007254365365952253, -0.006992825306952, -0.006731285247951746, -0.006469745188951492, -0.006208205595612526, -0.005946665070950985, -0.005685125477612019, -0.005423585418611765, -0.005162045359611511, -0.0049005053006112576, -0.004638965241611004, -0.00437742518261075, -0.0041158851236104965, -0.0038543452974408865, -0.003592805005609989, -0.0033312649466097355, -0.003069724887609482, -0.002808184828609228, -0.0025466447696089745, -0.0022851047106087208, -0.0020235648844391108, -0.001762024825438857, -0.0015004847664386034, -0.0012389447074383497, -0.000977404648438096, -0.0007158647058531642, -0.0004543246468529105, -0.00019278458785265684, 6.875535473227501e-05, 0.0003302954137325287, 0.0005918359383940697, 0.0008533759973943233, 0.001114916056394577, 0.0013764559989795089, 0.0016379960579797626, 0.0018995361169800162, 0.002161076059564948, 0.0024226161185652018, 0.0026841561775654554, 0.002945696236565709, 0.003207236295565963, 0.003468776121735573, 0.0037303161807358265, 0.00399185623973608, 0.004253396298736334, 0.0045149363577365875, 0.004776476416736841, 0.005038016475737095, 0.0052995565347373486, 0.005561096593737602, 0.005822636652737856, 0.00608417671173811, 0.006345716305077076, 0.006607256829738617, 0.006868796423077583, 0.007130336482077837, 0.007391876541078091, 0.007653416600078344, 0.007914956659078598, 0.008176496252417564, 0.008438036777079105, 0.008699576370418072, 0.008961116895079613]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 8.0, 12.0, 18.0, 23.0, 31.0, 48.0, 87.0, 139.0, 250.0, 471.0, 914.0, 2430.0, 11235.0, 2708881.0, 1454357.0, 10672.0, 2491.0, 1027.0, 516.0, 263.0, 157.0, 90.0, 64.0, 27.0, 19.0, 19.0, 10.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03249311447143555, -0.031508445739746094, -0.03052377700805664, -0.029539108276367188, -0.028554439544677734, -0.02756977081298828, -0.026585102081298828, -0.025600433349609375, -0.024615764617919922, -0.02363109588623047, -0.022646427154541016, -0.021661758422851562, -0.02067708969116211, -0.019692420959472656, -0.018707752227783203, -0.01772308349609375, -0.016738414764404297, -0.015753746032714844, -0.01476907730102539, -0.013784408569335938, -0.012799739837646484, -0.011815071105957031, -0.010830402374267578, -0.009845733642578125, -0.008861064910888672, -0.007876396179199219, -0.006891727447509766, -0.0059070587158203125, -0.004922389984130859, -0.003937721252441406, -0.002953052520751953, -0.0019683837890625, -0.0009837150573730469, 9.5367431640625e-07, 0.0009856224060058594, 0.0019702911376953125, 0.0029549598693847656, 0.003939628601074219, 0.004924297332763672, 0.005908966064453125, 0.006893634796142578, 0.007878303527832031, 0.008862972259521484, 0.009847640991210938, 0.01083230972290039, 0.011816978454589844, 0.012801647186279297, 0.01378631591796875, 0.014770984649658203, 0.015755653381347656, 0.01674032211303711, 0.017724990844726562, 0.018709659576416016, 0.01969432830810547, 0.020678997039794922, 0.021663665771484375, 0.022648334503173828, 0.02363300323486328, 0.024617671966552734, 0.025602340698242188, 0.02658700942993164, 0.027571678161621094, 0.028556346893310547, 0.029541015625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 16.0, 18.0, 23.0, 33.0, 52.0, 38.0, 66.0, 61.0, 68.0, 69.0, 75.0, 81.0, 77.0, 67.0, 59.0, 51.0, 34.0, 21.0, 25.0, 17.0, 10.0, 8.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164031982421875, -0.01591181755065918, -0.01542043685913086, -0.014929056167602539, -0.014437675476074219, -0.013946294784545898, -0.013454914093017578, -0.012963533401489258, -0.012472152709960938, -0.011980772018432617, -0.011489391326904297, -0.010998010635375977, -0.010506629943847656, -0.010015249252319336, -0.009523868560791016, -0.009032487869262695, -0.008541107177734375, -0.008049726486206055, -0.007558345794677734, -0.007066965103149414, -0.006575584411621094, -0.0060842037200927734, -0.005592823028564453, -0.005101442337036133, -0.0046100616455078125, -0.004118680953979492, -0.003627300262451172, -0.0031359195709228516, -0.0026445388793945312, -0.002153158187866211, -0.0016617774963378906, -0.0011703968048095703, -0.00067901611328125, -0.0001876354217529297, 0.0003037452697753906, 0.0007951259613037109, 0.0012865066528320312, 0.0017778873443603516, 0.002269268035888672, 0.002760648727416992, 0.0032520294189453125, 0.003743410110473633, 0.004234790802001953, 0.0047261714935302734, 0.005217552185058594, 0.005708932876586914, 0.006200313568115234, 0.006691694259643555, 0.007183074951171875, 0.007674455642700195, 0.008165836334228516, 0.008657217025756836, 0.009148597717285156, 0.009639978408813477, 0.010131359100341797, 0.010622739791870117, 0.011114120483398438, 0.011605501174926758, 0.012096881866455078, 0.012588262557983398, 0.013079643249511719, 0.013571023941040039, 0.01406240463256836, 0.01455378532409668, 0.015045166015625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 4.0, 16.0, 40.0, 137.0, 694.0, 4630.0, 4164528.0, 22205.0, 1562.0, 344.0, 79.0, 16.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12578773498535156, -0.12108230590820312, -0.11637687683105469, -0.11167144775390625, -0.10696601867675781, -0.10226058959960938, -0.09755516052246094, -0.0928497314453125, -0.08814430236816406, -0.08343887329101562, -0.07873344421386719, -0.07402801513671875, -0.06932258605957031, -0.06461715698242188, -0.05991172790527344, -0.055206298828125, -0.05050086975097656, -0.045795440673828125, -0.04109001159667969, -0.03638458251953125, -0.03167915344238281, -0.026973724365234375, -0.022268295288085938, -0.0175628662109375, -0.012857437133789062, -0.008152008056640625, -0.0034465789794921875, 0.00125885009765625, 0.0059642791748046875, 0.010669708251953125, 0.015375137329101562, 0.02008056640625, 0.024785995483398438, 0.029491424560546875, 0.03419685363769531, 0.03890228271484375, 0.04360771179199219, 0.048313140869140625, 0.05301856994628906, 0.0577239990234375, 0.06242942810058594, 0.06713485717773438, 0.07184028625488281, 0.07654571533203125, 0.08125114440917969, 0.08595657348632812, 0.09066200256347656, 0.095367431640625, 0.10007286071777344, 0.10477828979492188, 0.10948371887207031, 0.11418914794921875, 0.11889457702636719, 0.12360000610351562, 0.12830543518066406, 0.1330108642578125, 0.13771629333496094, 0.14242172241210938, 0.1471271514892578, 0.15183258056640625, 0.1565380096435547, 0.16124343872070312, 0.16594886779785156, 0.170654296875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 5.0, 9.0, 23.0, 80.0, 236.0, 2804.0, 711.0, 115.0, 41.0, 16.0, 9.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00899505615234375, -0.008729696273803711, -0.008464336395263672, -0.008198976516723633, -0.007933616638183594, -0.007668256759643555, -0.007402896881103516, -0.0071375370025634766, -0.0068721771240234375, -0.0066068172454833984, -0.006341457366943359, -0.00607609748840332, -0.005810737609863281, -0.005545377731323242, -0.005280017852783203, -0.005014657974243164, -0.004749298095703125, -0.004483938217163086, -0.004218578338623047, -0.003953218460083008, -0.0036878585815429688, -0.0034224987030029297, -0.0031571388244628906, -0.0028917789459228516, -0.0026264190673828125, -0.0023610591888427734, -0.0020956993103027344, -0.0018303394317626953, -0.0015649795532226562, -0.0012996196746826172, -0.0010342597961425781, -0.0007688999176025391, -0.0005035400390625, -0.00023818016052246094, 2.7179718017578125e-05, 0.0002925395965576172, 0.0005578994750976562, 0.0008232593536376953, 0.0010886192321777344, 0.0013539791107177734, 0.0016193389892578125, 0.0018846988677978516, 0.0021500587463378906, 0.0024154186248779297, 0.0026807785034179688, 0.002946138381958008, 0.003211498260498047, 0.003476858139038086, 0.003742218017578125, 0.004007577896118164, 0.004272937774658203, 0.004538297653198242, 0.004803657531738281, 0.00506901741027832, 0.005334377288818359, 0.0055997371673583984, 0.0058650970458984375, 0.0061304569244384766, 0.006395816802978516, 0.006661176681518555, 0.006926536560058594, 0.007191896438598633, 0.007457256317138672, 0.007722616195678711, 0.00798797607421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 8.0, 8.0, 10.0, 18.0, 20.0, 22.0, 38.0, 44.0, 79.0, 105.0, 125.0, 137.0, 92.0, 66.0, 44.0, 40.0, 35.0, 21.0, 20.0, 8.0, 10.0, 7.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011617259122431278, -0.011213523335754871, -0.010809787549078465, -0.010406051762402058, -0.010002315044403076, -0.00959857925772667, -0.009194843471050262, -0.008791107684373856, -0.008387371897697449, -0.007983636111021042, -0.007579900324344635, -0.007176164072006941, -0.006772428285330534, -0.006368692498654127, -0.005964956246316433, -0.005561220459640026, -0.005157484672963619, -0.004753748886287212, -0.0043500130996108055, -0.003946276847273111, -0.0035425410605967045, -0.0031388052739202976, -0.002735069254413247, -0.0023313332349061966, -0.0019275974482297897, -0.001523861545138061, -0.0011201256420463324, -0.0007163897389546037, -0.000312653835862875, 9.108195081353188e-05, 0.0004948179703205824, 0.0008985539898276329, 0.0013022907078266144, 0.001706026610918343, 0.0021097625140100718, 0.0025134985335171223, 0.002917234320193529, 0.003320970106869936, 0.0037247061263769865, 0.004128442145884037, 0.004532177932560444, 0.004935913719236851, 0.005339649505913258, 0.005743385758250952, 0.006147121544927359, 0.0065508573316037655, 0.00695459358394146, 0.0073583293706178665, 0.007762065157294273, 0.00816580094397068, 0.008569536730647087, 0.008973272517323494, 0.0093770083039999, 0.009780744090676308, 0.01018448080867529, 0.010588216595351696, 0.010991952382028103, 0.01139568816870451, 0.011799423955380917, 0.012203159742057323, 0.012606896460056305, 0.013010632246732712, 0.013414368033409119, 0.013818103820085526, 0.014221839606761932]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 9.0, 19.0, 11.0, 16.0, 16.0, 18.0, 27.0, 33.0, 23.0, 31.0, 48.0, 40.0, 33.0, 42.0, 32.0, 47.0, 49.0, 35.0, 36.0, 43.0, 49.0, 40.0, 39.0, 25.0, 33.0, 25.0, 27.0, 23.0, 16.0, 16.0, 17.0, 6.0, 9.0, 9.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.008160150609910488, -0.007916451431810856, -0.007672752719372511, -0.007429054006934166, -0.007185354828834534, -0.006941656116396189, -0.006697957403957844, -0.0064542582258582115, -0.0062105595134198666, -0.005966860800981522, -0.005723161622881889, -0.005479462910443544, -0.005235764198005199, -0.004992065019905567, -0.004748366307467222, -0.004504667595028877, -0.004260968416929245, -0.0040172697044909, -0.0037735705263912678, -0.003529871813952923, -0.003286172868683934, -0.0030424739234149456, -0.0027987752109766006, -0.002555076265707612, -0.0023113773204386234, -0.002067678375169635, -0.001823979546315968, -0.0015802807174623013, -0.0013365817721933126, -0.001092882826924324, -0.0008491839980706573, -0.0006054851692169905, -0.00036178575828671455, -0.00011808687122538686, 0.00012561201583594084, 0.00036931090289726853, 0.0006130097899585962, 0.0008567087352275848, 0.0011004075640812516, 0.0013441063929349184, 0.001587805338203907, 0.0018315042834728956, 0.0020752032287418842, 0.002318901941180229, 0.002562600886449218, 0.0028062998317182064, 0.0030499985441565514, 0.00329369748942554, 0.0035373964346945286, 0.003781095379963517, 0.004024794325232506, 0.004268493037670851, 0.004512191750109196, 0.004755890928208828, 0.004999589640647173, 0.005243288353085518, 0.00548698753118515, 0.005730686243623495, 0.005974385421723127, 0.006218084134161472, 0.006461783312261105, 0.0067054820246994495, 0.0069491807371377945, 0.007192879915237427, 0.007436578627675772]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 16.0, 22.0, 22.0, 33.0, 72.0, 92.0, 129.0, 215.0, 341.0, 558.0, 842.0, 1410.0, 2513.0, 4359.0, 8180.0, 16624.0, 35018.0, 80731.0, 218377.0, 407166.0, 154745.0, 60886.0, 27370.0, 13129.0, 6719.0, 3708.0, 2074.0, 1205.0, 740.0, 457.0, 268.0, 162.0, 128.0, 82.0, 42.0, 34.0, 17.0, 18.0, 17.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024993896484375, -0.024142026901245117, -0.023290157318115234, -0.02243828773498535, -0.02158641815185547, -0.020734548568725586, -0.019882678985595703, -0.01903080940246582, -0.018178939819335938, -0.017327070236206055, -0.016475200653076172, -0.015623331069946289, -0.014771461486816406, -0.013919591903686523, -0.01306772232055664, -0.012215852737426758, -0.011363983154296875, -0.010512113571166992, -0.00966024398803711, -0.008808374404907227, -0.007956504821777344, -0.007104635238647461, -0.006252765655517578, -0.005400896072387695, -0.0045490264892578125, -0.0036971569061279297, -0.002845287322998047, -0.001993417739868164, -0.0011415481567382812, -0.00028967857360839844, 0.0005621910095214844, 0.0014140605926513672, 0.00226593017578125, 0.003117799758911133, 0.003969669342041016, 0.0048215389251708984, 0.005673408508300781, 0.006525278091430664, 0.007377147674560547, 0.00822901725769043, 0.009080886840820312, 0.009932756423950195, 0.010784626007080078, 0.011636495590209961, 0.012488365173339844, 0.013340234756469727, 0.01419210433959961, 0.015043973922729492, 0.015895843505859375, 0.016747713088989258, 0.01759958267211914, 0.018451452255249023, 0.019303321838378906, 0.02015519142150879, 0.021007061004638672, 0.021858930587768555, 0.022710800170898438, 0.02356266975402832, 0.024414539337158203, 0.025266408920288086, 0.02611827850341797, 0.02697014808654785, 0.027822017669677734, 0.028673887252807617, 0.0295257568359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 7.0, 9.0, 16.0, 18.0, 13.0, 25.0, 23.0, 32.0, 28.0, 44.0, 36.0, 51.0, 48.0, 54.0, 50.0, 48.0, 46.0, 55.0, 62.0, 44.0, 49.0, 32.0, 46.0, 22.0, 33.0, 17.0, 18.0, 15.0, 15.0, 8.0, 12.0, 7.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006725311279296875, -0.006473243236541748, -0.006221175193786621, -0.005969107151031494, -0.005717039108276367, -0.00546497106552124, -0.005212903022766113, -0.004960834980010986, -0.004708766937255859, -0.004456698894500732, -0.0042046308517456055, -0.0039525628089904785, -0.0037004947662353516, -0.0034484267234802246, -0.0031963586807250977, -0.0029442906379699707, -0.0026922225952148438, -0.002440154552459717, -0.00218808650970459, -0.0019360184669494629, -0.001683950424194336, -0.001431882381439209, -0.001179814338684082, -0.0009277462959289551, -0.0006756782531738281, -0.00042361021041870117, -0.00017154216766357422, 8.052587509155273e-05, 0.0003325939178466797, 0.0005846619606018066, 0.0008367300033569336, 0.0010887980461120605, 0.0013408660888671875, 0.0015929341316223145, 0.0018450021743774414, 0.0020970702171325684, 0.0023491382598876953, 0.0026012063026428223, 0.0028532743453979492, 0.003105342388153076, 0.003357410430908203, 0.00360947847366333, 0.003861546516418457, 0.004113614559173584, 0.004365682601928711, 0.004617750644683838, 0.004869818687438965, 0.005121886730194092, 0.005373954772949219, 0.005626022815704346, 0.005878090858459473, 0.0061301589012146, 0.0063822269439697266, 0.0066342949867248535, 0.0068863630294799805, 0.007138431072235107, 0.007390499114990234, 0.007642567157745361, 0.007894635200500488, 0.008146703243255615, 0.008398771286010742, 0.00865083932876587, 0.008902907371520996, 0.009154975414276123, 0.00940704345703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 6.0, 9.0, 16.0, 17.0, 18.0, 24.0, 44.0, 40.0, 64.0, 100.0, 123.0, 164.0, 244.0, 395.0, 622.0, 944.0, 1757.0, 3350.0, 7034.0, 17438.0, 56236.0, 688897.0, 209602.0, 36655.0, 12676.0, 5443.0, 2684.0, 1456.0, 866.0, 498.0, 344.0, 223.0, 141.0, 107.0, 73.0, 53.0, 66.0, 20.0, 20.0, 25.0, 18.0, 9.0, 5.0, 7.0, 5.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.04449462890625, -0.04309701919555664, -0.04169940948486328, -0.04030179977416992, -0.03890419006347656, -0.0375065803527832, -0.036108970642089844, -0.034711360931396484, -0.033313751220703125, -0.031916141510009766, -0.030518531799316406, -0.029120922088623047, -0.027723312377929688, -0.026325702667236328, -0.02492809295654297, -0.02353048324584961, -0.02213287353515625, -0.02073526382446289, -0.01933765411376953, -0.017940044403076172, -0.016542434692382812, -0.015144824981689453, -0.013747215270996094, -0.012349605560302734, -0.010951995849609375, -0.009554386138916016, -0.008156776428222656, -0.006759166717529297, -0.0053615570068359375, -0.003963947296142578, -0.0025663375854492188, -0.0011687278747558594, 0.0002288818359375, 0.0016264915466308594, 0.0030241012573242188, 0.004421710968017578, 0.0058193206787109375, 0.007216930389404297, 0.008614540100097656, 0.010012149810791016, 0.011409759521484375, 0.012807369232177734, 0.014204978942871094, 0.015602588653564453, 0.017000198364257812, 0.018397808074951172, 0.01979541778564453, 0.02119302749633789, 0.02259063720703125, 0.02398824691772461, 0.02538585662841797, 0.026783466339111328, 0.028181076049804688, 0.029578685760498047, 0.030976295471191406, 0.032373905181884766, 0.033771514892578125, 0.035169124603271484, 0.036566734313964844, 0.0379643440246582, 0.03936195373535156, 0.04075956344604492, 0.04215717315673828, 0.04355478286743164, 0.044952392578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 8.0, 5.0, 4.0, 4.0, 11.0, 11.0, 14.0, 12.0, 16.0, 26.0, 27.0, 25.0, 32.0, 32.0, 43.0, 51.0, 32.0, 37.0, 48.0, 41.0, 44.0, 35.0, 47.0, 51.0, 29.0, 45.0, 42.0, 31.0, 33.0, 22.0, 29.0, 21.0, 12.0, 13.0, 14.0, 9.0, 4.0, 9.0, 7.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004535675048828125, -0.004392504692077637, -0.0042493343353271484, -0.00410616397857666, -0.003962993621826172, -0.0038198232650756836, -0.0036766529083251953, -0.003533482551574707, -0.0033903121948242188, -0.0032471418380737305, -0.003103971481323242, -0.002960801124572754, -0.0028176307678222656, -0.0026744604110717773, -0.002531290054321289, -0.0023881196975708008, -0.0022449493408203125, -0.0021017789840698242, -0.001958608627319336, -0.0018154382705688477, -0.0016722679138183594, -0.001529097557067871, -0.0013859272003173828, -0.0012427568435668945, -0.0010995864868164062, -0.000956416130065918, -0.0008132457733154297, -0.0006700754165649414, -0.0005269050598144531, -0.00038373470306396484, -0.00024056434631347656, -9.739398956298828e-05, 4.57763671875e-05, 0.00018894672393798828, 0.00033211708068847656, 0.00047528743743896484, 0.0006184577941894531, 0.0007616281509399414, 0.0009047985076904297, 0.001047968864440918, 0.0011911392211914062, 0.0013343095779418945, 0.0014774799346923828, 0.001620650291442871, 0.0017638206481933594, 0.0019069910049438477, 0.002050161361694336, 0.0021933317184448242, 0.0023365020751953125, 0.0024796724319458008, 0.002622842788696289, 0.0027660131454467773, 0.0029091835021972656, 0.003052353858947754, 0.003195524215698242, 0.0033386945724487305, 0.0034818649291992188, 0.003625035285949707, 0.0037682056427001953, 0.003911375999450684, 0.004054546356201172, 0.00419771671295166, 0.0043408870697021484, 0.004484057426452637, 0.004627227783203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 10.0, 11.0, 12.0, 13.0, 29.0, 19.0, 48.0, 49.0, 65.0, 84.0, 153.0, 204.0, 296.0, 498.0, 798.0, 1252.0, 2315.0, 5383.0, 18420.0, 862346.0, 134157.0, 12865.0, 4328.0, 1966.0, 1132.0, 656.0, 432.0, 287.0, 219.0, 140.0, 109.0, 63.0, 54.0, 37.0, 29.0, 22.0, 20.0, 6.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13134765625, -0.12758255004882812, -0.12381744384765625, -0.12005233764648438, -0.1162872314453125, -0.11252212524414062, -0.10875701904296875, -0.10499191284179688, -0.101226806640625, -0.09746170043945312, -0.09369659423828125, -0.08993148803710938, -0.0861663818359375, -0.08240127563476562, -0.07863616943359375, -0.07487106323242188, -0.07110595703125, -0.06734085083007812, -0.06357574462890625, -0.059810638427734375, -0.0560455322265625, -0.052280426025390625, -0.04851531982421875, -0.044750213623046875, -0.040985107421875, -0.037220001220703125, -0.03345489501953125, -0.029689788818359375, -0.0259246826171875, -0.022159576416015625, -0.01839447021484375, -0.014629364013671875, -0.0108642578125, -0.007099151611328125, -0.00333404541015625, 0.000431060791015625, 0.0041961669921875, 0.007961273193359375, 0.01172637939453125, 0.015491485595703125, 0.019256591796875, 0.023021697998046875, 0.02678680419921875, 0.030551910400390625, 0.0343170166015625, 0.038082122802734375, 0.04184722900390625, 0.045612335205078125, 0.04937744140625, 0.053142547607421875, 0.05690765380859375, 0.060672760009765625, 0.0644378662109375, 0.06820297241210938, 0.07196807861328125, 0.07573318481445312, 0.079498291015625, 0.08326339721679688, 0.08702850341796875, 0.09079360961914062, 0.0945587158203125, 0.09832382202148438, 0.10208892822265625, 0.10585403442382812, 0.109619140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 2.0, 9.0, 14.0, 16.0, 21.0, 29.0, 42.0, 117.0, 195.0, 193.0, 148.0, 79.0, 19.0, 20.0, 15.0, 14.0, 5.0, 10.0, 11.0, 6.0, 7.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8358230590820312e-05, -1.7787329852581024e-05, -1.7216429114341736e-05, -1.6645528376102448e-05, -1.607462763786316e-05, -1.550372689962387e-05, -1.4932826161384583e-05, -1.4361925423145294e-05, -1.3791024684906006e-05, -1.3220123946666718e-05, -1.264922320842743e-05, -1.2078322470188141e-05, -1.1507421731948853e-05, -1.0936520993709564e-05, -1.0365620255470276e-05, -9.794719517230988e-06, -9.2238187789917e-06, -8.652918040752411e-06, -8.082017302513123e-06, -7.511116564273834e-06, -6.940215826034546e-06, -6.3693150877952576e-06, -5.798414349555969e-06, -5.227513611316681e-06, -4.656612873077393e-06, -4.085712134838104e-06, -3.514811396598816e-06, -2.9439106583595276e-06, -2.3730099201202393e-06, -1.802109181880951e-06, -1.2312084436416626e-06, -6.603077054023743e-07, -8.940696716308594e-08, 4.814937710762024e-07, 1.0523945093154907e-06, 1.623295247554779e-06, 2.1941959857940674e-06, 2.7650967240333557e-06, 3.335997462272644e-06, 3.906898200511932e-06, 4.477798938751221e-06, 5.048699676990509e-06, 5.619600415229797e-06, 6.190501153469086e-06, 6.761401891708374e-06, 7.332302629947662e-06, 7.90320336818695e-06, 8.474104106426239e-06, 9.045004844665527e-06, 9.615905582904816e-06, 1.0186806321144104e-05, 1.0757707059383392e-05, 1.132860779762268e-05, 1.1899508535861969e-05, 1.2470409274101257e-05, 1.3041310012340546e-05, 1.3612210750579834e-05, 1.4183111488819122e-05, 1.475401222705841e-05, 1.53249129652977e-05, 1.5895813703536987e-05, 1.6466714441776276e-05, 1.7037615180015564e-05, 1.7608515918254852e-05, 1.817941665649414e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 6.0, 10.0, 24.0, 19.0, 44.0, 138.0, 752.0, 5562.0, 877045.0, 159976.0, 4122.0, 597.0, 110.0, 42.0, 20.0, 16.0, 4.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.17063140869140625, -0.1656036376953125, -0.16057586669921875, -0.155548095703125, -0.15052032470703125, -0.1454925537109375, -0.14046478271484375, -0.13543701171875, -0.13040924072265625, -0.1253814697265625, -0.12035369873046875, -0.115325927734375, -0.11029815673828125, -0.1052703857421875, -0.10024261474609375, -0.09521484375, -0.09018707275390625, -0.0851593017578125, -0.08013153076171875, -0.075103759765625, -0.07007598876953125, -0.0650482177734375, -0.06002044677734375, -0.05499267578125, -0.04996490478515625, -0.0449371337890625, -0.03990936279296875, -0.034881591796875, -0.02985382080078125, -0.0248260498046875, -0.01979827880859375, -0.0147705078125, -0.00974273681640625, -0.0047149658203125, 0.00031280517578125, 0.005340576171875, 0.01036834716796875, 0.0153961181640625, 0.02042388916015625, 0.02545166015625, 0.03047943115234375, 0.0355072021484375, 0.04053497314453125, 0.045562744140625, 0.05059051513671875, 0.0556182861328125, 0.06064605712890625, 0.065673828125, 0.07070159912109375, 0.0757293701171875, 0.08075714111328125, 0.085784912109375, 0.09081268310546875, 0.0958404541015625, 0.10086822509765625, 0.10589599609375, 0.11092376708984375, 0.1159515380859375, 0.12097930908203125, 0.126007080078125, 0.13103485107421875, 0.1360626220703125, 0.14109039306640625, 0.1461181640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 9.0, 17.0, 13.0, 27.0, 34.0, 55.0, 103.0, 387.0, 125.0, 50.0, 41.0, 22.0, 20.0, 14.0, 8.0, 13.0, 10.0, 3.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006618499755859375, -0.006401121616363525, -0.006183743476867676, -0.005966365337371826, -0.0057489871978759766, -0.005531609058380127, -0.005314230918884277, -0.005096852779388428, -0.004879474639892578, -0.0046620965003967285, -0.004444718360900879, -0.004227340221405029, -0.00400996208190918, -0.00379258394241333, -0.0035752058029174805, -0.003357827663421631, -0.0031404495239257812, -0.0029230713844299316, -0.002705693244934082, -0.0024883151054382324, -0.002270936965942383, -0.002053558826446533, -0.0018361806869506836, -0.001618802547454834, -0.0014014244079589844, -0.0011840462684631348, -0.0009666681289672852, -0.0007492899894714355, -0.0005319118499755859, -0.00031453371047973633, -9.715557098388672e-05, 0.00012022256851196289, 0.0003376007080078125, 0.0005549788475036621, 0.0007723569869995117, 0.0009897351264953613, 0.001207113265991211, 0.0014244914054870605, 0.0016418695449829102, 0.0018592476844787598, 0.0020766258239746094, 0.002294003963470459, 0.0025113821029663086, 0.002728760242462158, 0.002946138381958008, 0.0031635165214538574, 0.003380894660949707, 0.0035982728004455566, 0.0038156509399414062, 0.004033029079437256, 0.0042504072189331055, 0.004467785358428955, 0.004685163497924805, 0.004902541637420654, 0.005119919776916504, 0.0053372979164123535, 0.005554676055908203, 0.005772054195404053, 0.005989432334899902, 0.006206810474395752, 0.0064241886138916016, 0.006641566753387451, 0.006858944892883301, 0.00707632303237915, 0.007293701171875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 15.0, 16.0, 27.0, 41.0, 48.0, 124.0, 261.0, 224.0, 121.0, 58.0, 28.0, 19.0, 8.0, 10.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035258278250694275, -0.03452237695455551, -0.03378647565841675, -0.033050574362277985, -0.03231467306613922, -0.03157877177000046, -0.030842868611216545, -0.03010696731507778, -0.02937106415629387, -0.028635162860155106, -0.027899261564016342, -0.02716336026787758, -0.026427457109093666, -0.025691555812954903, -0.02495565451681614, -0.024219753220677376, -0.023483851924538612, -0.02274795062839985, -0.022012049332261086, -0.021276146173477173, -0.02054024487733841, -0.019804343581199646, -0.019068442285060883, -0.01833254098892212, -0.017596639692783356, -0.016860738396644592, -0.01612483710050583, -0.01538893487304449, -0.014653032645583153, -0.01391713134944439, -0.013181230053305626, -0.012445328757166862, -0.011709426529705524, -0.010973525233566761, -0.010237623006105423, -0.00950172170996666, -0.008765820413827896, -0.008029918186366558, -0.007294016890227795, -0.006558115128427744, -0.005822213366627693, -0.0050863116048276424, -0.004350409843027592, -0.0036145085468888283, -0.0028786067850887775, -0.002142705023288727, -0.0014068037271499634, -0.0006709019653499126, 6.499979645013809e-05, 0.000800901441834867, 0.001536803087219596, 0.002272704616189003, 0.0030086063779890537, 0.0037445081397891045, 0.004480409435927868, 0.005216311197727919, 0.005952212959527969, 0.00668811472132802, 0.007424016483128071, 0.008159917779266834, 0.008895820006728172, 0.009631721302866936, 0.0103676225990057, 0.011103523895144463, 0.0118394261226058]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 5.0, 5.0, 13.0, 18.0, 18.0, 18.0, 28.0, 23.0, 18.0, 25.0, 36.0, 34.0, 38.0, 43.0, 39.0, 36.0, 42.0, 39.0, 41.0, 45.0, 25.0, 44.0, 36.0, 30.0, 23.0, 34.0, 29.0, 33.0, 23.0, 11.0, 22.0, 18.0, 17.0, 16.0, 9.0, 16.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.006002914160490036, -0.005821658298373222, -0.005640402436256409, -0.005459146574139595, -0.005277890712022781, -0.005096634849905968, -0.004915378987789154, -0.00473412312567234, -0.004552867263555527, -0.004371611401438713, -0.004190355539321899, -0.004009099677205086, -0.003827843815088272, -0.0036465879529714584, -0.0034653320908546448, -0.003284076228737831, -0.0031028203666210175, -0.002921564504504204, -0.00274030864238739, -0.0025590527802705765, -0.002377796918153763, -0.002196541056036949, -0.0020152851939201355, -0.0018340293318033218, -0.0016527734696865082, -0.0014715176075696945, -0.0012902617454528809, -0.0011090058833360672, -0.0009277500212192535, -0.0007464941591024399, -0.0005652382969856262, -0.00038398243486881256, -0.0002027261070907116, -2.1470244973897934e-05, 0.00015978561714291573, 0.0003410414792597294, 0.000522297341376543, 0.0007035532034933567, 0.0008848090656101704, 0.001066064927726984, 0.0012473207898437977, 0.0014285766519606113, 0.001609832514077425, 0.0017910883761942387, 0.0019723442383110523, 0.002153600100427866, 0.0023348559625446796, 0.0025161118246614933, 0.002697367686778307, 0.0028786235488951206, 0.0030598794110119343, 0.003241135273128748, 0.0034223911352455616, 0.0036036469973623753, 0.003784902859479189, 0.003966158721596003, 0.004147414583712816, 0.00432867044582963, 0.0045099263079464436, 0.004691182170063257, 0.004872438032180071, 0.0050536938942968845, 0.005234949756413698, 0.005416205618530512, 0.0055974614806473255]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 8.0, 9.0, 19.0, 28.0, 44.0, 51.0, 86.0, 144.0, 186.0, 319.0, 462.0, 811.0, 1285.0, 2261.0, 3991.0, 7204.0, 13883.0, 28358.0, 63307.0, 169681.0, 431727.0, 191645.0, 69405.0, 30703.0, 15006.0, 7808.0, 4129.0, 2295.0, 1385.0, 864.0, 522.0, 316.0, 199.0, 138.0, 84.0, 54.0, 39.0, 28.0, 23.0, 14.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.017974853515625, -0.01743912696838379, -0.016903400421142578, -0.016367673873901367, -0.015831947326660156, -0.015296220779418945, -0.014760494232177734, -0.014224767684936523, -0.013689041137695312, -0.013153314590454102, -0.01261758804321289, -0.01208186149597168, -0.011546134948730469, -0.011010408401489258, -0.010474681854248047, -0.009938955307006836, -0.009403228759765625, -0.008867502212524414, -0.008331775665283203, -0.007796049118041992, -0.007260322570800781, -0.00672459602355957, -0.006188869476318359, -0.0056531429290771484, -0.0051174163818359375, -0.0045816898345947266, -0.004045963287353516, -0.0035102367401123047, -0.0029745101928710938, -0.002438783645629883, -0.0019030570983886719, -0.001367330551147461, -0.00083160400390625, -0.00029587745666503906, 0.00023984909057617188, 0.0007755756378173828, 0.0013113021850585938, 0.0018470287322998047, 0.0023827552795410156, 0.0029184818267822266, 0.0034542083740234375, 0.0039899349212646484, 0.004525661468505859, 0.00506138801574707, 0.005597114562988281, 0.006132841110229492, 0.006668567657470703, 0.007204294204711914, 0.007740020751953125, 0.008275747299194336, 0.008811473846435547, 0.009347200393676758, 0.009882926940917969, 0.01041865348815918, 0.01095438003540039, 0.011490106582641602, 0.012025833129882812, 0.012561559677124023, 0.013097286224365234, 0.013633012771606445, 0.014168739318847656, 0.014704465866088867, 0.015240192413330078, 0.01577591896057129, 0.0163116455078125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 5.0, 10.0, 13.0, 25.0, 24.0, 29.0, 35.0, 34.0, 49.0, 47.0, 64.0, 59.0, 59.0, 59.0, 60.0, 58.0, 58.0, 52.0, 38.0, 34.0, 44.0, 32.0, 21.0, 18.0, 13.0, 13.0, 8.0, 7.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004058837890625, -0.003920555114746094, -0.0037822723388671875, -0.0036439895629882812, -0.003505706787109375, -0.0033674240112304688, -0.0032291412353515625, -0.0030908584594726562, -0.00295257568359375, -0.0028142929077148438, -0.0026760101318359375, -0.0025377273559570312, -0.002399444580078125, -0.0022611618041992188, -0.0021228790283203125, -0.0019845962524414062, -0.0018463134765625, -0.0017080307006835938, -0.0015697479248046875, -0.0014314651489257812, -0.001293182373046875, -0.0011548995971679688, -0.0010166168212890625, -0.0008783340454101562, -0.00074005126953125, -0.0006017684936523438, -0.0004634857177734375, -0.00032520294189453125, -0.000186920166015625, -4.863739013671875e-05, 8.96453857421875e-05, 0.00022792816162109375, 0.0003662109375, 0.0005044937133789062, 0.0006427764892578125, 0.0007810592651367188, 0.000919342041015625, 0.0010576248168945312, 0.0011959075927734375, 0.0013341903686523438, 0.00147247314453125, 0.0016107559204101562, 0.0017490386962890625, 0.0018873214721679688, 0.002025604248046875, 0.0021638870239257812, 0.0023021697998046875, 0.0024404525756835938, 0.0025787353515625, 0.0027170181274414062, 0.0028553009033203125, 0.0029935836791992188, 0.003131866455078125, 0.0032701492309570312, 0.0034084320068359375, 0.0035467147827148438, 0.00368499755859375, 0.0038232803344726562, 0.0039615631103515625, 0.004099845886230469, 0.004238128662109375, 0.004376411437988281, 0.0045146942138671875, 0.004652976989746094, 0.004791259765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 10.0, 11.0, 13.0, 21.0, 22.0, 27.0, 38.0, 52.0, 58.0, 114.0, 216.0, 504.0, 1249.0, 3925.0, 13215.0, 49780.0, 233794.0, 586990.0, 118236.0, 28098.0, 7988.0, 2506.0, 905.0, 365.0, 139.0, 69.0, 46.0, 27.0, 21.0, 22.0, 16.0, 12.0, 16.0, 7.0, 6.0, 8.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0197906494140625, -0.01913738250732422, -0.018484115600585938, -0.017830848693847656, -0.017177581787109375, -0.016524314880371094, -0.015871047973632812, -0.015217781066894531, -0.01456451416015625, -0.013911247253417969, -0.013257980346679688, -0.012604713439941406, -0.011951446533203125, -0.011298179626464844, -0.010644912719726562, -0.009991645812988281, -0.00933837890625, -0.008685111999511719, -0.008031845092773438, -0.007378578186035156, -0.006725311279296875, -0.006072044372558594, -0.0054187774658203125, -0.004765510559082031, -0.00411224365234375, -0.0034589767456054688, -0.0028057098388671875, -0.0021524429321289062, -0.001499176025390625, -0.0008459091186523438, -0.0001926422119140625, 0.00046062469482421875, 0.0011138916015625, 0.0017671585083007812, 0.0024204254150390625, 0.0030736923217773438, 0.003726959228515625, 0.004380226135253906, 0.0050334930419921875, 0.005686759948730469, 0.00634002685546875, 0.006993293762207031, 0.0076465606689453125, 0.008299827575683594, 0.008953094482421875, 0.009606361389160156, 0.010259628295898438, 0.010912895202636719, 0.011566162109375, 0.012219429016113281, 0.012872695922851562, 0.013525962829589844, 0.014179229736328125, 0.014832496643066406, 0.015485763549804688, 0.01613903045654297, 0.01679229736328125, 0.01744556427001953, 0.018098831176757812, 0.018752098083496094, 0.019405364990234375, 0.020058631896972656, 0.020711898803710938, 0.02136516571044922, 0.0220184326171875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 11.0, 13.0, 18.0, 8.0, 24.0, 17.0, 27.0, 30.0, 34.0, 35.0, 31.0, 37.0, 37.0, 36.0, 38.0, 41.0, 44.0, 43.0, 41.0, 37.0, 46.0, 36.0, 34.0, 48.0, 33.0, 37.0, 30.0, 19.0, 19.0, 22.0, 9.0, 12.0, 11.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0030918121337890625, -0.003000020980834961, -0.0029082298278808594, -0.002816438674926758, -0.0027246475219726562, -0.0026328563690185547, -0.002541065216064453, -0.0024492740631103516, -0.00235748291015625, -0.0022656917572021484, -0.002173900604248047, -0.0020821094512939453, -0.0019903182983398438, -0.0018985271453857422, -0.0018067359924316406, -0.001714944839477539, -0.0016231536865234375, -0.001531362533569336, -0.0014395713806152344, -0.0013477802276611328, -0.0012559890747070312, -0.0011641979217529297, -0.0010724067687988281, -0.0009806156158447266, -0.000888824462890625, -0.0007970333099365234, -0.0007052421569824219, -0.0006134510040283203, -0.0005216598510742188, -0.0004298686981201172, -0.0003380775451660156, -0.00024628639221191406, -0.0001544952392578125, -6.270408630371094e-05, 2.9087066650390625e-05, 0.00012087821960449219, 0.00021266937255859375, 0.0003044605255126953, 0.0003962516784667969, 0.00048804283142089844, 0.000579833984375, 0.0006716251373291016, 0.0007634162902832031, 0.0008552074432373047, 0.0009469985961914062, 0.0010387897491455078, 0.0011305809020996094, 0.001222372055053711, 0.0013141632080078125, 0.001405954360961914, 0.0014977455139160156, 0.0015895366668701172, 0.0016813278198242188, 0.0017731189727783203, 0.0018649101257324219, 0.0019567012786865234, 0.002048492431640625, 0.0021402835845947266, 0.002232074737548828, 0.0023238658905029297, 0.0024156570434570312, 0.002507448196411133, 0.0025992393493652344, 0.002691030502319336, 0.0027828216552734375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 12.0, 21.0, 16.0, 18.0, 33.0, 46.0, 67.0, 103.0, 124.0, 154.0, 273.0, 462.0, 696.0, 1191.0, 2089.0, 4046.0, 9024.0, 24654.0, 114064.0, 751213.0, 99793.0, 23253.0, 8436.0, 3793.0, 2029.0, 1080.0, 643.0, 418.0, 238.0, 152.0, 101.0, 84.0, 43.0, 34.0, 33.0, 27.0, 21.0, 9.0, 10.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0009403228759765625, -0.0009130388498306274, -0.0008857548236846924, -0.0008584707975387573, -0.0008311867713928223, -0.0008039027452468872, -0.0007766187191009521, -0.0007493346929550171, -0.000722050666809082, -0.000694766640663147, -0.0006674826145172119, -0.0006401985883712769, -0.0006129145622253418, -0.0005856305360794067, -0.0005583465099334717, -0.0005310624837875366, -0.0005037784576416016, -0.0004764944314956665, -0.00044921040534973145, -0.0004219263792037964, -0.00039464235305786133, -0.00036735832691192627, -0.0003400743007659912, -0.00031279027462005615, -0.0002855062484741211, -0.00025822222232818604, -0.00023093819618225098, -0.00020365417003631592, -0.00017637014389038086, -0.0001490861177444458, -0.00012180209159851074, -9.451806545257568e-05, -6.723403930664062e-05, -3.9950013160705566e-05, -1.2665987014770508e-05, 1.461803913116455e-05, 4.190206527709961e-05, 6.918609142303467e-05, 9.647011756896973e-05, 0.00012375414371490479, 0.00015103816986083984, 0.0001783221960067749, 0.00020560622215270996, 0.00023289024829864502, 0.0002601742744445801, 0.00028745830059051514, 0.0003147423267364502, 0.00034202635288238525, 0.0003693103790283203, 0.00039659440517425537, 0.00042387843132019043, 0.0004511624574661255, 0.00047844648361206055, 0.0005057305097579956, 0.0005330145359039307, 0.0005602985620498657, 0.0005875825881958008, 0.0006148666143417358, 0.0006421506404876709, 0.000669434666633606, 0.000696718692779541, 0.0007240027189254761, 0.0007512867450714111, 0.0007785707712173462, 0.0008058547973632812]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 9.0, 12.0, 20.0, 16.0, 31.0, 35.0, 61.0, 71.0, 116.0, 131.0, 124.0, 84.0, 76.0, 55.0, 30.0, 30.0, 14.0, 25.0, 12.0, 6.0, 8.0, 10.0, 4.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-06, -7.512979209423065e-06, -7.277354598045349e-06, -7.041729986667633e-06, -6.806105375289917e-06, -6.570480763912201e-06, -6.334856152534485e-06, -6.099231541156769e-06, -5.863606929779053e-06, -5.627982318401337e-06, -5.392357707023621e-06, -5.1567330956459045e-06, -4.9211084842681885e-06, -4.685483872890472e-06, -4.449859261512756e-06, -4.21423465013504e-06, -3.978610038757324e-06, -3.742985427379608e-06, -3.507360816001892e-06, -3.271736204624176e-06, -3.03611159324646e-06, -2.800486981868744e-06, -2.564862370491028e-06, -2.3292377591133118e-06, -2.0936131477355957e-06, -1.8579885363578796e-06, -1.6223639249801636e-06, -1.3867393136024475e-06, -1.1511147022247314e-06, -9.154900908470154e-07, -6.798654794692993e-07, -4.4424086809158325e-07, -2.086162567138672e-07, 2.7008354663848877e-08, 2.6263296604156494e-07, 4.98257577419281e-07, 7.338821887969971e-07, 9.695068001747131e-07, 1.2051314115524292e-06, 1.4407560229301453e-06, 1.6763806343078613e-06, 1.9120052456855774e-06, 2.1476298570632935e-06, 2.3832544684410095e-06, 2.6188790798187256e-06, 2.8545036911964417e-06, 3.0901283025741577e-06, 3.3257529139518738e-06, 3.56137752532959e-06, 3.797002136707306e-06, 4.032626748085022e-06, 4.268251359462738e-06, 4.503875970840454e-06, 4.73950058221817e-06, 4.975125193595886e-06, 5.210749804973602e-06, 5.446374416351318e-06, 5.6819990277290344e-06, 5.9176236391067505e-06, 6.1532482504844666e-06, 6.388872861862183e-06, 6.624497473239899e-06, 6.860122084617615e-06, 7.095746695995331e-06, 7.331371307373047e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 8.0, 15.0, 22.0, 10.0, 33.0, 57.0, 113.0, 254.0, 554.0, 1577.0, 5509.0, 25227.0, 240767.0, 716199.0, 45705.0, 8770.0, 2326.0, 801.0, 284.0, 129.0, 62.0, 43.0, 27.0, 9.0, 12.0, 9.0, 6.0, 8.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006699562072753906, -0.0006461665034294128, -0.0006223767995834351, -0.0005985870957374573, -0.0005747973918914795, -0.0005510076880455017, -0.0005272179841995239, -0.0005034282803535461, -0.00047963857650756836, -0.0004558488726615906, -0.0004320591688156128, -0.000408269464969635, -0.0003844797611236572, -0.00036069005727767944, -0.00033690035343170166, -0.0003131106495857239, -0.0002893209457397461, -0.0002655312418937683, -0.00024174153804779053, -0.00021795183420181274, -0.00019416213035583496, -0.00017037242650985718, -0.0001465827226638794, -0.0001227930188179016, -9.900331497192383e-05, -7.521361112594604e-05, -5.142390727996826e-05, -2.763420343399048e-05, -3.844499588012695e-06, 1.9945204257965088e-05, 4.373490810394287e-05, 6.752461194992065e-05, 9.131431579589844e-05, 0.00011510401964187622, 0.000138893723487854, 0.0001626834273338318, 0.00018647313117980957, 0.00021026283502578735, 0.00023405253887176514, 0.0002578422427177429, 0.0002816319465637207, 0.0003054216504096985, 0.00032921135425567627, 0.00035300105810165405, 0.00037679076194763184, 0.0004005804657936096, 0.0004243701696395874, 0.0004481598734855652, 0.00047194957733154297, 0.0004957392811775208, 0.0005195289850234985, 0.0005433186888694763, 0.0005671083927154541, 0.0005908980965614319, 0.0006146878004074097, 0.0006384775042533875, 0.0006622672080993652, 0.000686056911945343, 0.0007098466157913208, 0.0007336363196372986, 0.0007574260234832764, 0.0007812157273292542, 0.0008050054311752319, 0.0008287951350212097, 0.0008525848388671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 7.0, 9.0, 12.0, 11.0, 25.0, 22.0, 37.0, 42.0, 53.0, 75.0, 90.0, 89.0, 96.0, 89.0, 50.0, 58.0, 42.0, 46.0, 28.0, 23.0, 18.0, 10.0, 12.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011622905731201172, -0.00011299550533294678, -0.00010976195335388184, -0.0001065284013748169, -0.00010329484939575195, -0.00010006129741668701, -9.682774543762207e-05, -9.359419345855713e-05, -9.036064147949219e-05, -8.712708950042725e-05, -8.38935375213623e-05, -8.065998554229736e-05, -7.742643356323242e-05, -7.419288158416748e-05, -7.095932960510254e-05, -6.77257776260376e-05, -6.449222564697266e-05, -6.125867366790771e-05, -5.8025121688842773e-05, -5.479156970977783e-05, -5.155801773071289e-05, -4.832446575164795e-05, -4.509091377258301e-05, -4.1857361793518066e-05, -3.8623809814453125e-05, -3.5390257835388184e-05, -3.215670585632324e-05, -2.89231538772583e-05, -2.568960189819336e-05, -2.2456049919128418e-05, -1.9222497940063477e-05, -1.5988945960998535e-05, -1.2755393981933594e-05, -9.521842002868652e-06, -6.288290023803711e-06, -3.0547380447387695e-06, 1.7881393432617188e-07, 3.4123659133911133e-06, 6.645917892456055e-06, 9.879469871520996e-06, 1.3113021850585938e-05, 1.634657382965088e-05, 1.958012580871582e-05, 2.2813677787780762e-05, 2.6047229766845703e-05, 2.9280781745910645e-05, 3.2514333724975586e-05, 3.574788570404053e-05, 3.898143768310547e-05, 4.221498966217041e-05, 4.544854164123535e-05, 4.868209362030029e-05, 5.1915645599365234e-05, 5.5149197578430176e-05, 5.838274955749512e-05, 6.161630153656006e-05, 6.4849853515625e-05, 6.808340549468994e-05, 7.131695747375488e-05, 7.455050945281982e-05, 7.778406143188477e-05, 8.101761341094971e-05, 8.425116539001465e-05, 8.748471736907959e-05, 9.071826934814453e-05]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 28.0, 80.0, 230.0, 408.0, 154.0, 50.0, 28.0, 12.0, 7.0, 3.0, 1.0, 1.0], "bins": [-0.03759555518627167, -0.036915820091962814, -0.03623608499765396, -0.03555634990334511, -0.034876614809036255, -0.0341968834400177, -0.03351714834570885, -0.032837413251399994, -0.03215767815709114, -0.03147794306278229, -0.030798207968473434, -0.03011847473680973, -0.029438739642500877, -0.028759004548192024, -0.02807926945388317, -0.027399536222219467, -0.026719801127910614, -0.02604006603360176, -0.025360330939292908, -0.024680597707629204, -0.02400086261332035, -0.023321127519011497, -0.022641392424702644, -0.02196165919303894, -0.021281922236084938, -0.020602187141776085, -0.019922452047467232, -0.019242718815803528, -0.018562983721494675, -0.01788324862718582, -0.01720351353287697, -0.016523778438568115, -0.01584404706954956, -0.015164311975240707, -0.014484577812254429, -0.013804842717945576, -0.013125108554959297, -0.012445373460650444, -0.011765638366341591, -0.011085904203355312, -0.010406168177723885, -0.009726433083415031, -0.009046698920428753, -0.0083669638261199, -0.007687229663133621, -0.007007494568824768, -0.006327759940177202, -0.005648025311529636, -0.004968291148543358, -0.004288556519895792, -0.003608821891248226, -0.0029290870297700167, -0.002249352401122451, -0.001569617772474885, -0.0008898829109966755, -0.00021014828234910965, 0.0004695863462984562, 0.001149320974946022, 0.0018290557200089097, 0.0025087904650717974, 0.003188525093719363, 0.003868259722366929, 0.0045479945838451385, 0.005227729212492704, 0.00590746384114027]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 10.0, 9.0, 12.0, 21.0, 19.0, 20.0, 17.0, 24.0, 23.0, 38.0, 27.0, 30.0, 30.0, 39.0, 37.0, 50.0, 46.0, 42.0, 64.0, 42.0, 37.0, 39.0, 34.0, 40.0, 33.0, 32.0, 32.0, 27.0, 24.0, 15.0, 15.0, 13.0, 12.0, 7.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004030133131891489, -0.0039068590849637985, -0.003783585038036108, -0.0036603109911084175, -0.0035370371770113707, -0.00341376313008368, -0.0032904890831559896, -0.003167215036228299, -0.0030439412221312523, -0.0029206671752035618, -0.0027973931282758713, -0.0026741190813481808, -0.002550845267251134, -0.0024275712203234434, -0.002304297173395753, -0.0021810231264680624, -0.002057749079540372, -0.0019344750326126814, -0.0018112011021003127, -0.0016879270551726222, -0.0015646531246602535, -0.001441379077732563, -0.0013181050308048725, -0.001194830983877182, -0.0010715570533648133, -0.0009482830646447837, -0.0008250090759247541, -0.0007017350289970636, -0.000578461040277034, -0.00045518705155700445, -0.00033191300462931395, -0.00020863901590928435, -8.536502718925476e-05, 3.790897608269006e-05, 0.00016118297935463488, 0.00028445699717849493, 0.0004077309858985245, 0.0005310049746185541, 0.0006542790215462446, 0.0007775530102662742, 0.0009008269989863038, 0.0010241010459139943, 0.001147374976426363, 0.0012706490233540535, 0.001393923070281744, 0.0015171970007941127, 0.0016404710477218032, 0.0017637449782341719, 0.0018870190251618624, 0.002010293072089553, 0.0021335671190172434, 0.0022568409331142902, 0.0023801149800419807, 0.0025033890269696712, 0.0026266630738973618, 0.0027499371208250523, 0.0028732111677527428, 0.0029964852146804333, 0.0031197592616081238, 0.0032430333085358143, 0.003366307122632861, 0.0034895811695605516, 0.003612855216488242, 0.0037361292634159327, 0.0038594030775129795]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 5.0, 11.0, 17.0, 16.0, 19.0, 33.0, 43.0, 66.0, 74.0, 104.0, 152.0, 255.0, 364.0, 655.0, 1051.0, 1836.0, 3604.0, 12490.0, 3589068.0, 566340.0, 10091.0, 3496.0, 1742.0, 955.0, 625.0, 366.0, 260.0, 153.0, 108.0, 75.0, 62.0, 40.0, 32.0, 18.0, 24.0, 9.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0121612548828125, -0.01170969009399414, -0.011258125305175781, -0.010806560516357422, -0.010354995727539062, -0.009903430938720703, -0.009451866149902344, -0.009000301361083984, -0.008548736572265625, -0.008097171783447266, -0.007645606994628906, -0.007194042205810547, -0.0067424774169921875, -0.006290912628173828, -0.005839347839355469, -0.005387783050537109, -0.00493621826171875, -0.004484653472900391, -0.004033088684082031, -0.003581523895263672, -0.0031299591064453125, -0.002678394317626953, -0.0022268295288085938, -0.0017752647399902344, -0.001323699951171875, -0.0008721351623535156, -0.00042057037353515625, 3.0994415283203125e-05, 0.0004825592041015625, 0.0009341239929199219, 0.0013856887817382812, 0.0018372535705566406, 0.002288818359375, 0.0027403831481933594, 0.0031919479370117188, 0.003643512725830078, 0.0040950775146484375, 0.004546642303466797, 0.004998207092285156, 0.005449771881103516, 0.005901336669921875, 0.006352901458740234, 0.006804466247558594, 0.007256031036376953, 0.0077075958251953125, 0.008159160614013672, 0.008610725402832031, 0.00906229019165039, 0.00951385498046875, 0.00996541976928711, 0.010416984558105469, 0.010868549346923828, 0.011320114135742188, 0.011771678924560547, 0.012223243713378906, 0.012674808502197266, 0.013126373291015625, 0.013577938079833984, 0.014029502868652344, 0.014481067657470703, 0.014932632446289062, 0.015384197235107422, 0.01583576202392578, 0.01628732681274414, 0.0167388916015625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 8.0, 9.0, 19.0, 21.0, 16.0, 19.0, 29.0, 21.0, 38.0, 34.0, 26.0, 44.0, 47.0, 51.0, 47.0, 48.0, 55.0, 45.0, 44.0, 50.0, 40.0, 37.0, 46.0, 36.0, 15.0, 30.0, 23.0, 18.0, 16.0, 12.0, 8.0, 10.0, 9.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030231475830078125, -0.0029136240482330322, -0.002804100513458252, -0.0026945769786834717, -0.0025850534439086914, -0.002475529909133911, -0.002366006374359131, -0.0022564828395843506, -0.0021469593048095703, -0.00203743577003479, -0.0019279122352600098, -0.0018183887004852295, -0.0017088651657104492, -0.001599341630935669, -0.0014898180961608887, -0.0013802945613861084, -0.0012707710266113281, -0.0011612474918365479, -0.0010517239570617676, -0.0009422004222869873, -0.000832676887512207, -0.0007231533527374268, -0.0006136298179626465, -0.0005041062831878662, -0.00039458274841308594, -0.00028505921363830566, -0.0001755356788635254, -6.601214408874512e-05, 4.3511390686035156e-05, 0.00015303492546081543, 0.0002625584602355957, 0.000372081995010376, 0.00048160552978515625, 0.0005911290645599365, 0.0007006525993347168, 0.0008101761341094971, 0.0009196996688842773, 0.0010292232036590576, 0.0011387467384338379, 0.0012482702732086182, 0.0013577938079833984, 0.0014673173427581787, 0.001576840877532959, 0.0016863644123077393, 0.0017958879470825195, 0.0019054114818572998, 0.00201493501663208, 0.0021244585514068604, 0.0022339820861816406, 0.002343505620956421, 0.002453029155731201, 0.0025625526905059814, 0.0026720762252807617, 0.002781599760055542, 0.0028911232948303223, 0.0030006468296051025, 0.003110170364379883, 0.003219693899154663, 0.0033292174339294434, 0.0034387409687042236, 0.003548264503479004, 0.003657788038253784, 0.0037673115730285645, 0.0038768351078033447, 0.003986358642578125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 15.0, 34.0, 53.0, 146.0, 524.0, 2045.0, 12489.0, 4090055.0, 82076.0, 5326.0, 1032.0, 273.0, 101.0, 41.0, 16.0, 8.0, 14.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.047821044921875, -0.04661893844604492, -0.045416831970214844, -0.044214725494384766, -0.04301261901855469, -0.04181051254272461, -0.04060840606689453, -0.03940629959106445, -0.038204193115234375, -0.0370020866394043, -0.03579998016357422, -0.03459787368774414, -0.03339576721191406, -0.032193660736083984, -0.030991554260253906, -0.029789447784423828, -0.02858734130859375, -0.027385234832763672, -0.026183128356933594, -0.024981021881103516, -0.023778915405273438, -0.02257680892944336, -0.02137470245361328, -0.020172595977783203, -0.018970489501953125, -0.017768383026123047, -0.01656627655029297, -0.01536417007446289, -0.014162063598632812, -0.012959957122802734, -0.011757850646972656, -0.010555744171142578, -0.0093536376953125, -0.008151531219482422, -0.006949424743652344, -0.005747318267822266, -0.0045452117919921875, -0.0033431053161621094, -0.0021409988403320312, -0.0009388923645019531, 0.000263214111328125, 0.0014653205871582031, 0.0026674270629882812, 0.0038695335388183594, 0.0050716400146484375, 0.006273746490478516, 0.007475852966308594, 0.008677959442138672, 0.00988006591796875, 0.011082172393798828, 0.012284278869628906, 0.013486385345458984, 0.014688491821289062, 0.01589059829711914, 0.01709270477294922, 0.018294811248779297, 0.019496917724609375, 0.020699024200439453, 0.02190113067626953, 0.02310323715209961, 0.024305343627929688, 0.025507450103759766, 0.026709556579589844, 0.027911663055419922, 0.02911376953125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 5.0, 5.0, 7.0, 8.0, 9.0, 27.0, 72.0, 201.0, 742.0, 2536.0, 273.0, 85.0, 33.0, 16.0, 9.0, 9.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025119781494140625, -0.0024159252643585205, -0.0023198723793029785, -0.0022238194942474365, -0.0021277666091918945, -0.0020317137241363525, -0.0019356608390808105, -0.0018396079540252686, -0.0017435550689697266, -0.0016475021839141846, -0.0015514492988586426, -0.0014553964138031006, -0.0013593435287475586, -0.0012632906436920166, -0.0011672377586364746, -0.0010711848735809326, -0.0009751319885253906, -0.0008790791034698486, -0.0007830262184143066, -0.0006869733333587646, -0.0005909204483032227, -0.0004948675632476807, -0.00039881467819213867, -0.0003027617931365967, -0.0002067089080810547, -0.0001106560230255127, -1.4603137969970703e-05, 8.144974708557129e-05, 0.00017750263214111328, 0.0002735555171966553, 0.00036960840225219727, 0.00046566128730773926, 0.0005617141723632812, 0.0006577670574188232, 0.0007538199424743652, 0.0008498728275299072, 0.0009459257125854492, 0.0010419785976409912, 0.0011380314826965332, 0.0012340843677520752, 0.0013301372528076172, 0.0014261901378631592, 0.0015222430229187012, 0.0016182959079742432, 0.0017143487930297852, 0.0018104016780853271, 0.0019064545631408691, 0.002002507448196411, 0.002098560333251953, 0.002194613218307495, 0.002290666103363037, 0.002386718988418579, 0.002482771873474121, 0.002578824758529663, 0.002674877643585205, 0.002770930528640747, 0.002866983413696289, 0.002963036298751831, 0.003059089183807373, 0.003155142068862915, 0.003251194953918457, 0.003347247838973999, 0.003443300724029541, 0.003539353609085083, 0.003635406494140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 9.0, 20.0, 32.0, 47.0, 68.0, 99.0, 166.0, 171.0, 139.0, 70.0, 47.0, 33.0, 26.0, 18.0, 15.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00956909079104662, -0.009362020529806614, -0.009154950268566608, -0.008947880007326603, -0.008740808814764023, -0.008533738553524017, -0.008326668292284012, -0.008119598031044006, -0.007912527769804, -0.007705457508563995, -0.00749838724732399, -0.007291316520422697, -0.007084246259182692, -0.006877175997942686, -0.006670105271041393, -0.006463035009801388, -0.006255964748561382, -0.006048894487321377, -0.005841824226081371, -0.0056347534991800785, -0.005427683237940073, -0.0052206129767000675, -0.005013542249798775, -0.004806471988558769, -0.004599401727318764, -0.004392331466078758, -0.004185261204838753, -0.00397819047793746, -0.0037711202166974545, -0.003564049955457449, -0.0033569794613868, -0.0031499089673161507, -0.0029428384732455015, -0.0027357679791748524, -0.002528697717934847, -0.0023216274566948414, -0.0021145569626241922, -0.001907486584968865, -0.0017004162073135376, -0.0014933458296582103, -0.001286275452002883, -0.0010792050743475556, -0.0008721346966922283, -0.000665064319036901, -0.0004579939413815737, -0.00025092356372624636, -4.385318607091904e-05, 0.00016321719158440828, 0.0003702875692397356, 0.0005773579468950629, 0.0007844283245503902, 0.0009914987022057176, 0.0011985690798610449, 0.0014056394575163722, 0.0016127098351716995, 0.0018197802128270268, 0.002026850590482354, 0.0022339210845530033, 0.002440991345793009, 0.0026480616070330143, 0.0028551321011036634, 0.0030622025951743126, 0.003269272856414318, 0.0034763431176543236, 0.0036834136117249727]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 11.0, 14.0, 7.0, 24.0, 7.0, 10.0, 16.0, 26.0, 32.0, 23.0, 39.0, 33.0, 29.0, 31.0, 32.0, 55.0, 53.0, 36.0, 47.0, 46.0, 29.0, 41.0, 34.0, 32.0, 31.0, 38.0, 30.0, 39.0, 31.0, 22.0, 21.0, 17.0, 15.0, 12.0, 12.0, 5.0, 3.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028635147027671337, -0.0027722229715436697, -0.0026809314731508493, -0.0025896397419273853, -0.002498348243534565, -0.002407056512311101, -0.002315764781087637, -0.0022244732826948166, -0.0021331815514713526, -0.0020418898202478886, -0.0019505983218550682, -0.0018593065906316042, -0.001768014975823462, -0.0016767233610153198, -0.0015854316297918558, -0.0014941400149837136, -0.0014028484001755714, -0.0013115567853674293, -0.001220265170559287, -0.001128973439335823, -0.0010376818245276809, -0.0009463902097195387, -0.0008550985367037356, -0.0007638068636879325, -0.0006725152488797903, -0.0005812236340716481, -0.000489931961055845, -0.0003986403171438724, -0.00030734867323189974, -0.0002160570293199271, -0.00012476538540795445, -3.3473712392151356e-05, 5.7817669585347176e-05, 0.00014910931349731982, 0.00024040095740929246, 0.0003316926013212651, 0.00042298424523323774, 0.0005142758600413799, 0.000605567533057183, 0.0006968592060729861, 0.0007881508208811283, 0.0008794424356892705, 0.0009707341087050736, 0.0010620257817208767, 0.0011533173965290189, 0.001244609011337161, 0.001335900742560625, 0.0014271923573687673, 0.0015184839721769094, 0.0016097755869850516, 0.0017010672017931938, 0.0017923589330166578, 0.0018836505478248, 0.001974942162632942, 0.002066233893856406, 0.0021575256250798702, 0.0022488171234726906, 0.0023401088546961546, 0.002431400353088975, 0.002522692084312439, 0.0026139835827052593, 0.0027052753139287233, 0.0027965670451521873, 0.0028878585435450077, 0.0029791502747684717]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 7.0, 12.0, 24.0, 23.0, 39.0, 49.0, 74.0, 110.0, 184.0, 253.0, 438.0, 784.0, 1359.0, 2372.0, 4274.0, 7796.0, 15812.0, 34622.0, 86566.0, 280484.0, 407329.0, 119037.0, 45513.0, 20120.0, 9716.0, 4902.0, 2722.0, 1560.0, 878.0, 531.0, 313.0, 197.0, 146.0, 95.0, 72.0, 43.0, 30.0, 24.0, 7.0, 10.0, 4.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0082855224609375, -0.00801074504852295, -0.0077359676361083984, -0.007461190223693848, -0.007186412811279297, -0.006911635398864746, -0.006636857986450195, -0.0063620805740356445, -0.006087303161621094, -0.005812525749206543, -0.005537748336791992, -0.005262970924377441, -0.004988193511962891, -0.00471341609954834, -0.004438638687133789, -0.004163861274719238, -0.0038890838623046875, -0.0036143064498901367, -0.003339529037475586, -0.003064751625061035, -0.0027899742126464844, -0.0025151968002319336, -0.002240419387817383, -0.001965641975402832, -0.0016908645629882812, -0.0014160871505737305, -0.0011413097381591797, -0.0008665323257446289, -0.0005917549133300781, -0.00031697750091552734, -4.220008850097656e-05, 0.00023257732391357422, 0.000507354736328125, 0.0007821321487426758, 0.0010569095611572266, 0.0013316869735717773, 0.0016064643859863281, 0.001881241798400879, 0.0021560192108154297, 0.0024307966232299805, 0.0027055740356445312, 0.002980351448059082, 0.003255128860473633, 0.0035299062728881836, 0.0038046836853027344, 0.004079461097717285, 0.004354238510131836, 0.004629015922546387, 0.0049037933349609375, 0.005178570747375488, 0.005453348159790039, 0.00572812557220459, 0.006002902984619141, 0.006277680397033691, 0.006552457809448242, 0.006827235221862793, 0.007102012634277344, 0.0073767900466918945, 0.007651567459106445, 0.007926344871520996, 0.008201122283935547, 0.008475899696350098, 0.008750677108764648, 0.0090254545211792, 0.00930023193359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 12.0, 15.0, 12.0, 19.0, 31.0, 24.0, 31.0, 33.0, 41.0, 34.0, 38.0, 48.0, 51.0, 52.0, 51.0, 52.0, 44.0, 41.0, 34.0, 40.0, 44.0, 34.0, 38.0, 28.0, 25.0, 13.0, 19.0, 18.0, 13.0, 12.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027675628662109375, -0.00266951322555542, -0.0025714635848999023, -0.0024734139442443848, -0.002375364303588867, -0.0022773146629333496, -0.002179265022277832, -0.0020812153816223145, -0.001983165740966797, -0.0018851161003112793, -0.0017870664596557617, -0.0016890168190002441, -0.0015909671783447266, -0.001492917537689209, -0.0013948678970336914, -0.0012968182563781738, -0.0011987686157226562, -0.0011007189750671387, -0.001002669334411621, -0.0009046196937561035, -0.0008065700531005859, -0.0007085204124450684, -0.0006104707717895508, -0.0005124211311340332, -0.0004143714904785156, -0.00031632184982299805, -0.00021827220916748047, -0.00012022256851196289, -2.2172927856445312e-05, 7.587671279907227e-05, 0.00017392635345458984, 0.0002719759941101074, 0.000370025634765625, 0.0004680752754211426, 0.0005661249160766602, 0.0006641745567321777, 0.0007622241973876953, 0.0008602738380432129, 0.0009583234786987305, 0.001056373119354248, 0.0011544227600097656, 0.0012524724006652832, 0.0013505220413208008, 0.0014485716819763184, 0.001546621322631836, 0.0016446709632873535, 0.001742720603942871, 0.0018407702445983887, 0.0019388198852539062, 0.002036869525909424, 0.0021349191665649414, 0.002232968807220459, 0.0023310184478759766, 0.002429068088531494, 0.0025271177291870117, 0.0026251673698425293, 0.002723217010498047, 0.0028212666511535645, 0.002919316291809082, 0.0030173659324645996, 0.003115415573120117, 0.0032134652137756348, 0.0033115148544311523, 0.00340956449508667, 0.0035076141357421875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 3.0, 7.0, 12.0, 9.0, 15.0, 11.0, 26.0, 33.0, 44.0, 85.0, 111.0, 174.0, 314.0, 490.0, 948.0, 1911.0, 3935.0, 9848.0, 32608.0, 271257.0, 658199.0, 46356.0, 12617.0, 4673.0, 2195.0, 1137.0, 598.0, 315.0, 204.0, 147.0, 92.0, 47.0, 25.0, 23.0, 22.0, 21.0, 14.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01493072509765625, -0.014479875564575195, -0.01402902603149414, -0.013578176498413086, -0.013127326965332031, -0.012676477432250977, -0.012225627899169922, -0.011774778366088867, -0.011323928833007812, -0.010873079299926758, -0.010422229766845703, -0.009971380233764648, -0.009520530700683594, -0.009069681167602539, -0.008618831634521484, -0.00816798210144043, -0.007717132568359375, -0.00726628303527832, -0.006815433502197266, -0.006364583969116211, -0.005913734436035156, -0.0054628849029541016, -0.005012035369873047, -0.004561185836791992, -0.0041103363037109375, -0.003659486770629883, -0.003208637237548828, -0.0027577877044677734, -0.0023069381713867188, -0.001856088638305664, -0.0014052391052246094, -0.0009543895721435547, -0.0005035400390625, -5.269050598144531e-05, 0.0003981590270996094, 0.0008490085601806641, 0.0012998580932617188, 0.0017507076263427734, 0.002201557159423828, 0.002652406692504883, 0.0031032562255859375, 0.003554105758666992, 0.004004955291748047, 0.0044558048248291016, 0.004906654357910156, 0.005357503890991211, 0.005808353424072266, 0.00625920295715332, 0.006710052490234375, 0.00716090202331543, 0.007611751556396484, 0.008062601089477539, 0.008513450622558594, 0.008964300155639648, 0.009415149688720703, 0.009865999221801758, 0.010316848754882812, 0.010767698287963867, 0.011218547821044922, 0.011669397354125977, 0.012120246887207031, 0.012571096420288086, 0.01302194595336914, 0.013472795486450195, 0.01392364501953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 2.0, 4.0, 8.0, 18.0, 14.0, 22.0, 20.0, 24.0, 22.0, 20.0, 25.0, 40.0, 41.0, 30.0, 37.0, 26.0, 52.0, 42.0, 42.0, 53.0, 38.0, 41.0, 47.0, 34.0, 40.0, 32.0, 46.0, 23.0, 16.0, 26.0, 23.0, 20.0, 17.0, 20.0, 11.0, 4.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.0022373199462890625, -0.0021764934062957764, -0.0021156668663024902, -0.002054840326309204, -0.001994013786315918, -0.0019331872463226318, -0.0018723607063293457, -0.0018115341663360596, -0.0017507076263427734, -0.0016898810863494873, -0.0016290545463562012, -0.001568228006362915, -0.001507401466369629, -0.0014465749263763428, -0.0013857483863830566, -0.0013249218463897705, -0.0012640953063964844, -0.0012032687664031982, -0.0011424422264099121, -0.001081615686416626, -0.0010207891464233398, -0.0009599626064300537, -0.0008991360664367676, -0.0008383095264434814, -0.0007774829864501953, -0.0007166564464569092, -0.000655829906463623, -0.0005950033664703369, -0.0005341768264770508, -0.00047335028648376465, -0.0004125237464904785, -0.0003516972064971924, -0.00029087066650390625, -0.00023004412651062012, -0.00016921758651733398, -0.00010839104652404785, -4.756450653076172e-05, 1.3262033462524414e-05, 7.408857345581055e-05, 0.00013491511344909668, 0.0001957416534423828, 0.00025656819343566895, 0.0003173947334289551, 0.0003782212734222412, 0.00043904781341552734, 0.0004998743534088135, 0.0005607008934020996, 0.0006215274333953857, 0.0006823539733886719, 0.000743180513381958, 0.0008040070533752441, 0.0008648335933685303, 0.0009256601333618164, 0.0009864866733551025, 0.0010473132133483887, 0.0011081397533416748, 0.001168966293334961, 0.001229792833328247, 0.0012906193733215332, 0.0013514459133148193, 0.0014122724533081055, 0.0014730989933013916, 0.0015339255332946777, 0.0015947520732879639, 0.00165557861328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 10.0, 10.0, 19.0, 24.0, 34.0, 30.0, 60.0, 82.0, 118.0, 188.0, 238.0, 402.0, 679.0, 1096.0, 2141.0, 4577.0, 12796.0, 61501.0, 859038.0, 80255.0, 14730.0, 5043.0, 2206.0, 1255.0, 670.0, 425.0, 276.0, 160.0, 123.0, 88.0, 68.0, 35.0, 38.0, 24.0, 17.0, 15.0, 15.0, 15.0, 5.0, 6.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.017425537109375, -0.01687335968017578, -0.016321182250976562, -0.015769004821777344, -0.015216827392578125, -0.014664649963378906, -0.014112472534179688, -0.013560295104980469, -0.01300811767578125, -0.012455940246582031, -0.011903762817382812, -0.011351585388183594, -0.010799407958984375, -0.010247230529785156, -0.009695053100585938, -0.009142875671386719, -0.0085906982421875, -0.008038520812988281, -0.0074863433837890625, -0.006934165954589844, -0.006381988525390625, -0.005829811096191406, -0.0052776336669921875, -0.004725456237792969, -0.00417327880859375, -0.0036211013793945312, -0.0030689239501953125, -0.0025167465209960938, -0.001964569091796875, -0.0014123916625976562, -0.0008602142333984375, -0.00030803680419921875, 0.000244140625, 0.0007963180541992188, 0.0013484954833984375, 0.0019006729125976562, 0.002452850341796875, 0.0030050277709960938, 0.0035572052001953125, 0.004109382629394531, 0.00466156005859375, 0.005213737487792969, 0.0057659149169921875, 0.006318092346191406, 0.006870269775390625, 0.007422447204589844, 0.007974624633789062, 0.008526802062988281, 0.0090789794921875, 0.009631156921386719, 0.010183334350585938, 0.010735511779785156, 0.011287689208984375, 0.011839866638183594, 0.012392044067382812, 0.012944221496582031, 0.01349639892578125, 0.014048576354980469, 0.014600753784179688, 0.015152931213378906, 0.015705108642578125, 0.016257286071777344, 0.016809463500976562, 0.01736164093017578, 0.017913818359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 6.0, 7.0, 6.0, 7.0, 12.0, 20.0, 25.0, 28.0, 51.0, 62.0, 78.0, 137.0, 208.0, 87.0, 62.0, 45.0, 40.0, 31.0, 13.0, 10.0, 17.0, 9.0, 5.0, 8.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.092123031616211e-05, -2.0308420062065125e-05, -1.969560980796814e-05, -1.9082799553871155e-05, -1.846998929977417e-05, -1.7857179045677185e-05, -1.72443687915802e-05, -1.6631558537483215e-05, -1.601874828338623e-05, -1.5405938029289246e-05, -1.479312777519226e-05, -1.4180317521095276e-05, -1.3567507266998291e-05, -1.2954697012901306e-05, -1.2341886758804321e-05, -1.1729076504707336e-05, -1.1116266250610352e-05, -1.0503455996513367e-05, -9.890645742416382e-06, -9.277835488319397e-06, -8.665025234222412e-06, -8.052214980125427e-06, -7.439404726028442e-06, -6.8265944719314575e-06, -6.213784217834473e-06, -5.600973963737488e-06, -4.988163709640503e-06, -4.375353455543518e-06, -3.762543201446533e-06, -3.1497329473495483e-06, -2.5369226932525635e-06, -1.9241124391555786e-06, -1.3113021850585938e-06, -6.984919309616089e-07, -8.568167686462402e-08, 5.271285772323608e-07, 1.1399388313293457e-06, 1.7527490854263306e-06, 2.3655593395233154e-06, 2.9783695936203003e-06, 3.591179847717285e-06, 4.20399010181427e-06, 4.816800355911255e-06, 5.42961061000824e-06, 6.042420864105225e-06, 6.6552311182022095e-06, 7.268041372299194e-06, 7.88085162639618e-06, 8.493661880493164e-06, 9.106472134590149e-06, 9.719282388687134e-06, 1.0332092642784119e-05, 1.0944902896881104e-05, 1.1557713150978088e-05, 1.2170523405075073e-05, 1.2783333659172058e-05, 1.3396143913269043e-05, 1.4008954167366028e-05, 1.4621764421463013e-05, 1.5234574675559998e-05, 1.5847384929656982e-05, 1.6460195183753967e-05, 1.7073005437850952e-05, 1.7685815691947937e-05, 1.8298625946044922e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 9.0, 10.0, 16.0, 18.0, 49.0, 116.0, 278.0, 713.0, 2189.0, 8954.0, 105882.0, 904694.0, 19798.0, 3910.0, 1136.0, 443.0, 164.0, 75.0, 36.0, 18.0, 14.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023529052734375, -0.02263164520263672, -0.021734237670898438, -0.020836830139160156, -0.019939422607421875, -0.019042015075683594, -0.018144607543945312, -0.01724720001220703, -0.01634979248046875, -0.015452384948730469, -0.014554977416992188, -0.013657569885253906, -0.012760162353515625, -0.011862754821777344, -0.010965347290039062, -0.010067939758300781, -0.0091705322265625, -0.008273124694824219, -0.0073757171630859375, -0.006478309631347656, -0.005580902099609375, -0.004683494567871094, -0.0037860870361328125, -0.0028886795043945312, -0.00199127197265625, -0.0010938644409179688, -0.0001964569091796875, 0.0007009506225585938, 0.001598358154296875, 0.0024957656860351562, 0.0033931732177734375, 0.004290580749511719, 0.00518798828125, 0.006085395812988281, 0.0069828033447265625, 0.007880210876464844, 0.008777618408203125, 0.009675025939941406, 0.010572433471679688, 0.011469841003417969, 0.01236724853515625, 0.013264656066894531, 0.014162063598632812, 0.015059471130371094, 0.015956878662109375, 0.016854286193847656, 0.017751693725585938, 0.01864910125732422, 0.0195465087890625, 0.02044391632080078, 0.021341323852539062, 0.022238731384277344, 0.023136138916015625, 0.024033546447753906, 0.024930953979492188, 0.02582836151123047, 0.02672576904296875, 0.02762317657470703, 0.028520584106445312, 0.029417991638183594, 0.030315399169921875, 0.031212806701660156, 0.03211021423339844, 0.03300762176513672, 0.033905029296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 14.0, 26.0, 36.0, 78.0, 103.0, 247.0, 182.0, 93.0, 55.0, 45.0, 21.0, 18.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026035308837890625, -0.002534627914428711, -0.0024657249450683594, -0.002396821975708008, -0.0023279190063476562, -0.0022590160369873047, -0.002190113067626953, -0.0021212100982666016, -0.00205230712890625, -0.0019834041595458984, -0.0019145011901855469, -0.0018455982208251953, -0.0017766952514648438, -0.0017077922821044922, -0.0016388893127441406, -0.001569986343383789, -0.0015010833740234375, -0.001432180404663086, -0.0013632774353027344, -0.0012943744659423828, -0.0012254714965820312, -0.0011565685272216797, -0.0010876655578613281, -0.0010187625885009766, -0.000949859619140625, -0.0008809566497802734, -0.0008120536804199219, -0.0007431507110595703, -0.0006742477416992188, -0.0006053447723388672, -0.0005364418029785156, -0.00046753883361816406, -0.0003986358642578125, -0.00032973289489746094, -0.0002608299255371094, -0.0001919269561767578, -0.00012302398681640625, -5.412101745605469e-05, 1.4781951904296875e-05, 8.368492126464844e-05, 0.000152587890625, 0.00022149085998535156, 0.0002903938293457031, 0.0003592967987060547, 0.00042819976806640625, 0.0004971027374267578, 0.0005660057067871094, 0.0006349086761474609, 0.0007038116455078125, 0.0007727146148681641, 0.0008416175842285156, 0.0009105205535888672, 0.0009794235229492188, 0.0010483264923095703, 0.0011172294616699219, 0.0011861324310302734, 0.001255035400390625, 0.0013239383697509766, 0.0013928413391113281, 0.0014617443084716797, 0.0015306472778320312, 0.0015995502471923828, 0.0016684532165527344, 0.001737356185913086, 0.0018062591552734375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 6.0, 8.0, 16.0, 22.0, 27.0, 31.0, 44.0, 58.0, 73.0, 128.0, 140.0, 141.0, 76.0, 60.0, 34.0, 24.0, 20.0, 13.0, 14.0, 8.0, 4.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005680849310010672, -0.0055295974016189575, -0.005378345027565956, -0.005227093119174242, -0.005075841210782528, -0.0049245888367295265, -0.004773336928337812, -0.004622085019946098, -0.004470832645893097, -0.004319580737501383, -0.004168328363448381, -0.004017076455056667, -0.0038658245466649532, -0.0037145724054425955, -0.0035633202642202377, -0.0034120683558285236, -0.0032608164474368095, -0.003109564306214452, -0.0029583123978227377, -0.00280706025660038, -0.002655808348208666, -0.002504556206986308, -0.0023533040657639503, -0.0022020521573722363, -0.0020508000161498785, -0.0018995479913428426, -0.0017482959665358067, -0.001597043825313449, -0.001445791800506413, -0.001294539775699377, -0.0011432876344770193, -0.0009920356096699834, -0.0008407831192016602, -0.0006895310943946242, -0.0005382790113799274, -0.000387026957469061, -0.00023577490355819464, -8.452287875115871e-05, 6.672920426353812e-05, 0.00021798128727823496, 0.0003692333120852709, 0.0005204853368923068, 0.0006717374199070036, 0.0008229895029217005, 0.0009742415277287364, 0.0011254935525357723, 0.00127674569375813, 0.001427997718565166, 0.001579249743372202, 0.0017305017681792378, 0.0018817537929862738, 0.0020330059342086315, 0.0021842578426003456, 0.0023355099838227034, 0.002486762125045061, 0.002638014033436775, 0.002789266174659133, 0.0029405183158814907, 0.003091770224273205, 0.0032430223654955626, 0.0033942745067179203, 0.0035455264151096344, 0.003696778556331992, 0.00384803069755435, 0.003999282605946064]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 3.0, 11.0, 16.0, 12.0, 13.0, 14.0, 14.0, 15.0, 28.0, 27.0, 33.0, 19.0, 49.0, 41.0, 29.0, 37.0, 38.0, 40.0, 49.0, 28.0, 41.0, 25.0, 35.0, 31.0, 47.0, 47.0, 32.0, 28.0, 26.0, 29.0, 24.0, 17.0, 12.0, 17.0, 15.0, 17.0, 3.0, 3.0, 5.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0022868276573717594, -0.0022104852832853794, -0.002134143142029643, -0.002057800767943263, -0.0019814586266875267, -0.0019051162526011467, -0.0018287739949300885, -0.0017524317372590303, -0.0016760894795879722, -0.001599747221916914, -0.0015234049642458558, -0.0014470627065747976, -0.0013707203324884176, -0.0012943781912326813, -0.0012180358171463013, -0.001141693559475243, -0.001065351301804185, -0.0009890090441331267, -0.0009126667864620686, -0.0008363244705833495, -0.0007599822129122913, -0.0006836399552412331, -0.000607297639362514, -0.0005309553816914558, -0.00045461312402039766, -0.0003782708663493395, -0.00030192857957445085, -0.00022558630735147744, -0.00014924403512850404, -7.290177745744586e-05, 3.4405093174427748e-06, 7.978279609233141e-05, 0.00015612528659403324, 0.00023246755881700665, 0.00030880983103998005, 0.0003851521178148687, 0.00046149437548592687, 0.000537836633156985, 0.0006141789490357041, 0.0006905212067067623, 0.0007668634643778205, 0.0008432057220488787, 0.0009195479797199368, 0.000995890237390995, 0.001072232611477375, 0.0011485747527331114, 0.0012249171268194914, 0.0013012593844905496, 0.0013776016421616077, 0.001453943899832666, 0.001530286157503724, 0.0016066284151747823, 0.0016829706728458405, 0.0017593130469322205, 0.0018356553046032786, 0.0019119975622743368, 0.001988339703530073, 0.002064682077616453, 0.0021410242188721895, 0.0022173665929585695, 0.002293708734214306, 0.002370051108300686, 0.0024463932495564222, 0.0025227356236428022, 0.0025990779977291822]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 11.0, 8.0, 10.0, 11.0, 17.0, 32.0, 26.0, 48.0, 119.0, 121.0, 226.0, 339.0, 452.0, 720.0, 1209.0, 1924.0, 3118.0, 4944.0, 8083.0, 13072.0, 21854.0, 37331.0, 67257.0, 134149.0, 289494.0, 227550.0, 103494.0, 54548.0, 31100.0, 18032.0, 11097.0, 6768.0, 4230.0, 2623.0, 1601.0, 1054.0, 641.0, 421.0, 266.0, 189.0, 110.0, 89.0, 58.0, 47.0, 22.0, 23.0, 9.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.005107879638671875, -0.004936635494232178, -0.0047653913497924805, -0.004594147205352783, -0.004422903060913086, -0.004251658916473389, -0.004080414772033691, -0.003909170627593994, -0.003737926483154297, -0.0035666823387145996, -0.0033954381942749023, -0.003224194049835205, -0.003052949905395508, -0.0028817057609558105, -0.0027104616165161133, -0.002539217472076416, -0.0023679733276367188, -0.0021967291831970215, -0.0020254850387573242, -0.001854240894317627, -0.0016829967498779297, -0.0015117526054382324, -0.0013405084609985352, -0.0011692643165588379, -0.0009980201721191406, -0.0008267760276794434, -0.0006555318832397461, -0.00048428773880004883, -0.00031304359436035156, -0.0001417994499206543, 2.944469451904297e-05, 0.00020068883895874023, 0.0003719329833984375, 0.0005431771278381348, 0.000714421272277832, 0.0008856654167175293, 0.0010569095611572266, 0.0012281537055969238, 0.001399397850036621, 0.0015706419944763184, 0.0017418861389160156, 0.0019131302833557129, 0.00208437442779541, 0.0022556185722351074, 0.0024268627166748047, 0.002598106861114502, 0.0027693510055541992, 0.0029405951499938965, 0.0031118392944335938, 0.003283083438873291, 0.0034543275833129883, 0.0036255717277526855, 0.003796815872192383, 0.00396806001663208, 0.004139304161071777, 0.004310548305511475, 0.004481792449951172, 0.004653036594390869, 0.004824280738830566, 0.004995524883270264, 0.005166769027709961, 0.005338013172149658, 0.0055092573165893555, 0.005680501461029053, 0.00585174560546875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 14.0, 10.0, 15.0, 16.0, 23.0, 8.0, 23.0, 17.0, 30.0, 34.0, 28.0, 25.0, 39.0, 48.0, 41.0, 42.0, 41.0, 44.0, 50.0, 51.0, 41.0, 41.0, 34.0, 42.0, 32.0, 32.0, 29.0, 20.0, 22.0, 19.0, 17.0, 10.0, 17.0, 7.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012645721435546875, -0.0012200921773910522, -0.001175612211227417, -0.0011311322450637817, -0.0010866522789001465, -0.0010421723127365112, -0.000997692346572876, -0.0009532123804092407, -0.0009087324142456055, -0.0008642524480819702, -0.000819772481918335, -0.0007752925157546997, -0.0007308125495910645, -0.0006863325834274292, -0.0006418526172637939, -0.0005973726511001587, -0.0005528926849365234, -0.0005084127187728882, -0.00046393275260925293, -0.0004194527864456177, -0.0003749728202819824, -0.00033049285411834717, -0.0002860128879547119, -0.00024153292179107666, -0.0001970529556274414, -0.00015257298946380615, -0.0001080930233001709, -6.361305713653564e-05, -1.913309097290039e-05, 2.5346875190734863e-05, 6.982684135437012e-05, 0.00011430680751800537, 0.00015878677368164062, 0.00020326673984527588, 0.00024774670600891113, 0.0002922266721725464, 0.00033670663833618164, 0.0003811866044998169, 0.00042566657066345215, 0.0004701465368270874, 0.0005146265029907227, 0.0005591064691543579, 0.0006035864353179932, 0.0006480664014816284, 0.0006925463676452637, 0.0007370263338088989, 0.0007815062999725342, 0.0008259862661361694, 0.0008704662322998047, 0.0009149461984634399, 0.0009594261646270752, 0.0010039061307907104, 0.0010483860969543457, 0.001092866063117981, 0.0011373460292816162, 0.0011818259954452515, 0.0012263059616088867, 0.001270785927772522, 0.0013152658939361572, 0.0013597458600997925, 0.0014042258262634277, 0.001448705792427063, 0.0014931857585906982, 0.0015376657247543335, 0.0015821456909179688]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 12.0, 14.0, 23.0, 22.0, 37.0, 50.0, 73.0, 113.0, 161.0, 245.0, 373.0, 548.0, 876.0, 1384.0, 2154.0, 3412.0, 5509.0, 8856.0, 14523.0, 24405.0, 44018.0, 84395.0, 183703.0, 332346.0, 164617.0, 77367.0, 40714.0, 22772.0, 13578.0, 8148.0, 5134.0, 3211.0, 2005.0, 1301.0, 823.0, 562.0, 346.0, 232.0, 165.0, 106.0, 79.0, 50.0, 35.0, 19.0, 16.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.00440216064453125, -0.004270493984222412, -0.004138827323913574, -0.004007160663604736, -0.0038754940032958984, -0.0037438273429870605, -0.0036121606826782227, -0.0034804940223693848, -0.003348827362060547, -0.003217160701751709, -0.003085494041442871, -0.002953827381134033, -0.0028221607208251953, -0.0026904940605163574, -0.0025588274002075195, -0.0024271607398986816, -0.0022954940795898438, -0.002163827419281006, -0.002032160758972168, -0.00190049409866333, -0.0017688274383544922, -0.0016371607780456543, -0.0015054941177368164, -0.0013738274574279785, -0.0012421607971191406, -0.0011104941368103027, -0.0009788274765014648, -0.000847160816192627, -0.0007154941558837891, -0.0005838274955749512, -0.0004521608352661133, -0.0003204941749572754, -0.0001888275146484375, -5.716085433959961e-05, 7.450580596923828e-05, 0.00020617246627807617, 0.00033783912658691406, 0.00046950578689575195, 0.0006011724472045898, 0.0007328391075134277, 0.0008645057678222656, 0.0009961724281311035, 0.0011278390884399414, 0.0012595057487487793, 0.0013911724090576172, 0.001522839069366455, 0.001654505729675293, 0.0017861723899841309, 0.0019178390502929688, 0.0020495057106018066, 0.0021811723709106445, 0.0023128390312194824, 0.0024445056915283203, 0.002576172351837158, 0.002707839012145996, 0.002839505672454834, 0.002971172332763672, 0.0031028389930725098, 0.0032345056533813477, 0.0033661723136901855, 0.0034978389739990234, 0.0036295056343078613, 0.0037611722946166992, 0.003892838954925537, 0.004024505615234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 9.0, 14.0, 16.0, 15.0, 19.0, 27.0, 21.0, 21.0, 20.0, 26.0, 33.0, 37.0, 23.0, 33.0, 33.0, 31.0, 43.0, 36.0, 46.0, 36.0, 39.0, 24.0, 34.0, 33.0, 36.0, 40.0, 27.0, 20.0, 26.0, 30.0, 14.0, 19.0, 15.0, 7.0, 9.0, 11.0, 15.0, 7.0, 4.0, 10.0, 6.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010662078857421875, -0.001030057668685913, -0.0009939074516296387, -0.0009577572345733643, -0.0009216070175170898, -0.0008854568004608154, -0.000849306583404541, -0.0008131563663482666, -0.0007770061492919922, -0.0007408559322357178, -0.0007047057151794434, -0.0006685554981231689, -0.0006324052810668945, -0.0005962550640106201, -0.0005601048469543457, -0.0005239546298980713, -0.0004878044128417969, -0.00045165419578552246, -0.00041550397872924805, -0.00037935376167297363, -0.0003432035446166992, -0.0003070533275604248, -0.0002709031105041504, -0.00023475289344787598, -0.00019860267639160156, -0.00016245245933532715, -0.00012630224227905273, -9.015202522277832e-05, -5.4001808166503906e-05, -1.7851591110229492e-05, 1.8298625946044922e-05, 5.4448843002319336e-05, 9.059906005859375e-05, 0.00012674927711486816, 0.00016289949417114258, 0.000199049711227417, 0.0002351999282836914, 0.0002713501453399658, 0.00030750036239624023, 0.00034365057945251465, 0.00037980079650878906, 0.0004159510135650635, 0.0004521012306213379, 0.0004882514476776123, 0.0005244016647338867, 0.0005605518817901611, 0.0005967020988464355, 0.00063285231590271, 0.0006690025329589844, 0.0007051527500152588, 0.0007413029670715332, 0.0007774531841278076, 0.000813603401184082, 0.0008497536182403564, 0.0008859038352966309, 0.0009220540523529053, 0.0009582042694091797, 0.000994354486465454, 0.0010305047035217285, 0.001066654920578003, 0.0011028051376342773, 0.0011389553546905518, 0.0011751055717468262, 0.0012112557888031006, 0.001247406005859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 9.0, 16.0, 17.0, 18.0, 40.0, 74.0, 110.0, 157.0, 285.0, 513.0, 1030.0, 2315.0, 6047.0, 20839.0, 185017.0, 778787.0, 37961.0, 9144.0, 3116.0, 1440.0, 679.0, 384.0, 221.0, 105.0, 67.0, 53.0, 31.0, 16.0, 21.0, 13.0, 3.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005421638488769531, -0.0005275830626487732, -0.0005130022764205933, -0.0004984214901924133, -0.0004838407039642334, -0.00046925991773605347, -0.00045467913150787354, -0.0004400983452796936, -0.00042551755905151367, -0.00041093677282333374, -0.0003963559865951538, -0.0003817752003669739, -0.00036719441413879395, -0.000352613627910614, -0.0003380328416824341, -0.00032345205545425415, -0.0003088712692260742, -0.0002942904829978943, -0.00027970969676971436, -0.0002651289105415344, -0.0002505481243133545, -0.00023596733808517456, -0.00022138655185699463, -0.0002068057656288147, -0.00019222497940063477, -0.00017764419317245483, -0.0001630634069442749, -0.00014848262071609497, -0.00013390183448791504, -0.00011932104825973511, -0.00010474026203155518, -9.015947580337524e-05, -7.557868957519531e-05, -6.099790334701538e-05, -4.641711711883545e-05, -3.183633089065552e-05, -1.7255544662475586e-05, -2.6747584342956543e-06, 1.1906027793884277e-05, 2.648681402206421e-05, 4.106760025024414e-05, 5.564838647842407e-05, 7.0229172706604e-05, 8.480995893478394e-05, 9.939074516296387e-05, 0.0001139715313911438, 0.00012855231761932373, 0.00014313310384750366, 0.0001577138900756836, 0.00017229467630386353, 0.00018687546253204346, 0.0002014562487602234, 0.00021603703498840332, 0.00023061782121658325, 0.0002451986074447632, 0.0002597793936729431, 0.00027436017990112305, 0.000288940966129303, 0.0003035217523574829, 0.00031810253858566284, 0.0003326833248138428, 0.0003472641110420227, 0.00036184489727020264, 0.00037642568349838257, 0.0003910064697265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 15.0, 13.0, 20.0, 26.0, 64.0, 52.0, 87.0, 108.0, 199.0, 118.0, 65.0, 66.0, 46.0, 36.0, 17.0, 16.0, 22.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.887580871582031e-06, -4.753470420837402e-06, -4.6193599700927734e-06, -4.4852495193481445e-06, -4.351139068603516e-06, -4.217028617858887e-06, -4.082918167114258e-06, -3.948807716369629e-06, -3.814697265625e-06, -3.680586814880371e-06, -3.546476364135742e-06, -3.4123659133911133e-06, -3.2782554626464844e-06, -3.1441450119018555e-06, -3.0100345611572266e-06, -2.8759241104125977e-06, -2.7418136596679688e-06, -2.60770320892334e-06, -2.473592758178711e-06, -2.339482307434082e-06, -2.205371856689453e-06, -2.0712614059448242e-06, -1.9371509552001953e-06, -1.8030405044555664e-06, -1.6689300537109375e-06, -1.5348196029663086e-06, -1.4007091522216797e-06, -1.2665987014770508e-06, -1.1324882507324219e-06, -9.98377799987793e-07, -8.642673492431641e-07, -7.301568984985352e-07, -5.960464477539062e-07, -4.6193599700927734e-07, -3.2782554626464844e-07, -1.9371509552001953e-07, -5.960464477539063e-08, 7.450580596923828e-08, 2.086162567138672e-07, 3.427267074584961e-07, 4.76837158203125e-07, 6.109476089477539e-07, 7.450580596923828e-07, 8.791685104370117e-07, 1.0132789611816406e-06, 1.1473894119262695e-06, 1.2814998626708984e-06, 1.4156103134155273e-06, 1.5497207641601562e-06, 1.6838312149047852e-06, 1.817941665649414e-06, 1.952052116394043e-06, 2.086162567138672e-06, 2.2202730178833008e-06, 2.3543834686279297e-06, 2.4884939193725586e-06, 2.6226043701171875e-06, 2.7567148208618164e-06, 2.8908252716064453e-06, 3.0249357223510742e-06, 3.159046173095703e-06, 3.293156623840332e-06, 3.427267074584961e-06, 3.56137752532959e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 10.0, 22.0, 23.0, 38.0, 51.0, 83.0, 140.0, 205.0, 281.0, 480.0, 806.0, 1260.0, 2264.0, 4099.0, 7740.0, 16609.0, 45138.0, 197070.0, 616075.0, 100809.0, 29538.0, 12102.0, 5864.0, 3148.0, 1840.0, 1062.0, 644.0, 416.0, 242.0, 154.0, 110.0, 73.0, 54.0, 29.0, 21.0, 13.0, 12.0, 9.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00014483928680419922, -0.00014005973935127258, -0.00013528019189834595, -0.0001305006444454193, -0.00012572109699249268, -0.00012094154953956604, -0.0001161620020866394, -0.00011138245463371277, -0.00010660290718078613, -0.0001018233597278595, -9.704381227493286e-05, -9.226426482200623e-05, -8.748471736907959e-05, -8.270516991615295e-05, -7.792562246322632e-05, -7.314607501029968e-05, -6.836652755737305e-05, -6.358698010444641e-05, -5.8807432651519775e-05, -5.402788519859314e-05, -4.9248337745666504e-05, -4.446879029273987e-05, -3.968924283981323e-05, -3.49096953868866e-05, -3.013014793395996e-05, -2.5350600481033325e-05, -2.057105302810669e-05, -1.5791505575180054e-05, -1.1011958122253418e-05, -6.232410669326782e-06, -1.4528632164001465e-06, 3.3266842365264893e-06, 8.106231689453125e-06, 1.288577914237976e-05, 1.7665326595306396e-05, 2.2444874048233032e-05, 2.7224421501159668e-05, 3.2003968954086304e-05, 3.678351640701294e-05, 4.1563063859939575e-05, 4.634261131286621e-05, 5.112215876579285e-05, 5.590170621871948e-05, 6.068125367164612e-05, 6.546080112457275e-05, 7.024034857749939e-05, 7.501989603042603e-05, 7.979944348335266e-05, 8.45789909362793e-05, 8.935853838920593e-05, 9.413808584213257e-05, 9.89176332950592e-05, 0.00010369718074798584, 0.00010847672820091248, 0.00011325627565383911, 0.00011803582310676575, 0.00012281537055969238, 0.00012759491801261902, 0.00013237446546554565, 0.0001371540129184723, 0.00014193356037139893, 0.00014671310782432556, 0.0001514926552772522, 0.00015627220273017883, 0.00016105175018310547]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 7.0, 8.0, 13.0, 17.0, 13.0, 26.0, 28.0, 59.0, 59.0, 86.0, 94.0, 119.0, 106.0, 60.0, 62.0, 52.0, 42.0, 28.0, 18.0, 18.0, 13.0, 8.0, 7.0, 3.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1365623474121094e-05, -4.012882709503174e-05, -3.889203071594238e-05, -3.765523433685303e-05, -3.641843795776367e-05, -3.5181641578674316e-05, -3.394484519958496e-05, -3.2708048820495605e-05, -3.147125244140625e-05, -3.0234456062316895e-05, -2.899765968322754e-05, -2.7760863304138184e-05, -2.6524066925048828e-05, -2.5287270545959473e-05, -2.4050474166870117e-05, -2.2813677787780762e-05, -2.1576881408691406e-05, -2.034008502960205e-05, -1.9103288650512695e-05, -1.786649227142334e-05, -1.6629695892333984e-05, -1.539289951324463e-05, -1.4156103134155273e-05, -1.2919306755065918e-05, -1.1682510375976562e-05, -1.0445713996887207e-05, -9.208917617797852e-06, -7.972121238708496e-06, -6.735324859619141e-06, -5.498528480529785e-06, -4.26173210144043e-06, -3.0249357223510742e-06, -1.7881393432617188e-06, -5.513429641723633e-07, 6.854534149169922e-07, 1.9222497940063477e-06, 3.159046173095703e-06, 4.395842552185059e-06, 5.632638931274414e-06, 6.8694353103637695e-06, 8.106231689453125e-06, 9.34302806854248e-06, 1.0579824447631836e-05, 1.1816620826721191e-05, 1.3053417205810547e-05, 1.4290213584899902e-05, 1.5527009963989258e-05, 1.6763806343078613e-05, 1.800060272216797e-05, 1.9237399101257324e-05, 2.047419548034668e-05, 2.1710991859436035e-05, 2.294778823852539e-05, 2.4184584617614746e-05, 2.54213809967041e-05, 2.6658177375793457e-05, 2.7894973754882812e-05, 2.9131770133972168e-05, 3.0368566513061523e-05, 3.160536289215088e-05, 3.2842159271240234e-05, 3.407895565032959e-05, 3.5315752029418945e-05, 3.65525484085083e-05, 3.7789344787597656e-05]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 8.0, 6.0, 10.0, 13.0, 18.0, 30.0, 36.0, 43.0, 93.0, 117.0, 156.0, 138.0, 81.0, 62.0, 47.0, 32.0, 23.0, 14.0, 13.0, 15.0, 9.0, 9.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002863997593522072, -0.002764544216915965, -0.0026650908403098583, -0.0025656374637037516, -0.002466184087097645, -0.0023667304776608944, -0.0022672771010547876, -0.002167823724448681, -0.002068370347842574, -0.0019689169712364674, -0.0018694635946303606, -0.001770010101608932, -0.0016705567250028253, -0.0015711033483967185, -0.00147164985537529, -0.0013721964787691832, -0.0012727431021630764, -0.0011732897255569696, -0.0010738363489508629, -0.0009743828559294343, -0.0008749294793233275, -0.0007754761027172208, -0.0006760226679034531, -0.0005765692330896854, -0.0004771158564835787, -0.00037766245077364147, -0.00027820904506370425, -0.00017875563935376704, -7.930223364382982e-05, 2.0151142962276936e-05, 0.00011960457777604461, 0.00021905801258981228, 0.0003185116220265627, 0.0004179650277364999, 0.0005174184334464371, 0.0006168718682602048, 0.0007163252448663116, 0.0008157786214724183, 0.000915232056286186, 0.0010146854910999537, 0.0011141388677060604, 0.0012135922443121672, 0.001313045620918274, 0.0014124991139397025, 0.0015119524905458093, 0.001611405867151916, 0.0017108593601733446, 0.0018103127367794514, 0.0019097661133855581, 0.002009219489991665, 0.0021086728665977716, 0.0022081262432038784, 0.002307579852640629, 0.002407032996416092, 0.0025064866058528423, 0.002605939982458949, 0.002705393359065056, 0.0028048467356711626, 0.0029043001122772694, 0.003003753488883376, 0.003103206865489483, 0.0032026604749262333, 0.00330211385153234, 0.003401567228138447, 0.0035010206047445536]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 5.0, 7.0, 24.0, 16.0, 17.0, 22.0, 20.0, 23.0, 26.0, 27.0, 48.0, 34.0, 35.0, 52.0, 45.0, 55.0, 47.0, 45.0, 43.0, 44.0, 37.0, 36.0, 38.0, 40.0, 27.0, 24.0, 31.0, 22.0, 20.0, 19.0, 13.0, 10.0, 12.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016782114980742335, -0.0016249845502898097, -0.0015717576025053859, -0.0015185305383056402, -0.0014653035905212164, -0.0014120766427367926, -0.0013588496949523687, -0.001305622747167945, -0.0012523956829681993, -0.0011991687351837754, -0.0011459417873993516, -0.001092714723199606, -0.0010394877754151821, -0.0009862608276307583, -0.0009330338798463345, -0.0008798068738542497, -0.0008265799260698259, -0.0007733529782854021, -0.0007201259722933173, -0.0006668990245088935, -0.0006136720185168087, -0.0005604450707323849, -0.0005072180647403002, -0.00045399111695587635, -0.00040076414006762207, -0.0003475371631793678, -0.0002943101862911135, -0.00024108322395477444, -0.00018785624706652015, -0.0001346292847301811, -8.140230784192681e-05, -2.8175330953672528e-05, 2.5051645934581757e-05, 7.827862282283604e-05, 0.00013150559971109033, 0.00018473256204742938, 0.00023795953893568367, 0.0002911865012720227, 0.000344413478160277, 0.0003976404550485313, 0.0004508674319367856, 0.0005040944088250399, 0.0005573213566094637, 0.0006105483626015484, 0.0006637753103859723, 0.000717002316378057, 0.0007702292641624808, 0.0008234562119469047, 0.0008766832179389894, 0.0009299101657234132, 0.000983137171715498, 0.0010363641194999218, 0.0010895910672843456, 0.0011428180150687695, 0.0011960450792685151, 0.001249272027052939, 0.0013024989748373628, 0.0013557259226217866, 0.0014089528704062104, 0.001462179934605956, 0.00151540688239038, 0.0015686338301748037, 0.0016218607779592276, 0.0016750877257436514, 0.001728314789943397]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 14.0, 24.0, 33.0, 39.0, 45.0, 84.0, 114.0, 180.0, 290.0, 425.0, 604.0, 980.0, 1622.0, 2496.0, 4315.0, 7534.0, 13891.0, 28673.0, 105773.0, 3866606.0, 104085.0, 26878.0, 12820.0, 6709.0, 3917.0, 2198.0, 1354.0, 887.0, 537.0, 344.0, 250.0, 168.0, 109.0, 79.0, 54.0, 38.0, 32.0, 13.0, 16.0, 14.0, 6.0, 10.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0054779052734375, -0.005292177200317383, -0.005106449127197266, -0.0049207210540771484, -0.004734992980957031, -0.004549264907836914, -0.004363536834716797, -0.00417780876159668, -0.0039920806884765625, -0.0038063526153564453, -0.003620624542236328, -0.003434896469116211, -0.0032491683959960938, -0.0030634403228759766, -0.0028777122497558594, -0.002691984176635742, -0.002506256103515625, -0.002320528030395508, -0.0021347999572753906, -0.0019490718841552734, -0.0017633438110351562, -0.001577615737915039, -0.0013918876647949219, -0.0012061595916748047, -0.0010204315185546875, -0.0008347034454345703, -0.0006489753723144531, -0.00046324729919433594, -0.00027751922607421875, -9.179115295410156e-05, 9.393692016601562e-05, 0.0002796649932861328, 0.00046539306640625, 0.0006511211395263672, 0.0008368492126464844, 0.0010225772857666016, 0.0012083053588867188, 0.001394033432006836, 0.0015797615051269531, 0.0017654895782470703, 0.0019512176513671875, 0.0021369457244873047, 0.002322673797607422, 0.002508401870727539, 0.0026941299438476562, 0.0028798580169677734, 0.0030655860900878906, 0.003251314163208008, 0.003437042236328125, 0.003622770309448242, 0.0038084983825683594, 0.0039942264556884766, 0.004179954528808594, 0.004365682601928711, 0.004551410675048828, 0.004737138748168945, 0.0049228668212890625, 0.00510859489440918, 0.005294322967529297, 0.005480051040649414, 0.005665779113769531, 0.0058515071868896484, 0.006037235260009766, 0.006222963333129883, 0.00640869140625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 8.0, 6.0, 14.0, 19.0, 28.0, 19.0, 30.0, 33.0, 34.0, 38.0, 42.0, 32.0, 57.0, 51.0, 51.0, 43.0, 52.0, 56.0, 47.0, 38.0, 42.0, 35.0, 40.0, 29.0, 20.0, 18.0, 25.0, 22.0, 15.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009517669677734375, -0.0009194314479827881, -0.0008870959281921387, -0.0008547604084014893, -0.0008224248886108398, -0.0007900893688201904, -0.000757753849029541, -0.0007254183292388916, -0.0006930828094482422, -0.0006607472896575928, -0.0006284117698669434, -0.0005960762500762939, -0.0005637407302856445, -0.0005314052104949951, -0.0004990696907043457, -0.0004667341709136963, -0.0004343986511230469, -0.00040206313133239746, -0.00036972761154174805, -0.00033739209175109863, -0.0003050565719604492, -0.0002727210521697998, -0.0002403855323791504, -0.00020805001258850098, -0.00017571449279785156, -0.00014337897300720215, -0.00011104345321655273, -7.870793342590332e-05, -4.6372413635253906e-05, -1.4036893844604492e-05, 1.8298625946044922e-05, 5.0634145736694336e-05, 8.296966552734375e-05, 0.00011530518531799316, 0.00014764070510864258, 0.000179976224899292, 0.0002123117446899414, 0.0002446472644805908, 0.00027698278427124023, 0.00030931830406188965, 0.00034165382385253906, 0.0003739893436431885, 0.0004063248634338379, 0.0004386603832244873, 0.0004709959030151367, 0.0005033314228057861, 0.0005356669425964355, 0.000568002462387085, 0.0006003379821777344, 0.0006326735019683838, 0.0006650090217590332, 0.0006973445415496826, 0.000729680061340332, 0.0007620155811309814, 0.0007943511009216309, 0.0008266866207122803, 0.0008590221405029297, 0.0008913576602935791, 0.0009236931800842285, 0.0009560286998748779, 0.0009883642196655273, 0.0010206997394561768, 0.0010530352592468262, 0.0010853707790374756, 0.001117706298828125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 7.0, 16.0, 16.0, 22.0, 42.0, 44.0, 76.0, 105.0, 150.0, 209.0, 318.0, 441.0, 627.0, 956.0, 1429.0, 2068.0, 3269.0, 5178.0, 8798.0, 15975.0, 32033.0, 80225.0, 487766.0, 3298539.0, 154619.0, 48985.0, 21992.0, 11930.0, 6679.0, 4057.0, 2570.0, 1648.0, 1093.0, 721.0, 506.0, 335.0, 224.0, 188.0, 117.0, 89.0, 82.0, 40.0, 28.0, 18.0, 21.0, 14.0, 5.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036640167236328125, -0.003542870283126831, -0.0034217238426208496, -0.003300577402114868, -0.0031794309616088867, -0.0030582845211029053, -0.002937138080596924, -0.0028159916400909424, -0.002694845199584961, -0.0025736987590789795, -0.002452552318572998, -0.0023314058780670166, -0.002210259437561035, -0.0020891129970550537, -0.0019679665565490723, -0.0018468201160430908, -0.0017256736755371094, -0.001604527235031128, -0.0014833807945251465, -0.001362234354019165, -0.0012410879135131836, -0.0011199414730072021, -0.0009987950325012207, -0.0008776485919952393, -0.0007565021514892578, -0.0006353557109832764, -0.0005142092704772949, -0.0003930628299713135, -0.00027191638946533203, -0.00015076994895935059, -2.962350845336914e-05, 9.15229320526123e-05, 0.00021266937255859375, 0.0003338158130645752, 0.00045496225357055664, 0.0005761086940765381, 0.0006972551345825195, 0.000818401575088501, 0.0009395480155944824, 0.0010606944561004639, 0.0011818408966064453, 0.0013029873371124268, 0.0014241337776184082, 0.0015452802181243896, 0.001666426658630371, 0.0017875730991363525, 0.001908719539642334, 0.0020298659801483154, 0.002151012420654297, 0.0022721588611602783, 0.0023933053016662598, 0.002514451742172241, 0.0026355981826782227, 0.002756744623184204, 0.0028778910636901855, 0.002999037504196167, 0.0031201839447021484, 0.00324133038520813, 0.0033624768257141113, 0.0034836232662200928, 0.0036047697067260742, 0.0037259161472320557, 0.003847062587738037, 0.0039682090282440186, 0.00408935546875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 5.0, 2.0, 3.0, 9.0, 9.0, 8.0, 9.0, 11.0, 10.0, 24.0, 24.0, 33.0, 45.0, 53.0, 107.0, 247.0, 601.0, 1850.0, 478.0, 176.0, 99.0, 53.0, 38.0, 41.0, 23.0, 21.0, 22.0, 11.0, 12.0, 10.0, 8.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00106048583984375, -0.0010297074913978577, -0.0009989291429519653, -0.000968150794506073, -0.0009373724460601807, -0.0009065940976142883, -0.000875815749168396, -0.0008450374007225037, -0.0008142590522766113, -0.000783480703830719, -0.0007527023553848267, -0.0007219240069389343, -0.000691145658493042, -0.0006603673100471497, -0.0006295889616012573, -0.000598810613155365, -0.0005680322647094727, -0.0005372539162635803, -0.000506475567817688, -0.00047569721937179565, -0.0004449188709259033, -0.000414140522480011, -0.00038336217403411865, -0.0003525838255882263, -0.000321805477142334, -0.00029102712869644165, -0.0002602487802505493, -0.00022947043180465698, -0.00019869208335876465, -0.00016791373491287231, -0.00013713538646697998, -0.00010635703802108765, -7.557868957519531e-05, -4.480034112930298e-05, -1.4021992683410645e-05, 1.675635576248169e-05, 4.7534704208374023e-05, 7.831305265426636e-05, 0.00010909140110015869, 0.00013986974954605103, 0.00017064809799194336, 0.0002014264464378357, 0.00023220479488372803, 0.00026298314332962036, 0.0002937614917755127, 0.00032453984022140503, 0.00035531818866729736, 0.0003860965371131897, 0.00041687488555908203, 0.00044765323400497437, 0.0004784315824508667, 0.000509209930896759, 0.0005399882793426514, 0.0005707666277885437, 0.000601544976234436, 0.0006323233246803284, 0.0006631016731262207, 0.000693880021572113, 0.0007246583700180054, 0.0007554367184638977, 0.00078621506690979, 0.0008169934153556824, 0.0008477717638015747, 0.000878550112247467, 0.0009093284606933594]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 2.0, 7.0, 7.0, 11.0, 10.0, 14.0, 18.0, 38.0, 49.0, 78.0, 94.0, 156.0, 141.0, 107.0, 74.0, 47.0, 41.0, 21.0, 27.0, 9.0, 12.0, 3.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001782490755431354, -0.0017057457007467747, -0.0016290006460621953, -0.001552255591377616, -0.0014755104202777147, -0.0013987653655931354, -0.001322020310908556, -0.0012452751398086548, -0.0011685302015393972, -0.0010917851468548179, -0.0010150400921702385, -0.0009382949792779982, -0.0008615498663857579, -0.0007848048117011786, -0.0007080597570165992, -0.0006313146441243589, -0.0005545695312321186, -0.0004778244474437088, -0.00040107936365529895, -0.0003243343089707196, -0.00024758922518230975, -0.00017084414139389992, -9.409908670932055e-05, -1.735397381708026e-05, 5.939108086749911e-05, 0.00013613616465590894, 0.00021288123389240354, 0.00028962630312889814, 0.000366371386917308, 0.0004431164707057178, 0.0005198615253902972, 0.0005966066382825375, 0.000673351576551795, 0.0007500966312363744, 0.0008268417441286147, 0.000903586798813194, 0.0009803319117054343, 0.0010570769663900137, 0.001133822021074593, 0.0012105670757591724, 0.0012873122468590736, 0.001364057301543653, 0.0014408023562282324, 0.0015175475273281336, 0.001594292582012713, 0.0016710376366972923, 0.0017477826913818717, 0.001824527746066451, 0.0019012728007510304, 0.00197801785543561, 0.002054763026535511, 0.0021315079648047686, 0.0022082531359046698, 0.0022849980741739273, 0.0023617432452738285, 0.0024384884163737297, 0.0025152333546429873, 0.0025919785257428885, 0.002668723464012146, 0.002745468635112047, 0.0028222135733813047, 0.002898958744481206, 0.0029757036827504635, 0.0030524488538503647, 0.003129194024950266]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 11.0, 11.0, 11.0, 14.0, 17.0, 15.0, 21.0, 26.0, 24.0, 20.0, 26.0, 27.0, 29.0, 38.0, 32.0, 31.0, 44.0, 35.0, 38.0, 33.0, 31.0, 30.0, 30.0, 23.0, 31.0, 29.0, 33.0, 22.0, 18.0, 27.0, 27.0, 16.0, 24.0, 18.0, 11.0, 13.0, 9.0, 13.0, 10.0, 13.0, 5.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-0.0009247217676602304, -0.0008943264838308096, -0.0008639312582090497, -0.0008335359743796289, -0.000803140748757869, -0.0007727454649284482, -0.0007423502393066883, -0.0007119549554772675, -0.0006815596716478467, -0.0006511643878184259, -0.000620769162196666, -0.0005903738783672452, -0.0005599786527454853, -0.0005295833689160645, -0.0004991880850866437, -0.0004687928594648838, -0.0004383976338431239, -0.00040800237911753356, -0.0003776071243919432, -0.0003472118405625224, -0.0003168166149407625, -0.0002864213311113417, -0.00025602607638575137, -0.00022563082166016102, -0.00019523556693457067, -0.00016484031220898032, -0.00013444505748338997, -0.0001040497882058844, -7.365453348029405e-05, -4.32592787547037e-05, -1.2864009477198124e-05, 1.7531245248392224e-05, 4.792644176632166e-05, 7.832169649191201e-05, 0.00010871695849345997, 0.00013911222049500793, 0.00016950747522059828, 0.00019990272994618863, 0.0002302979992236942, 0.00026069325394928455, 0.0002910885086748749, 0.00032148376340046525, 0.0003518790181260556, 0.00038227427285164595, 0.00041266955668106675, 0.00044306478230282664, 0.00047346006613224745, 0.0005038552917540073, 0.0005342505755834281, 0.000564645859412849, 0.0005950410850346088, 0.0006254363688640296, 0.0006558315944857895, 0.0006862268783152103, 0.0007166221039369702, 0.000747017387766391, 0.0007774126715958118, 0.0008078079554252326, 0.0008382031810469925, 0.0008685984648764133, 0.0008989936904981732, 0.000929388974327594, 0.0009597842581570148, 0.0009901794837787747, 0.0010205747094005346]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 8.0, 8.0, 21.0, 20.0, 17.0, 28.0, 49.0, 100.0, 147.0, 238.0, 433.0, 659.0, 1222.0, 2175.0, 4148.0, 8099.0, 16667.0, 35373.0, 84269.0, 249577.0, 422740.0, 126852.0, 50127.0, 22578.0, 11086.0, 5362.0, 2909.0, 1561.0, 845.0, 501.0, 274.0, 152.0, 84.0, 60.0, 44.0, 28.0, 11.0, 19.0, 9.0, 10.0, 6.0, 5.0, 6.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 4.0], "bins": [-0.00304412841796875, -0.002955138683319092, -0.0028661489486694336, -0.0027771592140197754, -0.002688169479370117, -0.002599179744720459, -0.0025101900100708008, -0.0024212002754211426, -0.0023322105407714844, -0.002243220806121826, -0.002154231071472168, -0.0020652413368225098, -0.0019762516021728516, -0.0018872618675231934, -0.0017982721328735352, -0.001709282398223877, -0.0016202926635742188, -0.0015313029289245605, -0.0014423131942749023, -0.0013533234596252441, -0.001264333724975586, -0.0011753439903259277, -0.0010863542556762695, -0.0009973645210266113, -0.0009083747863769531, -0.0008193850517272949, -0.0007303953170776367, -0.0006414055824279785, -0.0005524158477783203, -0.0004634261131286621, -0.0003744363784790039, -0.0002854466438293457, -0.0001964569091796875, -0.0001074671745300293, -1.8477439880371094e-05, 7.051229476928711e-05, 0.0001595020294189453, 0.0002484917640686035, 0.0003374814987182617, 0.0004264712333679199, 0.0005154609680175781, 0.0006044507026672363, 0.0006934404373168945, 0.0007824301719665527, 0.0008714199066162109, 0.0009604096412658691, 0.0010493993759155273, 0.0011383891105651855, 0.0012273788452148438, 0.001316368579864502, 0.0014053583145141602, 0.0014943480491638184, 0.0015833377838134766, 0.0016723275184631348, 0.001761317253112793, 0.0018503069877624512, 0.0019392967224121094, 0.0020282864570617676, 0.0021172761917114258, 0.002206265926361084, 0.002295255661010742, 0.0023842453956604004, 0.0024732351303100586, 0.002562224864959717, 0.002651214599609375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 7.0, 4.0, 4.0, 11.0, 10.0, 10.0, 14.0, 15.0, 15.0, 22.0, 30.0, 20.0, 30.0, 35.0, 36.0, 29.0, 48.0, 43.0, 49.0, 46.0, 44.0, 41.0, 30.0, 28.0, 32.0, 34.0, 45.0, 30.0, 28.0, 27.0, 20.0, 17.0, 25.0, 14.0, 11.0, 15.0, 9.0, 8.0, 15.0, 9.0, 7.0, 6.0, 5.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.0011653900146484375, -0.0011304020881652832, -0.001095414161682129, -0.0010604262351989746, -0.0010254383087158203, -0.000990450382232666, -0.0009554624557495117, -0.0009204745292663574, -0.0008854866027832031, -0.0008504986763000488, -0.0008155107498168945, -0.0007805228233337402, -0.0007455348968505859, -0.0007105469703674316, -0.0006755590438842773, -0.000640571117401123, -0.0006055831909179688, -0.0005705952644348145, -0.0005356073379516602, -0.0005006194114685059, -0.00046563148498535156, -0.00043064355850219727, -0.00039565563201904297, -0.00036066770553588867, -0.0003256797790527344, -0.0002906918525695801, -0.0002557039260864258, -0.00022071599960327148, -0.0001857280731201172, -0.0001507401466369629, -0.0001157522201538086, -8.07642936706543e-05, -4.57763671875e-05, -1.0788440704345703e-05, 2.4199485778808594e-05, 5.918741226196289e-05, 9.417533874511719e-05, 0.00012916326522827148, 0.00016415119171142578, 0.00019913911819458008, 0.00023412704467773438, 0.00026911497116088867, 0.00030410289764404297, 0.00033909082412719727, 0.00037407875061035156, 0.00040906667709350586, 0.00044405460357666016, 0.00047904253005981445, 0.0005140304565429688, 0.000549018383026123, 0.0005840063095092773, 0.0006189942359924316, 0.0006539821624755859, 0.0006889700889587402, 0.0007239580154418945, 0.0007589459419250488, 0.0007939338684082031, 0.0008289217948913574, 0.0008639097213745117, 0.000898897647857666, 0.0009338855743408203, 0.0009688735008239746, 0.001003861427307129, 0.0010388493537902832, 0.0010738372802734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 8.0, 8.0, 13.0, 15.0, 33.0, 42.0, 47.0, 64.0, 101.0, 155.0, 280.0, 453.0, 887.0, 2144.0, 5696.0, 18602.0, 89065.0, 789734.0, 109155.0, 21235.0, 6187.0, 2273.0, 972.0, 512.0, 250.0, 175.0, 121.0, 75.0, 46.0, 28.0, 38.0, 28.0, 28.0, 18.0, 7.0, 5.0, 6.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.004344940185546875, -0.004197895526885986, -0.004050850868225098, -0.003903806209564209, -0.0037567615509033203, -0.0036097168922424316, -0.003462672233581543, -0.0033156275749206543, -0.0031685829162597656, -0.003021538257598877, -0.0028744935989379883, -0.0027274489402770996, -0.002580404281616211, -0.0024333596229553223, -0.0022863149642944336, -0.002139270305633545, -0.0019922256469726562, -0.0018451809883117676, -0.001698136329650879, -0.0015510916709899902, -0.0014040470123291016, -0.0012570023536682129, -0.0011099576950073242, -0.0009629130363464355, -0.0008158683776855469, -0.0006688237190246582, -0.0005217790603637695, -0.00037473440170288086, -0.0002276897430419922, -8.064508438110352e-05, 6.639957427978516e-05, 0.00021344423294067383, 0.0003604888916015625, 0.0005075335502624512, 0.0006545782089233398, 0.0008016228675842285, 0.0009486675262451172, 0.0010957121849060059, 0.0012427568435668945, 0.0013898015022277832, 0.0015368461608886719, 0.0016838908195495605, 0.0018309354782104492, 0.001977980136871338, 0.0021250247955322266, 0.0022720694541931152, 0.002419114112854004, 0.0025661587715148926, 0.0027132034301757812, 0.00286024808883667, 0.0030072927474975586, 0.0031543374061584473, 0.003301382064819336, 0.0034484267234802246, 0.0035954713821411133, 0.003742516040802002, 0.0038895606994628906, 0.004036605358123779, 0.004183650016784668, 0.004330694675445557, 0.004477739334106445, 0.004624783992767334, 0.004771828651428223, 0.004918873310089111, 0.00506591796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 9.0, 5.0, 10.0, 9.0, 12.0, 11.0, 10.0, 19.0, 16.0, 23.0, 31.0, 29.0, 32.0, 29.0, 30.0, 32.0, 44.0, 37.0, 56.0, 49.0, 45.0, 48.0, 48.0, 35.0, 37.0, 50.0, 30.0, 35.0, 35.0, 25.0, 19.0, 19.0, 20.0, 14.0, 9.0, 9.0, 9.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007252693176269531, -0.0006995871663093567, -0.0006739050149917603, -0.0006482228636741638, -0.0006225407123565674, -0.000596858561038971, -0.0005711764097213745, -0.0005454942584037781, -0.0005198121070861816, -0.0004941299557685852, -0.00046844780445098877, -0.00044276565313339233, -0.0004170835018157959, -0.00039140135049819946, -0.00036571919918060303, -0.0003400370478630066, -0.00031435489654541016, -0.0002886727452278137, -0.0002629905939102173, -0.00023730844259262085, -0.00021162629127502441, -0.00018594413995742798, -0.00016026198863983154, -0.0001345798373222351, -0.00010889768600463867, -8.321553468704224e-05, -5.75333833694458e-05, -3.1851232051849365e-05, -6.16908073425293e-06, 1.9513070583343506e-05, 4.519522190093994e-05, 7.087737321853638e-05, 9.655952453613281e-05, 0.00012224167585372925, 0.00014792382717132568, 0.00017360597848892212, 0.00019928812980651855, 0.000224970281124115, 0.0002506524324417114, 0.00027633458375930786, 0.0003020167350769043, 0.00032769888639450073, 0.00035338103771209717, 0.0003790631890296936, 0.00040474534034729004, 0.0004304274916648865, 0.0004561096429824829, 0.00048179179430007935, 0.0005074739456176758, 0.0005331560969352722, 0.0005588382482528687, 0.0005845203995704651, 0.0006102025508880615, 0.000635884702205658, 0.0006615668535232544, 0.0006872490048408508, 0.0007129311561584473, 0.0007386133074760437, 0.0007642954587936401, 0.0007899776101112366, 0.000815659761428833, 0.0008413419127464294, 0.0008670240640640259, 0.0008927062153816223, 0.0009183883666992188]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 12.0, 14.0, 23.0, 15.0, 42.0, 41.0, 51.0, 68.0, 87.0, 121.0, 177.0, 256.0, 364.0, 591.0, 950.0, 1549.0, 3061.0, 6497.0, 17800.0, 89063.0, 823263.0, 75055.0, 16062.0, 6126.0, 2935.0, 1575.0, 926.0, 592.0, 392.0, 231.0, 168.0, 121.0, 97.0, 57.0, 40.0, 18.0, 29.0, 14.0, 14.0, 8.0, 9.0, 10.0, 2.0, 4.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.0010919570922851562, -0.0010602697730064392, -0.0010285824537277222, -0.0009968951344490051, -0.0009652078151702881, -0.000933520495891571, -0.000901833176612854, -0.000870145857334137, -0.0008384585380554199, -0.0008067712187767029, -0.0007750838994979858, -0.0007433965802192688, -0.0007117092609405518, -0.0006800219416618347, -0.0006483346223831177, -0.0006166473031044006, -0.0005849599838256836, -0.0005532726645469666, -0.0005215853452682495, -0.0004898980259895325, -0.00045821070671081543, -0.0004265233874320984, -0.00039483606815338135, -0.0003631487488746643, -0.00033146142959594727, -0.0002997741103172302, -0.0002680867910385132, -0.00023639947175979614, -0.0002047121524810791, -0.00017302483320236206, -0.00014133751392364502, -0.00010965019464492798, -7.796287536621094e-05, -4.6275556087493896e-05, -1.4588236808776855e-05, 1.7099082469940186e-05, 4.8786401748657227e-05, 8.047372102737427e-05, 0.00011216104030609131, 0.00014384835958480835, 0.0001755356788635254, 0.00020722299814224243, 0.00023891031742095947, 0.0002705976366996765, 0.00030228495597839355, 0.0003339722752571106, 0.00036565959453582764, 0.0003973469138145447, 0.0004290342330932617, 0.00046072155237197876, 0.0004924088716506958, 0.0005240961909294128, 0.0005557835102081299, 0.0005874708294868469, 0.000619158148765564, 0.000650845468044281, 0.000682532787322998, 0.0007142201066017151, 0.0007459074258804321, 0.0007775947451591492, 0.0008092820644378662, 0.0008409693837165833, 0.0008726567029953003, 0.0009043440222740173, 0.0009360313415527344]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 8.0, 1.0, 6.0, 23.0, 13.0, 15.0, 37.0, 28.0, 24.0, 47.0, 42.0, 54.0, 64.0, 54.0, 89.0, 95.0, 48.0, 48.0, 62.0, 38.0, 30.0, 44.0, 23.0, 19.0, 24.0, 13.0, 12.0, 11.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.5567209124565125e-06, -3.417953848838806e-06, -3.2791867852211e-06, -3.1404197216033936e-06, -3.0016526579856873e-06, -2.862885594367981e-06, -2.7241185307502747e-06, -2.5853514671325684e-06, -2.446584403514862e-06, -2.3078173398971558e-06, -2.1690502762794495e-06, -2.030283212661743e-06, -1.8915161490440369e-06, -1.7527490854263306e-06, -1.6139820218086243e-06, -1.475214958190918e-06, -1.3364478945732117e-06, -1.1976808309555054e-06, -1.058913767337799e-06, -9.201467037200928e-07, -7.813796401023865e-07, -6.426125764846802e-07, -5.038455128669739e-07, -3.650784492492676e-07, -2.2631138563156128e-07, -8.754432201385498e-08, 5.122274160385132e-08, 1.8998980522155762e-07, 3.287568688392639e-07, 4.675239324569702e-07, 6.062909960746765e-07, 7.450580596923828e-07, 8.838251233100891e-07, 1.0225921869277954e-06, 1.1613592505455017e-06, 1.300126314163208e-06, 1.4388933777809143e-06, 1.5776604413986206e-06, 1.716427505016327e-06, 1.8551945686340332e-06, 1.9939616322517395e-06, 2.132728695869446e-06, 2.271495759487152e-06, 2.4102628231048584e-06, 2.5490298867225647e-06, 2.687796950340271e-06, 2.8265640139579773e-06, 2.9653310775756836e-06, 3.10409814119339e-06, 3.242865204811096e-06, 3.3816322684288025e-06, 3.520399332046509e-06, 3.659166395664215e-06, 3.7979334592819214e-06, 3.936700522899628e-06, 4.075467586517334e-06, 4.21423465013504e-06, 4.353001713752747e-06, 4.491768777370453e-06, 4.630535840988159e-06, 4.7693029046058655e-06, 4.908069968223572e-06, 5.046837031841278e-06, 5.185604095458984e-06]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 6.0, 13.0, 15.0, 26.0, 38.0, 57.0, 77.0, 139.0, 195.0, 364.0, 573.0, 962.0, 1746.0, 3186.0, 6154.0, 12656.0, 31118.0, 117393.0, 651399.0, 156069.0, 37071.0, 14280.0, 6800.0, 3532.0, 1962.0, 1053.0, 627.0, 393.0, 237.0, 133.0, 99.0, 63.0, 38.0, 21.0, 18.0, 13.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007371902465820312, -0.0007145628333091736, -0.0006919354200363159, -0.0006693080067634583, -0.0006466805934906006, -0.0006240531802177429, -0.0006014257669448853, -0.0005787983536720276, -0.0005561709403991699, -0.0005335435271263123, -0.0005109161138534546, -0.0004882887005805969, -0.00046566128730773926, -0.0004430338740348816, -0.0004204064607620239, -0.00039777904748916626, -0.0003751516342163086, -0.00035252422094345093, -0.00032989680767059326, -0.0003072693943977356, -0.00028464198112487793, -0.00026201456785202026, -0.0002393871545791626, -0.00021675974130630493, -0.00019413232803344727, -0.0001715049147605896, -0.00014887750148773193, -0.00012625008821487427, -0.0001036226749420166, -8.099526166915894e-05, -5.836784839630127e-05, -3.5740435123443604e-05, -1.3113021850585938e-05, 9.514391422271729e-06, 3.2141804695129395e-05, 5.476921796798706e-05, 7.739663124084473e-05, 0.00010002404451370239, 0.00012265145778656006, 0.00014527887105941772, 0.0001679062843322754, 0.00019053369760513306, 0.00021316111087799072, 0.0002357885241508484, 0.00025841593742370605, 0.0002810433506965637, 0.0003036707639694214, 0.00032629817724227905, 0.0003489255905151367, 0.0003715530037879944, 0.00039418041706085205, 0.0004168078303337097, 0.0004394352436065674, 0.00046206265687942505, 0.0004846900701522827, 0.0005073174834251404, 0.000529944896697998, 0.0005525723099708557, 0.0005751997232437134, 0.000597827136516571, 0.0006204545497894287, 0.0006430819630622864, 0.000665709376335144, 0.0006883367896080017, 0.0007109642028808594]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 10.0, 12.0, 6.0, 7.0, 12.0, 14.0, 36.0, 49.0, 51.0, 81.0, 111.0, 109.0, 99.0, 101.0, 75.0, 47.0, 44.0, 22.0, 19.0, 8.0, 11.0, 9.0, 7.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001621246337890625, -0.00015703216195106506, -0.00015193969011306763, -0.0001468472182750702, -0.00014175474643707275, -0.00013666227459907532, -0.00013156980276107788, -0.00012647733092308044, -0.00012138485908508301, -0.00011629238724708557, -0.00011119991540908813, -0.0001061074435710907, -0.00010101497173309326, -9.592249989509583e-05, -9.083002805709839e-05, -8.573755621910095e-05, -8.064508438110352e-05, -7.555261254310608e-05, -7.046014070510864e-05, -6.53676688671112e-05, -6.027519702911377e-05, -5.518272519111633e-05, -5.0090253353118896e-05, -4.499778151512146e-05, -3.9905309677124023e-05, -3.481283783912659e-05, -2.972036600112915e-05, -2.4627894163131714e-05, -1.9535422325134277e-05, -1.444295048713684e-05, -9.350478649139404e-06, -4.258006811141968e-06, 8.344650268554688e-07, 5.926936864852905e-06, 1.1019408702850342e-05, 1.611188054084778e-05, 2.1204352378845215e-05, 2.629682421684265e-05, 3.138929605484009e-05, 3.6481767892837524e-05, 4.157423973083496e-05, 4.66667115688324e-05, 5.1759183406829834e-05, 5.685165524482727e-05, 6.194412708282471e-05, 6.703659892082214e-05, 7.212907075881958e-05, 7.722154259681702e-05, 8.231401443481445e-05, 8.740648627281189e-05, 9.249895811080933e-05, 9.759142994880676e-05, 0.0001026839017868042, 0.00010777637362480164, 0.00011286884546279907, 0.00011796131730079651, 0.00012305378913879395, 0.00012814626097679138, 0.00013323873281478882, 0.00013833120465278625, 0.0001434236764907837, 0.00014851614832878113, 0.00015360862016677856, 0.000158701092004776, 0.00016379356384277344]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 11.0, 18.0, 19.0, 36.0, 51.0, 68.0, 74.0, 131.0, 151.0, 119.0, 61.0, 51.0, 51.0, 30.0, 22.0, 24.0, 12.0, 12.0, 6.0, 5.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019107961561530828, -0.0018462104490026832, -0.0017816247418522835, -0.0017170390347018838, -0.001652453327551484, -0.0015878675039857626, -0.001523281796835363, -0.0014586960896849632, -0.0013941103825345635, -0.0013295246753841639, -0.0012649389682337642, -0.0012003532610833645, -0.001135767437517643, -0.0010711818467825651, -0.0010065960232168436, -0.0009420103160664439, -0.0008774246089160442, -0.0008128389017656446, -0.0007482531946152449, -0.0006836674292571843, -0.0006190817221067846, -0.0005544960149563849, -0.0004899102495983243, -0.0004253245424479246, -0.00036073883529752493, -0.00029615312814712524, -0.0002315673918928951, -0.0001669816701905802, -0.00010239594848826528, -3.781024133786559e-05, 2.677549491636455e-05, 9.136123117059469e-05, 0.00015594717115163803, 0.00022053289285395294, 0.00028511861455626786, 0.000349704350810498, 0.0004142900579608977, 0.00047887576511129737, 0.000543461530469358, 0.0006080472376197577, 0.0006726329447701573, 0.000737218651920557, 0.0008018043590709567, 0.0008663901244290173, 0.000930975831579417, 0.0009955614805221558, 0.0010601473040878773, 0.001124733011238277, 0.0011893187183886766, 0.0012539044255390763, 0.001318490132689476, 0.0013830758398398757, 0.0014476615469902754, 0.001512247370555997, 0.0015768330777063966, 0.0016414187848567963, 0.001706004492007196, 0.0017705901991575956, 0.0018351759063079953, 0.001899761613458395, 0.0019643474370241165, 0.0020289330277591944, 0.002093518851324916, 0.0021581044420599937, 0.0022226902656257153]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 12.0, 7.0, 7.0, 16.0, 15.0, 12.0, 16.0, 22.0, 22.0, 22.0, 19.0, 22.0, 25.0, 27.0, 37.0, 36.0, 28.0, 39.0, 38.0, 34.0, 40.0, 26.0, 31.0, 33.0, 26.0, 26.0, 30.0, 34.0, 24.0, 24.0, 22.0, 20.0, 30.0, 16.0, 23.0, 20.0, 12.0, 13.0, 8.0, 15.0, 9.0, 8.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0008287240052595735, -0.0008013669867068529, -0.0007740099681541324, -0.0007466529496014118, -0.0007192959310486913, -0.0006919389124959707, -0.0006645818939432502, -0.0006372248753905296, -0.0006098678568378091, -0.0005825108382850885, -0.000555153819732368, -0.0005277968011796474, -0.0005004397826269269, -0.00047308276407420635, -0.00044572571641765535, -0.0004183686978649348, -0.0003910116502083838, -0.00036365463165566325, -0.0003362976131029427, -0.00030894059455022216, -0.0002815835759975016, -0.00025422655744478106, -0.00022686950978823006, -0.00019951249123550951, -0.00017215547268278897, -0.00014479845413006842, -0.00011744142830139026, -9.00844024727121e-05, -6.272738391999155e-05, -3.5370365367271006e-05, -8.013332262635231e-06, 1.9343686290085316e-05, 4.6700763050466776e-05, 7.405778160318732e-05, 0.00010141480743186548, 0.00012877183326054364, 0.0001561288518132642, 0.00018348587036598474, 0.0002108429034706205, 0.00023819992202334106, 0.0002655569405760616, 0.00029291395912878215, 0.0003202709776815027, 0.0003476280253380537, 0.00037498504389077425, 0.0004023420624434948, 0.00042969908099621534, 0.0004570560995489359, 0.00048441311810165644, 0.000511770136654377, 0.0005391271552070975, 0.0005664841737598181, 0.0005938411923125386, 0.0006211982108652592, 0.0006485552294179797, 0.0006759122479707003, 0.0007032692665234208, 0.0007306262850761414, 0.0007579833036288619, 0.0007853403221815825, 0.000812697340734303, 0.0008400543592870235, 0.0008674113778397441, 0.0008947683963924646, 0.0009221254731528461]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 7.0, 7.0, 7.0, 9.0, 13.0, 26.0, 44.0, 52.0, 69.0, 120.0, 160.0, 185.0, 281.0, 380.0, 552.0, 764.0, 1131.0, 1532.0, 2126.0, 3072.0, 4478.0, 6371.0, 9481.0, 14370.0, 21413.0, 33555.0, 53039.0, 90346.0, 173507.0, 269276.0, 145276.0, 78708.0, 47266.0, 30052.0, 19298.0, 13100.0, 8555.0, 6072.0, 4112.0, 2858.0, 1977.0, 1402.0, 988.0, 776.0, 485.0, 364.0, 259.0, 190.0, 128.0, 108.0, 83.0, 48.0, 46.0, 17.0, 12.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018596649169921875, -0.0017984509468078613, -0.0017372369766235352, -0.001676023006439209, -0.0016148090362548828, -0.0015535950660705566, -0.0014923810958862305, -0.0014311671257019043, -0.0013699531555175781, -0.001308739185333252, -0.0012475252151489258, -0.0011863112449645996, -0.0011250972747802734, -0.0010638833045959473, -0.001002669334411621, -0.0009414553642272949, -0.0008802413940429688, -0.0008190274238586426, -0.0007578134536743164, -0.0006965994834899902, -0.0006353855133056641, -0.0005741715431213379, -0.0005129575729370117, -0.00045174360275268555, -0.0003905296325683594, -0.0003293156623840332, -0.00026810169219970703, -0.00020688772201538086, -0.0001456737518310547, -8.445978164672852e-05, -2.3245811462402344e-05, 3.796815872192383e-05, 9.918212890625e-05, 0.00016039609909057617, 0.00022161006927490234, 0.0002828240394592285, 0.0003440380096435547, 0.00040525197982788086, 0.00046646595001220703, 0.0005276799201965332, 0.0005888938903808594, 0.0006501078605651855, 0.0007113218307495117, 0.0007725358009338379, 0.0008337497711181641, 0.0008949637413024902, 0.0009561777114868164, 0.0010173916816711426, 0.0010786056518554688, 0.001139819622039795, 0.001201033592224121, 0.0012622475624084473, 0.0013234615325927734, 0.0013846755027770996, 0.0014458894729614258, 0.001507103443145752, 0.0015683174133300781, 0.0016295313835144043, 0.0016907453536987305, 0.0017519593238830566, 0.0018131732940673828, 0.001874387264251709, 0.0019356012344360352, 0.0019968152046203613, 0.0020580291748046875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 4.0, 11.0, 13.0, 19.0, 15.0, 16.0, 22.0, 28.0, 22.0, 20.0, 27.0, 27.0, 46.0, 47.0, 31.0, 45.0, 35.0, 39.0, 32.0, 32.0, 34.0, 33.0, 31.0, 30.0, 34.0, 32.0, 26.0, 27.0, 25.0, 19.0, 22.0, 24.0, 17.0, 15.0, 13.0, 11.0, 5.0, 8.0, 5.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0], "bins": [-0.0005636215209960938, -0.0005468428134918213, -0.0005300641059875488, -0.0005132853984832764, -0.0004965066909790039, -0.00047972798347473145, -0.000462949275970459, -0.0004461705684661865, -0.00042939186096191406, -0.0004126131534576416, -0.00039583444595336914, -0.0003790557384490967, -0.0003622770309448242, -0.00034549832344055176, -0.0003287196159362793, -0.00031194090843200684, -0.0002951622009277344, -0.0002783834934234619, -0.00026160478591918945, -0.000244826078414917, -0.00022804737091064453, -0.00021126866340637207, -0.0001944899559020996, -0.00017771124839782715, -0.0001609325408935547, -0.00014415383338928223, -0.00012737512588500977, -0.0001105964183807373, -9.381771087646484e-05, -7.703900337219238e-05, -6.026029586791992e-05, -4.348158836364746e-05, -2.6702880859375e-05, -9.924173355102539e-06, 6.854534149169922e-06, 2.3633241653442383e-05, 4.0411949157714844e-05, 5.7190656661987305e-05, 7.396936416625977e-05, 9.074807167053223e-05, 0.00010752677917480469, 0.00012430548667907715, 0.0001410841941833496, 0.00015786290168762207, 0.00017464160919189453, 0.000191420316696167, 0.00020819902420043945, 0.00022497773170471191, 0.00024175643920898438, 0.00025853514671325684, 0.0002753138542175293, 0.00029209256172180176, 0.0003088712692260742, 0.0003256499767303467, 0.00034242868423461914, 0.0003592073917388916, 0.00037598609924316406, 0.0003927648067474365, 0.000409543514251709, 0.00042632222175598145, 0.0004431009292602539, 0.00045987963676452637, 0.00047665834426879883, 0.0004934370517730713, 0.0005102157592773438]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 10.0, 10.0, 9.0, 13.0, 15.0, 26.0, 45.0, 59.0, 73.0, 127.0, 196.0, 299.0, 476.0, 812.0, 1288.0, 2347.0, 4093.0, 7239.0, 13298.0, 25123.0, 49041.0, 102316.0, 273180.0, 331962.0, 118561.0, 55484.0, 28412.0, 15041.0, 8202.0, 4421.0, 2542.0, 1493.0, 883.0, 522.0, 339.0, 188.0, 138.0, 84.0, 57.0, 44.0, 31.0, 23.0, 9.0, 7.0, 6.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.002353668212890625, -0.002280324697494507, -0.0022069811820983887, -0.0021336376667022705, -0.0020602941513061523, -0.001986950635910034, -0.001913607120513916, -0.0018402636051177979, -0.0017669200897216797, -0.0016935765743255615, -0.0016202330589294434, -0.0015468895435333252, -0.001473546028137207, -0.0014002025127410889, -0.0013268589973449707, -0.0012535154819488525, -0.0011801719665527344, -0.0011068284511566162, -0.001033484935760498, -0.0009601414203643799, -0.0008867979049682617, -0.0008134543895721436, -0.0007401108741760254, -0.0006667673587799072, -0.0005934238433837891, -0.0005200803279876709, -0.00044673681259155273, -0.00037339329719543457, -0.0003000497817993164, -0.00022670626640319824, -0.00015336275100708008, -8.001923561096191e-05, -6.67572021484375e-06, 6.666779518127441e-05, 0.00014001131057739258, 0.00021335482597351074, 0.0002866983413696289, 0.00036004185676574707, 0.00043338537216186523, 0.0005067288875579834, 0.0005800724029541016, 0.0006534159183502197, 0.0007267594337463379, 0.0008001029491424561, 0.0008734464645385742, 0.0009467899799346924, 0.0010201334953308105, 0.0010934770107269287, 0.0011668205261230469, 0.001240164041519165, 0.0013135075569152832, 0.0013868510723114014, 0.0014601945877075195, 0.0015335381031036377, 0.0016068816184997559, 0.001680225133895874, 0.0017535686492919922, 0.0018269121646881104, 0.0019002556800842285, 0.0019735991954803467, 0.002046942710876465, 0.002120286226272583, 0.002193629741668701, 0.0022669732570648193, 0.0023403167724609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 11.0, 9.0, 9.0, 9.0, 17.0, 22.0, 24.0, 20.0, 26.0, 33.0, 24.0, 47.0, 44.0, 32.0, 53.0, 45.0, 39.0, 45.0, 52.0, 59.0, 37.0, 30.0, 38.0, 40.0, 42.0, 36.0, 30.0, 22.0, 20.0, 14.0, 18.0, 7.0, 11.0, 10.0, 7.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006809234619140625, -0.0006604790687561035, -0.0006400346755981445, -0.0006195902824401855, -0.0005991458892822266, -0.0005787014961242676, -0.0005582571029663086, -0.0005378127098083496, -0.0005173683166503906, -0.0004969239234924316, -0.00047647953033447266, -0.00045603513717651367, -0.0004355907440185547, -0.0004151463508605957, -0.0003947019577026367, -0.00037425756454467773, -0.00035381317138671875, -0.00033336877822875977, -0.0003129243850708008, -0.0002924799919128418, -0.0002720355987548828, -0.00025159120559692383, -0.00023114681243896484, -0.00021070241928100586, -0.00019025802612304688, -0.0001698136329650879, -0.0001493692398071289, -0.00012892484664916992, -0.00010848045349121094, -8.803606033325195e-05, -6.759166717529297e-05, -4.7147274017333984e-05, -2.6702880859375e-05, -6.258487701416016e-06, 1.4185905456542969e-05, 3.463029861450195e-05, 5.507469177246094e-05, 7.551908493041992e-05, 9.59634780883789e-05, 0.00011640787124633789, 0.00013685226440429688, 0.00015729665756225586, 0.00017774105072021484, 0.00019818544387817383, 0.0002186298370361328, 0.0002390742301940918, 0.0002595186233520508, 0.00027996301651000977, 0.00030040740966796875, 0.00032085180282592773, 0.0003412961959838867, 0.0003617405891418457, 0.0003821849822998047, 0.00040262937545776367, 0.00042307376861572266, 0.00044351816177368164, 0.0004639625549316406, 0.0004844069480895996, 0.0005048513412475586, 0.0005252957344055176, 0.0005457401275634766, 0.0005661845207214355, 0.0005866289138793945, 0.0006070733070373535, 0.0006275177001953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 18.0, 16.0, 15.0, 33.0, 34.0, 33.0, 64.0, 120.0, 226.0, 313.0, 589.0, 1218.0, 2743.0, 7130.0, 24956.0, 210545.0, 734863.0, 47357.0, 10946.0, 3821.0, 1603.0, 818.0, 403.0, 245.0, 139.0, 96.0, 61.0, 43.0, 34.0, 14.0, 12.0, 7.0, 4.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00014412403106689453, -0.00013950280845165253, -0.00013488158583641052, -0.00013026036322116852, -0.00012563914060592651, -0.00012101791799068451, -0.0001163966953754425, -0.0001117754727602005, -0.0001071542501449585, -0.00010253302752971649, -9.791180491447449e-05, -9.329058229923248e-05, -8.866935968399048e-05, -8.404813706874847e-05, -7.942691445350647e-05, -7.480569183826447e-05, -7.018446922302246e-05, -6.556324660778046e-05, -6.094202399253845e-05, -5.632080137729645e-05, -5.169957876205444e-05, -4.707835614681244e-05, -4.2457133531570435e-05, -3.783591091632843e-05, -3.3214688301086426e-05, -2.859346568584442e-05, -2.3972243070602417e-05, -1.9351020455360413e-05, -1.4729797840118408e-05, -1.0108575224876404e-05, -5.487352609634399e-06, -8.66129994392395e-07, 3.7550926208496094e-06, 8.376315236091614e-06, 1.2997537851333618e-05, 1.7618760466575623e-05, 2.2239983081817627e-05, 2.686120569705963e-05, 3.1482428312301636e-05, 3.610365092754364e-05, 4.0724873542785645e-05, 4.534609615802765e-05, 4.996731877326965e-05, 5.458854138851166e-05, 5.920976400375366e-05, 6.383098661899567e-05, 6.845220923423767e-05, 7.307343184947968e-05, 7.769465446472168e-05, 8.231587707996368e-05, 8.693709969520569e-05, 9.155832231044769e-05, 9.61795449256897e-05, 0.0001008007675409317, 0.0001054219901561737, 0.00011004321277141571, 0.00011466443538665771, 0.00011928565800189972, 0.00012390688061714172, 0.00012852810323238373, 0.00013314932584762573, 0.00013777054846286774, 0.00014239177107810974, 0.00014701299369335175, 0.00015163421630859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 0.0, 6.0, 6.0, 6.0, 14.0, 10.0, 24.0, 46.0, 25.0, 78.0, 142.0, 80.0, 174.0, 66.0, 106.0, 73.0, 16.0, 43.0, 25.0, 10.0, 12.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0489096641540527e-06, -1.952052116394043e-06, -1.8551945686340332e-06, -1.7583370208740234e-06, -1.6614794731140137e-06, -1.564621925354004e-06, -1.4677643775939941e-06, -1.3709068298339844e-06, -1.2740492820739746e-06, -1.1771917343139648e-06, -1.080334186553955e-06, -9.834766387939453e-07, -8.866190910339355e-07, -7.897615432739258e-07, -6.92903995513916e-07, -5.960464477539062e-07, -4.991888999938965e-07, -4.023313522338867e-07, -3.0547380447387695e-07, -2.086162567138672e-07, -1.1175870895385742e-07, -1.4901161193847656e-08, 8.195638656616211e-08, 1.7881393432617188e-07, 2.7567148208618164e-07, 3.725290298461914e-07, 4.6938657760620117e-07, 5.662441253662109e-07, 6.631016731262207e-07, 7.599592208862305e-07, 8.568167686462402e-07, 9.5367431640625e-07, 1.0505318641662598e-06, 1.1473894119262695e-06, 1.2442469596862793e-06, 1.341104507446289e-06, 1.4379620552062988e-06, 1.5348196029663086e-06, 1.6316771507263184e-06, 1.7285346984863281e-06, 1.8253922462463379e-06, 1.9222497940063477e-06, 2.0191073417663574e-06, 2.115964889526367e-06, 2.212822437286377e-06, 2.3096799850463867e-06, 2.4065375328063965e-06, 2.5033950805664062e-06, 2.600252628326416e-06, 2.6971101760864258e-06, 2.7939677238464355e-06, 2.8908252716064453e-06, 2.987682819366455e-06, 3.084540367126465e-06, 3.1813979148864746e-06, 3.2782554626464844e-06, 3.375113010406494e-06, 3.471970558166504e-06, 3.5688281059265137e-06, 3.6656856536865234e-06, 3.762543201446533e-06, 3.859400749206543e-06, 3.956258296966553e-06, 4.0531158447265625e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 10.0, 15.0, 23.0, 17.0, 40.0, 73.0, 94.0, 164.0, 265.0, 442.0, 750.0, 1395.0, 2532.0, 5622.0, 13549.0, 39578.0, 207344.0, 646298.0, 89627.0, 23261.0, 9007.0, 3921.0, 1965.0, 1061.0, 555.0, 345.0, 217.0, 127.0, 73.0, 64.0, 40.0, 20.0, 18.0, 12.0, 4.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.092952728271484e-05, -6.891880184412003e-05, -6.690807640552521e-05, -6.489735096693039e-05, -6.288662552833557e-05, -6.087590008974075e-05, -5.8865174651145935e-05, -5.685444921255112e-05, -5.48437237739563e-05, -5.283299833536148e-05, -5.082227289676666e-05, -4.8811547458171844e-05, -4.6800822019577026e-05, -4.479009658098221e-05, -4.277937114238739e-05, -4.076864570379257e-05, -3.8757920265197754e-05, -3.6747194826602936e-05, -3.473646938800812e-05, -3.27257439494133e-05, -3.071501851081848e-05, -2.8704293072223663e-05, -2.6693567633628845e-05, -2.4682842195034027e-05, -2.267211675643921e-05, -2.066139131784439e-05, -1.8650665879249573e-05, -1.6639940440654755e-05, -1.4629215002059937e-05, -1.2618489563465118e-05, -1.06077641248703e-05, -8.597038686275482e-06, -6.586313247680664e-06, -4.575587809085846e-06, -2.564862370491028e-06, -5.541369318962097e-07, 1.4565885066986084e-06, 3.4673139452934265e-06, 5.478039383888245e-06, 7.488764822483063e-06, 9.499490261077881e-06, 1.1510215699672699e-05, 1.3520941138267517e-05, 1.5531666576862335e-05, 1.7542392015457153e-05, 1.955311745405197e-05, 2.156384289264679e-05, 2.3574568331241608e-05, 2.5585293769836426e-05, 2.7596019208431244e-05, 2.9606744647026062e-05, 3.161747008562088e-05, 3.36281955242157e-05, 3.5638920962810516e-05, 3.7649646401405334e-05, 3.966037184000015e-05, 4.167109727859497e-05, 4.368182271718979e-05, 4.569254815578461e-05, 4.7703273594379425e-05, 4.971399903297424e-05, 5.172472447156906e-05, 5.373544991016388e-05, 5.57461753487587e-05, 5.7756900787353516e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 6.0, 10.0, 10.0, 11.0, 10.0, 26.0, 32.0, 42.0, 57.0, 63.0, 112.0, 92.0, 110.0, 106.0, 80.0, 57.0, 41.0, 39.0, 21.0, 15.0, 16.0, 7.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.341104507446289e-05, -1.2932345271110535e-05, -1.2453645467758179e-05, -1.1974945664405823e-05, -1.1496245861053467e-05, -1.101754605770111e-05, -1.0538846254348755e-05, -1.0060146450996399e-05, -9.581446647644043e-06, -9.102746844291687e-06, -8.624047040939331e-06, -8.145347237586975e-06, -7.666647434234619e-06, -7.187947630882263e-06, -6.709247827529907e-06, -6.230548024177551e-06, -5.751848220825195e-06, -5.273148417472839e-06, -4.794448614120483e-06, -4.3157488107681274e-06, -3.8370490074157715e-06, -3.3583492040634155e-06, -2.8796494007110596e-06, -2.4009495973587036e-06, -1.9222497940063477e-06, -1.4435499906539917e-06, -9.648501873016357e-07, -4.861503839492798e-07, -7.450580596923828e-09, 4.7124922275543213e-07, 9.499490261077881e-07, 1.428648829460144e-06, 1.9073486328125e-06, 2.386048436164856e-06, 2.864748239517212e-06, 3.343448042869568e-06, 3.822147846221924e-06, 4.30084764957428e-06, 4.779547452926636e-06, 5.258247256278992e-06, 5.736947059631348e-06, 6.215646862983704e-06, 6.6943466663360596e-06, 7.1730464696884155e-06, 7.651746273040771e-06, 8.130446076393127e-06, 8.609145879745483e-06, 9.08784568309784e-06, 9.566545486450195e-06, 1.0045245289802551e-05, 1.0523945093154907e-05, 1.1002644896507263e-05, 1.1481344699859619e-05, 1.1960044503211975e-05, 1.2438744306564331e-05, 1.2917444109916687e-05, 1.3396143913269043e-05, 1.3874843716621399e-05, 1.4353543519973755e-05, 1.483224332332611e-05, 1.5310943126678467e-05, 1.5789642930030823e-05, 1.626834273338318e-05, 1.6747042536735535e-05, 1.722574234008789e-05]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 11.0, 15.0, 16.0, 25.0, 33.0, 17.0, 53.0, 52.0, 74.0, 80.0, 130.0, 104.0, 82.0, 64.0, 42.0, 33.0, 23.0, 24.0, 24.0, 10.0, 5.0, 11.0, 10.0, 7.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0011053293710574508, -0.0010705984896048903, -0.0010358677245676517, -0.0010011368431150913, -0.0009664060198701918, -0.0009316751966252923, -0.0008969443151727319, -0.0008622134919278324, -0.0008274826686829329, -0.0007927518454380333, -0.0007580210221931338, -0.0007232901407405734, -0.0006885593174956739, -0.0006538284942507744, -0.000619097612798214, -0.0005843667895533144, -0.0005496359663084149, -0.0005149051430635154, -0.00048017429071478546, -0.0004454434383660555, -0.000410712615121156, -0.00037598179187625647, -0.0003412509395275265, -0.00030652008717879653, -0.000271789263933897, -0.00023705842613708228, -0.00020232758834026754, -0.0001675967505434528, -0.00013286591274663806, -9.813507494982332e-05, -6.340423715300858e-05, -2.867339935619384e-05, 6.057554855942726e-06, 4.0788392652757466e-05, 7.55192304495722e-05, 0.00011025006824638695, 0.00014498090604320168, 0.00017971174384001642, 0.00021444258163683116, 0.00024917343398556113, 0.00028390425723046064, 0.00031863508047536016, 0.0003533659328240901, 0.0003880967851728201, 0.0004228276084177196, 0.0004575584316626191, 0.0004922893131151795, 0.000527020136360079, 0.0005617509596049786, 0.0005964817828498781, 0.0006312126060947776, 0.000665943487547338, 0.0007006743107922375, 0.000735405134037137, 0.0007701360154896975, 0.000804866838734597, 0.0008395976619794965, 0.000874328485224396, 0.0009090593084692955, 0.0009437901899218559, 0.0009785210713744164, 0.001013251836411655, 0.0010479827178642154, 0.001082713482901454, 0.0011174443643540144]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 13.0, 11.0, 11.0, 12.0, 10.0, 14.0, 18.0, 24.0, 22.0, 35.0, 25.0, 36.0, 28.0, 38.0, 27.0, 32.0, 39.0, 36.0, 41.0, 44.0, 39.0, 39.0, 36.0, 30.0, 25.0, 38.0, 38.0, 28.0, 23.0, 28.0, 29.0, 19.0, 12.0, 20.0, 13.0, 13.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000621070503257215, -0.0005998349515721202, -0.0005785993998870254, -0.0005573638482019305, -0.0005361282965168357, -0.0005148928030394018, -0.0004936572513543069, -0.0004724216996692121, -0.00045118614798411727, -0.00042995059629902244, -0.0004087150446139276, -0.0003874795220326632, -0.0003662439703475684, -0.00034500841866247356, -0.0003237728960812092, -0.00030253734439611435, -0.0002813017927110195, -0.0002600662410259247, -0.00023883070389274508, -0.00021759516675956547, -0.00019635961507447064, -0.0001751240633893758, -0.0001538885262561962, -0.0001326529891230166, -0.00011141743743792176, -9.018189302878454e-05, -6.894634861964732e-05, -4.7710804210510105e-05, -2.6475259801372886e-05, -5.2397153922356665e-06, 1.5995829016901553e-05, 3.723136615008116e-05, 5.8466976042836905e-05, 7.970252045197412e-05, 0.00010093806486111134, 0.00012217360199429095, 0.00014340915367938578, 0.00016464470536448061, 0.00018588024249766022, 0.00020711577963083982, 0.00022835133131593466, 0.0002495868830010295, 0.0002708224346861243, 0.0002920579572673887, 0.00031329350895248353, 0.00033452906063757837, 0.00035576458321884274, 0.0003770001349039376, 0.0003982356865890324, 0.00041947123827412724, 0.0004407067899592221, 0.00046194231254048645, 0.0004831778642255813, 0.0005044133868068457, 0.0005256489384919405, 0.0005468844901770353, 0.0005681200418621302, 0.000589355593547225, 0.0006105911452323198, 0.0006318266969174147, 0.0006530622486025095, 0.0006742977420799434, 0.0006955332937650383, 0.0007167688454501331, 0.0007380043971352279]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 4.0, 5.0, 9.0, 8.0, 18.0, 20.0, 22.0, 43.0, 62.0, 97.0, 135.0, 192.0, 282.0, 457.0, 674.0, 1057.0, 1476.0, 2323.0, 3914.0, 6917.0, 14654.0, 56126.0, 3863161.0, 201767.0, 20020.0, 8469.0, 4629.0, 2697.0, 1720.0, 1117.0, 748.0, 500.0, 315.0, 203.0, 149.0, 77.0, 79.0, 47.0, 27.0, 19.0, 21.0, 5.0, 6.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0029754638671875, -0.002892017364501953, -0.0028085708618164062, -0.0027251243591308594, -0.0026416778564453125, -0.0025582313537597656, -0.0024747848510742188, -0.002391338348388672, -0.002307891845703125, -0.002224445343017578, -0.0021409988403320312, -0.0020575523376464844, -0.0019741058349609375, -0.0018906593322753906, -0.0018072128295898438, -0.0017237663269042969, -0.00164031982421875, -0.0015568733215332031, -0.0014734268188476562, -0.0013899803161621094, -0.0013065338134765625, -0.0012230873107910156, -0.0011396408081054688, -0.0010561943054199219, -0.000972747802734375, -0.0008893013000488281, -0.0008058547973632812, -0.0007224082946777344, -0.0006389617919921875, -0.0005555152893066406, -0.00047206878662109375, -0.0003886222839355469, -0.00030517578125, -0.00022172927856445312, -0.00013828277587890625, -5.4836273193359375e-05, 2.86102294921875e-05, 0.00011205673217773438, 0.00019550323486328125, 0.0002789497375488281, 0.000362396240234375, 0.0004458427429199219, 0.0005292892456054688, 0.0006127357482910156, 0.0006961822509765625, 0.0007796287536621094, 0.0008630752563476562, 0.0009465217590332031, 0.00102996826171875, 0.0011134147644042969, 0.0011968612670898438, 0.0012803077697753906, 0.0013637542724609375, 0.0014472007751464844, 0.0015306472778320312, 0.0016140937805175781, 0.001697540283203125, 0.0017809867858886719, 0.0018644332885742188, 0.0019478797912597656, 0.0020313262939453125, 0.0021147727966308594, 0.0021982192993164062, 0.002281665802001953, 0.0023651123046875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 8.0, 11.0, 18.0, 15.0, 20.0, 24.0, 23.0, 32.0, 37.0, 39.0, 42.0, 40.0, 42.0, 52.0, 51.0, 60.0, 48.0, 53.0, 42.0, 49.0, 41.0, 42.0, 37.0, 34.0, 27.0, 25.0, 13.0, 14.0, 20.0, 8.0, 11.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006189346313476562, -0.0006014779210090637, -0.0005840212106704712, -0.0005665645003318787, -0.0005491077899932861, -0.0005316510796546936, -0.0005141943693161011, -0.0004967376589775085, -0.000479280948638916, -0.0004618242383003235, -0.00044436752796173096, -0.00042691081762313843, -0.0004094541072845459, -0.00039199739694595337, -0.00037454068660736084, -0.0003570839762687683, -0.0003396272659301758, -0.00032217055559158325, -0.0003047138452529907, -0.0002872571349143982, -0.00026980042457580566, -0.00025234371423721313, -0.0002348870038986206, -0.00021743029356002808, -0.00019997358322143555, -0.00018251687288284302, -0.0001650601625442505, -0.00014760345220565796, -0.00013014674186706543, -0.0001126900315284729, -9.523332118988037e-05, -7.777661085128784e-05, -6.031990051269531e-05, -4.286319017410278e-05, -2.5406479835510254e-05, -7.949769496917725e-06, 9.506940841674805e-06, 2.6963651180267334e-05, 4.442036151885986e-05, 6.187707185745239e-05, 7.933378219604492e-05, 9.679049253463745e-05, 0.00011424720287322998, 0.0001317039132118225, 0.00014916062355041504, 0.00016661733388900757, 0.0001840740442276001, 0.00020153075456619263, 0.00021898746490478516, 0.00023644417524337769, 0.0002539008855819702, 0.00027135759592056274, 0.0002888143062591553, 0.0003062710165977478, 0.00032372772693634033, 0.00034118443727493286, 0.0003586411476135254, 0.0003760978579521179, 0.00039355456829071045, 0.000411011278629303, 0.0004284679889678955, 0.00044592469930648804, 0.00046338140964508057, 0.0004808381199836731, 0.0004982948303222656]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 17.0, 31.0, 50.0, 52.0, 113.0, 185.0, 298.0, 486.0, 939.0, 1672.0, 3396.0, 7580.0, 19866.0, 82980.0, 3629961.0, 382060.0, 40855.0, 12951.0, 5403.0, 2430.0, 1290.0, 670.0, 350.0, 249.0, 149.0, 74.0, 53.0, 36.0, 22.0, 8.0, 11.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0035648345947265625, -0.0034679174423217773, -0.003371000289916992, -0.003274083137512207, -0.003177165985107422, -0.0030802488327026367, -0.0029833316802978516, -0.0028864145278930664, -0.0027894973754882812, -0.002692580223083496, -0.002595663070678711, -0.0024987459182739258, -0.0024018287658691406, -0.0023049116134643555, -0.0022079944610595703, -0.002111077308654785, -0.00201416015625, -0.0019172430038452148, -0.0018203258514404297, -0.0017234086990356445, -0.0016264915466308594, -0.0015295743942260742, -0.001432657241821289, -0.001335740089416504, -0.0012388229370117188, -0.0011419057846069336, -0.0010449886322021484, -0.0009480714797973633, -0.0008511543273925781, -0.000754237174987793, -0.0006573200225830078, -0.0005604028701782227, -0.0004634857177734375, -0.00036656856536865234, -0.0002696514129638672, -0.00017273426055908203, -7.581710815429688e-05, 2.110004425048828e-05, 0.00011801719665527344, 0.0002149343490600586, 0.00031185150146484375, 0.0004087686538696289, 0.0005056858062744141, 0.0006026029586791992, 0.0006995201110839844, 0.0007964372634887695, 0.0008933544158935547, 0.0009902715682983398, 0.001087188720703125, 0.0011841058731079102, 0.0012810230255126953, 0.0013779401779174805, 0.0014748573303222656, 0.0015717744827270508, 0.001668691635131836, 0.001765608787536621, 0.0018625259399414062, 0.0019594430923461914, 0.0020563602447509766, 0.0021532773971557617, 0.002250194549560547, 0.002347111701965332, 0.002444028854370117, 0.0025409460067749023, 0.0026378631591796875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 12.0, 6.0, 9.0, 11.0, 11.0, 9.0, 28.0, 31.0, 70.0, 120.0, 328.0, 913.0, 1763.0, 340.0, 132.0, 84.0, 49.0, 44.0, 22.0, 10.0, 14.0, 12.0, 12.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044083595275878906, -0.0004246048629283905, -0.00040837377309799194, -0.0003921426832675934, -0.0003759115934371948, -0.00035968050360679626, -0.0003434494137763977, -0.00032721832394599915, -0.0003109872341156006, -0.000294756144285202, -0.00027852505445480347, -0.0002622939646244049, -0.00024606287479400635, -0.0002298317849636078, -0.00021360069513320923, -0.00019736960530281067, -0.0001811385154724121, -0.00016490742564201355, -0.000148676335811615, -0.00013244524598121643, -0.00011621415615081787, -9.998306632041931e-05, -8.375197649002075e-05, -6.752088665962219e-05, -5.128979682922363e-05, -3.505870699882507e-05, -1.8827617168426514e-05, -2.596527338027954e-06, 1.3634562492370605e-05, 2.9865652322769165e-05, 4.6096742153167725e-05, 6.232783198356628e-05, 7.855892181396484e-05, 9.47900116443634e-05, 0.00011102110147476196, 0.00012725219130516052, 0.00014348328113555908, 0.00015971437096595764, 0.0001759454607963562, 0.00019217655062675476, 0.00020840764045715332, 0.00022463873028755188, 0.00024086982011795044, 0.000257100909948349, 0.00027333199977874756, 0.0002895630896091461, 0.0003057941794395447, 0.00032202526926994324, 0.0003382563591003418, 0.00035448744893074036, 0.0003707185387611389, 0.0003869496285915375, 0.00040318071842193604, 0.0004194118082523346, 0.00043564289808273315, 0.0004518739879131317, 0.0004681050777435303, 0.00048433616757392883, 0.0005005672574043274, 0.000516798347234726, 0.0005330294370651245, 0.0005492605268955231, 0.0005654916167259216, 0.0005817227065563202, 0.0005979537963867188]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 12.0, 14.0, 18.0, 36.0, 33.0, 43.0, 75.0, 106.0, 182.0, 126.0, 88.0, 53.0, 61.0, 23.0, 21.0, 21.0, 18.0, 7.0, 11.0, 4.0, 9.0, 4.0, 3.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0010057721519842744, -0.0009769252501428127, -0.0009480783483013511, -0.0009192314464598894, -0.0008903844864107668, -0.0008615375845693052, -0.0008326906827278435, -0.0008038437808863819, -0.0007749968208372593, -0.0007461499189957976, -0.000717303017154336, -0.0006884561153128743, -0.0006596091552637517, -0.0006307622534222901, -0.0006019153515808284, -0.0005730684497393668, -0.0005442215478979051, -0.0005153746460564435, -0.00048652771511115134, -0.0004576808132696897, -0.00042883388232439756, -0.0003999869804829359, -0.00037114007864147425, -0.0003422931768000126, -0.0003134462458547205, -0.0002845993440132588, -0.0002557524130679667, -0.00022690551122650504, -0.00019805859483312815, -0.00016921167843975127, -0.0001403647765982896, -0.00011151786020491272, -8.267088560387492e-05, -5.382397284847684e-05, -2.4977060093078762e-05, 3.86984902434051e-06, 3.27167654177174e-05, 6.156368181109428e-05, 9.041058365255594e-05, 0.00011925750004593283, 0.00014810441643930972, 0.0001769513328326866, 0.0002057982492260635, 0.00023464515106752515, 0.0002634920529089868, 0.0002923389838542789, 0.0003211858856957406, 0.0003500328166410327, 0.00037887971848249435, 0.000407726620323956, 0.00043657355126924813, 0.0004654204531107098, 0.0004942673840560019, 0.0005231142858974636, 0.0005519611877389252, 0.0005808080895803869, 0.0006096550496295094, 0.0006385019514709711, 0.0006673488533124328, 0.0006961957551538944, 0.000725042715203017, 0.0007538896170444787, 0.0007827365188859403, 0.000811583420727402, 0.0008404303225688636]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 15.0, 13.0, 16.0, 13.0, 14.0, 21.0, 23.0, 36.0, 29.0, 32.0, 39.0, 35.0, 44.0, 40.0, 32.0, 38.0, 43.0, 50.0, 41.0, 34.0, 32.0, 36.0, 38.0, 37.0, 32.0, 27.0, 17.0, 21.0, 14.0, 15.0, 10.0, 15.0, 12.0, 5.0, 7.0, 10.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00044068077113479376, -0.0004252153157722205, -0.0004097498895134777, -0.0003942844341509044, -0.00037881897878833115, -0.0003633535234257579, -0.0003478880971670151, -0.0003324226418044418, -0.00031695718644186854, -0.0003014917310792953, -0.00028602630482055247, -0.0002705608494579792, -0.00025509539409540594, -0.0002396299532847479, -0.00022416451247408986, -0.0002086990571115166, -0.00019323363085277379, -0.00017776819004211575, -0.00016230273467954248, -0.00014683729386888444, -0.00013137183850631118, -0.00011590639769565314, -0.0001004409568849951, -8.497550879837945e-05, -6.95100607117638e-05, -5.404461262514815e-05, -3.85791681765113e-05, -2.3113723727874458e-05, -7.648275641258806e-06, 7.817172445356846e-06, 2.3282613256014884e-05, 3.8748061342630535e-05, 5.421350942924619e-05, 6.967895751586184e-05, 8.514440560247749e-05, 0.00010060984641313553, 0.00011607529449975118, 0.00013154074258636683, 0.00014700618339702487, 0.00016247163875959814, 0.00017793707957025617, 0.0001934025203809142, 0.00020886797574348748, 0.00022433341655414551, 0.00023979885736480355, 0.0002552643127273768, 0.0002707297680899501, 0.0002861951943486929, 0.00030166064971126616, 0.0003171261050738394, 0.00033259153133258224, 0.0003480569866951555, 0.00036352244205772877, 0.0003789878683164716, 0.00039445332367904484, 0.0004099187790416181, 0.0004253842053003609, 0.0004408496606629342, 0.000456315086921677, 0.00047178054228425026, 0.0004872459976468235, 0.0005027114530093968, 0.0005181768792681396, 0.0005336423055268824, 0.0005491077899932861]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 15.0, 15.0, 11.0, 28.0, 27.0, 60.0, 61.0, 86.0, 146.0, 203.0, 258.0, 419.0, 628.0, 780.0, 1243.0, 1878.0, 2721.0, 4195.0, 6475.0, 9936.0, 15948.0, 25678.0, 43345.0, 76529.0, 154826.0, 337218.0, 165664.0, 81023.0, 45740.0, 26743.0, 16524.0, 10319.0, 6498.0, 4394.0, 2888.0, 1885.0, 1271.0, 898.0, 604.0, 435.0, 279.0, 199.0, 143.0, 99.0, 74.0, 41.0, 35.0, 15.0, 20.0, 12.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0006322860717773438, -0.0006128549575805664, -0.0005934238433837891, -0.0005739927291870117, -0.0005545616149902344, -0.000535130500793457, -0.0005156993865966797, -0.0004962682723999023, -0.000476837158203125, -0.00045740604400634766, -0.0004379749298095703, -0.00041854381561279297, -0.0003991127014160156, -0.0003796815872192383, -0.00036025047302246094, -0.0003408193588256836, -0.00032138824462890625, -0.0003019571304321289, -0.00028252601623535156, -0.0002630949020385742, -0.00024366378784179688, -0.00022423267364501953, -0.0002048015594482422, -0.00018537044525146484, -0.0001659393310546875, -0.00014650821685791016, -0.0001270771026611328, -0.00010764598846435547, -8.821487426757812e-05, -6.878376007080078e-05, -4.935264587402344e-05, -2.9921531677246094e-05, -1.049041748046875e-05, 8.940696716308594e-06, 2.8371810913085938e-05, 4.780292510986328e-05, 6.723403930664062e-05, 8.666515350341797e-05, 0.00010609626770019531, 0.00012552738189697266, 0.00014495849609375, 0.00016438961029052734, 0.0001838207244873047, 0.00020325183868408203, 0.00022268295288085938, 0.00024211406707763672, 0.00026154518127441406, 0.0002809762954711914, 0.00030040740966796875, 0.0003198385238647461, 0.00033926963806152344, 0.0003587007522583008, 0.0003781318664550781, 0.00039756298065185547, 0.0004169940948486328, 0.00043642520904541016, 0.0004558563232421875, 0.00047528743743896484, 0.0004947185516357422, 0.0005141496658325195, 0.0005335807800292969, 0.0005530118942260742, 0.0005724430084228516, 0.0005918741226196289, 0.0006113052368164062]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 7.0, 7.0, 4.0, 4.0, 13.0, 12.0, 12.0, 16.0, 21.0, 26.0, 22.0, 26.0, 33.0, 39.0, 36.0, 38.0, 37.0, 42.0, 48.0, 39.0, 56.0, 57.0, 44.0, 43.0, 35.0, 39.0, 34.0, 37.0, 22.0, 24.0, 22.0, 18.0, 16.0, 13.0, 16.0, 9.0, 7.0, 5.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005502700805664062, -0.0005327016115188599, -0.0005151331424713135, -0.0004975646734237671, -0.0004799962043762207, -0.0004624277353286743, -0.00044485926628112793, -0.00042729079723358154, -0.00040972232818603516, -0.00039215385913848877, -0.0003745853900909424, -0.000357016921043396, -0.0003394484519958496, -0.0003218799829483032, -0.00030431151390075684, -0.00028674304485321045, -0.00026917457580566406, -0.0002516061067581177, -0.0002340376377105713, -0.0002164691686630249, -0.00019890069961547852, -0.00018133223056793213, -0.00016376376152038574, -0.00014619529247283936, -0.00012862682342529297, -0.00011105835437774658, -9.34898853302002e-05, -7.592141628265381e-05, -5.835294723510742e-05, -4.0784478187561035e-05, -2.321600914001465e-05, -5.647540092468262e-06, 1.1920928955078125e-05, 2.9489398002624512e-05, 4.70578670501709e-05, 6.462633609771729e-05, 8.219480514526367e-05, 9.976327419281006e-05, 0.00011733174324035645, 0.00013490021228790283, 0.00015246868133544922, 0.0001700371503829956, 0.000187605619430542, 0.00020517408847808838, 0.00022274255752563477, 0.00024031102657318115, 0.00025787949562072754, 0.0002754479646682739, 0.0002930164337158203, 0.0003105849027633667, 0.0003281533718109131, 0.00034572184085845947, 0.00036329030990600586, 0.00038085877895355225, 0.00039842724800109863, 0.000415995717048645, 0.0004335641860961914, 0.0004511326551437378, 0.0004687011241912842, 0.00048626959323883057, 0.000503838062286377, 0.0005214065313339233, 0.0005389750003814697, 0.0005565434694290161, 0.0005741119384765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 10.0, 15.0, 16.0, 34.0, 36.0, 42.0, 88.0, 104.0, 180.0, 233.0, 297.0, 474.0, 688.0, 996.0, 1353.0, 2157.0, 3109.0, 4642.0, 7390.0, 11472.0, 19181.0, 33373.0, 68082.0, 190481.0, 455814.0, 124739.0, 51703.0, 27248.0, 15945.0, 9743.0, 6127.0, 4107.0, 2710.0, 1860.0, 1291.0, 833.0, 591.0, 411.0, 291.0, 201.0, 142.0, 93.0, 73.0, 53.0, 43.0, 24.0, 17.0, 16.0, 7.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0006084442138671875, -0.0005890205502510071, -0.0005695968866348267, -0.0005501732230186462, -0.0005307495594024658, -0.0005113258957862854, -0.000491902232170105, -0.00047247856855392456, -0.00045305490493774414, -0.0004336312413215637, -0.0004142075777053833, -0.0003947839140892029, -0.00037536025047302246, -0.00035593658685684204, -0.0003365129232406616, -0.0003170892596244812, -0.0002976655960083008, -0.00027824193239212036, -0.00025881826877593994, -0.00023939460515975952, -0.0002199709415435791, -0.00020054727792739868, -0.00018112361431121826, -0.00016169995069503784, -0.00014227628707885742, -0.000122852623462677, -0.00010342895984649658, -8.400529623031616e-05, -6.458163261413574e-05, -4.515796899795532e-05, -2.5734305381774902e-05, -6.310641765594482e-06, 1.3113021850585938e-05, 3.253668546676636e-05, 5.196034908294678e-05, 7.13840126991272e-05, 9.080767631530762e-05, 0.00011023133993148804, 0.00012965500354766846, 0.00014907866716384888, 0.0001685023307800293, 0.00018792599439620972, 0.00020734965801239014, 0.00022677332162857056, 0.000246196985244751, 0.0002656206488609314, 0.0002850443124771118, 0.00030446797609329224, 0.00032389163970947266, 0.0003433153033256531, 0.0003627389669418335, 0.0003821626305580139, 0.00040158629417419434, 0.00042100995779037476, 0.0004404336214065552, 0.0004598572850227356, 0.000479280948638916, 0.0004987046122550964, 0.0005181282758712769, 0.0005375519394874573, 0.0005569756031036377, 0.0005763992667198181, 0.0005958229303359985, 0.000615246593952179, 0.0006346702575683594]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 13.0, 12.0, 13.0, 19.0, 28.0, 29.0, 19.0, 28.0, 32.0, 34.0, 31.0, 36.0, 45.0, 45.0, 44.0, 45.0, 41.0, 38.0, 49.0, 36.0, 35.0, 33.0, 36.0, 36.0, 37.0, 23.0, 21.0, 17.0, 19.0, 10.0, 15.0, 8.0, 13.0, 5.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003466606140136719, -0.00033549964427948, -0.0003243386745452881, -0.0003131777048110962, -0.0003020167350769043, -0.0002908557653427124, -0.0002796947956085205, -0.0002685338258743286, -0.0002573728561401367, -0.0002462118864059448, -0.00023505091667175293, -0.00022388994693756104, -0.00021272897720336914, -0.00020156800746917725, -0.00019040703773498535, -0.00017924606800079346, -0.00016808509826660156, -0.00015692412853240967, -0.00014576315879821777, -0.00013460218906402588, -0.00012344121932983398, -0.00011228024959564209, -0.0001011192798614502, -8.99583101272583e-05, -7.87973403930664e-05, -6.763637065887451e-05, -5.647540092468262e-05, -4.531443119049072e-05, -3.415346145629883e-05, -2.2992491722106934e-05, -1.1831521987915039e-05, -6.705522537231445e-07, 1.049041748046875e-05, 2.1651387214660645e-05, 3.281235694885254e-05, 4.3973326683044434e-05, 5.513429641723633e-05, 6.629526615142822e-05, 7.745623588562012e-05, 8.861720561981201e-05, 9.97781753540039e-05, 0.0001109391450881958, 0.0001221001148223877, 0.0001332610845565796, 0.00014442205429077148, 0.00015558302402496338, 0.00016674399375915527, 0.00017790496349334717, 0.00018906593322753906, 0.00020022690296173096, 0.00021138787269592285, 0.00022254884243011475, 0.00023370981216430664, 0.00024487078189849854, 0.00025603175163269043, 0.0002671927213668823, 0.0002783536911010742, 0.0002895146608352661, 0.000300675630569458, 0.0003118366003036499, 0.0003229975700378418, 0.0003341585397720337, 0.0003453195095062256, 0.0003564804792404175, 0.0003676414489746094]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 6.0, 12.0, 15.0, 12.0, 17.0, 20.0, 38.0, 47.0, 62.0, 77.0, 125.0, 157.0, 198.0, 278.0, 415.0, 534.0, 809.0, 1238.0, 1846.0, 2955.0, 5007.0, 9526.0, 20580.0, 63670.0, 659106.0, 209346.0, 38661.0, 14852.0, 7397.0, 4040.0, 2480.0, 1512.0, 1045.0, 677.0, 482.0, 371.0, 256.0, 171.0, 135.0, 85.0, 82.0, 59.0, 39.0, 31.0, 21.0, 11.0, 11.0, 11.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00015723705291748047, -0.0001522935926914215, -0.00014735013246536255, -0.0001424066722393036, -0.00013746321201324463, -0.00013251975178718567, -0.0001275762915611267, -0.00012263283133506775, -0.00011768937110900879, -0.00011274591088294983, -0.00010780245065689087, -0.00010285899043083191, -9.791553020477295e-05, -9.297206997871399e-05, -8.802860975265503e-05, -8.308514952659607e-05, -7.814168930053711e-05, -7.319822907447815e-05, -6.825476884841919e-05, -6.331130862236023e-05, -5.836784839630127e-05, -5.342438817024231e-05, -4.848092794418335e-05, -4.353746771812439e-05, -3.859400749206543e-05, -3.365054726600647e-05, -2.870708703994751e-05, -2.376362681388855e-05, -1.882016658782959e-05, -1.387670636177063e-05, -8.93324613571167e-06, -3.98978590965271e-06, 9.5367431640625e-07, 5.89713454246521e-06, 1.084059476852417e-05, 1.578405499458313e-05, 2.072751522064209e-05, 2.567097544670105e-05, 3.061443567276001e-05, 3.555789589881897e-05, 4.050135612487793e-05, 4.544481635093689e-05, 5.038827657699585e-05, 5.533173680305481e-05, 6.027519702911377e-05, 6.521865725517273e-05, 7.016211748123169e-05, 7.510557770729065e-05, 8.004903793334961e-05, 8.499249815940857e-05, 8.993595838546753e-05, 9.487941861152649e-05, 9.982287883758545e-05, 0.00010476633906364441, 0.00010970979928970337, 0.00011465325951576233, 0.00011959671974182129, 0.00012454017996788025, 0.0001294836401939392, 0.00013442710041999817, 0.00013937056064605713, 0.0001443140208721161, 0.00014925748109817505, 0.000154200941324234, 0.00015914440155029297]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 0.0, 7.0, 8.0, 15.0, 20.0, 11.0, 28.0, 32.0, 50.0, 30.0, 68.0, 70.0, 93.0, 95.0, 50.0, 92.0, 50.0, 55.0, 48.0, 15.0, 34.0, 22.0, 20.0, 10.0, 15.0, 11.0, 4.0, 8.0, 2.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.7550926208496094e-06, -3.648921847343445e-06, -3.5427510738372803e-06, -3.4365803003311157e-06, -3.330409526824951e-06, -3.2242387533187866e-06, -3.118067979812622e-06, -3.0118972063064575e-06, -2.905726432800293e-06, -2.7995556592941284e-06, -2.693384885787964e-06, -2.5872141122817993e-06, -2.4810433387756348e-06, -2.3748725652694702e-06, -2.2687017917633057e-06, -2.162531018257141e-06, -2.0563602447509766e-06, -1.950189471244812e-06, -1.8440186977386475e-06, -1.737847924232483e-06, -1.6316771507263184e-06, -1.5255063772201538e-06, -1.4193356037139893e-06, -1.3131648302078247e-06, -1.2069940567016602e-06, -1.1008232831954956e-06, -9.94652509689331e-07, -8.884817361831665e-07, -7.82310962677002e-07, -6.761401891708374e-07, -5.699694156646729e-07, -4.637986421585083e-07, -3.5762786865234375e-07, -2.514570951461792e-07, -1.4528632164001465e-07, -3.91155481338501e-08, 6.705522537231445e-08, 1.73225998878479e-07, 2.7939677238464355e-07, 3.855675458908081e-07, 4.917383193969727e-07, 5.979090929031372e-07, 7.040798664093018e-07, 8.102506399154663e-07, 9.164214134216309e-07, 1.0225921869277954e-06, 1.12876296043396e-06, 1.2349337339401245e-06, 1.341104507446289e-06, 1.4472752809524536e-06, 1.5534460544586182e-06, 1.6596168279647827e-06, 1.7657876014709473e-06, 1.8719583749771118e-06, 1.9781291484832764e-06, 2.084299921989441e-06, 2.1904706954956055e-06, 2.29664146900177e-06, 2.4028122425079346e-06, 2.508983016014099e-06, 2.6151537895202637e-06, 2.7213245630264282e-06, 2.8274953365325928e-06, 2.9336661100387573e-06, 3.039836883544922e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 10.0, 11.0, 8.0, 26.0, 21.0, 53.0, 83.0, 139.0, 290.0, 595.0, 1324.0, 3107.0, 8455.0, 28255.0, 245549.0, 698545.0, 43384.0, 11405.0, 4063.0, 1676.0, 773.0, 360.0, 187.0, 102.0, 55.0, 17.0, 20.0, 17.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003502368927001953, -0.00033966824412345886, -0.0003290995955467224, -0.00031853094696998596, -0.0003079622983932495, -0.00029739364981651306, -0.0002868250012397766, -0.00027625635266304016, -0.0002656877040863037, -0.00025511905550956726, -0.0002445504069328308, -0.00023398175835609436, -0.0002234131097793579, -0.00021284446120262146, -0.000202275812625885, -0.00019170716404914856, -0.0001811385154724121, -0.00017056986689567566, -0.0001600012183189392, -0.00014943256974220276, -0.0001388639211654663, -0.00012829527258872986, -0.00011772662401199341, -0.00010715797543525696, -9.658932685852051e-05, -8.602067828178406e-05, -7.545202970504761e-05, -6.488338112831116e-05, -5.431473255157471e-05, -4.374608397483826e-05, -3.317743539810181e-05, -2.2608786821365356e-05, -1.2040138244628906e-05, -1.471489667892456e-06, 9.097158908843994e-06, 1.9665807485580444e-05, 3.0234456062316895e-05, 4.0803104639053345e-05, 5.1371753215789795e-05, 6.194040179252625e-05, 7.25090503692627e-05, 8.307769894599915e-05, 9.36463475227356e-05, 0.00010421499609947205, 0.0001147836446762085, 0.00012535229325294495, 0.0001359209418296814, 0.00014648959040641785, 0.0001570582389831543, 0.00016762688755989075, 0.0001781955361366272, 0.00018876418471336365, 0.0001993328332901001, 0.00020990148186683655, 0.000220470130443573, 0.00023103877902030945, 0.0002416074275970459, 0.00025217607617378235, 0.0002627447247505188, 0.00027331337332725525, 0.0002838820219039917, 0.00029445067048072815, 0.0003050193190574646, 0.00031558796763420105, 0.0003261566162109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 3.0, 4.0, 6.0, 10.0, 10.0, 15.0, 15.0, 30.0, 35.0, 55.0, 94.0, 147.0, 191.0, 138.0, 66.0, 36.0, 25.0, 24.0, 16.0, 11.0, 7.0, 8.0, 11.0, 6.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.976987838745117e-05, -4.817545413970947e-05, -4.6581029891967773e-05, -4.4986605644226074e-05, -4.3392181396484375e-05, -4.1797757148742676e-05, -4.0203332901000977e-05, -3.860890865325928e-05, -3.701448440551758e-05, -3.542006015777588e-05, -3.382563591003418e-05, -3.223121166229248e-05, -3.063678741455078e-05, -2.9042363166809082e-05, -2.7447938919067383e-05, -2.5853514671325684e-05, -2.4259090423583984e-05, -2.2664666175842285e-05, -2.1070241928100586e-05, -1.9475817680358887e-05, -1.7881393432617188e-05, -1.6286969184875488e-05, -1.4692544937133789e-05, -1.309812068939209e-05, -1.150369644165039e-05, -9.909272193908691e-06, -8.314847946166992e-06, -6.720423698425293e-06, -5.125999450683594e-06, -3.5315752029418945e-06, -1.9371509552001953e-06, -3.427267074584961e-07, 1.2516975402832031e-06, 2.8461217880249023e-06, 4.4405460357666016e-06, 6.034970283508301e-06, 7.62939453125e-06, 9.2238187789917e-06, 1.0818243026733398e-05, 1.2412667274475098e-05, 1.4007091522216797e-05, 1.5601515769958496e-05, 1.7195940017700195e-05, 1.8790364265441895e-05, 2.0384788513183594e-05, 2.1979212760925293e-05, 2.3573637008666992e-05, 2.516806125640869e-05, 2.676248550415039e-05, 2.835690975189209e-05, 2.995133399963379e-05, 3.154575824737549e-05, 3.314018249511719e-05, 3.473460674285889e-05, 3.6329030990600586e-05, 3.7923455238342285e-05, 3.9517879486083984e-05, 4.1112303733825684e-05, 4.270672798156738e-05, 4.430115222930908e-05, 4.589557647705078e-05, 4.749000072479248e-05, 4.908442497253418e-05, 5.067884922027588e-05, 5.227327346801758e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 8.0, 7.0, 12.0, 8.0, 22.0, 23.0, 33.0, 37.0, 57.0, 69.0, 126.0, 161.0, 108.0, 85.0, 67.0, 39.0, 29.0, 22.0, 21.0, 8.0, 10.0, 9.0, 7.0, 7.0, 10.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009279638179577887, -0.0009019734570756555, -0.0008759830961935222, -0.000849992735311389, -0.0008240023744292557, -0.0007980120135471225, -0.0007720216526649892, -0.000746031291782856, -0.0007200409309007227, -0.0006940505700185895, -0.0006680602091364563, -0.000642069848254323, -0.0006160794873721898, -0.0005900891264900565, -0.0005640987656079233, -0.00053810840472579, -0.0005121180438436568, -0.00048612768296152353, -0.0004601373220793903, -0.00043414696119725704, -0.0004081566003151238, -0.00038216623943299055, -0.0003561758785508573, -0.00033018551766872406, -0.0003041951567865908, -0.00027820479590445757, -0.0002522144350223243, -0.00022622407414019108, -0.00020023371325805783, -0.0001742433523759246, -0.00014825299149379134, -0.0001222626306116581, -9.627221152186394e-05, -7.028185063973069e-05, -4.4291489757597446e-05, -1.83011288754642e-05, 7.689232006669044e-06, 3.367959288880229e-05, 5.9669953770935535e-05, 8.566031465306878e-05, 0.00011165067553520203, 0.00013764103641733527, 0.00016363139729946852, 0.00018962175818160176, 0.000215612119063735, 0.00024160247994586825, 0.0002675928408280015, 0.00029358320171013474, 0.000319573562592268, 0.00034556392347440124, 0.0003715542843565345, 0.0003975446452386677, 0.00042353500612080097, 0.0004495253670029342, 0.00047551572788506746, 0.0005015060887672007, 0.000527496449649334, 0.0005534868105314672, 0.0005794771714136004, 0.0006054675322957337, 0.0006314578931778669, 0.0006574482540600002, 0.0006834386149421334, 0.0007094289758242667, 0.0007354193367063999]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 3.0, 3.0, 8.0, 10.0, 11.0, 18.0, 13.0, 9.0, 18.0, 25.0, 16.0, 29.0, 29.0, 39.0, 33.0, 42.0, 38.0, 47.0, 34.0, 37.0, 36.0, 51.0, 41.0, 39.0, 27.0, 40.0, 40.0, 34.0, 38.0, 23.0, 21.0, 22.0, 17.0, 13.0, 9.0, 17.0, 8.0, 8.0, 11.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00041409741970710456, -0.0003997076128143817, -0.00038531783502548933, -0.0003709280281327665, -0.00035653822124004364, -0.00034214844345115125, -0.0003277586365584284, -0.000313368858769536, -0.0002989790518768132, -0.00028458924498409033, -0.00027019946719519794, -0.0002558096603024751, -0.00024141986796166748, -0.00022703007562085986, -0.00021264026872813702, -0.0001982504763873294, -0.00018386068404652178, -0.00016947089170571417, -0.00015508109936490655, -0.0001406912924721837, -0.0001263015001313761, -0.00011191170779056847, -9.752190817380324e-05, -8.313210855703801e-05, -6.874231621623039e-05, -5.435252023744397e-05, -3.9962724258657545e-05, -2.557292827987112e-05, -1.1183132301084697e-05, 3.2066600397229195e-06, 1.759645965648815e-05, 3.198625927325338e-05, 4.637602251023054e-05, 6.0765818489016965e-05, 7.515561446780339e-05, 8.954541408456862e-05, 0.00010393520642537624, 0.00011832499876618385, 0.0001327148056589067, 0.00014710459799971431, 0.00016149439034052193, 0.00017588418268132955, 0.00019027397502213717, 0.00020466378191486, 0.00021905357425566763, 0.00023344336659647524, 0.0002478331734891981, 0.0002622229512780905, 0.0002766127581708133, 0.00029100256506353617, 0.00030539234285242856, 0.0003197821497451514, 0.0003341719275340438, 0.00034856173442676663, 0.0003629515413194895, 0.0003773413482122123, 0.0003917311260011047, 0.00040612093289382756, 0.00042051071068271995, 0.0004349005175754428, 0.00044929032446816564, 0.000463680102257058, 0.00047806990914978087, 0.0004924596869386733, 0.0005068494938313961]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 24.0, 25.0, 39.0, 47.0, 78.0, 130.0, 165.0, 271.0, 372.0, 622.0, 893.0, 1322.0, 2035.0, 3068.0, 4726.0, 7318.0, 12140.0, 20251.0, 36327.0, 67646.0, 137922.0, 339275.0, 208491.0, 90454.0, 47392.0, 26390.0, 15216.0, 9391.0, 5734.0, 3588.0, 2417.0, 1570.0, 1057.0, 668.0, 494.0, 314.0, 197.0, 154.0, 94.0, 71.0, 52.0, 35.0, 17.0, 19.0, 11.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0010433197021484375, -0.0010093599557876587, -0.0009754002094268799, -0.0009414404630661011, -0.0009074807167053223, -0.0008735209703445435, -0.0008395612239837646, -0.0008056014776229858, -0.000771641731262207, -0.0007376819849014282, -0.0007037222385406494, -0.0006697624921798706, -0.0006358027458190918, -0.000601842999458313, -0.0005678832530975342, -0.0005339235067367554, -0.0004999637603759766, -0.00046600401401519775, -0.00043204426765441895, -0.00039808452129364014, -0.00036412477493286133, -0.0003301650285720825, -0.0002962052822113037, -0.0002622455358505249, -0.0002282857894897461, -0.00019432604312896729, -0.00016036629676818848, -0.00012640655040740967, -9.244680404663086e-05, -5.848705768585205e-05, -2.4527311325073242e-05, 9.432435035705566e-06, 4.3392181396484375e-05, 7.735192775726318e-05, 0.00011131167411804199, 0.0001452714204788208, 0.0001792311668395996, 0.00021319091320037842, 0.0002471506595611572, 0.00028111040592193604, 0.00031507015228271484, 0.00034902989864349365, 0.00038298964500427246, 0.00041694939136505127, 0.0004509091377258301, 0.0004848688840866089, 0.0005188286304473877, 0.0005527883768081665, 0.0005867481231689453, 0.0006207078695297241, 0.0006546676158905029, 0.0006886273622512817, 0.0007225871086120605, 0.0007565468549728394, 0.0007905066013336182, 0.000824466347694397, 0.0008584260940551758, 0.0008923858404159546, 0.0009263455867767334, 0.0009603053331375122, 0.000994265079498291, 0.0010282248258590698, 0.0010621845722198486, 0.0010961443185806274, 0.0011301040649414062]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 7.0, 11.0, 11.0, 10.0, 11.0, 19.0, 20.0, 18.0, 31.0, 26.0, 26.0, 51.0, 43.0, 49.0, 40.0, 46.0, 50.0, 45.0, 50.0, 53.0, 34.0, 34.0, 48.0, 45.0, 51.0, 25.0, 28.0, 13.0, 18.0, 18.0, 9.0, 12.0, 5.0, 9.0, 9.0, 1.0, 5.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002663135528564453, -0.00025705620646476746, -0.0002477988600730896, -0.00023854151368141174, -0.0002292841672897339, -0.00022002682089805603, -0.00021076947450637817, -0.00020151212811470032, -0.00019225478172302246, -0.0001829974353313446, -0.00017374008893966675, -0.0001644827425479889, -0.00015522539615631104, -0.00014596804976463318, -0.00013671070337295532, -0.00012745335698127747, -0.00011819601058959961, -0.00010893866419792175, -9.96813178062439e-05, -9.042397141456604e-05, -8.116662502288818e-05, -7.190927863121033e-05, -6.265193223953247e-05, -5.3394585847854614e-05, -4.413723945617676e-05, -3.48798930644989e-05, -2.5622546672821045e-05, -1.636520028114319e-05, -7.107853889465332e-06, 2.1494925022125244e-06, 1.1406838893890381e-05, 2.0664185285568237e-05, 2.9921531677246094e-05, 3.917887806892395e-05, 4.843622446060181e-05, 5.769357085227966e-05, 6.695091724395752e-05, 7.620826363563538e-05, 8.546561002731323e-05, 9.472295641899109e-05, 0.00010398030281066895, 0.0001132376492023468, 0.00012249499559402466, 0.00013175234198570251, 0.00014100968837738037, 0.00015026703476905823, 0.00015952438116073608, 0.00016878172755241394, 0.0001780390739440918, 0.00018729642033576965, 0.0001965537667274475, 0.00020581111311912537, 0.00021506845951080322, 0.00022432580590248108, 0.00023358315229415894, 0.0002428404986858368, 0.00025209784507751465, 0.0002613551914691925, 0.00027061253786087036, 0.0002798698842525482, 0.0002891272306442261, 0.00029838457703590393, 0.0003076419234275818, 0.00031689926981925964, 0.0003261566162109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 7.0, 11.0, 9.0, 19.0, 21.0, 35.0, 58.0, 103.0, 206.0, 378.0, 681.0, 1313.0, 2529.0, 4632.0, 9206.0, 18444.0, 39719.0, 93979.0, 293789.0, 379690.0, 113982.0, 46471.0, 21337.0, 10548.0, 5348.0, 2806.0, 1454.0, 770.0, 421.0, 228.0, 120.0, 72.0, 48.0, 24.0, 18.0, 16.0, 13.0, 7.0, 3.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011348724365234375, -0.0010983794927597046, -0.0010618865489959717, -0.0010253936052322388, -0.0009889006614685059, -0.000952407717704773, -0.00091591477394104, -0.0008794218301773071, -0.0008429288864135742, -0.0008064359426498413, -0.0007699429988861084, -0.0007334500551223755, -0.0006969571113586426, -0.0006604641675949097, -0.0006239712238311768, -0.0005874782800674438, -0.0005509853363037109, -0.000514492392539978, -0.0004779994487762451, -0.0004415065050125122, -0.0004050135612487793, -0.0003685206174850464, -0.0003320276737213135, -0.00029553472995758057, -0.00025904178619384766, -0.00022254884243011475, -0.00018605589866638184, -0.00014956295490264893, -0.00011307001113891602, -7.65770673751831e-05, -4.0084123611450195e-05, -3.591179847717285e-06, 3.2901763916015625e-05, 6.939470767974854e-05, 0.00010588765144348145, 0.00014238059520721436, 0.00017887353897094727, 0.00021536648273468018, 0.0002518594264984131, 0.000288352370262146, 0.0003248453140258789, 0.0003613382577896118, 0.0003978312015533447, 0.00043432414531707764, 0.00047081708908081055, 0.0005073100328445435, 0.0005438029766082764, 0.0005802959203720093, 0.0006167888641357422, 0.0006532818078994751, 0.000689774751663208, 0.0007262676954269409, 0.0007627606391906738, 0.0007992535829544067, 0.0008357465267181396, 0.0008722394704818726, 0.0009087324142456055, 0.0009452253580093384, 0.0009817183017730713, 0.0010182112455368042, 0.0010547041893005371, 0.00109119713306427, 0.001127690076828003, 0.0011641830205917358, 0.0012006759643554688]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 9.0, 12.0, 11.0, 13.0, 19.0, 16.0, 24.0, 15.0, 25.0, 18.0, 24.0, 29.0, 29.0, 33.0, 37.0, 52.0, 41.0, 33.0, 51.0, 37.0, 41.0, 44.0, 34.0, 43.0, 39.0, 47.0, 22.0, 35.0, 23.0, 13.0, 17.0, 18.0, 12.0, 10.0, 10.0, 6.0, 8.0, 8.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00025010108947753906, -0.00024263933300971985, -0.00023517757654190063, -0.00022771582007408142, -0.0002202540636062622, -0.000212792307138443, -0.00020533055067062378, -0.00019786879420280457, -0.00019040703773498535, -0.00018294528126716614, -0.00017548352479934692, -0.0001680217683315277, -0.0001605600118637085, -0.00015309825539588928, -0.00014563649892807007, -0.00013817474246025085, -0.00013071298599243164, -0.00012325122952461243, -0.00011578947305679321, -0.000108327716588974, -0.00010086596012115479, -9.340420365333557e-05, -8.594244718551636e-05, -7.848069071769714e-05, -7.101893424987793e-05, -6.355717778205872e-05, -5.60954213142395e-05, -4.863366484642029e-05, -4.1171908378601074e-05, -3.371015191078186e-05, -2.6248395442962646e-05, -1.8786638975143433e-05, -1.1324882507324219e-05, -3.863126039505005e-06, 3.598630428314209e-06, 1.1060386896133423e-05, 1.8522143363952637e-05, 2.598389983177185e-05, 3.3445656299591064e-05, 4.090741276741028e-05, 4.836916923522949e-05, 5.5830925703048706e-05, 6.329268217086792e-05, 7.075443863868713e-05, 7.821619510650635e-05, 8.567795157432556e-05, 9.313970804214478e-05, 0.00010060146450996399, 0.0001080632209777832, 0.00011552497744560242, 0.00012298673391342163, 0.00013044849038124084, 0.00013791024684906006, 0.00014537200331687927, 0.00015283375978469849, 0.0001602955162525177, 0.00016775727272033691, 0.00017521902918815613, 0.00018268078565597534, 0.00019014254212379456, 0.00019760429859161377, 0.00020506605505943298, 0.0002125278115272522, 0.0002199895679950714, 0.00022745132446289062]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 13.0, 10.0, 18.0, 25.0, 29.0, 49.0, 72.0, 99.0, 188.0, 265.0, 437.0, 836.0, 1538.0, 3217.0, 7835.0, 29118.0, 346026.0, 610452.0, 32196.0, 8807.0, 3515.0, 1551.0, 926.0, 481.0, 298.0, 175.0, 116.0, 74.0, 48.0, 37.0, 19.0, 26.0, 7.0, 11.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.9233436584472656e-05, -4.759524017572403e-05, -4.59570437669754e-05, -4.4318847358226776e-05, -4.268065094947815e-05, -4.104245454072952e-05, -3.9404258131980896e-05, -3.776606172323227e-05, -3.612786531448364e-05, -3.4489668905735016e-05, -3.285147249698639e-05, -3.121327608823776e-05, -2.9575079679489136e-05, -2.793688327074051e-05, -2.6298686861991882e-05, -2.4660490453243256e-05, -2.302229404449463e-05, -2.1384097635746002e-05, -1.9745901226997375e-05, -1.810770481824875e-05, -1.6469508409500122e-05, -1.4831312000751495e-05, -1.3193115592002869e-05, -1.1554919183254242e-05, -9.916722774505615e-06, -8.278526365756989e-06, -6.640329957008362e-06, -5.002133548259735e-06, -3.3639371395111084e-06, -1.7257407307624817e-06, -8.754432201385498e-08, 1.5506520867347717e-06, 3.1888484954833984e-06, 4.827044904232025e-06, 6.465241312980652e-06, 8.103437721729279e-06, 9.741634130477905e-06, 1.1379830539226532e-05, 1.3018026947975159e-05, 1.4656223356723785e-05, 1.6294419765472412e-05, 1.793261617422104e-05, 1.9570812582969666e-05, 2.1209008991718292e-05, 2.284720540046692e-05, 2.4485401809215546e-05, 2.6123598217964172e-05, 2.77617946267128e-05, 2.9399991035461426e-05, 3.103818744421005e-05, 3.267638385295868e-05, 3.4314580261707306e-05, 3.595277667045593e-05, 3.759097307920456e-05, 3.9229169487953186e-05, 4.086736589670181e-05, 4.250556230545044e-05, 4.4143758714199066e-05, 4.578195512294769e-05, 4.742015153169632e-05, 4.9058347940444946e-05, 5.069654434919357e-05, 5.23347407579422e-05, 5.3972937166690826e-05, 5.561113357543945e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 7.0, 5.0, 0.0, 3.0, 8.0, 11.0, 18.0, 25.0, 0.0, 21.0, 35.0, 41.0, 51.0, 84.0, 0.0, 130.0, 154.0, 137.0, 65.0, 59.0, 35.0, 0.0, 37.0, 21.0, 12.0, 11.0, 13.0, 0.0, 6.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6186386346817017e-06, -1.5683472156524658e-06, -1.51805579662323e-06, -1.4677643775939941e-06, -1.4174729585647583e-06, -1.3671815395355225e-06, -1.3168901205062866e-06, -1.2665987014770508e-06, -1.216307282447815e-06, -1.166015863418579e-06, -1.1157244443893433e-06, -1.0654330253601074e-06, -1.0151416063308716e-06, -9.648501873016357e-07, -9.145587682723999e-07, -8.642673492431641e-07, -8.139759302139282e-07, -7.636845111846924e-07, -7.133930921554565e-07, -6.631016731262207e-07, -6.128102540969849e-07, -5.62518835067749e-07, -5.122274160385132e-07, -4.6193599700927734e-07, -4.116445779800415e-07, -3.6135315895080566e-07, -3.110617399215698e-07, -2.60770320892334e-07, -2.1047890186309814e-07, -1.601874828338623e-07, -1.0989606380462646e-07, -5.960464477539063e-08, -9.313225746154785e-09, 4.0978193283081055e-08, 9.12696123123169e-08, 1.4156103134155273e-07, 1.9185245037078857e-07, 2.421438694000244e-07, 2.9243528842926025e-07, 3.427267074584961e-07, 3.9301812648773193e-07, 4.4330954551696777e-07, 4.936009645462036e-07, 5.438923835754395e-07, 5.941838026046753e-07, 6.444752216339111e-07, 6.94766640663147e-07, 7.450580596923828e-07, 7.953494787216187e-07, 8.456408977508545e-07, 8.959323167800903e-07, 9.462237358093262e-07, 9.96515154838562e-07, 1.0468065738677979e-06, 1.0970979928970337e-06, 1.1473894119262695e-06, 1.1976808309555054e-06, 1.2479722499847412e-06, 1.298263669013977e-06, 1.3485550880432129e-06, 1.3988465070724487e-06, 1.4491379261016846e-06, 1.4994293451309204e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 7.0, 17.0, 15.0, 24.0, 25.0, 54.0, 87.0, 133.0, 256.0, 440.0, 885.0, 1761.0, 3756.0, 8777.0, 19216.0, 62381.0, 484357.0, 377000.0, 56207.0, 18853.0, 7579.0, 3417.0, 1519.0, 728.0, 415.0, 235.0, 161.0, 92.0, 51.0, 38.0, 20.0, 17.0, 10.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.300739288330078e-05, -2.223905175924301e-05, -2.1470710635185242e-05, -2.0702369511127472e-05, -1.9934028387069702e-05, -1.9165687263011932e-05, -1.8397346138954163e-05, -1.7629005014896393e-05, -1.6860663890838623e-05, -1.6092322766780853e-05, -1.5323981642723083e-05, -1.4555640518665314e-05, -1.3787299394607544e-05, -1.3018958270549774e-05, -1.2250617146492004e-05, -1.1482276022434235e-05, -1.0713934898376465e-05, -9.945593774318695e-06, -9.177252650260925e-06, -8.408911526203156e-06, -7.640570402145386e-06, -6.872229278087616e-06, -6.103888154029846e-06, -5.335547029972076e-06, -4.567205905914307e-06, -3.798864781856537e-06, -3.030523657798767e-06, -2.2621825337409973e-06, -1.4938414096832275e-06, -7.255002856254578e-07, 4.284083843231201e-08, 8.111819624900818e-07, 1.5795230865478516e-06, 2.3478642106056213e-06, 3.116205334663391e-06, 3.884546458721161e-06, 4.652887582778931e-06, 5.4212287068367004e-06, 6.18956983089447e-06, 6.95791095495224e-06, 7.72625207901001e-06, 8.49459320306778e-06, 9.26293432712555e-06, 1.0031275451183319e-05, 1.0799616575241089e-05, 1.1567957699298859e-05, 1.2336298823356628e-05, 1.3104639947414398e-05, 1.3872981071472168e-05, 1.4641322195529938e-05, 1.5409663319587708e-05, 1.6178004443645477e-05, 1.6946345567703247e-05, 1.7714686691761017e-05, 1.8483027815818787e-05, 1.9251368939876556e-05, 2.0019710063934326e-05, 2.0788051187992096e-05, 2.1556392312049866e-05, 2.2324733436107635e-05, 2.3093074560165405e-05, 2.3861415684223175e-05, 2.4629756808280945e-05, 2.5398097932338715e-05, 2.6166439056396484e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 10.0, 10.0, 12.0, 11.0, 13.0, 23.0, 15.0, 17.0, 19.0, 42.0, 32.0, 79.0, 92.0, 70.0, 124.0, 109.0, 46.0, 59.0, 56.0, 23.0, 26.0, 22.0, 14.0, 13.0, 15.0, 7.0, 8.0, 5.0, 6.0, 5.0, 0.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.424022674560547e-06, -5.2647665143013e-06, -5.105510354042053e-06, -4.946254193782806e-06, -4.7869980335235596e-06, -4.627741873264313e-06, -4.468485713005066e-06, -4.309229552745819e-06, -4.149973392486572e-06, -3.9907172322273254e-06, -3.831461071968079e-06, -3.6722049117088318e-06, -3.512948751449585e-06, -3.353692591190338e-06, -3.1944364309310913e-06, -3.0351802706718445e-06, -2.8759241104125977e-06, -2.716667950153351e-06, -2.557411789894104e-06, -2.398155629634857e-06, -2.2388994693756104e-06, -2.0796433091163635e-06, -1.9203871488571167e-06, -1.7611309885978699e-06, -1.601874828338623e-06, -1.4426186680793762e-06, -1.2833625078201294e-06, -1.1241063475608826e-06, -9.648501873016357e-07, -8.055940270423889e-07, -6.463378667831421e-07, -4.870817065238953e-07, -3.2782554626464844e-07, -1.685693860054016e-07, -9.313225746154785e-09, 1.4994293451309204e-07, 3.0919909477233887e-07, 4.684552550315857e-07, 6.277114152908325e-07, 7.869675755500793e-07, 9.462237358093262e-07, 1.105479896068573e-06, 1.2647360563278198e-06, 1.4239922165870667e-06, 1.5832483768463135e-06, 1.7425045371055603e-06, 1.9017606973648071e-06, 2.061016857624054e-06, 2.2202730178833008e-06, 2.3795291781425476e-06, 2.5387853384017944e-06, 2.6980414986610413e-06, 2.857297658920288e-06, 3.016553819179535e-06, 3.1758099794387817e-06, 3.3350661396980286e-06, 3.4943222999572754e-06, 3.6535784602165222e-06, 3.812834620475769e-06, 3.972090780735016e-06, 4.131346940994263e-06, 4.2906031012535095e-06, 4.449859261512756e-06, 4.609115421772003e-06, 4.76837158203125e-06]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 8.0, 7.0, 6.0, 7.0, 8.0, 20.0, 21.0, 21.0, 17.0, 24.0, 39.0, 50.0, 71.0, 92.0, 123.0, 101.0, 86.0, 67.0, 47.0, 24.0, 25.0, 21.0, 13.0, 17.0, 10.0, 10.0, 7.0, 8.0, 8.0, 4.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004280159482732415, -0.0004136843199376017, -0.00039935269160196185, -0.00038502103416249156, -0.0003706894058268517, -0.0003563577774912119, -0.00034202614915557206, -0.0003276945208199322, -0.00031336286338046193, -0.0002990312350448221, -0.00028469960670918226, -0.00027036794926971197, -0.00025603632093407214, -0.0002417046925984323, -0.00022737306426279247, -0.0002130414213752374, -0.00019870979303959757, -0.00018437816470395774, -0.00017004652181640267, -0.00015571489348076284, -0.00014138325059320778, -0.00012705162225756794, -0.0001127199866459705, -9.838835103437304e-05, -8.40567154227756e-05, -6.972507981117815e-05, -5.53934441995807e-05, -4.106181222596206e-05, -2.673017661436461e-05, -1.2398544640745968e-05, 1.933090970851481e-06, 1.626472658244893e-05, 3.059636219404638e-05, 4.492799780564383e-05, 5.9259633417241275e-05, 7.359126175288111e-05, 8.792290464043617e-05, 0.00010225453297607601, 0.00011658616858767346, 0.0001309178041992709, 0.00014524944708682597, 0.0001595810754224658, 0.00017391271831002086, 0.0001882443466456607, 0.00020257598953321576, 0.0002169076178688556, 0.00023123924620449543, 0.0002455709036439657, 0.0002599025028757751, 0.00027423413121141493, 0.00028856575954705477, 0.00030289741698652506, 0.0003172290453221649, 0.00033156067365780473, 0.00034589230199344456, 0.0003602239303290844, 0.0003745555877685547, 0.0003888872161041945, 0.00040321884443983436, 0.00041755050187930465, 0.0004318821302149445, 0.0004462137585505843, 0.00046054538688622415, 0.000474877015221864, 0.0004892086726613343]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 4.0, 13.0, 8.0, 8.0, 12.0, 13.0, 25.0, 16.0, 19.0, 21.0, 26.0, 40.0, 33.0, 34.0, 32.0, 48.0, 47.0, 46.0, 37.0, 36.0, 34.0, 54.0, 55.0, 42.0, 38.0, 32.0, 32.0, 20.0, 25.0, 21.0, 31.0, 13.0, 18.0, 9.0, 12.0, 15.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00033587354118935764, -0.0003245063708163798, -0.0003131392295472324, -0.00030177205917425454, -0.0002904048888012767, -0.0002790377475321293, -0.00026767057715915143, -0.0002563034067861736, -0.0002449362655170262, -0.00023356910969596356, -0.0002222019393229857, -0.00021083478350192308, -0.00019946761312894523, -0.0001881004573078826, -0.00017673330148681998, -0.00016536613111384213, -0.00015399896074086428, -0.00014263180491980165, -0.0001312646345468238, -0.00011989747872576118, -0.00010853031562874094, -9.71631525317207e-05, -8.579599671065807e-05, -7.442883361363783e-05, -6.30616705166176e-05, -5.169450741959736e-05, -4.0327347960555926e-05, -2.8960188501514494e-05, -1.7593025404494256e-05, -6.225862307474017e-06, 5.141293513588607e-06, 1.6508456610608846e-05, 2.787564881145954e-05, 3.924281190847978e-05, 5.060997136752121e-05, 6.197713082656264e-05, 7.334429392358288e-05, 8.471145702060312e-05, 9.607861284166574e-05, 0.00010744577593868598, 0.00011881293903570622, 0.00013018009485676885, 0.0001415472652297467, 0.00015291442105080932, 0.00016428157687187195, 0.0001756487472448498, 0.00018701590306591243, 0.00019838305888697505, 0.0002097502292599529, 0.00022111738508101553, 0.00023248455545399338, 0.000243851711275056, 0.00025521888164803386, 0.00026658602291718125, 0.0002779531932901591, 0.00028932036366313696, 0.00030068750493228436, 0.0003120546753052622, 0.0003234218165744096, 0.00033478898694738746, 0.0003461561573203653, 0.00035752332769334316, 0.00036889046896249056, 0.0003802576393354684, 0.00039162480970844626]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 7.0, 7.0, 14.0, 12.0, 17.0, 27.0, 41.0, 47.0, 43.0, 95.0, 131.0, 186.0, 285.0, 547.0, 895.0, 1609.0, 3236.0, 8460.0, 3048795.0, 1114302.0, 8352.0, 3273.0, 1621.0, 851.0, 485.0, 304.0, 185.0, 120.0, 85.0, 72.0, 45.0, 24.0, 24.0, 20.0, 20.0, 10.0, 10.0, 7.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00205230712890625, -0.0019789934158325195, -0.001905679702758789, -0.0018323659896850586, -0.0017590522766113281, -0.0016857385635375977, -0.0016124248504638672, -0.0015391111373901367, -0.0014657974243164062, -0.0013924837112426758, -0.0013191699981689453, -0.0012458562850952148, -0.0011725425720214844, -0.001099228858947754, -0.0010259151458740234, -0.000952601432800293, -0.0008792877197265625, -0.000805974006652832, -0.0007326602935791016, -0.0006593465805053711, -0.0005860328674316406, -0.0005127191543579102, -0.0004394054412841797, -0.0003660917282104492, -0.00029277801513671875, -0.00021946430206298828, -0.0001461505889892578, -7.283687591552734e-05, 4.76837158203125e-07, 7.37905502319336e-05, 0.00014710426330566406, 0.00022041797637939453, 0.000293731689453125, 0.00036704540252685547, 0.00044035911560058594, 0.0005136728286743164, 0.0005869865417480469, 0.0006603002548217773, 0.0007336139678955078, 0.0008069276809692383, 0.0008802413940429688, 0.0009535551071166992, 0.0010268688201904297, 0.0011001825332641602, 0.0011734962463378906, 0.001246809959411621, 0.0013201236724853516, 0.001393437385559082, 0.0014667510986328125, 0.001540064811706543, 0.0016133785247802734, 0.001686692237854004, 0.0017600059509277344, 0.0018333196640014648, 0.0019066333770751953, 0.0019799470901489258, 0.0020532608032226562, 0.0021265745162963867, 0.002199888229370117, 0.0022732019424438477, 0.002346515655517578, 0.0024198293685913086, 0.002493143081665039, 0.0025664567947387695, 0.0026397705078125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 10.0, 5.0, 15.0, 19.0, 22.0, 17.0, 10.0, 21.0, 33.0, 30.0, 27.0, 35.0, 37.0, 58.0, 42.0, 49.0, 62.0, 45.0, 48.0, 53.0, 41.0, 41.0, 40.0, 33.0, 24.0, 26.0, 19.0, 29.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020015239715576172, -0.00019299425184726715, -0.00018583610653877258, -0.00017867796123027802, -0.00017151981592178345, -0.00016436167061328888, -0.0001572035253047943, -0.00015004537999629974, -0.00014288723468780518, -0.0001357290893793106, -0.00012857094407081604, -0.00012141279876232147, -0.0001142546534538269, -0.00010709650814533234, -9.993836283683777e-05, -9.27802175283432e-05, -8.562207221984863e-05, -7.846392691135406e-05, -7.13057816028595e-05, -6.414763629436493e-05, -5.698949098587036e-05, -4.9831345677375793e-05, -4.2673200368881226e-05, -3.551505506038666e-05, -2.835690975189209e-05, -2.1198764443397522e-05, -1.4040619134902954e-05, -6.882473826408386e-06, 2.7567148208618164e-07, 7.4338167905807495e-06, 1.4591962099075317e-05, 2.1750107407569885e-05, 2.8908252716064453e-05, 3.606639802455902e-05, 4.322454333305359e-05, 5.038268864154816e-05, 5.7540833950042725e-05, 6.469897925853729e-05, 7.185712456703186e-05, 7.901526987552643e-05, 8.6173415184021e-05, 9.333156049251556e-05, 0.00010048970580101013, 0.0001076478511095047, 0.00011480599641799927, 0.00012196414172649384, 0.0001291222870349884, 0.00013628043234348297, 0.00014343857765197754, 0.0001505967229604721, 0.00015775486826896667, 0.00016491301357746124, 0.0001720711588859558, 0.00017922930419445038, 0.00018638744950294495, 0.00019354559481143951, 0.00020070374011993408, 0.00020786188542842865, 0.00021502003073692322, 0.00022217817604541779, 0.00022933632135391235, 0.00023649446666240692, 0.0002436526119709015, 0.00025081075727939606, 0.0002579689025878906]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 14.0, 13.0, 17.0, 33.0, 48.0, 107.0, 204.0, 532.0, 1566.0, 5017.0, 21729.0, 4032663.0, 117252.0, 10608.0, 2867.0, 937.0, 356.0, 167.0, 70.0, 33.0, 14.0, 11.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001758575439453125, -0.0016928911209106445, -0.001627206802368164, -0.0015615224838256836, -0.0014958381652832031, -0.0014301538467407227, -0.0013644695281982422, -0.0012987852096557617, -0.0012331008911132812, -0.0011674165725708008, -0.0011017322540283203, -0.0010360479354858398, -0.0009703636169433594, -0.0009046792984008789, -0.0008389949798583984, -0.000773310661315918, -0.0007076263427734375, -0.000641942024230957, -0.0005762577056884766, -0.0005105733871459961, -0.0004448890686035156, -0.00037920475006103516, -0.0003135204315185547, -0.0002478361129760742, -0.00018215179443359375, -0.00011646747589111328, -5.078315734863281e-05, 1.4901161193847656e-05, 8.058547973632812e-05, 0.0001462697982788086, 0.00021195411682128906, 0.00027763843536376953, 0.00034332275390625, 0.00040900707244873047, 0.00047469139099121094, 0.0005403757095336914, 0.0006060600280761719, 0.0006717443466186523, 0.0007374286651611328, 0.0008031129837036133, 0.0008687973022460938, 0.0009344816207885742, 0.0010001659393310547, 0.0010658502578735352, 0.0011315345764160156, 0.001197218894958496, 0.0012629032135009766, 0.001328587532043457, 0.0013942718505859375, 0.001459956169128418, 0.0015256404876708984, 0.001591324806213379, 0.0016570091247558594, 0.0017226934432983398, 0.0017883777618408203, 0.0018540620803833008, 0.0019197463989257812, 0.0019854307174682617, 0.002051115036010742, 0.0021167993545532227, 0.002182483673095703, 0.0022481679916381836, 0.002313852310180664, 0.0023795366287231445, 0.002445220947265625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 3.0, 10.0, 12.0, 19.0, 48.0, 133.0, 588.0, 2687.0, 338.0, 102.0, 33.0, 16.0, 8.0, 9.0, 7.0, 12.0, 3.0, 5.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002684593200683594, -0.0002612695097923279, -0.0002540796995162964, -0.0002468898892402649, -0.0002397000789642334, -0.0002325102686882019, -0.0002253204584121704, -0.00021813064813613892, -0.00021094083786010742, -0.00020375102758407593, -0.00019656121730804443, -0.00018937140703201294, -0.00018218159675598145, -0.00017499178647994995, -0.00016780197620391846, -0.00016061216592788696, -0.00015342235565185547, -0.00014623254537582397, -0.00013904273509979248, -0.00013185292482376099, -0.0001246631145477295, -0.000117473304271698, -0.0001102834939956665, -0.00010309368371963501, -9.590387344360352e-05, -8.871406316757202e-05, -8.152425289154053e-05, -7.433444261550903e-05, -6.714463233947754e-05, -5.9954822063446045e-05, -5.276501178741455e-05, -4.557520151138306e-05, -3.838539123535156e-05, -3.119558095932007e-05, -2.4005770683288574e-05, -1.681596040725708e-05, -9.626150131225586e-06, -2.436339855194092e-06, 4.753470420837402e-06, 1.1943280696868896e-05, 1.913309097290039e-05, 2.6322901248931885e-05, 3.351271152496338e-05, 4.070252180099487e-05, 4.789233207702637e-05, 5.508214235305786e-05, 6.227195262908936e-05, 6.946176290512085e-05, 7.665157318115234e-05, 8.384138345718384e-05, 9.103119373321533e-05, 9.822100400924683e-05, 0.00010541081428527832, 0.00011260062456130981, 0.00011979043483734131, 0.0001269802451133728, 0.0001341700553894043, 0.0001413598656654358, 0.00014854967594146729, 0.00015573948621749878, 0.00016292929649353027, 0.00017011910676956177, 0.00017730891704559326, 0.00018449872732162476, 0.00019168853759765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 12.0, 9.0, 17.0, 26.0, 30.0, 27.0, 56.0, 78.0, 123.0, 187.0, 116.0, 96.0, 47.0, 38.0, 32.0, 22.0, 17.0, 19.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000441015261458233, -0.0004278901033103466, -0.00041476491605862975, -0.00040163975791074336, -0.00038851459976285696, -0.0003753894125111401, -0.0003622642543632537, -0.0003491390962153673, -0.00033601390896365047, -0.00032288875081576407, -0.0003097635635640472, -0.0002966384054161608, -0.0002835132472682744, -0.00027038808912038803, -0.0002572629018686712, -0.00024413774372078478, -0.0002310125855728984, -0.00021788741287309676, -0.00020476225472521037, -0.00019163708202540874, -0.00017851192387752235, -0.00016538675117772073, -0.0001522615784779191, -0.0001391364203300327, -0.00012601124763023108, -0.00011288608220638707, -9.976091678254306e-05, -8.663574408274144e-05, -7.351057865889743e-05, -6.038541323505342e-05, -4.7260240535251796e-05, -3.4135075111407787e-05, -2.100988058373332e-05, -7.884713340899907e-06, 5.240453901933506e-06, 1.8365622963756323e-05, 3.149078838760033e-05, 4.461595381144434e-05, 5.7741126511245966e-05, 7.086629193508998e-05, 8.399145735893399e-05, 9.7116622782778e-05, 0.000110241788206622, 0.00012336696090642363, 0.00013649213360622525, 0.00014961729175411165, 0.00016274246445391327, 0.0001758676371537149, 0.0001889927953016013, 0.00020211796800140291, 0.0002152431261492893, 0.00022836829884909093, 0.00024149345699697733, 0.0002546186442486942, 0.0002677438023965806, 0.00028086896054446697, 0.0002939941477961838, 0.0003071193059440702, 0.00032024449319578707, 0.00033336965134367347, 0.00034649480949155986, 0.00035961996763944626, 0.0003727451548911631, 0.0003858703130390495, 0.0003989954711869359]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 13.0, 16.0, 13.0, 10.0, 26.0, 17.0, 23.0, 27.0, 35.0, 30.0, 42.0, 32.0, 24.0, 38.0, 47.0, 31.0, 42.0, 35.0, 40.0, 37.0, 31.0, 41.0, 29.0, 45.0, 30.0, 31.0, 19.0, 22.0, 21.0, 19.0, 18.0, 13.0, 22.0, 12.0, 10.0, 5.0, 10.0, 1.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00021696966723538935, -0.00021043699234724045, -0.00020390431745909154, -0.00019737164257094264, -0.0001908389531308785, -0.0001843062782427296, -0.0001777736033545807, -0.0001712409284664318, -0.00016470823902636766, -0.00015817556413821876, -0.00015164288925006986, -0.00014511021436192095, -0.00013857752492185682, -0.00013204485003370792, -0.000125512175145559, -0.00011897950025741011, -0.0001124468253692612, -0.0001059141504811123, -9.938146831700578e-05, -9.284879342885688e-05, -8.631611126475036e-05, -7.978343637660146e-05, -7.325076148845255e-05, -6.671808660030365e-05, -6.018540443619713e-05, -5.365272591006942e-05, -4.712004738394171e-05, -4.0587372495792806e-05, -3.4054693969665095e-05, -2.7522015443537384e-05, -2.098934055538848e-05, -1.445666202926077e-05, -7.923998055048287e-06, -1.3913204384152777e-06, 5.141357178217731e-06, 1.1674033885356039e-05, 1.820671241148375e-05, 2.473939093761146e-05, 3.1272065825760365e-05, 3.7804744351888075e-05, 4.4337422878015786e-05, 5.08701014041435e-05, 5.740277993027121e-05, 6.393545481842011e-05, 7.046812970656902e-05, 7.700081187067553e-05, 8.353348675882444e-05, 9.006616892293096e-05, 9.659884381107986e-05, 0.00010313151869922876, 0.00010966420086333528, 0.00011619687575148419, 0.0001227295579155907, 0.0001292622328037396, 0.0001357949076918885, 0.00014232758258003742, 0.00014886027202010155, 0.00015539294690825045, 0.00016192562179639935, 0.00016845829668454826, 0.0001749909861246124, 0.0001815236610127613, 0.0001880563359009102, 0.0001945890107890591, 0.000201121685677208]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 7.0, 14.0, 12.0, 15.0, 24.0, 22.0, 38.0, 42.0, 75.0, 92.0, 168.0, 248.0, 337.0, 501.0, 709.0, 981.0, 1601.0, 2372.0, 3845.0, 5924.0, 9425.0, 15284.0, 25396.0, 41983.0, 75906.0, 151310.0, 343495.0, 170314.0, 81973.0, 45500.0, 26819.0, 15983.0, 9869.0, 6444.0, 4128.0, 2638.0, 1611.0, 1073.0, 747.0, 460.0, 365.0, 250.0, 169.0, 117.0, 81.0, 57.0, 34.0, 27.0, 16.0, 19.0, 14.0, 7.0, 4.0, 8.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.00027489662170410156, -0.00026645511388778687, -0.00025801360607147217, -0.00024957209825515747, -0.00024113059043884277, -0.00023268908262252808, -0.00022424757480621338, -0.00021580606698989868, -0.00020736455917358398, -0.0001989230513572693, -0.0001904815435409546, -0.0001820400357246399, -0.0001735985279083252, -0.0001651570200920105, -0.0001567155122756958, -0.0001482740044593811, -0.0001398324966430664, -0.0001313909888267517, -0.000122949481010437, -0.00011450797319412231, -0.00010606646537780762, -9.762495756149292e-05, -8.918344974517822e-05, -8.074194192886353e-05, -7.230043411254883e-05, -6.385892629623413e-05, -5.5417418479919434e-05, -4.6975910663604736e-05, -3.853440284729004e-05, -3.0092895030975342e-05, -2.1651387214660645e-05, -1.3209879398345947e-05, -4.76837158203125e-06, 3.6731362342834473e-06, 1.2114644050598145e-05, 2.0556151866912842e-05, 2.899765968322754e-05, 3.7439167499542236e-05, 4.5880675315856934e-05, 5.432218313217163e-05, 6.276369094848633e-05, 7.120519876480103e-05, 7.964670658111572e-05, 8.808821439743042e-05, 9.652972221374512e-05, 0.00010497123003005981, 0.00011341273784637451, 0.00012185424566268921, 0.0001302957534790039, 0.0001387372612953186, 0.0001471787691116333, 0.000155620276927948, 0.0001640617847442627, 0.0001725032925605774, 0.0001809448003768921, 0.0001893863081932068, 0.00019782781600952148, 0.00020626932382583618, 0.00021471083164215088, 0.00022315233945846558, 0.00023159384727478027, 0.00024003535509109497, 0.00024847686290740967, 0.00025691837072372437, 0.00026535987854003906]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 7.0, 8.0, 15.0, 15.0, 20.0, 16.0, 18.0, 22.0, 35.0, 27.0, 41.0, 37.0, 35.0, 36.0, 39.0, 44.0, 43.0, 40.0, 39.0, 42.0, 46.0, 35.0, 32.0, 43.0, 27.0, 30.0, 19.0, 24.0, 19.0, 20.0, 14.0, 16.0, 11.0, 23.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00022220611572265625, -0.0002153683453798294, -0.00020853057503700256, -0.00020169280469417572, -0.00019485503435134888, -0.00018801726400852203, -0.0001811794936656952, -0.00017434172332286835, -0.0001675039529800415, -0.00016066618263721466, -0.00015382841229438782, -0.00014699064195156097, -0.00014015287160873413, -0.0001333151012659073, -0.00012647733092308044, -0.0001196395605802536, -0.00011280179023742676, -0.00010596401989459991, -9.912624955177307e-05, -9.228847920894623e-05, -8.545070886611938e-05, -7.861293852329254e-05, -7.17751681804657e-05, -6.493739783763885e-05, -5.809962749481201e-05, -5.126185715198517e-05, -4.4424086809158325e-05, -3.758631646633148e-05, -3.074854612350464e-05, -2.3910775780677795e-05, -1.7073005437850952e-05, -1.0235235095024109e-05, -3.3974647521972656e-06, 3.4403055906295776e-06, 1.0278075933456421e-05, 1.7115846276283264e-05, 2.3953616619110107e-05, 3.079138696193695e-05, 3.7629157304763794e-05, 4.446692764759064e-05, 5.130469799041748e-05, 5.8142468333244324e-05, 6.498023867607117e-05, 7.181800901889801e-05, 7.865577936172485e-05, 8.54935497045517e-05, 9.233132004737854e-05, 9.916909039020538e-05, 0.00010600686073303223, 0.00011284463107585907, 0.00011968240141868591, 0.00012652017176151276, 0.0001333579421043396, 0.00014019571244716644, 0.00014703348278999329, 0.00015387125313282013, 0.00016070902347564697, 0.00016754679381847382, 0.00017438456416130066, 0.0001812223345041275, 0.00018806010484695435, 0.0001948978751897812, 0.00020173564553260803, 0.00020857341587543488, 0.00021541118621826172]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 20.0, 20.0, 23.0, 36.0, 69.0, 81.0, 125.0, 176.0, 262.0, 413.0, 610.0, 890.0, 1282.0, 2051.0, 2973.0, 4681.0, 7472.0, 12467.0, 22345.0, 43711.0, 106204.0, 481028.0, 218355.0, 68302.0, 31096.0, 16989.0, 9830.0, 5893.0, 3764.0, 2419.0, 1662.0, 1037.0, 743.0, 493.0, 334.0, 218.0, 150.0, 98.0, 69.0, 53.0, 24.0, 19.0, 22.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003082752227783203, -0.000298570841550827, -0.00028886646032333374, -0.00027916207909584045, -0.00026945769786834717, -0.0002597533166408539, -0.0002500489354133606, -0.0002403445541858673, -0.00023064017295837402, -0.00022093579173088074, -0.00021123141050338745, -0.00020152702927589417, -0.00019182264804840088, -0.0001821182668209076, -0.0001724138855934143, -0.00016270950436592102, -0.00015300512313842773, -0.00014330074191093445, -0.00013359636068344116, -0.00012389197945594788, -0.00011418759822845459, -0.0001044832170009613, -9.477883577346802e-05, -8.507445454597473e-05, -7.537007331848145e-05, -6.566569209098816e-05, -5.596131086349487e-05, -4.625692963600159e-05, -3.65525484085083e-05, -2.6848167181015015e-05, -1.714378595352173e-05, -7.439404726028442e-06, 2.2649765014648438e-06, 1.196935772895813e-05, 2.1673738956451416e-05, 3.13781201839447e-05, 4.108250141143799e-05, 5.0786882638931274e-05, 6.049126386642456e-05, 7.019564509391785e-05, 7.990002632141113e-05, 8.960440754890442e-05, 9.93087887763977e-05, 0.00010901317000389099, 0.00011871755123138428, 0.00012842193245887756, 0.00013812631368637085, 0.00014783069491386414, 0.00015753507614135742, 0.0001672394573688507, 0.000176943838596344, 0.00018664821982383728, 0.00019635260105133057, 0.00020605698227882385, 0.00021576136350631714, 0.00022546574473381042, 0.0002351701259613037, 0.000244874507188797, 0.0002545788884162903, 0.00026428326964378357, 0.00027398765087127686, 0.00028369203209877014, 0.00029339641332626343, 0.0003031007945537567, 0.00031280517578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 14.0, 12.0, 14.0, 9.0, 23.0, 24.0, 25.0, 35.0, 41.0, 41.0, 41.0, 41.0, 35.0, 36.0, 49.0, 44.0, 44.0, 48.0, 38.0, 30.0, 28.0, 40.0, 28.0, 28.0, 30.0, 21.0, 21.0, 11.0, 22.0, 11.0, 11.0, 9.0, 15.0, 13.0, 6.0, 5.0, 6.0, 3.0, 8.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001417398452758789, -0.00013731233775615692, -0.00013288483023643494, -0.00012845732271671295, -0.00012402981519699097, -0.00011960230767726898, -0.000115174800157547, -0.00011074729263782501, -0.00010631978511810303, -0.00010189227759838104, -9.746477007865906e-05, -9.303726255893707e-05, -8.860975503921509e-05, -8.41822475194931e-05, -7.975473999977112e-05, -7.532723248004913e-05, -7.089972496032715e-05, -6.647221744060516e-05, -6.204470992088318e-05, -5.7617202401161194e-05, -5.318969488143921e-05, -4.8762187361717224e-05, -4.433467984199524e-05, -3.9907172322273254e-05, -3.547966480255127e-05, -3.1052157282829285e-05, -2.66246497631073e-05, -2.2197142243385315e-05, -1.776963472366333e-05, -1.3342127203941345e-05, -8.91461968421936e-06, -4.4871121644973755e-06, -5.960464477539063e-08, 4.367902874946594e-06, 8.795410394668579e-06, 1.3222917914390564e-05, 1.765042543411255e-05, 2.2077932953834534e-05, 2.650544047355652e-05, 3.0932947993278503e-05, 3.536045551300049e-05, 3.978796303272247e-05, 4.421547055244446e-05, 4.864297807216644e-05, 5.307048559188843e-05, 5.749799311161041e-05, 6.19255006313324e-05, 6.635300815105438e-05, 7.078051567077637e-05, 7.520802319049835e-05, 7.963553071022034e-05, 8.406303822994232e-05, 8.84905457496643e-05, 9.291805326938629e-05, 9.734556078910828e-05, 0.00010177306830883026, 0.00010620057582855225, 0.00011062808334827423, 0.00011505559086799622, 0.0001194830983877182, 0.00012391060590744019, 0.00012833811342716217, 0.00013276562094688416, 0.00013719312846660614, 0.00014162063598632812]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 8.0, 15.0, 19.0, 21.0, 27.0, 51.0, 65.0, 102.0, 135.0, 168.0, 296.0, 430.0, 683.0, 1125.0, 1924.0, 3866.0, 8487.0, 28379.0, 422230.0, 533599.0, 29012.0, 8627.0, 3901.0, 2045.0, 1189.0, 742.0, 472.0, 276.0, 192.0, 125.0, 110.0, 48.0, 52.0, 38.0, 23.0, 16.0, 12.0, 11.0, 5.0, 10.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.219480514526367e-05, -7.954426109790802e-05, -7.689371705055237e-05, -7.424317300319672e-05, -7.159262895584106e-05, -6.894208490848541e-05, -6.629154086112976e-05, -6.364099681377411e-05, -6.099045276641846e-05, -5.8339908719062805e-05, -5.568936467170715e-05, -5.30388206243515e-05, -5.038827657699585e-05, -4.77377325296402e-05, -4.5087188482284546e-05, -4.2436644434928894e-05, -3.978610038757324e-05, -3.713555634021759e-05, -3.448501229286194e-05, -3.183446824550629e-05, -2.9183924198150635e-05, -2.6533380150794983e-05, -2.388283610343933e-05, -2.123229205608368e-05, -1.8581748008728027e-05, -1.5931203961372375e-05, -1.3280659914016724e-05, -1.0630115866661072e-05, -7.97957181930542e-06, -5.329027771949768e-06, -2.678483724594116e-06, -2.7939677238464355e-08, 2.6226043701171875e-06, 5.273148417472839e-06, 7.923692464828491e-06, 1.0574236512184143e-05, 1.3224780559539795e-05, 1.5875324606895447e-05, 1.85258686542511e-05, 2.117641270160675e-05, 2.3826956748962402e-05, 2.6477500796318054e-05, 2.9128044843673706e-05, 3.177858889102936e-05, 3.442913293838501e-05, 3.707967698574066e-05, 3.9730221033096313e-05, 4.2380765080451965e-05, 4.503130912780762e-05, 4.768185317516327e-05, 5.033239722251892e-05, 5.298294126987457e-05, 5.5633485317230225e-05, 5.8284029364585876e-05, 6.093457341194153e-05, 6.358511745929718e-05, 6.623566150665283e-05, 6.888620555400848e-05, 7.153674960136414e-05, 7.418729364871979e-05, 7.683783769607544e-05, 7.948838174343109e-05, 8.213892579078674e-05, 8.47894698381424e-05, 8.744001388549805e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 3.0, 7.0, 21.0, 15.0, 19.0, 12.0, 32.0, 20.0, 34.0, 41.0, 53.0, 51.0, 62.0, 61.0, 69.0, 69.0, 61.0, 40.0, 88.0, 36.0, 35.0, 22.0, 21.0, 28.0, 20.0, 14.0, 8.0, 9.0, 7.0, 5.0, 1.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-06, -1.7248094081878662e-06, -1.6614794731140137e-06, -1.5981495380401611e-06, -1.5348196029663086e-06, -1.471489667892456e-06, -1.4081597328186035e-06, -1.344829797744751e-06, -1.2814998626708984e-06, -1.218169927597046e-06, -1.1548399925231934e-06, -1.0915100574493408e-06, -1.0281801223754883e-06, -9.648501873016357e-07, -9.015202522277832e-07, -8.381903171539307e-07, -7.748603820800781e-07, -7.115304470062256e-07, -6.48200511932373e-07, -5.848705768585205e-07, -5.21540641784668e-07, -4.5821070671081543e-07, -3.948807716369629e-07, -3.3155083656311035e-07, -2.682209014892578e-07, -2.0489096641540527e-07, -1.4156103134155273e-07, -7.82310962677002e-08, -1.4901161193847656e-08, 4.842877388000488e-08, 1.1175870895385742e-07, 1.7508864402770996e-07, 2.384185791015625e-07, 3.0174851417541504e-07, 3.650784492492676e-07, 4.284083843231201e-07, 4.917383193969727e-07, 5.550682544708252e-07, 6.183981895446777e-07, 6.817281246185303e-07, 7.450580596923828e-07, 8.083879947662354e-07, 8.717179298400879e-07, 9.350478649139404e-07, 9.98377799987793e-07, 1.0617077350616455e-06, 1.125037670135498e-06, 1.1883676052093506e-06, 1.2516975402832031e-06, 1.3150274753570557e-06, 1.3783574104309082e-06, 1.4416873455047607e-06, 1.5050172805786133e-06, 1.5683472156524658e-06, 1.6316771507263184e-06, 1.695007085800171e-06, 1.7583370208740234e-06, 1.821666955947876e-06, 1.8849968910217285e-06, 1.948326826095581e-06, 2.0116567611694336e-06, 2.074986696243286e-06, 2.1383166313171387e-06, 2.201646566390991e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 17.0, 58.0, 145.0, 355.0, 903.0, 2303.0, 6705.0, 28837.0, 906713.0, 85666.0, 11087.0, 3532.0, 1302.0, 500.0, 218.0, 86.0, 34.0, 17.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00017642974853515625, -0.00017148815095424652, -0.0001665465533733368, -0.00016160495579242706, -0.00015666335821151733, -0.0001517217606306076, -0.00014678016304969788, -0.00014183856546878815, -0.00013689696788787842, -0.0001319553703069687, -0.00012701377272605896, -0.00012207217514514923, -0.0001171305775642395, -0.00011218897998332977, -0.00010724738240242004, -0.00010230578482151031, -9.736418724060059e-05, -9.242258965969086e-05, -8.748099207878113e-05, -8.25393944978714e-05, -7.759779691696167e-05, -7.265619933605194e-05, -6.771460175514221e-05, -6.277300417423248e-05, -5.7831406593322754e-05, -5.2889809012413025e-05, -4.7948211431503296e-05, -4.300661385059357e-05, -3.806501626968384e-05, -3.312341868877411e-05, -2.818182110786438e-05, -2.324022352695465e-05, -1.8298625946044922e-05, -1.3357028365135193e-05, -8.415430784225464e-06, -3.473833203315735e-06, 1.4677643775939941e-06, 6.409361958503723e-06, 1.1350959539413452e-05, 1.629255712032318e-05, 2.123415470123291e-05, 2.617575228214264e-05, 3.111734986305237e-05, 3.60589474439621e-05, 4.1000545024871826e-05, 4.5942142605781555e-05, 5.0883740186691284e-05, 5.582533776760101e-05, 6.076693534851074e-05, 6.570853292942047e-05, 7.06501305103302e-05, 7.559172809123993e-05, 8.053332567214966e-05, 8.547492325305939e-05, 9.041652083396912e-05, 9.535811841487885e-05, 0.00010029971599578857, 0.0001052413135766983, 0.00011018291115760803, 0.00011512450873851776, 0.00012006610631942749, 0.00012500770390033722, 0.00012994930148124695, 0.00013489089906215668, 0.0001398324966430664]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 6.0, 13.0, 15.0, 24.0, 31.0, 41.0, 92.0, 158.0, 222.0, 133.0, 84.0, 37.0, 32.0, 15.0, 12.0, 7.0, 4.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3887882232666016e-05, -1.3399869203567505e-05, -1.2911856174468994e-05, -1.2423843145370483e-05, -1.1935830116271973e-05, -1.1447817087173462e-05, -1.0959804058074951e-05, -1.047179102897644e-05, -9.98377799987793e-06, -9.495764970779419e-06, -9.007751941680908e-06, -8.519738912582397e-06, -8.031725883483887e-06, -7.543712854385376e-06, -7.055699825286865e-06, -6.5676867961883545e-06, -6.079673767089844e-06, -5.591660737991333e-06, -5.103647708892822e-06, -4.6156346797943115e-06, -4.127621650695801e-06, -3.63960862159729e-06, -3.1515955924987793e-06, -2.6635825634002686e-06, -2.175569534301758e-06, -1.687556505203247e-06, -1.1995434761047363e-06, -7.115304470062256e-07, -2.2351741790771484e-07, 2.644956111907959e-07, 7.525086402893066e-07, 1.2405216693878174e-06, 1.7285346984863281e-06, 2.216547727584839e-06, 2.7045607566833496e-06, 3.1925737857818604e-06, 3.680586814880371e-06, 4.168599843978882e-06, 4.656612873077393e-06, 5.144625902175903e-06, 5.632638931274414e-06, 6.120651960372925e-06, 6.6086649894714355e-06, 7.096678018569946e-06, 7.584691047668457e-06, 8.072704076766968e-06, 8.560717105865479e-06, 9.04873013496399e-06, 9.5367431640625e-06, 1.002475619316101e-05, 1.0512769222259521e-05, 1.1000782251358032e-05, 1.1488795280456543e-05, 1.1976808309555054e-05, 1.2464821338653564e-05, 1.2952834367752075e-05, 1.3440847396850586e-05, 1.3928860425949097e-05, 1.4416873455047607e-05, 1.4904886484146118e-05, 1.539289951324463e-05, 1.588091254234314e-05, 1.636892557144165e-05, 1.685693860054016e-05, 1.7344951629638672e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 8.0, 10.0, 7.0, 13.0, 30.0, 26.0, 40.0, 51.0, 71.0, 138.0, 196.0, 107.0, 86.0, 54.0, 38.0, 29.0, 20.0, 22.0, 9.0, 6.0, 9.0, 2.0, 6.0, 1.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00049090530956164, -0.00047848952817730606, -0.0004660737467929721, -0.00045365793630480766, -0.0004412421549204737, -0.0004288263735361397, -0.00041641059215180576, -0.0004039948107674718, -0.00039157900027930737, -0.0003791632188949734, -0.00036674743751063943, -0.000354331627022475, -0.00034191584563814104, -0.00032950006425380707, -0.0003170842828694731, -0.00030466850148513913, -0.00029225272010080516, -0.0002798369387164712, -0.0002674211573321372, -0.00025500537594780326, -0.00024258956545963883, -0.00023017378407530487, -0.0002177580026909709, -0.00020534222130663693, -0.00019292642537038773, -0.00018051064398605376, -0.00016809484804980457, -0.0001556790666654706, -0.00014326328528113663, -0.00013084748934488744, -0.00011843170796055347, -0.00010601591930026188, -9.36001306399703e-05, -8.118434197967872e-05, -6.876855331938714e-05, -5.635277193505317e-05, -4.393698327476159e-05, -3.1521194614470005e-05, -1.9105413230136037e-05, -6.6896245698444545e-06, 5.726164090447128e-06, 1.8141950931749307e-05, 3.0557737773051485e-05, 4.297352279536426e-05, 5.538931145565584e-05, 6.780510011594743e-05, 8.02208815002814e-05, 9.263667016057298e-05, 0.00010505245882086456, 0.00011746824748115614, 0.00012988403614144772, 0.0001422998175257817, 0.0001547156134620309, 0.00016713139484636486, 0.00017954717623069882, 0.0001919629576150328, 0.000204378753551282, 0.00021679453493561596, 0.00022921033087186515, 0.00024162611225619912, 0.0002540418936405331, 0.00026645767502486706, 0.0002788734855130315, 0.00029128926689736545, 0.0003037050482816994]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 5.0, 6.0, 7.0, 14.0, 12.0, 17.0, 13.0, 20.0, 19.0, 25.0, 32.0, 31.0, 32.0, 34.0, 33.0, 29.0, 41.0, 34.0, 43.0, 41.0, 34.0, 38.0, 31.0, 40.0, 31.0, 35.0, 42.0, 30.0, 31.0, 21.0, 20.0, 26.0, 19.0, 14.0, 17.0, 17.0, 16.0, 8.0, 7.0, 8.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.00019996223272755742, -0.00019393362163100392, -0.0001879050105344504, -0.0001818763994378969, -0.0001758477883413434, -0.00016981916269287467, -0.00016379055159632117, -0.00015776194049976766, -0.00015173332940321416, -0.00014570471830666065, -0.00013967610721010715, -0.00013364749611355364, -0.0001276188704650849, -0.00012159026664448902, -0.0001155616482719779, -0.0001095330371754244, -0.00010350442607887089, -9.747581498231739e-05, -9.144720388576388e-05, -8.541858551325276e-05, -7.938997441669926e-05, -7.336136332014576e-05, -6.733274494763464e-05, -6.130413385108113e-05, -5.527552275452763e-05, -4.9246911657974124e-05, -4.321829692344181e-05, -3.71896821889095e-05, -3.1161071092355996e-05, -2.513245817681309e-05, -1.910384526127018e-05, -1.3075230526737869e-05, -7.046604878269136e-06, -1.017991962726228e-06, 5.01062095281668e-06, 1.1039233868359588e-05, 1.7067846783902496e-05, 2.3096459699445404e-05, 2.9125072614988312e-05, 3.5153687349520624e-05, 4.118229844607413e-05, 4.721090954262763e-05, 5.3239524277159944e-05, 5.9268139011692256e-05, 6.529675010824576e-05, 7.132536120479926e-05, 7.735397957731038e-05, 8.338259067386389e-05, 8.941120177041739e-05, 9.54398128669709e-05, 0.0001014684239635244, 0.00010749704233603552, 0.00011352565343258902, 0.00011955426452914253, 0.00012558288290165365, 0.00013161149399820715, 0.00013764010509476066, 0.00014366871619131416, 0.00014969732728786767, 0.00015572593838442117, 0.00016175454948097467, 0.0001677831751294434, 0.0001738117862259969, 0.00017984039732255042, 0.00018586900841910392]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 19.0, 27.0, 30.0, 49.0, 73.0, 78.0, 133.0, 177.0, 250.0, 349.0, 596.0, 884.0, 1318.0, 2022.0, 3135.0, 5275.0, 8647.0, 14427.0, 25558.0, 47425.0, 95441.0, 238005.0, 338874.0, 128246.0, 60153.0, 32162.0, 18005.0, 10218.0, 6026.0, 3885.0, 2326.0, 1588.0, 1010.0, 641.0, 458.0, 316.0, 216.0, 150.0, 107.0, 77.0, 46.0, 28.0, 24.0, 23.0, 7.0, 11.0, 12.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00048661231994628906, -0.0004710070788860321, -0.00045540183782577515, -0.0004397965967655182, -0.00042419135570526123, -0.00040858611464500427, -0.0003929808735847473, -0.00037737563252449036, -0.0003617703914642334, -0.00034616515040397644, -0.0003305599093437195, -0.0003149546682834625, -0.00029934942722320557, -0.0002837441861629486, -0.00026813894510269165, -0.0002525337040424347, -0.00023692846298217773, -0.00022132322192192078, -0.00020571798086166382, -0.00019011273980140686, -0.0001745074987411499, -0.00015890225768089294, -0.00014329701662063599, -0.00012769177556037903, -0.00011208653450012207, -9.648129343986511e-05, -8.087605237960815e-05, -6.52708113193512e-05, -4.966557025909424e-05, -3.406032919883728e-05, -1.8455088138580322e-05, -2.8498470783233643e-06, 1.2755393981933594e-05, 2.8360635042190552e-05, 4.396587610244751e-05, 5.957111716270447e-05, 7.517635822296143e-05, 9.078159928321838e-05, 0.00010638684034347534, 0.0001219920814037323, 0.00013759732246398926, 0.00015320256352424622, 0.00016880780458450317, 0.00018441304564476013, 0.0002000182867050171, 0.00021562352776527405, 0.000231228768825531, 0.00024683400988578796, 0.0002624392509460449, 0.0002780444920063019, 0.00029364973306655884, 0.0003092549741268158, 0.00032486021518707275, 0.0003404654562473297, 0.00035607069730758667, 0.00037167593836784363, 0.0003872811794281006, 0.00040288642048835754, 0.0004184916615486145, 0.00043409690260887146, 0.0004497021436691284, 0.0004653073847293854, 0.00048091262578964233, 0.0004965178668498993, 0.0005121231079101562]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 12.0, 17.0, 10.0, 19.0, 16.0, 25.0, 29.0, 23.0, 38.0, 37.0, 38.0, 35.0, 35.0, 45.0, 45.0, 48.0, 41.0, 38.0, 37.0, 41.0, 47.0, 34.0, 42.0, 34.0, 26.0, 32.0, 32.0, 14.0, 21.0, 11.0, 17.0, 10.0, 12.0, 6.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010901689529418945, -0.00010542944073677063, -0.0001018419861793518, -9.825453162193298e-05, -9.466707706451416e-05, -9.107962250709534e-05, -8.749216794967651e-05, -8.390471339225769e-05, -8.031725883483887e-05, -7.672980427742004e-05, -7.314234972000122e-05, -6.95548951625824e-05, -6.596744060516357e-05, -6.237998604774475e-05, -5.879253149032593e-05, -5.5205076932907104e-05, -5.161762237548828e-05, -4.803016781806946e-05, -4.4442713260650635e-05, -4.085525870323181e-05, -3.726780414581299e-05, -3.3680349588394165e-05, -3.0092895030975342e-05, -2.650544047355652e-05, -2.2917985916137695e-05, -1.9330531358718872e-05, -1.574307680130005e-05, -1.2155622243881226e-05, -8.568167686462402e-06, -4.980713129043579e-06, -1.3932585716247559e-06, 2.1941959857940674e-06, 5.781650543212891e-06, 9.369105100631714e-06, 1.2956559658050537e-05, 1.654401421546936e-05, 2.0131468772888184e-05, 2.3718923330307007e-05, 2.730637788772583e-05, 3.089383244514465e-05, 3.4481287002563477e-05, 3.80687415599823e-05, 4.165619611740112e-05, 4.5243650674819946e-05, 4.883110523223877e-05, 5.241855978965759e-05, 5.6006014347076416e-05, 5.959346890449524e-05, 6.318092346191406e-05, 6.676837801933289e-05, 7.035583257675171e-05, 7.394328713417053e-05, 7.753074169158936e-05, 8.111819624900818e-05, 8.4705650806427e-05, 8.829310536384583e-05, 9.188055992126465e-05, 9.546801447868347e-05, 9.90554690361023e-05, 0.00010264292359352112, 0.00010623037815093994, 0.00010981783270835876, 0.00011340528726577759, 0.00011699274182319641, 0.00012058019638061523]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 11.0, 14.0, 29.0, 31.0, 55.0, 100.0, 147.0, 210.0, 374.0, 648.0, 1097.0, 2003.0, 3454.0, 6198.0, 11521.0, 22703.0, 48701.0, 116462.0, 372391.0, 284501.0, 94816.0, 40805.0, 19594.0, 10077.0, 5414.0, 2952.0, 1769.0, 966.0, 612.0, 323.0, 206.0, 130.0, 75.0, 53.0, 35.0, 20.0, 12.0, 10.0, 7.0, 13.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045299530029296875, -0.00043879076838493347, -0.0004245862364768982, -0.0004103817045688629, -0.00039617717266082764, -0.00038197264075279236, -0.0003677681088447571, -0.0003535635769367218, -0.0003393590450286865, -0.00032515451312065125, -0.00031094998121261597, -0.0002967454493045807, -0.0002825409173965454, -0.00026833638548851013, -0.00025413185358047485, -0.00023992732167243958, -0.0002257227897644043, -0.00021151825785636902, -0.00019731372594833374, -0.00018310919404029846, -0.00016890466213226318, -0.0001547001302242279, -0.00014049559831619263, -0.00012629106640815735, -0.00011208653450012207, -9.788200259208679e-05, -8.367747068405151e-05, -6.947293877601624e-05, -5.526840686798096e-05, -4.106387495994568e-05, -2.68593430519104e-05, -1.2654811143875122e-05, 1.5497207641601562e-06, 1.5754252672195435e-05, 2.9958784580230713e-05, 4.416331648826599e-05, 5.836784839630127e-05, 7.257238030433655e-05, 8.677691221237183e-05, 0.0001009814441204071, 0.00011518597602844238, 0.00012939050793647766, 0.00014359503984451294, 0.00015779957175254822, 0.0001720041036605835, 0.00018620863556861877, 0.00020041316747665405, 0.00021461769938468933, 0.0002288222312927246, 0.0002430267632007599, 0.00025723129510879517, 0.00027143582701683044, 0.0002856403589248657, 0.000299844890832901, 0.0003140494227409363, 0.00032825395464897156, 0.00034245848655700684, 0.0003566630184650421, 0.0003708675503730774, 0.00038507208228111267, 0.00039927661418914795, 0.00041348114609718323, 0.0004276856780052185, 0.0004418902099132538, 0.00045609474182128906]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 3.0, 9.0, 9.0, 16.0, 9.0, 14.0, 18.0, 21.0, 33.0, 29.0, 32.0, 39.0, 43.0, 24.0, 48.0, 50.0, 49.0, 42.0, 52.0, 42.0, 51.0, 41.0, 38.0, 47.0, 31.0, 23.0, 30.0, 15.0, 27.0, 18.0, 20.0, 17.0, 9.0, 12.0, 9.0, 5.0, 2.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001068115234375, -0.00010345876216888428, -0.00010010600090026855, -9.675323963165283e-05, -9.340047836303711e-05, -9.004771709442139e-05, -8.669495582580566e-05, -8.334219455718994e-05, -7.998943328857422e-05, -7.66366720199585e-05, -7.328391075134277e-05, -6.993114948272705e-05, -6.657838821411133e-05, -6.32256269454956e-05, -5.987286567687988e-05, -5.652010440826416e-05, -5.316734313964844e-05, -4.9814581871032715e-05, -4.646182060241699e-05, -4.310905933380127e-05, -3.975629806518555e-05, -3.6403536796569824e-05, -3.30507755279541e-05, -2.969801425933838e-05, -2.6345252990722656e-05, -2.2992491722106934e-05, -1.963973045349121e-05, -1.6286969184875488e-05, -1.2934207916259766e-05, -9.581446647644043e-06, -6.22868537902832e-06, -2.8759241104125977e-06, 4.76837158203125e-07, 3.829598426818848e-06, 7.18235969543457e-06, 1.0535120964050293e-05, 1.3887882232666016e-05, 1.7240643501281738e-05, 2.059340476989746e-05, 2.3946166038513184e-05, 2.7298927307128906e-05, 3.065168857574463e-05, 3.400444984436035e-05, 3.7357211112976074e-05, 4.07099723815918e-05, 4.406273365020752e-05, 4.741549491882324e-05, 5.0768256187438965e-05, 5.412101745605469e-05, 5.747377872467041e-05, 6.082653999328613e-05, 6.417930126190186e-05, 6.753206253051758e-05, 7.08848237991333e-05, 7.423758506774902e-05, 7.759034633636475e-05, 8.094310760498047e-05, 8.429586887359619e-05, 8.764863014221191e-05, 9.100139141082764e-05, 9.435415267944336e-05, 9.770691394805908e-05, 0.0001010596752166748, 0.00010441243648529053, 0.00010776519775390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 19.0, 21.0, 32.0, 50.0, 59.0, 87.0, 147.0, 227.0, 465.0, 714.0, 1450.0, 2631.0, 7210.0, 19338.0, 126434.0, 802268.0, 61402.0, 15867.0, 4952.0, 2416.0, 1121.0, 641.0, 388.0, 184.0, 146.0, 70.0, 65.0, 47.0, 27.0, 17.0, 16.0, 8.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-05, -1.7906539142131805e-05, -1.7335638403892517e-05, -1.676473766565323e-05, -1.619383692741394e-05, -1.5622936189174652e-05, -1.5052035450935364e-05, -1.4481134712696075e-05, -1.3910233974456787e-05, -1.3339333236217499e-05, -1.276843249797821e-05, -1.2197531759738922e-05, -1.1626631021499634e-05, -1.1055730283260345e-05, -1.0484829545021057e-05, -9.913928806781769e-06, -9.34302806854248e-06, -8.772127330303192e-06, -8.201226592063904e-06, -7.630325853824615e-06, -7.059425115585327e-06, -6.488524377346039e-06, -5.9176236391067505e-06, -5.346722900867462e-06, -4.775822162628174e-06, -4.2049214243888855e-06, -3.634020686149597e-06, -3.063119947910309e-06, -2.4922192096710205e-06, -1.921318471431732e-06, -1.3504177331924438e-06, -7.795169949531555e-07, -2.086162567138672e-07, 3.6228448152542114e-07, 9.331852197647095e-07, 1.5040859580039978e-06, 2.074986696243286e-06, 2.6458874344825745e-06, 3.216788172721863e-06, 3.787688910961151e-06, 4.3585896492004395e-06, 4.929490387439728e-06, 5.500391125679016e-06, 6.0712918639183044e-06, 6.642192602157593e-06, 7.213093340396881e-06, 7.78399407863617e-06, 8.354894816875458e-06, 8.925795555114746e-06, 9.496696293354034e-06, 1.0067597031593323e-05, 1.0638497769832611e-05, 1.12093985080719e-05, 1.1780299246311188e-05, 1.2351199984550476e-05, 1.2922100722789764e-05, 1.3493001461029053e-05, 1.4063902199268341e-05, 1.463480293750763e-05, 1.5205703675746918e-05, 1.5776604413986206e-05, 1.6347505152225494e-05, 1.6918405890464783e-05, 1.748930662870407e-05, 1.806020736694336e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 7.0, 5.0, 0.0, 7.0, 0.0, 16.0, 0.0, 22.0, 37.0, 0.0, 59.0, 0.0, 140.0, 381.0, 0.0, 174.0, 0.0, 70.0, 33.0, 0.0, 20.0, 0.0, 13.0, 12.0, 0.0, 7.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.3709068298339844e-06, -1.3355165719985962e-06, -1.300126314163208e-06, -1.2647360563278198e-06, -1.2293457984924316e-06, -1.1939555406570435e-06, -1.1585652828216553e-06, -1.123175024986267e-06, -1.087784767150879e-06, -1.0523945093154907e-06, -1.0170042514801025e-06, -9.816139936447144e-07, -9.462237358093262e-07, -9.10833477973938e-07, -8.754432201385498e-07, -8.400529623031616e-07, -8.046627044677734e-07, -7.692724466323853e-07, -7.338821887969971e-07, -6.984919309616089e-07, -6.631016731262207e-07, -6.277114152908325e-07, -5.923211574554443e-07, -5.569308996200562e-07, -5.21540641784668e-07, -4.861503839492798e-07, -4.507601261138916e-07, -4.153698682785034e-07, -3.7997961044311523e-07, -3.4458935260772705e-07, -3.0919909477233887e-07, -2.738088369369507e-07, -2.384185791015625e-07, -2.0302832126617432e-07, -1.6763806343078613e-07, -1.3224780559539795e-07, -9.685754776000977e-08, -6.146728992462158e-08, -2.60770320892334e-08, 9.313225746154785e-09, 4.470348358154297e-08, 8.009374141693115e-08, 1.1548399925231934e-07, 1.5087425708770752e-07, 1.862645149230957e-07, 2.2165477275848389e-07, 2.5704503059387207e-07, 2.9243528842926025e-07, 3.2782554626464844e-07, 3.632158041000366e-07, 3.986060619354248e-07, 4.33996319770813e-07, 4.6938657760620117e-07, 5.047768354415894e-07, 5.401670932769775e-07, 5.755573511123657e-07, 6.109476089477539e-07, 6.463378667831421e-07, 6.817281246185303e-07, 7.171183824539185e-07, 7.525086402893066e-07, 7.878988981246948e-07, 8.23289155960083e-07, 8.586794137954712e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 10.0, 9.0, 20.0, 28.0, 40.0, 77.0, 79.0, 139.0, 263.0, 334.0, 837.0, 1072.0, 1770.0, 4706.0, 7099.0, 14028.0, 45238.0, 101050.0, 617422.0, 156182.0, 50991.0, 27061.0, 8941.0, 4638.0, 3205.0, 1207.0, 917.0, 409.0, 257.0, 202.0, 89.0, 71.0, 60.0, 27.0, 23.0, 12.0, 10.0, 11.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.973743438720703e-06, -6.77257776260376e-06, -6.571412086486816e-06, -6.370246410369873e-06, -6.16908073425293e-06, -5.967915058135986e-06, -5.766749382019043e-06, -5.5655837059021e-06, -5.364418029785156e-06, -5.163252353668213e-06, -4.9620866775512695e-06, -4.760921001434326e-06, -4.559755325317383e-06, -4.3585896492004395e-06, -4.157423973083496e-06, -3.956258296966553e-06, -3.7550926208496094e-06, -3.553926944732666e-06, -3.3527612686157227e-06, -3.1515955924987793e-06, -2.950429916381836e-06, -2.7492642402648926e-06, -2.5480985641479492e-06, -2.346932888031006e-06, -2.1457672119140625e-06, -1.944601535797119e-06, -1.7434358596801758e-06, -1.5422701835632324e-06, -1.341104507446289e-06, -1.1399388313293457e-06, -9.387731552124023e-07, -7.37607479095459e-07, -5.364418029785156e-07, -3.3527612686157227e-07, -1.341104507446289e-07, 6.705522537231445e-08, 2.682209014892578e-07, 4.6938657760620117e-07, 6.705522537231445e-07, 8.717179298400879e-07, 1.0728836059570312e-06, 1.2740492820739746e-06, 1.475214958190918e-06, 1.6763806343078613e-06, 1.8775463104248047e-06, 2.078711986541748e-06, 2.2798776626586914e-06, 2.4810433387756348e-06, 2.682209014892578e-06, 2.8833746910095215e-06, 3.084540367126465e-06, 3.285706043243408e-06, 3.4868717193603516e-06, 3.688037395477295e-06, 3.889203071594238e-06, 4.090368747711182e-06, 4.291534423828125e-06, 4.492700099945068e-06, 4.693865776062012e-06, 4.895031452178955e-06, 5.0961971282958984e-06, 5.297362804412842e-06, 5.498528480529785e-06, 5.6996941566467285e-06, 5.900859832763672e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 8.0, 5.0, 10.0, 0.0, 15.0, 23.0, 23.0, 32.0, 27.0, 44.0, 61.0, 90.0, 0.0, 92.0, 100.0, 107.0, 84.0, 58.0, 39.0, 34.0, 37.0, 0.0, 28.0, 24.0, 18.0, 7.0, 15.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.496635377407074e-06, -1.4435499906539917e-06, -1.3904646039009094e-06, -1.3373792171478271e-06, -1.2842938303947449e-06, -1.2312084436416626e-06, -1.1781230568885803e-06, -1.125037670135498e-06, -1.0719522833824158e-06, -1.0188668966293335e-06, -9.657815098762512e-07, -9.126961231231689e-07, -8.596107363700867e-07, -8.065253496170044e-07, -7.534399628639221e-07, -7.003545761108398e-07, -6.472691893577576e-07, -5.941838026046753e-07, -5.41098415851593e-07, -4.880130290985107e-07, -4.3492764234542847e-07, -3.818422555923462e-07, -3.287568688392639e-07, -2.7567148208618164e-07, -2.2258609533309937e-07, -1.695007085800171e-07, -1.1641532182693481e-07, -6.332993507385254e-08, -1.0244548320770264e-08, 4.284083843231201e-08, 9.592622518539429e-08, 1.4901161193847656e-07, 2.0209699869155884e-07, 2.551823854446411e-07, 3.082677721977234e-07, 3.6135315895080566e-07, 4.1443854570388794e-07, 4.675239324569702e-07, 5.206093192100525e-07, 5.736947059631348e-07, 6.26780092716217e-07, 6.798654794692993e-07, 7.329508662223816e-07, 7.860362529754639e-07, 8.391216397285461e-07, 8.922070264816284e-07, 9.452924132347107e-07, 9.98377799987793e-07, 1.0514631867408752e-06, 1.1045485734939575e-06, 1.1576339602470398e-06, 1.210719347000122e-06, 1.2638047337532043e-06, 1.3168901205062866e-06, 1.369975507259369e-06, 1.4230608940124512e-06, 1.4761462807655334e-06, 1.5292316675186157e-06, 1.582317054271698e-06, 1.6354024410247803e-06, 1.6884878277778625e-06, 1.7415732145309448e-06, 1.794658601284027e-06, 1.8477439880371094e-06]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 10.0, 13.0, 8.0, 16.0, 22.0, 18.0, 39.0, 43.0, 69.0, 93.0, 147.0, 157.0, 87.0, 63.0, 52.0, 40.0, 24.0, 20.0, 15.0, 8.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020626587502192706, -0.00019941026403103024, -0.00019255466759204865, -0.00018569905660115182, -0.000178843445610255, -0.00017198783461935818, -0.00016513222362846136, -0.00015827662718947977, -0.00015142101619858295, -0.00014456540520768613, -0.00013770980876870453, -0.0001308541977778077, -0.0001239985867869109, -0.00011714297579601407, -0.00011028737208107486, -0.00010343176836613566, -9.657615737523884e-05, -8.972054638434201e-05, -8.286494266940281e-05, -7.60093389544636e-05, -6.915372796356678e-05, -6.229811697266996e-05, -5.544251325773075e-05, -4.858690590481274e-05, -4.1731298551894724e-05, -3.487569119897671e-05, -2.8020083846058697e-05, -2.1164476493140683e-05, -1.4308869140222669e-05, -7.453261787304655e-06, -5.976544343866408e-07, 6.257952918531373e-06, 1.3113545719534159e-05, 1.9969153072452173e-05, 2.6824760425370187e-05, 3.36803677782882e-05, 4.0535975131206214e-05, 4.739158248412423e-05, 5.424718983704224e-05, 6.110279355198145e-05, 6.795840454287827e-05, 7.481401553377509e-05, 8.16696192487143e-05, 8.85252229636535e-05, 9.538083395455033e-05, 0.00010223644494544715, 0.00010909204866038635, 0.00011594765237532556, 0.00012280326336622238, 0.0001296588743571192, 0.00013651448534801602, 0.00014337008178699762, 0.00015022569277789444, 0.00015708130376879126, 0.00016393690020777285, 0.00017079251119866967, 0.0001776481221895665, 0.00018450373318046331, 0.00019135934417136014, 0.00019821494061034173, 0.00020507055160123855, 0.00021192616259213537, 0.00021878175903111696, 0.00022563737002201378, 0.0002324929810129106]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 11.0, 6.0, 9.0, 14.0, 15.0, 11.0, 18.0, 18.0, 17.0, 29.0, 17.0, 34.0, 41.0, 32.0, 41.0, 39.0, 39.0, 36.0, 35.0, 41.0, 37.0, 34.0, 37.0, 28.0, 33.0, 36.0, 27.0, 40.0, 37.0, 26.0, 15.0, 18.0, 16.0, 18.0, 17.0, 7.0, 13.0, 7.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 6.0, 3.0, 3.0, 1.0], "bins": [-0.00012676892220042646, -0.0001231811911566183, -0.00011959346738876775, -0.00011600573634495959, -0.00011241801257710904, -0.00010883028153330088, -0.00010524255048949271, -0.00010165482672164217, -9.806710295379162e-05, -9.447937190998346e-05, -9.089164814213291e-05, -8.730391709832475e-05, -8.37161933304742e-05, -8.012846228666604e-05, -7.654073124285787e-05, -7.295300747500733e-05, -6.936527643119916e-05, -6.5777545387391e-05, -6.218982161954045e-05, -5.860209057573229e-05, -5.501436680788174e-05, -5.142663576407358e-05, -4.7838908358244225e-05, -4.425118095241487e-05, -4.0663453546585515e-05, -3.707572614075616e-05, -3.3487998734926805e-05, -2.9900269510108046e-05, -2.631254210427869e-05, -2.2724814698449336e-05, -1.9137085473630577e-05, -1.5549358067801222e-05, -1.1961630661971867e-05, -8.373903256142512e-06, -4.786174940818455e-06, -1.1984466254943982e-06, 2.389280780334957e-06, 5.977008186164312e-06, 9.56473741098307e-06, 1.3152464816812426e-05, 1.674019222264178e-05, 2.0327919628471136e-05, 2.391564703430049e-05, 2.750337625911925e-05, 3.109110548393801e-05, 3.4678829251788557e-05, 3.826656029559672e-05, 4.1854287701426074e-05, 4.544201510725543e-05, 4.9029742513084784e-05, 5.261746991891414e-05, 5.62052009627223e-05, 5.979292473057285e-05, 6.338065577438101e-05, 6.696837954223156e-05, 7.055611058603972e-05, 7.414384162984788e-05, 7.773157267365605e-05, 8.13192964415066e-05, 8.490702748531476e-05, 8.84947512531653e-05, 9.208248229697347e-05, 9.567021334078163e-05, 9.925793710863218e-05, 0.00010284566087648273]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 3.0, 5.0, 9.0, 10.0, 13.0, 9.0, 19.0, 14.0, 15.0, 25.0, 31.0, 48.0, 70.0, 105.0, 234.0, 427.0, 1041.0, 2575.0, 7598.0, 66550.0, 4092673.0, 15224.0, 4448.0, 1646.0, 667.0, 307.0, 163.0, 87.0, 56.0, 46.0, 28.0, 19.0, 21.0, 16.0, 11.0, 16.0, 8.0, 11.0, 2.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008492469787597656, -0.0008220598101615906, -0.0007948726415634155, -0.0007676854729652405, -0.0007404983043670654, -0.0007133111357688904, -0.0006861239671707153, -0.0006589367985725403, -0.0006317496299743652, -0.0006045624613761902, -0.0005773752927780151, -0.0005501881241798401, -0.000523000955581665, -0.00049581378698349, -0.00046862661838531494, -0.0004414394497871399, -0.00041425228118896484, -0.0003870651125907898, -0.00035987794399261475, -0.0003326907753944397, -0.00030550360679626465, -0.0002783164381980896, -0.00025112926959991455, -0.0002239421010017395, -0.00019675493240356445, -0.0001695677638053894, -0.00014238059520721436, -0.0001151934266090393, -8.800625801086426e-05, -6.081908941268921e-05, -3.363192081451416e-05, -6.444752216339111e-06, 2.0742416381835938e-05, 4.7929584980010986e-05, 7.511675357818604e-05, 0.00010230392217636108, 0.00012949109077453613, 0.00015667825937271118, 0.00018386542797088623, 0.00021105259656906128, 0.00023823976516723633, 0.0002654269337654114, 0.0002926141023635864, 0.0003198012709617615, 0.0003469884395599365, 0.00037417560815811157, 0.0004013627767562866, 0.00042854994535446167, 0.0004557371139526367, 0.00048292428255081177, 0.0005101114511489868, 0.0005372986197471619, 0.0005644857883453369, 0.000591672956943512, 0.000618860125541687, 0.0006460472941398621, 0.0006732344627380371, 0.0007004216313362122, 0.0007276087999343872, 0.0007547959685325623, 0.0007819831371307373, 0.0008091703057289124, 0.0008363574743270874, 0.0008635446429252625, 0.0008907318115234375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 12.0, 7.0, 7.0, 12.0, 16.0, 15.0, 14.0, 19.0, 23.0, 27.0, 28.0, 36.0, 44.0, 36.0, 48.0, 33.0, 38.0, 40.0, 45.0, 42.0, 38.0, 43.0, 37.0, 27.0, 40.0, 33.0, 40.0, 30.0, 26.0, 18.0, 19.0, 17.0, 14.0, 15.0, 9.0, 9.0, 5.0, 7.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.700920104980469e-05, -7.45728611946106e-05, -7.21365213394165e-05, -6.970018148422241e-05, -6.726384162902832e-05, -6.482750177383423e-05, -6.239116191864014e-05, -5.9954822063446045e-05, -5.751848220825195e-05, -5.508214235305786e-05, -5.264580249786377e-05, -5.020946264266968e-05, -4.7773122787475586e-05, -4.5336782932281494e-05, -4.29004430770874e-05, -4.046410322189331e-05, -3.802776336669922e-05, -3.559142351150513e-05, -3.3155083656311035e-05, -3.071874380111694e-05, -2.828240394592285e-05, -2.584606409072876e-05, -2.3409724235534668e-05, -2.0973384380340576e-05, -1.8537044525146484e-05, -1.6100704669952393e-05, -1.36643648147583e-05, -1.1228024959564209e-05, -8.791685104370117e-06, -6.355345249176025e-06, -3.919005393981934e-06, -1.4826655387878418e-06, 9.5367431640625e-07, 3.390014171600342e-06, 5.826354026794434e-06, 8.262693881988525e-06, 1.0699033737182617e-05, 1.3135373592376709e-05, 1.55717134475708e-05, 1.8008053302764893e-05, 2.0444393157958984e-05, 2.2880733013153076e-05, 2.5317072868347168e-05, 2.775341272354126e-05, 3.018975257873535e-05, 3.262609243392944e-05, 3.5062432289123535e-05, 3.749877214431763e-05, 3.993511199951172e-05, 4.237145185470581e-05, 4.48077917098999e-05, 4.7244131565093994e-05, 4.9680471420288086e-05, 5.211681127548218e-05, 5.455315113067627e-05, 5.698949098587036e-05, 5.942583084106445e-05, 6.186217069625854e-05, 6.429851055145264e-05, 6.673485040664673e-05, 6.917119026184082e-05, 7.160753011703491e-05, 7.4043869972229e-05, 7.64802098274231e-05, 7.891654968261719e-05]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 25.0, 23.0, 63.0, 89.0, 169.0, 292.0, 549.0, 1159.0, 2712.0, 8953.0, 65202.0, 4063101.0, 40490.0, 7124.0, 2255.0, 964.0, 461.0, 260.0, 144.0, 82.0, 51.0, 29.0, 21.0, 10.0, 7.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007038116455078125, -0.0006806701421737671, -0.0006575286388397217, -0.0006343871355056763, -0.0006112456321716309, -0.0005881041288375854, -0.00056496262550354, -0.0005418211221694946, -0.0005186796188354492, -0.0004955381155014038, -0.0004723966121673584, -0.000449255108833313, -0.0004261136054992676, -0.00040297210216522217, -0.00037983059883117676, -0.00035668909549713135, -0.00033354759216308594, -0.00031040608882904053, -0.0002872645854949951, -0.0002641230821609497, -0.0002409815788269043, -0.0002178400754928589, -0.00019469857215881348, -0.00017155706882476807, -0.00014841556549072266, -0.00012527406215667725, -0.00010213255882263184, -7.899105548858643e-05, -5.5849552154541016e-05, -3.2708048820495605e-05, -9.566545486450195e-06, 1.3574957847595215e-05, 3.6716461181640625e-05, 5.9857964515686035e-05, 8.299946784973145e-05, 0.00010614097118377686, 0.00012928247451782227, 0.00015242397785186768, 0.00017556548118591309, 0.0001987069845199585, 0.0002218484878540039, 0.0002449899911880493, 0.0002681314945220947, 0.00029127299785614014, 0.00031441450119018555, 0.00033755600452423096, 0.00036069750785827637, 0.0003838390111923218, 0.0004069805145263672, 0.0004301220178604126, 0.000453263521194458, 0.0004764050245285034, 0.0004995465278625488, 0.0005226880311965942, 0.0005458295345306396, 0.0005689710378646851, 0.0005921125411987305, 0.0006152540445327759, 0.0006383955478668213, 0.0006615370512008667, 0.0006846785545349121, 0.0007078200578689575, 0.0007309615612030029, 0.0007541030645370483, 0.0007772445678710938]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 3.0, 9.0, 16.0, 31.0, 59.0, 180.0, 1313.0, 2142.0, 165.0, 46.0, 27.0, 18.0, 13.0, 15.0, 7.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011646747589111328, -0.00011304207146167755, -0.00010961666703224182, -0.00010619126260280609, -0.00010276585817337036, -9.934045374393463e-05, -9.59150493144989e-05, -9.248964488506317e-05, -8.906424045562744e-05, -8.563883602619171e-05, -8.221343159675598e-05, -7.878802716732025e-05, -7.536262273788452e-05, -7.193721830844879e-05, -6.851181387901306e-05, -6.508640944957733e-05, -6.16610050201416e-05, -5.823560059070587e-05, -5.481019616127014e-05, -5.138479173183441e-05, -4.795938730239868e-05, -4.453398287296295e-05, -4.110857844352722e-05, -3.768317401409149e-05, -3.425776958465576e-05, -3.083236515522003e-05, -2.7406960725784302e-05, -2.3981556296348572e-05, -2.0556151866912842e-05, -1.7130747437477112e-05, -1.3705343008041382e-05, -1.0279938578605652e-05, -6.854534149169922e-06, -3.429129719734192e-06, -3.725290298461914e-09, 3.421679139137268e-06, 6.847083568572998e-06, 1.0272487998008728e-05, 1.3697892427444458e-05, 1.7123296856880188e-05, 2.0548701286315918e-05, 2.3974105715751648e-05, 2.7399510145187378e-05, 3.082491457462311e-05, 3.425031900405884e-05, 3.767572343349457e-05, 4.11011278629303e-05, 4.452653229236603e-05, 4.795193672180176e-05, 5.137734115123749e-05, 5.480274558067322e-05, 5.822815001010895e-05, 6.165355443954468e-05, 6.507895886898041e-05, 6.850436329841614e-05, 7.192976772785187e-05, 7.53551721572876e-05, 7.878057658672333e-05, 8.220598101615906e-05, 8.563138544559479e-05, 8.905678987503052e-05, 9.248219430446625e-05, 9.590759873390198e-05, 9.933300316333771e-05, 0.00010275840759277344]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 8.0, 7.0, 10.0, 14.0, 9.0, 26.0, 21.0, 61.0, 86.0, 89.0, 173.0, 154.0, 94.0, 61.0, 48.0, 37.0, 26.0, 15.0, 17.0, 5.0, 8.0, 10.0, 8.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001678686385275796, -0.00016292034706566483, -0.00015797207015566528, -0.0001530237786937505, -0.00014807548723183572, -0.00014312719576992095, -0.00013817890430800617, -0.00013323062739800662, -0.00012828233593609184, -0.00012333404447417706, -0.0001183857602882199, -0.00011343747610226274, -0.00010848918464034796, -0.00010354089317843318, -9.859260899247602e-05, -9.364432480651885e-05, -8.869603334460407e-05, -8.37477418826893e-05, -7.879945769673213e-05, -7.385117351077497e-05, -6.890288204886019e-05, -6.395459058694541e-05, -5.900630640098825e-05, -5.405801857705228e-05, -4.910973075311631e-05, -4.416144292918034e-05, -3.921315510524437e-05, -3.42648672813084e-05, -2.9316579457372427e-05, -2.4368291633436456e-05, -1.9420003809500486e-05, -1.4471715985564515e-05, -9.523442713543773e-06, -4.575154889607802e-06, 3.7313293432816863e-07, 5.321420758264139e-06, 1.026970858220011e-05, 1.521799640613608e-05, 2.016628423007205e-05, 2.5114572054008022e-05, 3.0062859877943993e-05, 3.501114770187996e-05, 3.9959435525815934e-05, 4.4907723349751905e-05, 4.9856011173687875e-05, 5.4804298997623846e-05, 5.9752586821559817e-05, 6.470087100751698e-05, 6.964916246943176e-05, 7.459745393134654e-05, 7.95457381173037e-05, 8.449402230326086e-05, 8.944231376517564e-05, 9.439060522709042e-05, 9.933888941304758e-05, 0.00010428717359900475, 0.00010923546506091952, 0.0001141837565228343, 0.00011913204070879146, 0.00012408032489474863, 0.0001290286163566634, 0.00013397690781857818, 0.00013892518472857773, 0.0001438734761904925, 0.0001488217676524073]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 2.0, 7.0, 2.0, 10.0, 13.0, 14.0, 20.0, 18.0, 22.0, 20.0, 38.0, 36.0, 29.0, 36.0, 30.0, 42.0, 34.0, 49.0, 35.0, 50.0, 48.0, 49.0, 47.0, 43.0, 38.0, 39.0, 36.0, 22.0, 26.0, 22.0, 20.0, 24.0, 12.0, 13.0, 18.0, 10.0, 10.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.710594895295799e-05, -9.435342508368194e-05, -9.16009012144059e-05, -8.884838462108746e-05, -8.609586075181141e-05, -8.334333688253537e-05, -8.059082028921694e-05, -7.783829641994089e-05, -7.508577255066484e-05, -7.23332486813888e-05, -6.958072481211275e-05, -6.682820821879432e-05, -6.407568434951827e-05, -6.132316048024222e-05, -5.857064024894498e-05, -5.581812001764774e-05, -5.3065596148371696e-05, -5.031307227909565e-05, -4.756055204779841e-05, -4.480803181650117e-05, -4.2055507947225124e-05, -3.930298407794908e-05, -3.655046384665184e-05, -3.37979436153546e-05, -3.104541974607855e-05, -2.8292897695791908e-05, -2.5540375645505264e-05, -2.278785359521862e-05, -2.0035331544931978e-05, -1.7282809494645335e-05, -1.4530287444358692e-05, -1.1777765394072048e-05, -9.025236067827791e-06, -6.272714017541148e-06, -3.5201919672545046e-06, -7.676699169678614e-07, 1.984852133318782e-06, 4.737374183605425e-06, 7.489896233892068e-06, 1.0242418284178711e-05, 1.2994940334465355e-05, 1.5747462384751998e-05, 1.849998443503864e-05, 2.1252506485325284e-05, 2.4005028535611928e-05, 2.675755058589857e-05, 2.9510072636185214e-05, 3.2262592867482454e-05, 3.50151167367585e-05, 3.776764060603455e-05, 4.052016083733179e-05, 4.3272681068629026e-05, 4.602520493790507e-05, 4.877772880718112e-05, 5.153024903847836e-05, 5.42827692697756e-05, 5.7035293139051646e-05, 5.978781700832769e-05, 6.254033360164613e-05, 6.529285747092217e-05, 6.804538134019822e-05, 7.079790520947427e-05, 7.355042907875031e-05, 7.630294567206874e-05, 7.905546954134479e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 14.0, 18.0, 22.0, 30.0, 41.0, 64.0, 116.0, 161.0, 257.0, 390.0, 602.0, 959.0, 1403.0, 2221.0, 3523.0, 5340.0, 8531.0, 13107.0, 21285.0, 36446.0, 62769.0, 115400.0, 264564.0, 244659.0, 112638.0, 61449.0, 35605.0, 20812.0, 12844.0, 8382.0, 5265.0, 3372.0, 2275.0, 1422.0, 901.0, 616.0, 358.0, 214.0, 164.0, 107.0, 67.0, 33.0, 34.0, 28.0, 16.0, 12.0, 3.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-05, -8.056685328483582e-05, -7.768720388412476e-05, -7.48075544834137e-05, -7.192790508270264e-05, -6.904825568199158e-05, -6.616860628128052e-05, -6.328895688056946e-05, -6.04093074798584e-05, -5.752965807914734e-05, -5.465000867843628e-05, -5.177035927772522e-05, -4.889070987701416e-05, -4.60110604763031e-05, -4.313141107559204e-05, -4.025176167488098e-05, -3.737211227416992e-05, -3.449246287345886e-05, -3.16128134727478e-05, -2.8733164072036743e-05, -2.5853514671325684e-05, -2.2973865270614624e-05, -2.0094215869903564e-05, -1.7214566469192505e-05, -1.4334917068481445e-05, -1.1455267667770386e-05, -8.575618267059326e-06, -5.695968866348267e-06, -2.816319465637207e-06, 6.332993507385254e-08, 2.942979335784912e-06, 5.822628736495972e-06, 8.702278137207031e-06, 1.158192753791809e-05, 1.446157693862915e-05, 1.734122633934021e-05, 2.022087574005127e-05, 2.310052514076233e-05, 2.598017454147339e-05, 2.8859823942184448e-05, 3.173947334289551e-05, 3.461912274360657e-05, 3.749877214431763e-05, 4.0378421545028687e-05, 4.3258070945739746e-05, 4.6137720346450806e-05, 4.9017369747161865e-05, 5.1897019147872925e-05, 5.4776668548583984e-05, 5.7656317949295044e-05, 6.0535967350006104e-05, 6.341561675071716e-05, 6.629526615142822e-05, 6.917491555213928e-05, 7.205456495285034e-05, 7.49342143535614e-05, 7.781386375427246e-05, 8.069351315498352e-05, 8.357316255569458e-05, 8.645281195640564e-05, 8.93324613571167e-05, 9.221211075782776e-05, 9.509176015853882e-05, 9.797140955924988e-05, 0.00010085105895996094]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 6.0, 6.0, 9.0, 15.0, 18.0, 13.0, 20.0, 27.0, 26.0, 45.0, 38.0, 34.0, 35.0, 49.0, 32.0, 40.0, 48.0, 61.0, 49.0, 36.0, 57.0, 48.0, 50.0, 40.0, 24.0, 29.0, 25.0, 13.0, 20.0, 13.0, 11.0, 16.0, 15.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010436773300170898, -0.00010138656944036484, -9.840540587902069e-05, -9.542424231767654e-05, -9.24430787563324e-05, -8.946191519498825e-05, -8.64807516336441e-05, -8.349958807229996e-05, -8.051842451095581e-05, -7.753726094961166e-05, -7.455609738826752e-05, -7.157493382692337e-05, -6.859377026557922e-05, -6.561260670423508e-05, -6.263144314289093e-05, -5.9650279581546783e-05, -5.666911602020264e-05, -5.368795245885849e-05, -5.070678889751434e-05, -4.7725625336170197e-05, -4.474446177482605e-05, -4.17632982134819e-05, -3.8782134652137756e-05, -3.580097109079361e-05, -3.281980752944946e-05, -2.9838643968105316e-05, -2.685748040676117e-05, -2.3876316845417023e-05, -2.0895153284072876e-05, -1.791398972272873e-05, -1.4932826161384583e-05, -1.1951662600040436e-05, -8.970499038696289e-06, -5.989335477352142e-06, -3.0081719160079956e-06, -2.7008354663848877e-08, 2.954155206680298e-06, 5.935318768024445e-06, 8.916482329368591e-06, 1.1897645890712738e-05, 1.4878809452056885e-05, 1.785997301340103e-05, 2.0841136574745178e-05, 2.3822300136089325e-05, 2.680346369743347e-05, 2.978462725877762e-05, 3.2765790820121765e-05, 3.574695438146591e-05, 3.872811794281006e-05, 4.1709281504154205e-05, 4.469044506549835e-05, 4.76716086268425e-05, 5.0652772188186646e-05, 5.363393574953079e-05, 5.661509931087494e-05, 5.9596262872219086e-05, 6.257742643356323e-05, 6.555858999490738e-05, 6.853975355625153e-05, 7.152091711759567e-05, 7.450208067893982e-05, 7.748324424028397e-05, 8.046440780162811e-05, 8.344557136297226e-05, 8.64267349243164e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 4.0, 14.0, 14.0, 22.0, 28.0, 48.0, 77.0, 104.0, 138.0, 177.0, 299.0, 401.0, 621.0, 846.0, 1313.0, 1911.0, 3052.0, 4823.0, 7940.0, 13866.0, 24062.0, 49160.0, 126385.0, 492270.0, 185634.0, 63736.0, 30004.0, 16223.0, 9451.0, 5492.0, 3593.0, 2182.0, 1488.0, 1023.0, 631.0, 473.0, 345.0, 202.0, 139.0, 120.0, 79.0, 55.0, 29.0, 16.0, 16.0, 9.0, 12.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001074075698852539, -0.00010390393435955048, -0.00010040029883384705, -9.689666330814362e-05, -9.339302778244019e-05, -8.988939225673676e-05, -8.638575673103333e-05, -8.28821212053299e-05, -7.937848567962646e-05, -7.587485015392303e-05, -7.23712146282196e-05, -6.886757910251617e-05, -6.536394357681274e-05, -6.186030805110931e-05, -5.8356672525405884e-05, -5.4853036999702454e-05, -5.1349401473999023e-05, -4.784576594829559e-05, -4.434213042259216e-05, -4.083849489688873e-05, -3.73348593711853e-05, -3.383122384548187e-05, -3.0327588319778442e-05, -2.6823952794075012e-05, -2.3320317268371582e-05, -1.9816681742668152e-05, -1.631304621696472e-05, -1.2809410691261292e-05, -9.305775165557861e-06, -5.802139639854431e-06, -2.298504114151001e-06, 1.2051314115524292e-06, 4.708766937255859e-06, 8.21240246295929e-06, 1.171603798866272e-05, 1.521967351436615e-05, 1.872330904006958e-05, 2.222694456577301e-05, 2.573058009147644e-05, 2.923421561717987e-05, 3.27378511428833e-05, 3.624148666858673e-05, 3.974512219429016e-05, 4.324875771999359e-05, 4.675239324569702e-05, 5.025602877140045e-05, 5.375966429710388e-05, 5.726329982280731e-05, 6.076693534851074e-05, 6.427057087421417e-05, 6.77742063999176e-05, 7.127784192562103e-05, 7.478147745132446e-05, 7.828511297702789e-05, 8.178874850273132e-05, 8.529238402843475e-05, 8.879601955413818e-05, 9.229965507984161e-05, 9.580329060554504e-05, 9.930692613124847e-05, 0.0001028105616569519, 0.00010631419718265533, 0.00010981783270835876, 0.0001133214682340622, 0.00011682510375976562]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 6.0, 6.0, 12.0, 15.0, 9.0, 16.0, 12.0, 7.0, 22.0, 22.0, 29.0, 23.0, 31.0, 27.0, 34.0, 32.0, 38.0, 42.0, 36.0, 37.0, 33.0, 34.0, 36.0, 47.0, 29.0, 28.0, 36.0, 33.0, 29.0, 29.0, 22.0, 34.0, 22.0, 30.0, 10.0, 17.0, 11.0, 6.0, 7.0, 5.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-5.1081180572509766e-05, -4.956405609846115e-05, -4.804693162441254e-05, -4.652980715036392e-05, -4.501268267631531e-05, -4.349555820226669e-05, -4.197843372821808e-05, -4.0461309254169464e-05, -3.894418478012085e-05, -3.7427060306072235e-05, -3.590993583202362e-05, -3.4392811357975006e-05, -3.287568688392639e-05, -3.135856240987778e-05, -2.9841437935829163e-05, -2.8324313461780548e-05, -2.6807188987731934e-05, -2.529006451368332e-05, -2.3772940039634705e-05, -2.225581556558609e-05, -2.0738691091537476e-05, -1.922156661748886e-05, -1.7704442143440247e-05, -1.6187317669391632e-05, -1.4670193195343018e-05, -1.3153068721294403e-05, -1.1635944247245789e-05, -1.0118819773197174e-05, -8.60169529914856e-06, -7.084570825099945e-06, -5.5674463510513306e-06, -4.050321877002716e-06, -2.5331974029541016e-06, -1.016072928905487e-06, 5.010515451431274e-07, 2.018176019191742e-06, 3.5353004932403564e-06, 5.052424967288971e-06, 6.5695494413375854e-06, 8.0866739153862e-06, 9.603798389434814e-06, 1.1120922863483429e-05, 1.2638047337532043e-05, 1.4155171811580658e-05, 1.5672296285629272e-05, 1.7189420759677887e-05, 1.87065452337265e-05, 2.0223669707775116e-05, 2.174079418182373e-05, 2.3257918655872345e-05, 2.477504312992096e-05, 2.6292167603969574e-05, 2.780929207801819e-05, 2.9326416552066803e-05, 3.084354102611542e-05, 3.236066550016403e-05, 3.3877789974212646e-05, 3.539491444826126e-05, 3.6912038922309875e-05, 3.842916339635849e-05, 3.9946287870407104e-05, 4.146341234445572e-05, 4.2980536818504333e-05, 4.449766129255295e-05, 4.601478576660156e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 6.0, 7.0, 14.0, 15.0, 51.0, 59.0, 64.0, 72.0, 118.0, 223.0, 291.0, 491.0, 605.0, 1037.0, 1575.0, 2599.0, 4691.0, 8332.0, 18703.0, 48203.0, 312819.0, 553130.0, 53966.0, 19424.0, 9250.0, 5365.0, 2632.0, 1578.0, 1122.0, 638.0, 462.0, 326.0, 215.0, 125.0, 82.0, 63.0, 63.0, 40.0, 30.0, 15.0, 14.0, 8.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.174731343984604e-05, -2.1023675799369812e-05, -2.0300038158893585e-05, -1.957640051841736e-05, -1.885276287794113e-05, -1.8129125237464905e-05, -1.7405487596988678e-05, -1.668184995651245e-05, -1.5958212316036224e-05, -1.5234574675559998e-05, -1.451093703508377e-05, -1.3787299394607544e-05, -1.3063661754131317e-05, -1.234002411365509e-05, -1.1616386473178864e-05, -1.0892748832702637e-05, -1.016911119222641e-05, -9.445473551750183e-06, -8.721835911273956e-06, -7.99819827079773e-06, -7.274560630321503e-06, -6.550922989845276e-06, -5.827285349369049e-06, -5.103647708892822e-06, -4.3800100684165955e-06, -3.6563724279403687e-06, -2.932734787464142e-06, -2.209097146987915e-06, -1.4854595065116882e-06, -7.618218660354614e-07, -3.818422555923462e-08, 6.854534149169922e-07, 1.409091055393219e-06, 2.132728695869446e-06, 2.8563663363456726e-06, 3.5800039768218994e-06, 4.303641617298126e-06, 5.027279257774353e-06, 5.75091689825058e-06, 6.474554538726807e-06, 7.1981921792030334e-06, 7.92182981967926e-06, 8.645467460155487e-06, 9.369105100631714e-06, 1.009274274110794e-05, 1.0816380381584167e-05, 1.1540018022060394e-05, 1.2263655662536621e-05, 1.2987293303012848e-05, 1.3710930943489075e-05, 1.4434568583965302e-05, 1.5158206224441528e-05, 1.5881843864917755e-05, 1.6605481505393982e-05, 1.732911914587021e-05, 1.8052756786346436e-05, 1.8776394426822662e-05, 1.950003206729889e-05, 2.0223669707775116e-05, 2.0947307348251343e-05, 2.167094498872757e-05, 2.2394582629203796e-05, 2.3118220269680023e-05, 2.384185791015625e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 7.0, 7.0, 0.0, 11.0, 11.0, 22.0, 0.0, 28.0, 22.0, 20.0, 0.0, 46.0, 52.0, 46.0, 0.0, 58.0, 76.0, 157.0, 74.0, 0.0, 61.0, 65.0, 38.0, 0.0, 51.0, 24.0, 23.0, 0.0, 23.0, 18.0, 12.0, 0.0, 12.0, 10.0, 8.0, 1.0, 0.0, 6.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4444813132286072e-06, -1.3988465070724487e-06, -1.3532117009162903e-06, -1.3075768947601318e-06, -1.2619420886039734e-06, -1.216307282447815e-06, -1.1706724762916565e-06, -1.125037670135498e-06, -1.0794028639793396e-06, -1.0337680578231812e-06, -9.881332516670227e-07, -9.424984455108643e-07, -8.968636393547058e-07, -8.512288331985474e-07, -8.055940270423889e-07, -7.599592208862305e-07, -7.14324414730072e-07, -6.686896085739136e-07, -6.230548024177551e-07, -5.774199962615967e-07, -5.317851901054382e-07, -4.861503839492798e-07, -4.4051557779312134e-07, -3.948807716369629e-07, -3.4924596548080444e-07, -3.03611159324646e-07, -2.5797635316848755e-07, -2.123415470123291e-07, -1.6670674085617065e-07, -1.210719347000122e-07, -7.543712854385376e-08, -2.9802322387695312e-08, 1.5832483768463135e-08, 6.146728992462158e-08, 1.0710209608078003e-07, 1.5273690223693848e-07, 1.9837170839309692e-07, 2.4400651454925537e-07, 2.896413207054138e-07, 3.3527612686157227e-07, 3.809109330177307e-07, 4.2654573917388916e-07, 4.721805453300476e-07, 5.178153514862061e-07, 5.634501576423645e-07, 6.09084963798523e-07, 6.547197699546814e-07, 7.003545761108398e-07, 7.459893822669983e-07, 7.916241884231567e-07, 8.372589945793152e-07, 8.828938007354736e-07, 9.285286068916321e-07, 9.741634130477905e-07, 1.019798219203949e-06, 1.0654330253601074e-06, 1.1110678315162659e-06, 1.1567026376724243e-06, 1.2023374438285828e-06, 1.2479722499847412e-06, 1.2936070561408997e-06, 1.339241862297058e-06, 1.3848766684532166e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 20.0, 28.0, 35.0, 69.0, 82.0, 188.0, 307.0, 612.0, 1291.0, 3712.0, 11071.0, 45101.0, 514086.0, 413749.0, 41677.0, 10351.0, 3388.0, 1393.0, 610.0, 322.0, 166.0, 103.0, 58.0, 37.0, 25.0, 14.0, 16.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.641843795776367e-05, -3.516208380460739e-05, -3.390572965145111e-05, -3.264937549829483e-05, -3.139302134513855e-05, -3.013666719198227e-05, -2.888031303882599e-05, -2.7623958885669708e-05, -2.6367604732513428e-05, -2.5111250579357147e-05, -2.3854896426200867e-05, -2.2598542273044586e-05, -2.1342188119888306e-05, -2.0085833966732025e-05, -1.8829479813575745e-05, -1.7573125660419464e-05, -1.6316771507263184e-05, -1.5060417354106903e-05, -1.3804063200950623e-05, -1.2547709047794342e-05, -1.1291354894638062e-05, -1.0035000741481781e-05, -8.7786465883255e-06, -7.52229243516922e-06, -6.2659382820129395e-06, -5.009584128856659e-06, -3.7532299757003784e-06, -2.496875822544098e-06, -1.2405216693878174e-06, 1.5832483768463135e-08, 1.2721866369247437e-06, 2.528540790081024e-06, 3.7848949432373047e-06, 5.041249096393585e-06, 6.297603249549866e-06, 7.553957402706146e-06, 8.810311555862427e-06, 1.0066665709018707e-05, 1.1323019862174988e-05, 1.2579374015331268e-05, 1.3835728168487549e-05, 1.509208232164383e-05, 1.634843647480011e-05, 1.760479062795639e-05, 1.886114478111267e-05, 2.011749893426895e-05, 2.1373853087425232e-05, 2.2630207240581512e-05, 2.3886561393737793e-05, 2.5142915546894073e-05, 2.6399269700050354e-05, 2.7655623853206635e-05, 2.8911978006362915e-05, 3.0168332159519196e-05, 3.1424686312675476e-05, 3.2681040465831757e-05, 3.393739461898804e-05, 3.519374877214432e-05, 3.64501029253006e-05, 3.770645707845688e-05, 3.896281123161316e-05, 4.021916538476944e-05, 4.147551953792572e-05, 4.2731873691082e-05, 4.398822784423828e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 20.0, 19.0, 25.0, 29.0, 32.0, 59.0, 59.0, 79.0, 106.0, 120.0, 103.0, 76.0, 55.0, 43.0, 32.0, 25.0, 20.0, 17.0, 17.0, 9.0, 8.0, 7.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.080605089664459e-06, -5.902722477912903e-06, -5.7248398661613464e-06, -5.54695725440979e-06, -5.369074642658234e-06, -5.191192030906677e-06, -5.013309419155121e-06, -4.8354268074035645e-06, -4.657544195652008e-06, -4.479661583900452e-06, -4.301778972148895e-06, -4.123896360397339e-06, -3.9460137486457825e-06, -3.768131136894226e-06, -3.5902485251426697e-06, -3.4123659133911133e-06, -3.234483301639557e-06, -3.0566006898880005e-06, -2.878718078136444e-06, -2.7008354663848877e-06, -2.5229528546333313e-06, -2.345070242881775e-06, -2.1671876311302185e-06, -1.989305019378662e-06, -1.8114224076271057e-06, -1.6335397958755493e-06, -1.455657184123993e-06, -1.2777745723724365e-06, -1.0998919606208801e-06, -9.220093488693237e-07, -7.441267371177673e-07, -5.662441253662109e-07, -3.8836151361465454e-07, -2.1047890186309814e-07, -3.259629011154175e-08, 1.4528632164001465e-07, 3.2316893339157104e-07, 5.010515451431274e-07, 6.789341568946838e-07, 8.568167686462402e-07, 1.0346993803977966e-06, 1.212581992149353e-06, 1.3904646039009094e-06, 1.5683472156524658e-06, 1.7462298274040222e-06, 1.9241124391555786e-06, 2.101995050907135e-06, 2.2798776626586914e-06, 2.457760274410248e-06, 2.635642886161804e-06, 2.8135254979133606e-06, 2.991408109664917e-06, 3.1692907214164734e-06, 3.3471733331680298e-06, 3.525055944919586e-06, 3.7029385566711426e-06, 3.880821168422699e-06, 4.058703780174255e-06, 4.236586391925812e-06, 4.414469003677368e-06, 4.5923516154289246e-06, 4.770234227180481e-06, 4.948116838932037e-06, 5.125999450683594e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 4.0, 9.0, 14.0, 12.0, 15.0, 21.0, 36.0, 43.0, 62.0, 99.0, 131.0, 152.0, 131.0, 66.0, 48.0, 38.0, 27.0, 19.0, 16.0, 10.0, 7.0, 9.0, 6.0, 6.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013595583732239902, -0.0001314588589593768, -0.00012696189514826983, -0.00012246491678524762, -0.00011796794569818303, -0.00011347097461111844, -0.00010897400352405384, -0.00010447703243698925, -9.998005407396704e-05, -9.548308298690245e-05, -9.098611189983785e-05, -8.648913353681564e-05, -8.199216244975105e-05, -7.749519136268646e-05, -7.299822027562186e-05, -6.850124918855727e-05, -6.400427810149267e-05, -5.950730701442808e-05, -5.501033228938468e-05, -5.0513361202320084e-05, -4.601638647727668e-05, -4.151941539021209e-05, -3.7022444303147495e-05, -3.2525469578104094e-05, -2.80284984910395e-05, -2.3531525584985502e-05, -1.9034552678931504e-05, -1.453758159186691e-05, -1.0040608685812913e-05, -5.543635779758915e-06, -1.0466646926943213e-06, 3.45031003234908e-06, 7.947281119413674e-06, 1.2444254025467671e-05, 1.694122693152167e-05, 2.1438198018586263e-05, 2.593517092464026e-05, 3.0432143830694258e-05, 3.492911491775885e-05, 3.942608964280225e-05, 4.392306072986685e-05, 4.842003181693144e-05, 5.291700654197484e-05, 5.7413977629039437e-05, 6.191094871610403e-05, 6.640792707912624e-05, 7.090489089023322e-05, 7.540186925325543e-05, 7.989884034032002e-05, 8.439581142738461e-05, 8.889278251444921e-05, 9.33897536015138e-05, 9.788673196453601e-05, 0.0001023837030516006, 0.0001068806741386652, 0.00011137765250168741, 0.00011587461631279439, 0.00012037158739985898, 0.00012486855848692358, 0.00012936553684994578, 0.00013386250066105276, 0.00013835947902407497, 0.00014285644283518195, 0.00014735342119820416, 0.00015185039956122637]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 1.0, 8.0, 5.0, 7.0, 16.0, 12.0, 19.0, 18.0, 20.0, 25.0, 38.0, 35.0, 31.0, 33.0, 28.0, 48.0, 36.0, 40.0, 47.0, 46.0, 44.0, 47.0, 47.0, 43.0, 32.0, 46.0, 33.0, 31.0, 21.0, 16.0, 27.0, 23.0, 9.0, 14.0, 17.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.300171950599179e-05, -9.035928087541834e-05, -8.771684224484488e-05, -8.507440361427143e-05, -8.243196498369798e-05, -7.978952635312453e-05, -7.714709499850869e-05, -7.450465636793524e-05, -7.186221773736179e-05, -6.921977910678834e-05, -6.657734047621489e-05, -6.393490184564143e-05, -6.129246321506798e-05, -5.865002458449453e-05, -5.600758959189989e-05, -5.3365150961326435e-05, -5.0722708692774177e-05, -4.8080270062200725e-05, -4.5437831431627274e-05, -4.279539280105382e-05, -4.015295417048037e-05, -3.751051553990692e-05, -3.4868080547312275e-05, -3.222564191673882e-05, -2.958320328616537e-05, -2.694076465559192e-05, -2.429832602501847e-05, -2.165588921343442e-05, -1.901345058286097e-05, -1.6371011952287517e-05, -1.372857514070347e-05, -1.1086136510130018e-05, -8.443690603598952e-06, -5.801252427772852e-06, -3.158814251946751e-06, -5.163765308680013e-07, 2.1260620997054502e-06, 4.768500730278902e-06, 7.41093754186295e-06, 1.0053376172436401e-05, 1.2695814803009853e-05, 1.5338253433583304e-05, 1.7980692064156756e-05, 2.0623128875740804e-05, 2.3265567506314255e-05, 2.5908006136887707e-05, 2.8550442948471755e-05, 3.1192881579045206e-05, 3.383532020961866e-05, 3.647775884019211e-05, 3.912019747076556e-05, 4.176263610133901e-05, 4.4405074731912464e-05, 4.7047513362485915e-05, 4.968994835508056e-05, 5.233238698565401e-05, 5.497482561622746e-05, 5.7617264246800914e-05, 6.0259702877374366e-05, 6.290213786996901e-05, 6.554457650054246e-05, 6.818701513111591e-05, 7.082945376168936e-05, 7.347189239226282e-05, 7.611433102283627e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 11.0, 11.0, 19.0, 25.0, 29.0, 44.0, 61.0, 70.0, 143.0, 191.0, 306.0, 429.0, 612.0, 962.0, 1458.0, 2226.0, 3438.0, 5255.0, 7980.0, 12741.0, 20548.0, 33667.0, 57456.0, 105816.0, 243400.0, 273947.0, 118802.0, 62746.0, 35989.0, 21678.0, 13659.0, 8676.0, 5540.0, 3628.0, 2367.0, 1518.0, 999.0, 689.0, 454.0, 304.0, 194.0, 142.0, 97.0, 74.0, 44.0, 40.0, 15.0, 24.0, 11.0, 7.0, 3.0, 5.0, 3.0, 6.0, 1.0, 2.0], "bins": [-0.00017333030700683594, -0.00016808882355690002, -0.0001628473401069641, -0.0001576058566570282, -0.00015236437320709229, -0.00014712288975715637, -0.00014188140630722046, -0.00013663992285728455, -0.00013139843940734863, -0.00012615695595741272, -0.0001209154725074768, -0.0001156739890575409, -0.00011043250560760498, -0.00010519102215766907, -9.994953870773315e-05, -9.470805525779724e-05, -8.946657180786133e-05, -8.422508835792542e-05, -7.89836049079895e-05, -7.374212145805359e-05, -6.850063800811768e-05, -6.325915455818176e-05, -5.801767110824585e-05, -5.2776187658309937e-05, -4.7534704208374023e-05, -4.229322075843811e-05, -3.70517373085022e-05, -3.1810253858566284e-05, -2.656877040863037e-05, -2.1327286958694458e-05, -1.6085803508758545e-05, -1.0844320058822632e-05, -5.602836608886719e-06, -3.6135315895080566e-07, 4.880130290985107e-06, 1.012161374092102e-05, 1.5363097190856934e-05, 2.0604580640792847e-05, 2.584606409072876e-05, 3.108754754066467e-05, 3.6329030990600586e-05, 4.15705144405365e-05, 4.681199789047241e-05, 5.2053481340408325e-05, 5.729496479034424e-05, 6.253644824028015e-05, 6.777793169021606e-05, 7.301941514015198e-05, 7.826089859008789e-05, 8.35023820400238e-05, 8.874386548995972e-05, 9.398534893989563e-05, 9.922683238983154e-05, 0.00010446831583976746, 0.00010970979928970337, 0.00011495128273963928, 0.0001201927661895752, 0.0001254342496395111, 0.00013067573308944702, 0.00013591721653938293, 0.00014115869998931885, 0.00014640018343925476, 0.00015164166688919067, 0.0001568831503391266, 0.0001621246337890625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 6.0, 8.0, 14.0, 13.0, 14.0, 13.0, 22.0, 22.0, 31.0, 19.0, 36.0, 38.0, 22.0, 33.0, 37.0, 31.0, 41.0, 37.0, 31.0, 49.0, 45.0, 37.0, 37.0, 36.0, 35.0, 39.0, 28.0, 29.0, 23.0, 26.0, 15.0, 18.0, 18.0, 12.0, 7.0, 11.0, 12.0, 7.0, 10.0, 5.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.5299530029296875e-05, -4.3925829231739044e-05, -4.255212843418121e-05, -4.117842763662338e-05, -3.980472683906555e-05, -3.843102604150772e-05, -3.705732524394989e-05, -3.568362444639206e-05, -3.430992364883423e-05, -3.29362228512764e-05, -3.156252205371857e-05, -3.0188821256160736e-05, -2.8815120458602905e-05, -2.7441419661045074e-05, -2.6067718863487244e-05, -2.4694018065929413e-05, -2.3320317268371582e-05, -2.194661647081375e-05, -2.057291567325592e-05, -1.919921487569809e-05, -1.782551407814026e-05, -1.6451813280582428e-05, -1.5078112483024597e-05, -1.3704411685466766e-05, -1.2330710887908936e-05, -1.0957010090351105e-05, -9.583309292793274e-06, -8.209608495235443e-06, -6.835907697677612e-06, -5.4622069001197815e-06, -4.088506102561951e-06, -2.71480530500412e-06, -1.341104507446289e-06, 3.259629011154175e-08, 1.4062970876693726e-06, 2.7799978852272034e-06, 4.153698682785034e-06, 5.527399480342865e-06, 6.901100277900696e-06, 8.274801075458527e-06, 9.648501873016357e-06, 1.1022202670574188e-05, 1.2395903468132019e-05, 1.376960426568985e-05, 1.514330506324768e-05, 1.651700586080551e-05, 1.7890706658363342e-05, 1.9264407455921173e-05, 2.0638108253479004e-05, 2.2011809051036835e-05, 2.3385509848594666e-05, 2.4759210646152496e-05, 2.6132911443710327e-05, 2.7506612241268158e-05, 2.888031303882599e-05, 3.025401383638382e-05, 3.162771463394165e-05, 3.300141543149948e-05, 3.437511622905731e-05, 3.574881702661514e-05, 3.7122517824172974e-05, 3.8496218621730804e-05, 3.9869919419288635e-05, 4.1243620216846466e-05, 4.26173210144043e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 20.0, 15.0, 18.0, 35.0, 43.0, 65.0, 77.0, 121.0, 212.0, 338.0, 631.0, 1274.0, 2912.0, 7074.0, 17797.0, 49007.0, 156867.0, 537493.0, 185179.0, 55160.0, 19934.0, 7851.0, 3240.0, 1429.0, 754.0, 360.0, 205.0, 146.0, 89.0, 55.0, 41.0, 23.0, 19.0, 16.0, 9.0, 10.0, 8.0, 3.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003120899200439453, -0.00030355341732501984, -0.00029501691460609436, -0.0002864804118871689, -0.0002779439091682434, -0.00026940740644931793, -0.00026087090373039246, -0.000252334401011467, -0.0002437978982925415, -0.00023526139557361603, -0.00022672489285469055, -0.00021818839013576508, -0.0002096518874168396, -0.00020111538469791412, -0.00019257888197898865, -0.00018404237926006317, -0.0001755058765411377, -0.00016696937382221222, -0.00015843287110328674, -0.00014989636838436127, -0.0001413598656654358, -0.00013282336294651031, -0.00012428686022758484, -0.00011575035750865936, -0.00010721385478973389, -9.867735207080841e-05, -9.014084935188293e-05, -8.160434663295746e-05, -7.306784391403198e-05, -6.45313411951065e-05, -5.599483847618103e-05, -4.7458335757255554e-05, -3.892183303833008e-05, -3.0385330319404602e-05, -2.1848827600479126e-05, -1.331232488155365e-05, -4.775822162628174e-06, 3.7606805562973022e-06, 1.2297183275222778e-05, 2.0833685994148254e-05, 2.937018871307373e-05, 3.7906691431999207e-05, 4.644319415092468e-05, 5.497969686985016e-05, 6.351619958877563e-05, 7.205270230770111e-05, 8.058920502662659e-05, 8.912570774555206e-05, 9.766221046447754e-05, 0.00010619871318340302, 0.00011473521590232849, 0.00012327171862125397, 0.00013180822134017944, 0.00014034472405910492, 0.0001488812267780304, 0.00015741772949695587, 0.00016595423221588135, 0.00017449073493480682, 0.0001830272376537323, 0.00019156374037265778, 0.00020010024309158325, 0.00020863674581050873, 0.0002171732485294342, 0.00022570975124835968, 0.00023424625396728516]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 11.0, 9.0, 11.0, 14.0, 26.0, 20.0, 32.0, 23.0, 46.0, 42.0, 30.0, 26.0, 29.0, 40.0, 39.0, 49.0, 52.0, 51.0, 40.0, 43.0, 46.0, 42.0, 34.0, 27.0, 34.0, 29.0, 30.0, 20.0, 21.0, 14.0, 16.0, 8.0, 7.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9696693420410156e-05, -3.825780004262924e-05, -3.681890666484833e-05, -3.538001328706741e-05, -3.39411199092865e-05, -3.2502226531505585e-05, -3.106333315372467e-05, -2.9624439775943756e-05, -2.8185546398162842e-05, -2.6746653020381927e-05, -2.5307759642601013e-05, -2.38688662648201e-05, -2.2429972887039185e-05, -2.099107950925827e-05, -1.9552186131477356e-05, -1.811329275369644e-05, -1.6674399375915527e-05, -1.5235505998134613e-05, -1.3796612620353699e-05, -1.2357719242572784e-05, -1.091882586479187e-05, -9.479932487010956e-06, -8.041039109230042e-06, -6.602145731449127e-06, -5.163252353668213e-06, -3.7243589758872986e-06, -2.2854655981063843e-06, -8.4657222032547e-07, 5.923211574554443e-07, 2.0312145352363586e-06, 3.470107913017273e-06, 4.909001290798187e-06, 6.3478946685791016e-06, 7.786788046360016e-06, 9.22568142414093e-06, 1.0664574801921844e-05, 1.2103468179702759e-05, 1.3542361557483673e-05, 1.4981254935264587e-05, 1.6420148313045502e-05, 1.7859041690826416e-05, 1.929793506860733e-05, 2.0736828446388245e-05, 2.217572182416916e-05, 2.3614615201950073e-05, 2.5053508579730988e-05, 2.6492401957511902e-05, 2.7931295335292816e-05, 2.937018871307373e-05, 3.0809082090854645e-05, 3.224797546863556e-05, 3.3686868846416473e-05, 3.512576222419739e-05, 3.65646556019783e-05, 3.8003548979759216e-05, 3.944244235754013e-05, 4.0881335735321045e-05, 4.232022911310196e-05, 4.3759122490882874e-05, 4.519801586866379e-05, 4.66369092464447e-05, 4.8075802624225616e-05, 4.951469600200653e-05, 5.0953589379787445e-05, 5.239248275756836e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 15.0, 10.0, 24.0, 35.0, 18.0, 77.0, 60.0, 155.0, 243.0, 249.0, 663.0, 700.0, 2081.0, 2818.0, 9475.0, 32303.0, 89156.0, 772305.0, 89203.0, 32226.0, 7308.0, 4910.0, 2123.0, 759.0, 652.0, 288.0, 225.0, 181.0, 68.0, 73.0, 31.0, 25.0, 18.0, 20.0, 13.0, 10.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.304813385009766e-06, -5.151145160198212e-06, -4.997476935386658e-06, -4.843808710575104e-06, -4.69014048576355e-06, -4.536472260951996e-06, -4.382804036140442e-06, -4.229135811328888e-06, -4.075467586517334e-06, -3.92179936170578e-06, -3.768131136894226e-06, -3.614462912082672e-06, -3.460794687271118e-06, -3.307126462459564e-06, -3.1534582376480103e-06, -2.9997900128364563e-06, -2.8461217880249023e-06, -2.6924535632133484e-06, -2.5387853384017944e-06, -2.3851171135902405e-06, -2.2314488887786865e-06, -2.0777806639671326e-06, -1.9241124391555786e-06, -1.7704442143440247e-06, -1.6167759895324707e-06, -1.4631077647209167e-06, -1.3094395399093628e-06, -1.1557713150978088e-06, -1.0021030902862549e-06, -8.484348654747009e-07, -6.94766640663147e-07, -5.41098415851593e-07, -3.8743019104003906e-07, -2.337619662284851e-07, -8.009374141693115e-08, 7.35744833946228e-08, 2.2724270820617676e-07, 3.809109330177307e-07, 5.345791578292847e-07, 6.882473826408386e-07, 8.419156074523926e-07, 9.955838322639465e-07, 1.1492520570755005e-06, 1.3029202818870544e-06, 1.4565885066986084e-06, 1.6102567315101624e-06, 1.7639249563217163e-06, 1.9175931811332703e-06, 2.0712614059448242e-06, 2.224929630756378e-06, 2.378597855567932e-06, 2.532266080379486e-06, 2.68593430519104e-06, 2.839602530002594e-06, 2.993270754814148e-06, 3.146938979625702e-06, 3.300607204437256e-06, 3.45427542924881e-06, 3.6079436540603638e-06, 3.7616118788719177e-06, 3.915280103683472e-06, 4.068948328495026e-06, 4.22261655330658e-06, 4.3762847781181335e-06, 4.5299530029296875e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 121.0, 0.0, 0.0, 0.0, 0.0, 0.0, 751.0, 0.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 6.0, 4.0, 0.0, 1.0, 12.0, 0.0, 6.0, 4.0, 34.0, 1.0, 22.0, 28.0, 72.0, 27.0, 142.0, 101.0, 478.0, 398.0, 1643.0, 1599.0, 8818.0, 11080.0, 73471.0, 157056.0, 695052.0, 52450.0, 32749.0, 5380.0, 5040.0, 1063.0, 946.0, 265.0, 267.0, 108.0, 69.0, 30.0, 64.0, 25.0, 5.0, 8.0, 30.0, 1.0, 1.0, 1.0, 8.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.129243850708008e-06, -3.039836883544922e-06, -2.950429916381836e-06, -2.86102294921875e-06, -2.771615982055664e-06, -2.682209014892578e-06, -2.592802047729492e-06, -2.5033950805664062e-06, -2.4139881134033203e-06, -2.3245811462402344e-06, -2.2351741790771484e-06, -2.1457672119140625e-06, -2.0563602447509766e-06, -1.9669532775878906e-06, -1.8775463104248047e-06, -1.7881393432617188e-06, -1.6987323760986328e-06, -1.6093254089355469e-06, -1.519918441772461e-06, -1.430511474609375e-06, -1.341104507446289e-06, -1.2516975402832031e-06, -1.1622905731201172e-06, -1.0728836059570312e-06, -9.834766387939453e-07, -8.940696716308594e-07, -8.046627044677734e-07, -7.152557373046875e-07, -6.258487701416016e-07, -5.364418029785156e-07, -4.470348358154297e-07, -3.5762786865234375e-07, -2.682209014892578e-07, -1.7881393432617188e-07, -8.940696716308594e-08, 0.0, 8.940696716308594e-08, 1.7881393432617188e-07, 2.682209014892578e-07, 3.5762786865234375e-07, 4.470348358154297e-07, 5.364418029785156e-07, 6.258487701416016e-07, 7.152557373046875e-07, 8.046627044677734e-07, 8.940696716308594e-07, 9.834766387939453e-07, 1.0728836059570312e-06, 1.1622905731201172e-06, 1.2516975402832031e-06, 1.341104507446289e-06, 1.430511474609375e-06, 1.519918441772461e-06, 1.6093254089355469e-06, 1.6987323760986328e-06, 1.7881393432617188e-06, 1.8775463104248047e-06, 1.9669532775878906e-06, 2.0563602447509766e-06, 2.1457672119140625e-06, 2.2351741790771484e-06, 2.3245811462402344e-06, 2.4139881134033203e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 0.0, 195.0, 0.0, 0.0, 0.0, 296.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07, 4.917383193969727e-07, 5.066394805908203e-07, 5.21540641784668e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 8.0, 3.0, 15.0, 15.0, 26.0, 30.0, 60.0, 109.0, 181.0, 227.0, 124.0, 61.0, 42.0, 30.0, 26.0, 13.0, 11.0, 8.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013294802920427173, -0.00012893248640466481, -0.0001249169436050579, -0.00012090140808140859, -0.00011688586528180167, -0.00011287032975815237, -0.00010885478695854545, -0.00010483924415893853, -0.00010082370135933161, -9.680815855972469e-05, -9.279262303607538e-05, -8.877708023646846e-05, -8.476153743686154e-05, -8.074600191321224e-05, -7.673045911360532e-05, -7.27149163139984e-05, -6.86993807903491e-05, -6.468383799074218e-05, -6.0668298829114065e-05, -5.665275966748595e-05, -5.263721686787903e-05, -4.862167770625092e-05, -4.460613854462281e-05, -4.059059574501589e-05, -3.657505658338778e-05, -3.2559517421759665e-05, -2.8543974622152746e-05, -2.4528435460524634e-05, -2.0512894479907118e-05, -1.6497353499289602e-05, -1.248181433766149e-05, -8.466273357043974e-06, -4.450732376426458e-06, -4.351918505562935e-07, 3.5803486753138714e-06, 7.595888746436685e-06, 1.1611429727054201e-05, 1.5626970707671717e-05, 1.964250986929983e-05, 2.3658050849917345e-05, 2.767359183053486e-05, 3.168913099216297e-05, 3.570467379176989e-05, 3.9720212953398004e-05, 4.3735752115026116e-05, 4.7751294914633036e-05, 5.176683407626115e-05, 5.578237323788926e-05, 5.979791603749618e-05, 6.38134588371031e-05, 6.78289943607524e-05, 7.184453716035932e-05, 7.586007995996624e-05, 7.987562275957316e-05, 8.389115828322247e-05, 8.790670108282939e-05, 9.192223660647869e-05, 9.593777940608561e-05, 9.995331492973492e-05, 0.00010396885772934183, 0.00010798440052894875, 0.00011199993605259806, 0.00011601547885220498, 0.0001200310216518119, 0.00012404656445141882]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 11.0, 7.0, 9.0, 7.0, 15.0, 11.0, 18.0, 20.0, 25.0, 27.0, 33.0, 34.0, 28.0, 28.0, 48.0, 46.0, 33.0, 51.0, 46.0, 49.0, 58.0, 31.0, 35.0, 43.0, 44.0, 35.0, 29.0, 27.0, 18.0, 17.0, 17.0, 14.0, 13.0, 15.0, 9.0, 5.0, 7.0, 3.0, 7.0, 8.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.312470966600813e-05, -5.145422255736776e-05, -4.978373908670619e-05, -4.811325197806582e-05, -4.6442764869425446e-05, -4.477228139876388e-05, -4.310179429012351e-05, -4.143131081946194e-05, -3.976082371082157e-05, -3.8090336602181196e-05, -3.641985313151963e-05, -3.474936602287926e-05, -3.307888255221769e-05, -3.140839544357732e-05, -2.9737908334936947e-05, -2.8067423045285977e-05, -2.6396937755635008e-05, -2.472645246598404e-05, -2.305596717633307e-05, -2.1385480067692697e-05, -1.9714994778041728e-05, -1.804450948839076e-05, -1.6374022379750386e-05, -1.4703537090099417e-05, -1.3033051800448447e-05, -1.1362566510797478e-05, -9.692080311651807e-06, -8.021594112506136e-06, -6.351108822855167e-06, -4.680623533204198e-06, -3.010137334058527e-06, -1.339651134912856e-06, 3.308341547381133e-07, 2.0013198991364334e-06, 3.6718056435347535e-06, 5.3422913879330736e-06, 7.012777132331394e-06, 8.683262421982363e-06, 1.0353748621128034e-05, 1.2024234820273705e-05, 1.3694720109924674e-05, 1.5365205399575643e-05, 1.7035690689226612e-05, 1.8706177797866985e-05, 2.0376663087517954e-05, 2.2047148377168924e-05, 2.3717635485809296e-05, 2.5388120775460266e-05, 2.7058606065111235e-05, 2.8729091354762204e-05, 3.0399576644413173e-05, 3.2070063753053546e-05, 3.374055086169392e-05, 3.5411034332355484e-05, 3.708152144099586e-05, 3.875200491165742e-05, 4.0422492020297796e-05, 4.209297912893817e-05, 4.3763462599599734e-05, 4.543394970824011e-05, 4.710443317890167e-05, 4.8774920287542045e-05, 5.044540739618242e-05, 5.211589450482279e-05, 5.3786377975484356e-05]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 8.0, 6.0, 5.0, 8.0, 18.0, 12.0, 23.0, 32.0, 46.0, 56.0, 78.0, 93.0, 145.0, 205.0, 281.0, 409.0, 586.0, 850.0, 1320.0, 2037.0, 3282.0, 6316.0, 25756.0, 3559799.0, 564599.0, 14020.0, 5459.0, 2979.0, 1830.0, 1090.0, 848.0, 573.0, 389.0, 295.0, 204.0, 170.0, 128.0, 89.0, 64.0, 41.0, 34.0, 20.0, 18.0, 18.0, 15.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0001697540283203125, -0.00016443058848381042, -0.00015910714864730835, -0.00015378370881080627, -0.0001484602689743042, -0.00014313682913780212, -0.00013781338930130005, -0.00013248994946479797, -0.0001271665096282959, -0.00012184306979179382, -0.00011651962995529175, -0.00011119619011878967, -0.0001058727502822876, -0.00010054931044578552, -9.522587060928345e-05, -8.990243077278137e-05, -8.45789909362793e-05, -7.925555109977722e-05, -7.393211126327515e-05, -6.860867142677307e-05, -6.3285231590271e-05, -5.796179175376892e-05, -5.2638351917266846e-05, -4.731491208076477e-05, -4.1991472244262695e-05, -3.666803240776062e-05, -3.1344592571258545e-05, -2.602115273475647e-05, -2.0697712898254395e-05, -1.537427306175232e-05, -1.0050833225250244e-05, -4.727393388748169e-06, 5.960464477539062e-07, 5.9194862842559814e-06, 1.1242926120758057e-05, 1.6566365957260132e-05, 2.1889805793762207e-05, 2.7213245630264282e-05, 3.253668546676636e-05, 3.786012530326843e-05, 4.318356513977051e-05, 4.850700497627258e-05, 5.383044481277466e-05, 5.9153884649276733e-05, 6.447732448577881e-05, 6.980076432228088e-05, 7.512420415878296e-05, 8.044764399528503e-05, 8.577108383178711e-05, 9.109452366828918e-05, 9.641796350479126e-05, 0.00010174140334129333, 0.00010706484317779541, 0.00011238828301429749, 0.00011771172285079956, 0.00012303516268730164, 0.0001283586025238037, 0.00013368204236030579, 0.00013900548219680786, 0.00014432892203330994, 0.000149652361869812, 0.0001549758017063141, 0.00016029924154281616, 0.00016562268137931824, 0.0001709461212158203]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 0.0, 3.0, 5.0, 6.0, 3.0, 11.0, 6.0, 12.0, 13.0, 12.0, 22.0, 29.0, 26.0, 37.0, 30.0, 26.0, 35.0, 47.0, 46.0, 39.0, 52.0, 59.0, 51.0, 58.0, 34.0, 43.0, 42.0, 35.0, 35.0, 23.0, 31.0, 11.0, 18.0, 16.0, 15.0, 14.0, 13.0, 9.0, 8.0, 3.0, 6.0, 2.0, 7.0, 6.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.467647522687912e-05, -4.3218955397605896e-05, -4.176143556833267e-05, -4.030391573905945e-05, -3.8846395909786224e-05, -3.7388876080513e-05, -3.5931356251239777e-05, -3.447383642196655e-05, -3.301631659269333e-05, -3.1558796763420105e-05, -3.010127693414688e-05, -2.8643757104873657e-05, -2.7186237275600433e-05, -2.572871744632721e-05, -2.4271197617053986e-05, -2.2813677787780762e-05, -2.1356157958507538e-05, -1.9898638129234314e-05, -1.844111829996109e-05, -1.6983598470687866e-05, -1.5526078641414642e-05, -1.4068558812141418e-05, -1.2611038982868195e-05, -1.115351915359497e-05, -9.695999324321747e-06, -8.238479495048523e-06, -6.780959665775299e-06, -5.323439836502075e-06, -3.865920007228851e-06, -2.4084001779556274e-06, -9.508803486824036e-07, 5.066394805908203e-07, 1.964159309864044e-06, 3.421679139137268e-06, 4.879198968410492e-06, 6.336718797683716e-06, 7.79423862695694e-06, 9.251758456230164e-06, 1.0709278285503387e-05, 1.2166798114776611e-05, 1.3624317944049835e-05, 1.5081837773323059e-05, 1.6539357602596283e-05, 1.7996877431869507e-05, 1.945439726114273e-05, 2.0911917090415955e-05, 2.236943691968918e-05, 2.3826956748962402e-05, 2.5284476578235626e-05, 2.674199640750885e-05, 2.8199516236782074e-05, 2.9657036066055298e-05, 3.111455589532852e-05, 3.2572075724601746e-05, 3.402959555387497e-05, 3.548711538314819e-05, 3.694463521242142e-05, 3.840215504169464e-05, 3.9859674870967865e-05, 4.131719470024109e-05, 4.277471452951431e-05, 4.423223435878754e-05, 4.568975418806076e-05, 4.7147274017333984e-05]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 8.0, 12.0, 8.0, 13.0, 28.0, 48.0, 86.0, 121.0, 326.0, 655.0, 1590.0, 4196.0, 13076.0, 116270.0, 4012237.0, 32958.0, 7867.0, 2711.0, 1076.0, 488.0, 213.0, 111.0, 55.0, 23.0, 24.0, 19.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00030732154846191406, -0.00029780343174934387, -0.0002882853150367737, -0.0002787671983242035, -0.0002692490816116333, -0.0002597309648990631, -0.0002502128481864929, -0.00024069473147392273, -0.00023117661476135254, -0.00022165849804878235, -0.00021214038133621216, -0.00020262226462364197, -0.00019310414791107178, -0.0001835860311985016, -0.0001740679144859314, -0.0001645497977733612, -0.00015503168106079102, -0.00014551356434822083, -0.00013599544763565063, -0.00012647733092308044, -0.00011695921421051025, -0.00010744109749794006, -9.792298078536987e-05, -8.840486407279968e-05, -7.888674736022949e-05, -6.93686306476593e-05, -5.985051393508911e-05, -5.033239722251892e-05, -4.081428050994873e-05, -3.129616379737854e-05, -2.177804708480835e-05, -1.225993037223816e-05, -2.7418136596679688e-06, 6.776303052902222e-06, 1.6294419765472412e-05, 2.5812536478042603e-05, 3.533065319061279e-05, 4.4848769903182983e-05, 5.4366886615753174e-05, 6.388500332832336e-05, 7.340312004089355e-05, 8.292123675346375e-05, 9.243935346603394e-05, 0.00010195747017860413, 0.00011147558689117432, 0.00012099370360374451, 0.0001305118203163147, 0.0001400299370288849, 0.00014954805374145508, 0.00015906617045402527, 0.00016858428716659546, 0.00017810240387916565, 0.00018762052059173584, 0.00019713863730430603, 0.00020665675401687622, 0.0002161748707294464, 0.0002256929874420166, 0.0002352111041545868, 0.000244729220867157, 0.00025424733757972717, 0.00026376545429229736, 0.00027328357100486755, 0.00028280168771743774, 0.00029231980443000793, 0.0003018379211425781]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 8.0, 2.0, 5.0, 3.0, 8.0, 19.0, 19.0, 18.0, 66.0, 175.0, 483.0, 2423.0, 470.0, 178.0, 68.0, 33.0, 22.0, 11.0, 5.0, 5.0, 5.0, 6.0, 4.0, 1.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2007694244384766e-05, -3.0957162380218506e-05, -2.9906630516052246e-05, -2.8856098651885986e-05, -2.7805566787719727e-05, -2.6755034923553467e-05, -2.5704503059387207e-05, -2.4653971195220947e-05, -2.3603439331054688e-05, -2.2552907466888428e-05, -2.1502375602722168e-05, -2.0451843738555908e-05, -1.940131187438965e-05, -1.835078001022339e-05, -1.730024814605713e-05, -1.624971628189087e-05, -1.519918441772461e-05, -1.414865255355835e-05, -1.309812068939209e-05, -1.204758882522583e-05, -1.099705696105957e-05, -9.94652509689331e-06, -8.89599323272705e-06, -7.845461368560791e-06, -6.794929504394531e-06, -5.7443976402282715e-06, -4.693865776062012e-06, -3.643333911895752e-06, -2.592802047729492e-06, -1.5422701835632324e-06, -4.917383193969727e-07, 5.587935447692871e-07, 1.6093254089355469e-06, 2.6598572731018066e-06, 3.7103891372680664e-06, 4.760921001434326e-06, 5.811452865600586e-06, 6.861984729766846e-06, 7.912516593933105e-06, 8.963048458099365e-06, 1.0013580322265625e-05, 1.1064112186431885e-05, 1.2114644050598145e-05, 1.3165175914764404e-05, 1.4215707778930664e-05, 1.5266239643096924e-05, 1.6316771507263184e-05, 1.7367303371429443e-05, 1.8417835235595703e-05, 1.9468367099761963e-05, 2.0518898963928223e-05, 2.1569430828094482e-05, 2.2619962692260742e-05, 2.3670494556427002e-05, 2.4721026420593262e-05, 2.577155828475952e-05, 2.682209014892578e-05, 2.787262201309204e-05, 2.89231538772583e-05, 2.997368574142456e-05, 3.102421760559082e-05, 3.207474946975708e-05, 3.312528133392334e-05, 3.41758131980896e-05, 3.522634506225586e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 6.0, 3.0, 12.0, 17.0, 14.0, 23.0, 34.0, 46.0, 56.0, 71.0, 100.0, 147.0, 136.0, 89.0, 65.0, 47.0, 28.0, 18.0, 17.0, 12.0, 15.0, 8.0, 4.0, 3.0, 1.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.912751996424049e-05, -6.693925388390198e-05, -6.475098052760586e-05, -6.256271444726735e-05, -6.0374448366928846e-05, -5.818617864861153e-05, -5.5997908930294216e-05, -5.380964284995571e-05, -5.162137313163839e-05, -4.943310341332108e-05, -4.724483733298257e-05, -4.5056567614665255e-05, -4.286829789634794e-05, -4.068003181600943e-05, -3.849176209769212e-05, -3.63034923793748e-05, -3.4115226299036294e-05, -3.192695658071898e-05, -2.973869050038047e-05, -2.7550420782063156e-05, -2.5362152882735245e-05, -2.3173884983407333e-05, -2.098561526509002e-05, -1.8797347365762107e-05, -1.6609079466434196e-05, -1.4420811567106284e-05, -1.2232542758283671e-05, -1.0044273949461058e-05, -7.856006050133146e-06, -5.667738150805235e-06, -3.4794693419826217e-06, -1.2912005331600085e-06, 8.970673661679029e-07, 3.0853357202431653e-06, 5.273604074318428e-06, 7.46187242839369e-06, 9.650140782468952e-06, 1.1838408681796864e-05, 1.4026677490619477e-05, 1.621494629944209e-05, 1.840321419877e-05, 2.0591482098097913e-05, 2.2779749997425824e-05, 2.496801971574314e-05, 2.715628761507105e-05, 2.9344555514398962e-05, 3.153282523271628e-05, 3.372109495103359e-05, 3.59093610313721e-05, 3.8097630749689415e-05, 4.028589683002792e-05, 4.247416654834524e-05, 4.4662432628683746e-05, 4.685070234700106e-05, 4.9038972065318376e-05, 5.1227238145656884e-05, 5.34155078639742e-05, 5.5603777582291514e-05, 5.779204366263002e-05, 5.9980313380947337e-05, 6.216858309926465e-05, 6.435684917960316e-05, 6.654511525994167e-05, 6.873338861623779e-05, 7.09216546965763e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 12.0, 7.0, 12.0, 16.0, 12.0, 16.0, 20.0, 19.0, 29.0, 36.0, 33.0, 38.0, 47.0, 40.0, 40.0, 38.0, 49.0, 50.0, 41.0, 45.0, 50.0, 54.0, 50.0, 26.0, 26.0, 28.0, 18.0, 27.0, 20.0, 18.0, 11.0, 14.0, 9.0, 9.0, 7.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.849924152949825e-05, -4.704817183665e-05, -4.559710214380175e-05, -4.4146036088932306e-05, -4.2694966396084055e-05, -4.1243896703235805e-05, -3.9792827010387555e-05, -3.8341757317539304e-05, -3.6890687624691054e-05, -3.5439617931842804e-05, -3.3988548238994554e-05, -3.2537478546146303e-05, -3.108641249127686e-05, -2.963534279842861e-05, -2.818427310558036e-05, -2.673320341273211e-05, -2.5282135538873263e-05, -2.3831065846025012e-05, -2.2379997972166166e-05, -2.0928928279317915e-05, -1.9477858586469665e-05, -1.8026788893621415e-05, -1.6575721019762568e-05, -1.5124651326914318e-05, -1.367358254356077e-05, -1.2222513760207221e-05, -1.077144406735897e-05, -9.320375284005422e-06, -7.869306500651874e-06, -6.418236807803623e-06, -4.967168024450075e-06, -3.5160983316018246e-06, -2.065029548248276e-06, -6.139604238342145e-07, 8.371087005798472e-07, 2.288177711307071e-06, 3.7392469494079705e-06, 5.19031618750887e-06, 6.641384970862418e-06, 8.092454663710669e-06, 9.543523447064217e-06, 1.0994592230417766e-05, 1.2445661923266016e-05, 1.3896730706619564e-05, 1.5347799489973113e-05, 1.6798869182821363e-05, 1.8249938875669613e-05, 1.9701008568517864e-05, 2.115207644237671e-05, 2.260314613522496e-05, 2.4054214009083807e-05, 2.5505283701932058e-05, 2.6956353394780308e-05, 2.8407423087628558e-05, 2.9858490961487405e-05, 3.130955883534625e-05, 3.27606285281945e-05, 3.421169822104275e-05, 3.5662767913891e-05, 3.711383760673925e-05, 3.8564903661608696e-05, 4.0015973354456946e-05, 4.1467043047305197e-05, 4.291811274015345e-05, 4.43691824330017e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 9.0, 13.0, 28.0, 40.0, 55.0, 91.0, 132.0, 173.0, 289.0, 431.0, 643.0, 1057.0, 1625.0, 2592.0, 4302.0, 6703.0, 11510.0, 18748.0, 32698.0, 62888.0, 119751.0, 285899.0, 261204.0, 107173.0, 56583.0, 29425.0, 17284.0, 10489.0, 6093.0, 3801.0, 2526.0, 1488.0, 985.0, 631.0, 366.0, 276.0, 175.0, 122.0, 84.0, 61.0, 38.0, 24.0, 12.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.6372413635253906e-05, -4.491955041885376e-05, -4.346668720245361e-05, -4.201382398605347e-05, -4.056096076965332e-05, -3.9108097553253174e-05, -3.765523433685303e-05, -3.620237112045288e-05, -3.4749507904052734e-05, -3.329664468765259e-05, -3.184378147125244e-05, -3.0390918254852295e-05, -2.893805503845215e-05, -2.7485191822052002e-05, -2.6032328605651855e-05, -2.457946538925171e-05, -2.3126602172851562e-05, -2.1673738956451416e-05, -2.022087574005127e-05, -1.8768012523651123e-05, -1.7315149307250977e-05, -1.586228609085083e-05, -1.4409422874450684e-05, -1.2956559658050537e-05, -1.150369644165039e-05, -1.0050833225250244e-05, -8.597970008850098e-06, -7.145106792449951e-06, -5.692243576049805e-06, -4.239380359649658e-06, -2.7865171432495117e-06, -1.3336539268493652e-06, 1.1920928955078125e-07, 1.5720725059509277e-06, 3.0249357223510742e-06, 4.477798938751221e-06, 5.930662155151367e-06, 7.383525371551514e-06, 8.83638858795166e-06, 1.0289251804351807e-05, 1.1742115020751953e-05, 1.31949782371521e-05, 1.4647841453552246e-05, 1.6100704669952393e-05, 1.755356788635254e-05, 1.9006431102752686e-05, 2.0459294319152832e-05, 2.191215753555298e-05, 2.3365020751953125e-05, 2.481788396835327e-05, 2.6270747184753418e-05, 2.7723610401153564e-05, 2.917647361755371e-05, 3.062933683395386e-05, 3.2082200050354004e-05, 3.353506326675415e-05, 3.49879264831543e-05, 3.644078969955444e-05, 3.789365291595459e-05, 3.9346516132354736e-05, 4.079937934875488e-05, 4.225224256515503e-05, 4.3705105781555176e-05, 4.515796899795532e-05, 4.661083221435547e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 8.0, 6.0, 16.0, 18.0, 10.0, 10.0, 22.0, 21.0, 29.0, 15.0, 32.0, 42.0, 38.0, 50.0, 41.0, 40.0, 43.0, 61.0, 42.0, 44.0, 42.0, 50.0, 49.0, 35.0, 33.0, 26.0, 35.0, 14.0, 21.0, 16.0, 15.0, 10.0, 12.0, 10.0, 5.0, 7.0, 10.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.696846008300781e-05, -4.549045115709305e-05, -4.4012442231178284e-05, -4.253443330526352e-05, -4.1056424379348755e-05, -3.957841545343399e-05, -3.8100406527519226e-05, -3.662239760160446e-05, -3.51443886756897e-05, -3.366637974977493e-05, -3.218837082386017e-05, -3.0710361897945404e-05, -2.923235297203064e-05, -2.7754344046115875e-05, -2.627633512020111e-05, -2.4798326194286346e-05, -2.3320317268371582e-05, -2.1842308342456818e-05, -2.0364299416542053e-05, -1.888629049062729e-05, -1.7408281564712524e-05, -1.593027263879776e-05, -1.4452263712882996e-05, -1.2974254786968231e-05, -1.1496245861053467e-05, -1.0018236935138702e-05, -8.540228009223938e-06, -7.062219083309174e-06, -5.584210157394409e-06, -4.106201231479645e-06, -2.6281923055648804e-06, -1.150183379650116e-06, 3.2782554626464844e-07, 1.8058344721794128e-06, 3.2838433980941772e-06, 4.761852324008942e-06, 6.239861249923706e-06, 7.71787017583847e-06, 9.195879101753235e-06, 1.0673888027668e-05, 1.2151896953582764e-05, 1.3629905879497528e-05, 1.5107914805412292e-05, 1.6585923731327057e-05, 1.806393265724182e-05, 1.9541941583156586e-05, 2.101995050907135e-05, 2.2497959434986115e-05, 2.397596836090088e-05, 2.5453977286815643e-05, 2.6931986212730408e-05, 2.8409995138645172e-05, 2.9888004064559937e-05, 3.13660129904747e-05, 3.2844021916389465e-05, 3.432203084230423e-05, 3.5800039768218994e-05, 3.727804869413376e-05, 3.875605762004852e-05, 4.023406654596329e-05, 4.171207547187805e-05, 4.3190084397792816e-05, 4.466809332370758e-05, 4.6146102249622345e-05, 4.762411117553711e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 12.0, 18.0, 16.0, 22.0, 42.0, 58.0, 95.0, 137.0, 173.0, 233.0, 328.0, 511.0, 714.0, 970.0, 1437.0, 2188.0, 3207.0, 4738.0, 7456.0, 11458.0, 18667.0, 32897.0, 64733.0, 169046.0, 443434.0, 146491.0, 59270.0, 30640.0, 17764.0, 10820.0, 6806.0, 4613.0, 3115.0, 1941.0, 1418.0, 906.0, 634.0, 403.0, 345.0, 240.0, 166.0, 115.0, 69.0, 63.0, 34.0, 38.0, 20.0, 10.0, 15.0, 6.0, 6.0, 1.0, 3.0, 2.0, 3.0], "bins": [-4.780292510986328e-05, -4.6372413635253906e-05, -4.494190216064453e-05, -4.3511390686035156e-05, -4.208087921142578e-05, -4.0650367736816406e-05, -3.921985626220703e-05, -3.7789344787597656e-05, -3.635883331298828e-05, -3.4928321838378906e-05, -3.349781036376953e-05, -3.2067298889160156e-05, -3.063678741455078e-05, -2.9206275939941406e-05, -2.777576446533203e-05, -2.6345252990722656e-05, -2.491474151611328e-05, -2.3484230041503906e-05, -2.205371856689453e-05, -2.0623207092285156e-05, -1.919269561767578e-05, -1.7762184143066406e-05, -1.633167266845703e-05, -1.4901161193847656e-05, -1.3470649719238281e-05, -1.2040138244628906e-05, -1.0609626770019531e-05, -9.179115295410156e-06, -7.748603820800781e-06, -6.318092346191406e-06, -4.887580871582031e-06, -3.4570693969726562e-06, -2.0265579223632812e-06, -5.960464477539062e-07, 8.344650268554688e-07, 2.2649765014648438e-06, 3.6954879760742188e-06, 5.125999450683594e-06, 6.556510925292969e-06, 7.987022399902344e-06, 9.417533874511719e-06, 1.0848045349121094e-05, 1.2278556823730469e-05, 1.3709068298339844e-05, 1.5139579772949219e-05, 1.6570091247558594e-05, 1.800060272216797e-05, 1.9431114196777344e-05, 2.086162567138672e-05, 2.2292137145996094e-05, 2.372264862060547e-05, 2.5153160095214844e-05, 2.658367156982422e-05, 2.8014183044433594e-05, 2.944469451904297e-05, 3.0875205993652344e-05, 3.230571746826172e-05, 3.3736228942871094e-05, 3.516674041748047e-05, 3.6597251892089844e-05, 3.802776336669922e-05, 3.9458274841308594e-05, 4.088878631591797e-05, 4.2319297790527344e-05, 4.374980926513672e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 6.0, 8.0, 15.0, 20.0, 14.0, 26.0, 24.0, 25.0, 16.0, 26.0, 35.0, 35.0, 46.0, 36.0, 40.0, 37.0, 42.0, 39.0, 47.0, 38.0, 28.0, 38.0, 39.0, 32.0, 33.0, 27.0, 27.0, 21.0, 30.0, 24.0, 17.0, 9.0, 14.0, 12.0, 14.0, 11.0, 4.0, 1.0, 6.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6047229766845703e-05, -2.5214627385139465e-05, -2.4382025003433228e-05, -2.354942262172699e-05, -2.2716820240020752e-05, -2.1884217858314514e-05, -2.1051615476608276e-05, -2.021901309490204e-05, -1.93864107131958e-05, -1.8553808331489563e-05, -1.7721205949783325e-05, -1.6888603568077087e-05, -1.605600118637085e-05, -1.5223398804664612e-05, -1.4390796422958374e-05, -1.3558194041252136e-05, -1.2725591659545898e-05, -1.189298927783966e-05, -1.1060386896133423e-05, -1.0227784514427185e-05, -9.395182132720947e-06, -8.56257975101471e-06, -7.729977369308472e-06, -6.897374987602234e-06, -6.064772605895996e-06, -5.232170224189758e-06, -4.3995678424835205e-06, -3.5669654607772827e-06, -2.734363079071045e-06, -1.9017606973648071e-06, -1.0691583156585693e-06, -2.3655593395233154e-07, 5.960464477539062e-07, 1.428648829460144e-06, 2.261251211166382e-06, 3.0938535928726196e-06, 3.926455974578857e-06, 4.759058356285095e-06, 5.591660737991333e-06, 6.424263119697571e-06, 7.256865501403809e-06, 8.089467883110046e-06, 8.922070264816284e-06, 9.754672646522522e-06, 1.058727502822876e-05, 1.1419877409934998e-05, 1.2252479791641235e-05, 1.3085082173347473e-05, 1.3917684555053711e-05, 1.4750286936759949e-05, 1.5582889318466187e-05, 1.6415491700172424e-05, 1.7248094081878662e-05, 1.80806964635849e-05, 1.8913298845291138e-05, 1.9745901226997375e-05, 2.0578503608703613e-05, 2.141110599040985e-05, 2.224370837211609e-05, 2.3076310753822327e-05, 2.3908913135528564e-05, 2.4741515517234802e-05, 2.557411789894104e-05, 2.6406720280647278e-05, 2.7239322662353516e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 11.0, 23.0, 19.0, 33.0, 43.0, 46.0, 79.0, 132.0, 205.0, 301.0, 376.0, 683.0, 1037.0, 1579.0, 2713.0, 5406.0, 9310.0, 21358.0, 79784.0, 819199.0, 65801.0, 19419.0, 9620.0, 4450.0, 2481.0, 1565.0, 1070.0, 545.0, 383.0, 268.0, 212.0, 121.0, 88.0, 47.0, 57.0, 24.0, 16.0, 22.0, 6.0, 10.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6808509826660156e-05, -1.6256235539913177e-05, -1.57039612531662e-05, -1.515168696641922e-05, -1.4599412679672241e-05, -1.4047138392925262e-05, -1.3494864106178284e-05, -1.2942589819431305e-05, -1.2390315532684326e-05, -1.1838041245937347e-05, -1.1285766959190369e-05, -1.073349267244339e-05, -1.0181218385696411e-05, -9.628944098949432e-06, -9.076669812202454e-06, -8.524395525455475e-06, -7.972121238708496e-06, -7.419846951961517e-06, -6.8675726652145386e-06, -6.31529837846756e-06, -5.763024091720581e-06, -5.210749804973602e-06, -4.6584755182266235e-06, -4.106201231479645e-06, -3.553926944732666e-06, -3.0016526579856873e-06, -2.4493783712387085e-06, -1.8971040844917297e-06, -1.344829797744751e-06, -7.925555109977722e-07, -2.4028122425079346e-07, 3.119930624961853e-07, 8.642673492431641e-07, 1.4165416359901428e-06, 1.9688159227371216e-06, 2.5210902094841003e-06, 3.073364496231079e-06, 3.625638782978058e-06, 4.177913069725037e-06, 4.730187356472015e-06, 5.282461643218994e-06, 5.834735929965973e-06, 6.387010216712952e-06, 6.93928450345993e-06, 7.491558790206909e-06, 8.043833076953888e-06, 8.596107363700867e-06, 9.148381650447845e-06, 9.700655937194824e-06, 1.0252930223941803e-05, 1.0805204510688782e-05, 1.135747879743576e-05, 1.190975308418274e-05, 1.2462027370929718e-05, 1.3014301657676697e-05, 1.3566575944423676e-05, 1.4118850231170654e-05, 1.4671124517917633e-05, 1.5223398804664612e-05, 1.577567309141159e-05, 1.632794737815857e-05, 1.6880221664905548e-05, 1.7432495951652527e-05, 1.7984770238399506e-05, 1.8537044525146484e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 0.0, 6.0, 2.0, 13.0, 0.0, 11.0, 11.0, 4.0, 0.0, 12.0, 9.0, 16.0, 0.0, 50.0, 43.0, 59.0, 0.0, 18.0, 97.0, 309.0, 0.0, 96.0, 23.0, 41.0, 0.0, 53.0, 37.0, 21.0, 0.0, 10.0, 12.0, 7.0, 0.0, 13.0, 2.0, 16.0, 0.0, 5.0, 9.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6838312149047852e-06, -1.6391277313232422e-06, -1.5944242477416992e-06, -1.5497207641601562e-06, -1.5050172805786133e-06, -1.4603137969970703e-06, -1.4156103134155273e-06, -1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 11.0, 16.0, 28.0, 42.0, 42.0, 79.0, 137.0, 257.0, 549.0, 1298.0, 3542.0, 12138.0, 56126.0, 782974.0, 157823.0, 23561.0, 6138.0, 2105.0, 785.0, 372.0, 189.0, 113.0, 62.0, 34.0, 26.0, 19.0, 16.0, 14.0, 8.0, 9.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9146671295166016e-05, -2.813246101140976e-05, -2.7118250727653503e-05, -2.6104040443897247e-05, -2.508983016014099e-05, -2.4075619876384735e-05, -2.306140959262848e-05, -2.2047199308872223e-05, -2.1032989025115967e-05, -2.001877874135971e-05, -1.9004568457603455e-05, -1.79903581738472e-05, -1.6976147890090942e-05, -1.5961937606334686e-05, -1.494772732257843e-05, -1.3933517038822174e-05, -1.2919306755065918e-05, -1.1905096471309662e-05, -1.0890886187553406e-05, -9.87667590379715e-06, -8.862465620040894e-06, -7.848255336284637e-06, -6.834045052528381e-06, -5.819834768772125e-06, -4.805624485015869e-06, -3.791414201259613e-06, -2.777203917503357e-06, -1.7629936337471008e-06, -7.487833499908447e-07, 2.654269337654114e-07, 1.2796372175216675e-06, 2.2938475012779236e-06, 3.3080577850341797e-06, 4.322268068790436e-06, 5.336478352546692e-06, 6.350688636302948e-06, 7.364898920059204e-06, 8.37910920381546e-06, 9.393319487571716e-06, 1.0407529771327972e-05, 1.1421740055084229e-05, 1.2435950338840485e-05, 1.345016062259674e-05, 1.4464370906352997e-05, 1.5478581190109253e-05, 1.649279147386551e-05, 1.7507001757621765e-05, 1.852121204137802e-05, 1.9535422325134277e-05, 2.0549632608890533e-05, 2.156384289264679e-05, 2.2578053176403046e-05, 2.3592263460159302e-05, 2.4606473743915558e-05, 2.5620684027671814e-05, 2.663489431142807e-05, 2.7649104595184326e-05, 2.8663314878940582e-05, 2.967752516269684e-05, 3.0691735446453094e-05, 3.170594573020935e-05, 3.272015601396561e-05, 3.373436629772186e-05, 3.474857658147812e-05, 3.5762786865234375e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 8.0, 12.0, 9.0, 10.0, 16.0, 10.0, 24.0, 21.0, 13.0, 44.0, 44.0, 51.0, 79.0, 116.0, 160.0, 97.0, 58.0, 22.0, 37.0, 34.0, 21.0, 15.0, 16.0, 16.0, 16.0, 12.0, 4.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6424025893211365e-06, -3.5297125577926636e-06, -3.4170225262641907e-06, -3.3043324947357178e-06, -3.191642463207245e-06, -3.078952431678772e-06, -2.966262400150299e-06, -2.853572368621826e-06, -2.7408823370933533e-06, -2.6281923055648804e-06, -2.5155022740364075e-06, -2.4028122425079346e-06, -2.2901222109794617e-06, -2.1774321794509888e-06, -2.064742147922516e-06, -1.952052116394043e-06, -1.83936208486557e-06, -1.7266720533370972e-06, -1.6139820218086243e-06, -1.5012919902801514e-06, -1.3886019587516785e-06, -1.2759119272232056e-06, -1.1632218956947327e-06, -1.0505318641662598e-06, -9.378418326377869e-07, -8.25151801109314e-07, -7.124617695808411e-07, -5.997717380523682e-07, -4.870817065238953e-07, -3.7439167499542236e-07, -2.6170164346694946e-07, -1.4901161193847656e-07, -3.632158041000366e-08, 7.636845111846924e-08, 1.8905848264694214e-07, 3.0174851417541504e-07, 4.1443854570388794e-07, 5.271285772323608e-07, 6.398186087608337e-07, 7.525086402893066e-07, 8.651986718177795e-07, 9.778887033462524e-07, 1.0905787348747253e-06, 1.2032687664031982e-06, 1.3159587979316711e-06, 1.428648829460144e-06, 1.541338860988617e-06, 1.6540288925170898e-06, 1.7667189240455627e-06, 1.8794089555740356e-06, 1.9920989871025085e-06, 2.1047890186309814e-06, 2.2174790501594543e-06, 2.3301690816879272e-06, 2.4428591132164e-06, 2.555549144744873e-06, 2.668239176273346e-06, 2.780929207801819e-06, 2.8936192393302917e-06, 3.0063092708587646e-06, 3.1189993023872375e-06, 3.2316893339157104e-06, 3.3443793654441833e-06, 3.4570693969726562e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 13.0, 11.0, 22.0, 22.0, 32.0, 48.0, 53.0, 58.0, 112.0, 155.0, 123.0, 91.0, 58.0, 46.0, 32.0, 17.0, 18.0, 17.0, 11.0, 6.0, 5.0, 6.0, 4.0, 2.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.10133244865574e-05, -6.889286305522546e-05, -6.677240162389353e-05, -6.46519401925616e-05, -6.253147876122966e-05, -6.041101732989773e-05, -5.82905558985658e-05, -5.6170094467233866e-05, -5.4049633035901934e-05, -5.192917160457e-05, -4.980871017323807e-05, -4.7688248741906136e-05, -4.5567787310574204e-05, -4.344732587924227e-05, -4.132686444791034e-05, -3.9206403016578406e-05, -3.7085941585246474e-05, -3.496548015391454e-05, -3.284501872258261e-05, -3.0724557291250676e-05, -2.8604095859918743e-05, -2.648363442858681e-05, -2.4363172997254878e-05, -2.2242711565922946e-05, -2.0122250134591013e-05, -1.800178870325908e-05, -1.5881327271927148e-05, -1.3760865840595216e-05, -1.1640404409263283e-05, -9.51994297793135e-06, -7.399481546599418e-06, -5.279020115267485e-06, -3.158565959893167e-06, -1.0381045285612345e-06, 1.082356902770698e-06, 3.2028183341026306e-06, 5.323279765434563e-06, 7.443741196766496e-06, 9.564202628098428e-06, 1.168466405943036e-05, 1.3805125490762293e-05, 1.5925586922094226e-05, 1.804604835342616e-05, 2.016650978475809e-05, 2.2286971216090024e-05, 2.4407432647421956e-05, 2.652789407875389e-05, 2.864835551008582e-05, 3.0768816941417754e-05, 3.2889278372749686e-05, 3.500973980408162e-05, 3.713020123541355e-05, 3.9250662666745484e-05, 4.1371124098077416e-05, 4.349158552940935e-05, 4.561204696074128e-05, 4.7732508392073214e-05, 4.9852969823405147e-05, 5.197343125473708e-05, 5.409389268606901e-05, 5.6214354117400944e-05, 5.833481554873288e-05, 6.045527698006481e-05, 6.257573841139674e-05, 6.469619984272867e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 13.0, 13.0, 12.0, 16.0, 20.0, 17.0, 30.0, 30.0, 41.0, 36.0, 45.0, 41.0, 41.0, 35.0, 53.0, 44.0, 43.0, 41.0, 56.0, 56.0, 48.0, 26.0, 31.0, 19.0, 26.0, 21.0, 23.0, 12.0, 15.0, 12.0, 9.0, 8.0, 14.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.606642323778942e-05, -4.4688000343739986e-05, -4.330957744969055e-05, -4.1931154555641115e-05, -4.055273166159168e-05, -3.917430876754224e-05, -3.779588587349281e-05, -3.641746297944337e-05, -3.5039040085393935e-05, -3.36606171913445e-05, -3.2282194297295064e-05, -3.090377140324563e-05, -2.9525348509196192e-05, -2.8146925615146756e-05, -2.6768504540086724e-05, -2.5390081646037288e-05, -2.4011660570977256e-05, -2.263323767692782e-05, -2.1254814782878384e-05, -1.9876391888828948e-05, -1.8497968994779512e-05, -1.7119546100730076e-05, -1.5741125025670044e-05, -1.4362702131620608e-05, -1.2984279237571172e-05, -1.1605856343521737e-05, -1.02274334494723e-05, -8.849011464917567e-06, -7.470588570868131e-06, -6.092165676818695e-06, -4.713743692263961e-06, -3.335320798214525e-06, -1.9569015421438962e-06, -5.784788754681358e-07, 7.999437912076246e-07, 2.1783662305097096e-06, 3.5567891245591454e-06, 4.935212018608581e-06, 6.313634003163315e-06, 7.692056897212751e-06, 9.070479791262187e-06, 1.0448902685311623e-05, 1.1827325579361059e-05, 1.3205747563915793e-05, 1.4584170457965229e-05, 1.5962592442519963e-05, 1.73410153365694e-05, 1.8719438230618834e-05, 2.009786112466827e-05, 2.1476284018717706e-05, 2.2854706912767142e-05, 2.4233129806816578e-05, 2.5611552700866014e-05, 2.698997559491545e-05, 2.8368396669975482e-05, 2.9746819564024918e-05, 3.112524427706376e-05, 3.250366717111319e-05, 3.388209006516263e-05, 3.5260512959212065e-05, 3.66389358532615e-05, 3.8017358747310936e-05, 3.939578164136037e-05, 4.077420453540981e-05, 4.215262379148044e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 7.0, 18.0, 29.0, 28.0, 57.0, 83.0, 86.0, 151.0, 215.0, 311.0, 433.0, 606.0, 881.0, 1225.0, 1928.0, 2650.0, 3962.0, 5821.0, 9271.0, 14460.0, 24183.0, 40913.0, 77600.0, 154433.0, 312638.0, 185990.0, 88816.0, 47929.0, 26955.0, 16316.0, 10117.0, 6721.0, 4279.0, 2846.0, 2026.0, 1415.0, 918.0, 686.0, 457.0, 315.0, 239.0, 151.0, 122.0, 76.0, 62.0, 44.0, 26.0, 18.0, 13.0, 8.0, 10.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.08970832824707e-05, -8.802209049463272e-05, -8.514709770679474e-05, -8.227210491895676e-05, -7.939711213111877e-05, -7.652211934328079e-05, -7.364712655544281e-05, -7.077213376760483e-05, -6.789714097976685e-05, -6.502214819192886e-05, -6.214715540409088e-05, -5.92721626162529e-05, -5.639716982841492e-05, -5.3522177040576935e-05, -5.064718425273895e-05, -4.777219146490097e-05, -4.489719867706299e-05, -4.2022205889225006e-05, -3.9147213101387024e-05, -3.627222031354904e-05, -3.339722752571106e-05, -3.052223473787308e-05, -2.7647241950035095e-05, -2.4772249162197113e-05, -2.189725637435913e-05, -1.902226358652115e-05, -1.6147270798683167e-05, -1.3272278010845184e-05, -1.0397285223007202e-05, -7.52229243516922e-06, -4.647299647331238e-06, -1.7723068594932556e-06, 1.1026859283447266e-06, 3.977678716182709e-06, 6.852671504020691e-06, 9.727664291858673e-06, 1.2602657079696655e-05, 1.5477649867534637e-05, 1.835264265537262e-05, 2.1227635443210602e-05, 2.4102628231048584e-05, 2.6977621018886566e-05, 2.985261380672455e-05, 3.272760659456253e-05, 3.560259938240051e-05, 3.8477592170238495e-05, 4.135258495807648e-05, 4.422757774591446e-05, 4.710257053375244e-05, 4.9977563321590424e-05, 5.2852556109428406e-05, 5.572754889726639e-05, 5.860254168510437e-05, 6.147753447294235e-05, 6.435252726078033e-05, 6.722752004861832e-05, 7.01025128364563e-05, 7.297750562429428e-05, 7.585249841213226e-05, 7.872749119997025e-05, 8.160248398780823e-05, 8.447747677564621e-05, 8.735246956348419e-05, 9.022746235132217e-05, 9.310245513916016e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 7.0, 6.0, 14.0, 13.0, 11.0, 12.0, 15.0, 18.0, 20.0, 32.0, 32.0, 33.0, 46.0, 44.0, 50.0, 36.0, 46.0, 52.0, 44.0, 38.0, 49.0, 55.0, 44.0, 41.0, 35.0, 27.0, 27.0, 20.0, 18.0, 22.0, 14.0, 9.0, 13.0, 10.0, 9.0, 5.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3020973205566406e-05, -3.198999911546707e-05, -3.095902502536774e-05, -2.9928050935268402e-05, -2.8897076845169067e-05, -2.7866102755069733e-05, -2.6835128664970398e-05, -2.5804154574871063e-05, -2.477318048477173e-05, -2.3742206394672394e-05, -2.271123230457306e-05, -2.1680258214473724e-05, -2.064928412437439e-05, -1.9618310034275055e-05, -1.858733594417572e-05, -1.7556361854076385e-05, -1.652538776397705e-05, -1.5494413673877716e-05, -1.4463439583778381e-05, -1.3432465493679047e-05, -1.2401491403579712e-05, -1.1370517313480377e-05, -1.0339543223381042e-05, -9.308569133281708e-06, -8.277595043182373e-06, -7.246620953083038e-06, -6.215646862983704e-06, -5.184672772884369e-06, -4.153698682785034e-06, -3.1227245926856995e-06, -2.0917505025863647e-06, -1.06077641248703e-06, -2.9802322387695312e-08, 1.0011717677116394e-06, 2.032145857810974e-06, 3.063119947910309e-06, 4.0940940380096436e-06, 5.125068128108978e-06, 6.156042218208313e-06, 7.187016308307648e-06, 8.217990398406982e-06, 9.248964488506317e-06, 1.0279938578605652e-05, 1.1310912668704987e-05, 1.2341886758804321e-05, 1.3372860848903656e-05, 1.440383493900299e-05, 1.5434809029102325e-05, 1.646578311920166e-05, 1.7496757209300995e-05, 1.852773129940033e-05, 1.9558705389499664e-05, 2.0589679479599e-05, 2.1620653569698334e-05, 2.265162765979767e-05, 2.3682601749897003e-05, 2.4713575839996338e-05, 2.5744549930095673e-05, 2.6775524020195007e-05, 2.7806498110294342e-05, 2.8837472200393677e-05, 2.986844629049301e-05, 3.0899420380592346e-05, 3.193039447069168e-05, 3.2961368560791016e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 11.0, 18.0, 24.0, 25.0, 48.0, 75.0, 79.0, 153.0, 200.0, 330.0, 619.0, 1016.0, 1781.0, 3457.0, 6470.0, 13307.0, 27734.0, 63982.0, 168947.0, 438837.0, 191129.0, 69801.0, 30849.0, 14084.0, 7180.0, 3602.0, 1984.0, 1128.0, 625.0, 380.0, 214.0, 126.0, 94.0, 64.0, 43.0, 40.0, 29.0, 17.0, 11.0, 10.0, 6.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001264810562133789, -0.00012259557843208313, -0.00011871010065078735, -0.00011482462286949158, -0.0001109391450881958, -0.00010705366730690002, -0.00010316818952560425, -9.928271174430847e-05, -9.53972339630127e-05, -9.151175618171692e-05, -8.762627840042114e-05, -8.374080061912537e-05, -7.985532283782959e-05, -7.596984505653381e-05, -7.208436727523804e-05, -6.819888949394226e-05, -6.431341171264648e-05, -6.042793393135071e-05, -5.654245615005493e-05, -5.2656978368759155e-05, -4.877150058746338e-05, -4.48860228061676e-05, -4.1000545024871826e-05, -3.711506724357605e-05, -3.3229589462280273e-05, -2.9344111680984497e-05, -2.545863389968872e-05, -2.1573156118392944e-05, -1.7687678337097168e-05, -1.3802200555801392e-05, -9.916722774505615e-06, -6.031244993209839e-06, -2.1457672119140625e-06, 1.7397105693817139e-06, 5.62518835067749e-06, 9.510666131973267e-06, 1.3396143913269043e-05, 1.728162169456482e-05, 2.1167099475860596e-05, 2.5052577257156372e-05, 2.893805503845215e-05, 3.2823532819747925e-05, 3.67090106010437e-05, 4.059448838233948e-05, 4.4479966163635254e-05, 4.836544394493103e-05, 5.225092172622681e-05, 5.613639950752258e-05, 6.002187728881836e-05, 6.390735507011414e-05, 6.779283285140991e-05, 7.167831063270569e-05, 7.556378841400146e-05, 7.944926619529724e-05, 8.333474397659302e-05, 8.72202217578888e-05, 9.110569953918457e-05, 9.499117732048035e-05, 9.887665510177612e-05, 0.0001027621328830719, 0.00010664761066436768, 0.00011053308844566345, 0.00011441856622695923, 0.000118304044008255, 0.00012218952178955078]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 6.0, 5.0, 9.0, 7.0, 14.0, 13.0, 22.0, 22.0, 29.0, 33.0, 40.0, 32.0, 38.0, 41.0, 39.0, 51.0, 46.0, 51.0, 47.0, 45.0, 54.0, 34.0, 40.0, 46.0, 40.0, 29.0, 23.0, 24.0, 20.0, 22.0, 16.0, 7.0, 8.0, 11.0, 11.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.658367156982422e-05, -2.5698915123939514e-05, -2.481415867805481e-05, -2.3929402232170105e-05, -2.30446457862854e-05, -2.2159889340400696e-05, -2.127513289451599e-05, -2.0390376448631287e-05, -1.9505620002746582e-05, -1.8620863556861877e-05, -1.7736107110977173e-05, -1.6851350665092468e-05, -1.5966594219207764e-05, -1.5081837773323059e-05, -1.4197081327438354e-05, -1.331232488155365e-05, -1.2427568435668945e-05, -1.154281198978424e-05, -1.0658055543899536e-05, -9.773299098014832e-06, -8.888542652130127e-06, -8.003786206245422e-06, -7.119029760360718e-06, -6.234273314476013e-06, -5.349516868591309e-06, -4.464760422706604e-06, -3.5800039768218994e-06, -2.695247530937195e-06, -1.8104910850524902e-06, -9.257346391677856e-07, -4.0978193283081055e-08, 8.437782526016235e-07, 1.7285346984863281e-06, 2.6132911443710327e-06, 3.4980475902557373e-06, 4.382804036140442e-06, 5.2675604820251465e-06, 6.152316927909851e-06, 7.037073373794556e-06, 7.92182981967926e-06, 8.806586265563965e-06, 9.69134271144867e-06, 1.0576099157333374e-05, 1.1460855603218079e-05, 1.2345612049102783e-05, 1.3230368494987488e-05, 1.4115124940872192e-05, 1.4999881386756897e-05, 1.58846378326416e-05, 1.6769394278526306e-05, 1.765415072441101e-05, 1.8538907170295715e-05, 1.942366361618042e-05, 2.0308420062065125e-05, 2.119317650794983e-05, 2.2077932953834534e-05, 2.2962689399719238e-05, 2.3847445845603943e-05, 2.4732202291488647e-05, 2.5616958737373352e-05, 2.6501715183258057e-05, 2.738647162914276e-05, 2.8271228075027466e-05, 2.915598452091217e-05, 3.0040740966796875e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 9.0, 13.0, 15.0, 28.0, 25.0, 54.0, 69.0, 104.0, 240.0, 276.0, 886.0, 1334.0, 5208.0, 25177.0, 144351.0, 837323.0, 21032.0, 8186.0, 1945.0, 1168.0, 496.0, 181.0, 174.0, 63.0, 65.0, 34.0, 18.0, 18.0, 19.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.245208740234375e-06, -5.091540515422821e-06, -4.937872290611267e-06, -4.784204065799713e-06, -4.630535840988159e-06, -4.476867616176605e-06, -4.323199391365051e-06, -4.169531166553497e-06, -4.015862941741943e-06, -3.862194716930389e-06, -3.7085264921188354e-06, -3.5548582673072815e-06, -3.4011900424957275e-06, -3.2475218176841736e-06, -3.0938535928726196e-06, -2.9401853680610657e-06, -2.7865171432495117e-06, -2.6328489184379578e-06, -2.479180693626404e-06, -2.32551246881485e-06, -2.171844244003296e-06, -2.018176019191742e-06, -1.864507794380188e-06, -1.710839569568634e-06, -1.55717134475708e-06, -1.4035031199455261e-06, -1.2498348951339722e-06, -1.0961666703224182e-06, -9.424984455108643e-07, -7.888302206993103e-07, -6.351619958877563e-07, -4.814937710762024e-07, -3.2782554626464844e-07, -1.7415732145309448e-07, -2.0489096641540527e-08, 1.3317912817001343e-07, 2.868473529815674e-07, 4.4051557779312134e-07, 5.941838026046753e-07, 7.478520274162292e-07, 9.015202522277832e-07, 1.0551884770393372e-06, 1.2088567018508911e-06, 1.362524926662445e-06, 1.516193151473999e-06, 1.669861376285553e-06, 1.823529601097107e-06, 1.977197825908661e-06, 2.130866050720215e-06, 2.284534275531769e-06, 2.4382025003433228e-06, 2.5918707251548767e-06, 2.7455389499664307e-06, 2.8992071747779846e-06, 3.0528753995895386e-06, 3.2065436244010925e-06, 3.3602118492126465e-06, 3.5138800740242004e-06, 3.6675482988357544e-06, 3.821216523647308e-06, 3.974884748458862e-06, 4.128552973270416e-06, 4.28222119808197e-06, 4.435889422893524e-06, 4.589557647705078e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 854.0, 0.0, 0.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 1.0, 11.0, 6.0, 7.0, 18.0, 20.0, 31.0, 71.0, 90.0, 140.0, 156.0, 202.0, 365.0, 1539.0, 1511.0, 2657.0, 5544.0, 10517.0, 27970.0, 855242.0, 91975.0, 27671.0, 10470.0, 5539.0, 4165.0, 849.0, 631.0, 372.0, 225.0, 148.0, 234.0, 45.0, 15.0, 34.0, 19.0, 13.0, 16.0, 8.0, 8.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.016313374042511e-06, -1.94646418094635e-06, -1.8766149878501892e-06, -1.8067657947540283e-06, -1.7369166016578674e-06, -1.6670674085617065e-06, -1.5972182154655457e-06, -1.5273690223693848e-06, -1.4575198292732239e-06, -1.387670636177063e-06, -1.317821443080902e-06, -1.2479722499847412e-06, -1.1781230568885803e-06, -1.1082738637924194e-06, -1.0384246706962585e-06, -9.685754776000977e-07, -8.987262845039368e-07, -8.288770914077759e-07, -7.59027898311615e-07, -6.891787052154541e-07, -6.193295121192932e-07, -5.494803190231323e-07, -4.796311259269714e-07, -4.0978193283081055e-07, -3.3993273973464966e-07, -2.7008354663848877e-07, -2.0023435354232788e-07, -1.30385160446167e-07, -6.05359673500061e-08, 9.313225746154785e-09, 7.916241884231567e-08, 1.4901161193847656e-07, 2.1886080503463745e-07, 2.8870999813079834e-07, 3.5855919122695923e-07, 4.284083843231201e-07, 4.98257577419281e-07, 5.681067705154419e-07, 6.379559636116028e-07, 7.078051567077637e-07, 7.776543498039246e-07, 8.475035429000854e-07, 9.173527359962463e-07, 9.872019290924072e-07, 1.0570511221885681e-06, 1.126900315284729e-06, 1.1967495083808899e-06, 1.2665987014770508e-06, 1.3364478945732117e-06, 1.4062970876693726e-06, 1.4761462807655334e-06, 1.5459954738616943e-06, 1.6158446669578552e-06, 1.6856938600540161e-06, 1.755543053150177e-06, 1.8253922462463379e-06, 1.8952414393424988e-06, 1.9650906324386597e-06, 2.0349398255348206e-06, 2.1047890186309814e-06, 2.1746382117271423e-06, 2.2444874048233032e-06, 2.314336597919464e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 116.0, 0.0, 0.0, 596.0, 0.0, 0.0, 0.0, 149.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.364418029785156e-07, -5.206093192100525e-07, -5.047768354415894e-07, -4.889443516731262e-07, -4.731118679046631e-07, -4.5727938413619995e-07, -4.414469003677368e-07, -4.256144165992737e-07, -4.0978193283081055e-07, -3.939494490623474e-07, -3.781169652938843e-07, -3.6228448152542114e-07, -3.46451997756958e-07, -3.3061951398849487e-07, -3.1478703022003174e-07, -2.989545464515686e-07, -2.8312206268310547e-07, -2.6728957891464233e-07, -2.514570951461792e-07, -2.3562461137771606e-07, -2.1979212760925293e-07, -2.039596438407898e-07, -1.8812716007232666e-07, -1.7229467630386353e-07, -1.564621925354004e-07, -1.4062970876693726e-07, -1.2479722499847412e-07, -1.0896474123001099e-07, -9.313225746154785e-08, -7.729977369308472e-08, -6.146728992462158e-08, -4.563480615615845e-08, -2.9802322387695312e-08, -1.3969838619232178e-08, 1.862645149230957e-09, 1.7695128917694092e-08, 3.3527612686157227e-08, 4.936009645462036e-08, 6.51925802230835e-08, 8.102506399154663e-08, 9.685754776000977e-08, 1.126900315284729e-07, 1.2852251529693604e-07, 1.4435499906539917e-07, 1.601874828338623e-07, 1.7601996660232544e-07, 1.9185245037078857e-07, 2.076849341392517e-07, 2.2351741790771484e-07, 2.39349901676178e-07, 2.551823854446411e-07, 2.7101486921310425e-07, 2.868473529815674e-07, 3.026798367500305e-07, 3.1851232051849365e-07, 3.343448042869568e-07, 3.501772880554199e-07, 3.6600977182388306e-07, 3.818422555923462e-07, 3.976747393608093e-07, 4.1350722312927246e-07, 4.293397068977356e-07, 4.4517219066619873e-07, 4.6100467443466187e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 3.0, 12.0, 15.0, 23.0, 41.0, 45.0, 89.0, 164.0, 217.0, 158.0, 92.0, 44.0, 43.0, 18.0, 11.0, 10.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.601846689591184e-05, -6.332686461973935e-05, -6.063525870558806e-05, -5.794365279143676e-05, -5.525205051526427e-05, -5.256044460111298e-05, -4.986883868696168e-05, -4.717723641078919e-05, -4.4485630496637896e-05, -4.17940245824866e-05, -3.910242230631411e-05, -3.6410816392162815e-05, -3.371921047801152e-05, -3.102760820183903e-05, -2.8336002287687734e-05, -2.564439819252584e-05, -2.295279409736395e-05, -2.0261190002202056e-05, -1.7569585907040164e-05, -1.4877979992888868e-05, -1.2186375897726975e-05, -9.494771802565083e-06, -6.803165888413787e-06, -4.111561793251894e-06, -1.419957698090002e-06, 1.2716468518192414e-06, 3.963251401728485e-06, 6.654856406385079e-06, 9.346460501546971e-06, 1.2038064596708864e-05, 1.472967051086016e-05, 1.7421274606022052e-05, 2.011287142522633e-05, 2.2804475520388223e-05, 2.5496079615550116e-05, 2.8187685529701412e-05, 3.08792878058739e-05, 3.35708937200252e-05, 3.626249963417649e-05, 3.895410191034898e-05, 4.164570782450028e-05, 4.4337313738651574e-05, 4.702891601482406e-05, 4.972052192897536e-05, 5.2412127843126655e-05, 5.5103730119299144e-05, 5.779533603345044e-05, 6.0486941947601736e-05, 6.317854422377422e-05, 6.587014649994671e-05, 6.856175605207682e-05, 7.12533583282493e-05, 7.39449606044218e-05, 7.66365701565519e-05, 7.932817243272439e-05, 8.201977470889688e-05, 8.471138426102698e-05, 8.740298653719947e-05, 9.009459608932957e-05, 9.278619836550206e-05, 9.547780064167455e-05, 9.816940291784704e-05, 0.00010086101246997714, 0.00010355261474614963, 0.00010624421702232212]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 1.0, 8.0, 2.0, 8.0, 8.0, 10.0, 6.0, 19.0, 18.0, 18.0, 23.0, 21.0, 25.0, 30.0, 31.0, 34.0, 35.0, 42.0, 33.0, 42.0, 31.0, 45.0, 46.0, 46.0, 39.0, 39.0, 36.0, 39.0, 32.0, 16.0, 16.0, 29.0, 28.0, 25.0, 13.0, 18.0, 21.0, 14.0, 9.0, 9.0, 5.0, 7.0, 9.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.9518478186219e-05, -2.8572161681950092e-05, -2.7625845177681185e-05, -2.6679528673412278e-05, -2.573321216914337e-05, -2.4786895664874464e-05, -2.3840579160605557e-05, -2.289426265633665e-05, -2.1947946152067743e-05, -2.1001629647798836e-05, -2.005531314352993e-05, -1.9108996639261022e-05, -1.8162680134992115e-05, -1.7216363630723208e-05, -1.62700471264543e-05, -1.5323730622185394e-05, -1.4377414117916487e-05, -1.343109761364758e-05, -1.2484781109378673e-05, -1.1538464605109766e-05, -1.0592148100840859e-05, -9.645831596571952e-06, -8.699515092303045e-06, -7.753198588034138e-06, -6.806882083765231e-06, -5.860565579496324e-06, -4.914249075227417e-06, -3.96793257095851e-06, -3.021616066689603e-06, -2.075299562420696e-06, -1.128983058151789e-06, -1.82666553882882e-07, 7.636517693754286e-07, 1.7099682736443356e-06, 2.6562847779132426e-06, 3.6026012821821496e-06, 4.548917786451057e-06, 5.495234290719964e-06, 6.441550794988871e-06, 7.387867299257778e-06, 8.334183803526685e-06, 9.280500307795592e-06, 1.0226816812064499e-05, 1.1173133316333406e-05, 1.2119449820602313e-05, 1.306576632487122e-05, 1.4012082829140127e-05, 1.4958399333409034e-05, 1.590471583767794e-05, 1.6851032341946848e-05, 1.7797348846215755e-05, 1.8743665350484662e-05, 1.968998185475357e-05, 2.0636298359022476e-05, 2.1582614863291383e-05, 2.252893136756029e-05, 2.3475247871829197e-05, 2.4421564376098104e-05, 2.536788088036701e-05, 2.6314197384635918e-05, 2.7260513888904825e-05, 2.8206830393173732e-05, 2.915314689744264e-05, 3.0099463401711546e-05, 3.104577990598045e-05]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 6.0, 11.0, 7.0, 15.0, 5.0, 14.0, 15.0, 26.0, 26.0, 31.0, 44.0, 67.0, 85.0, 106.0, 160.0, 228.0, 311.0, 471.0, 701.0, 1158.0, 1972.0, 3669.0, 9029.0, 356468.0, 3783365.0, 24193.0, 5052.0, 2569.0, 1549.0, 930.0, 570.0, 422.0, 237.0, 183.0, 146.0, 94.0, 84.0, 66.0, 45.0, 22.0, 33.0, 27.0, 17.0, 8.0, 6.0, 12.0, 12.0, 6.0, 3.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00010126829147338867, -9.80207696557045e-05, -9.477324783802032e-05, -9.152572602033615e-05, -8.827820420265198e-05, -8.50306823849678e-05, -8.178316056728363e-05, -7.853563874959946e-05, -7.528811693191528e-05, -7.204059511423111e-05, -6.879307329654694e-05, -6.554555147886276e-05, -6.229802966117859e-05, -5.9050507843494415e-05, -5.580298602581024e-05, -5.255546420812607e-05, -4.9307942390441895e-05, -4.606042057275772e-05, -4.281289875507355e-05, -3.9565376937389374e-05, -3.63178551197052e-05, -3.3070333302021027e-05, -2.9822811484336853e-05, -2.657528966665268e-05, -2.3327767848968506e-05, -2.0080246031284332e-05, -1.683272421360016e-05, -1.3585202395915985e-05, -1.0337680578231812e-05, -7.090158760547638e-06, -3.842636942863464e-06, -5.951151251792908e-07, 2.652406692504883e-06, 5.899928510189056e-06, 9.14745032787323e-06, 1.2394972145557404e-05, 1.5642493963241577e-05, 1.889001578092575e-05, 2.2137537598609924e-05, 2.5385059416294098e-05, 2.863258123397827e-05, 3.1880103051662445e-05, 3.512762486934662e-05, 3.837514668703079e-05, 4.1622668504714966e-05, 4.487019032239914e-05, 4.811771214008331e-05, 5.1365233957767487e-05, 5.461275577545166e-05, 5.7860277593135834e-05, 6.110779941082001e-05, 6.435532122850418e-05, 6.760284304618835e-05, 7.085036486387253e-05, 7.40978866815567e-05, 7.734540849924088e-05, 8.059293031692505e-05, 8.384045213460922e-05, 8.70879739522934e-05, 9.033549576997757e-05, 9.358301758766174e-05, 9.683053940534592e-05, 0.00010007806122303009, 0.00010332558304071426, 0.00010657310485839844]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 3.0, 2.0, 6.0, 6.0, 6.0, 9.0, 8.0, 13.0, 18.0, 14.0, 20.0, 24.0, 30.0, 26.0, 39.0, 33.0, 41.0, 23.0, 40.0, 55.0, 41.0, 41.0, 63.0, 43.0, 47.0, 44.0, 42.0, 24.0, 34.0, 19.0, 22.0, 27.0, 19.0, 20.0, 19.0, 15.0, 9.0, 11.0, 9.0, 8.0, 5.0, 3.0, 3.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.590753138065338e-05, -2.5052577257156372e-05, -2.4197623133659363e-05, -2.3342669010162354e-05, -2.2487714886665344e-05, -2.1632760763168335e-05, -2.0777806639671326e-05, -1.9922852516174316e-05, -1.9067898392677307e-05, -1.8212944269180298e-05, -1.735799014568329e-05, -1.650303602218628e-05, -1.564808189868927e-05, -1.479312777519226e-05, -1.3938173651695251e-05, -1.3083219528198242e-05, -1.2228265404701233e-05, -1.1373311281204224e-05, -1.0518357157707214e-05, -9.663403034210205e-06, -8.808448910713196e-06, -7.953494787216187e-06, -7.098540663719177e-06, -6.243586540222168e-06, -5.388632416725159e-06, -4.533678293228149e-06, -3.67872416973114e-06, -2.823770046234131e-06, -1.9688159227371216e-06, -1.1138617992401123e-06, -2.5890767574310303e-07, 5.960464477539062e-07, 1.4510005712509155e-06, 2.305954694747925e-06, 3.160908818244934e-06, 4.015862941741943e-06, 4.870817065238953e-06, 5.725771188735962e-06, 6.580725312232971e-06, 7.4356794357299805e-06, 8.29063355922699e-06, 9.145587682723999e-06, 1.0000541806221008e-05, 1.0855495929718018e-05, 1.1710450053215027e-05, 1.2565404176712036e-05, 1.3420358300209045e-05, 1.4275312423706055e-05, 1.5130266547203064e-05, 1.5985220670700073e-05, 1.6840174794197083e-05, 1.7695128917694092e-05, 1.85500830411911e-05, 1.940503716468811e-05, 2.025999128818512e-05, 2.111494541168213e-05, 2.1969899535179138e-05, 2.2824853658676147e-05, 2.3679807782173157e-05, 2.4534761905670166e-05, 2.5389716029167175e-05, 2.6244670152664185e-05, 2.7099624276161194e-05, 2.7954578399658203e-05]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 12.0, 15.0, 21.0, 36.0, 65.0, 112.0, 166.0, 365.0, 761.0, 1642.0, 4013.0, 12897.0, 183473.0, 3953621.0, 26324.0, 6352.0, 2328.0, 1017.0, 511.0, 242.0, 119.0, 68.0, 39.0, 19.0, 18.0, 16.0, 11.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015842914581298828, -0.0001531839370727539, -0.00014793872833251953, -0.00014269351959228516, -0.00013744831085205078, -0.0001322031021118164, -0.00012695789337158203, -0.00012171268463134766, -0.00011646747589111328, -0.0001112222671508789, -0.00010597705841064453, -0.00010073184967041016, -9.548664093017578e-05, -9.02414321899414e-05, -8.499622344970703e-05, -7.975101470947266e-05, -7.450580596923828e-05, -6.92605972290039e-05, -6.401538848876953e-05, -5.8770179748535156e-05, -5.352497100830078e-05, -4.8279762268066406e-05, -4.303455352783203e-05, -3.7789344787597656e-05, -3.254413604736328e-05, -2.7298927307128906e-05, -2.205371856689453e-05, -1.6808509826660156e-05, -1.1563301086425781e-05, -6.318092346191406e-06, -1.0728836059570312e-06, 4.172325134277344e-06, 9.417533874511719e-06, 1.4662742614746094e-05, 1.990795135498047e-05, 2.5153160095214844e-05, 3.039836883544922e-05, 3.5643577575683594e-05, 4.088878631591797e-05, 4.6133995056152344e-05, 5.137920379638672e-05, 5.6624412536621094e-05, 6.186962127685547e-05, 6.711483001708984e-05, 7.236003875732422e-05, 7.76052474975586e-05, 8.285045623779297e-05, 8.809566497802734e-05, 9.334087371826172e-05, 9.85860824584961e-05, 0.00010383129119873047, 0.00010907649993896484, 0.00011432170867919922, 0.0001195669174194336, 0.00012481212615966797, 0.00013005733489990234, 0.00013530254364013672, 0.0001405477523803711, 0.00014579296112060547, 0.00015103816986083984, 0.00015628337860107422, 0.0001615285873413086, 0.00016677379608154297, 0.00017201900482177734, 0.00017726421356201172]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 7.0, 5.0, 16.0, 31.0, 61.0, 182.0, 571.0, 2614.0, 334.0, 122.0, 43.0, 16.0, 8.0, 11.0, 8.0, 7.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187490463256836e-05, -2.1152198314666748e-05, -2.0429491996765137e-05, -1.9706785678863525e-05, -1.8984079360961914e-05, -1.8261373043060303e-05, -1.753866672515869e-05, -1.681596040725708e-05, -1.609325408935547e-05, -1.5370547771453857e-05, -1.4647841453552246e-05, -1.3925135135650635e-05, -1.3202428817749023e-05, -1.2479722499847412e-05, -1.17570161819458e-05, -1.103430986404419e-05, -1.0311603546142578e-05, -9.588897228240967e-06, -8.866190910339355e-06, -8.143484592437744e-06, -7.420778274536133e-06, -6.6980719566345215e-06, -5.97536563873291e-06, -5.252659320831299e-06, -4.5299530029296875e-06, -3.807246685028076e-06, -3.084540367126465e-06, -2.3618340492248535e-06, -1.6391277313232422e-06, -9.164214134216309e-07, -1.9371509552001953e-07, 5.289912223815918e-07, 1.2516975402832031e-06, 1.9744038581848145e-06, 2.6971101760864258e-06, 3.419816493988037e-06, 4.1425228118896484e-06, 4.86522912979126e-06, 5.587935447692871e-06, 6.310641765594482e-06, 7.033348083496094e-06, 7.756054401397705e-06, 8.478760719299316e-06, 9.201467037200928e-06, 9.924173355102539e-06, 1.064687967300415e-05, 1.1369585990905762e-05, 1.2092292308807373e-05, 1.2814998626708984e-05, 1.3537704944610596e-05, 1.4260411262512207e-05, 1.4983117580413818e-05, 1.570582389831543e-05, 1.642853021621704e-05, 1.7151236534118652e-05, 1.7873942852020264e-05, 1.8596649169921875e-05, 1.9319355487823486e-05, 2.0042061805725098e-05, 2.076476812362671e-05, 2.148747444152832e-05, 2.221018075942993e-05, 2.2932887077331543e-05, 2.3655593395233154e-05, 2.4378299713134766e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 4.0, 9.0, 21.0, 21.0, 28.0, 40.0, 36.0, 90.0, 125.0, 183.0, 142.0, 97.0, 53.0, 38.0, 37.0, 23.0, 12.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.924494012608193e-05, -3.751970507437363e-05, -3.579446638468653e-05, -3.4069227694999427e-05, -3.234399264329113e-05, -3.0618757591582835e-05, -2.889351890189573e-05, -2.7168282031198032e-05, -2.5443045160500333e-05, -2.3717808289802633e-05, -2.1992571419104934e-05, -2.0267334548407234e-05, -1.8542097677709535e-05, -1.6816860807011835e-05, -1.5091623936314136e-05, -1.3366387065616436e-05, -1.1641150194918737e-05, -9.915913324221037e-06, -8.190676453523338e-06, -6.465439582825638e-06, -4.740202712127939e-06, -3.0149658414302394e-06, -1.2897289707325399e-06, 4.355078999651596e-07, 2.160744770662859e-06, 3.8859816413605586e-06, 5.611218512058258e-06, 7.3364553827559575e-06, 9.061692253453657e-06, 1.0786929124151357e-05, 1.2512165994849056e-05, 1.4237402865546755e-05, 1.5962636098265648e-05, 1.7687872968963347e-05, 1.9413109839661047e-05, 2.1138346710358746e-05, 2.2863583581056446e-05, 2.4588820451754145e-05, 2.6314057322451845e-05, 2.8039294193149544e-05, 2.9764531063847244e-05, 3.148976975353435e-05, 3.321500480524264e-05, 3.494023985695094e-05, 3.666547854663804e-05, 3.8390717236325145e-05, 4.011595228803344e-05, 4.184118733974174e-05, 4.356642602942884e-05, 4.529166471911594e-05, 4.701689977082424e-05, 4.8742134822532535e-05, 5.046737351221964e-05, 5.219261220190674e-05, 5.3917847253615037e-05, 5.564308230532333e-05, 5.7368320995010436e-05, 5.909355968469754e-05, 6.0818794736405835e-05, 6.254402978811413e-05, 6.426926847780123e-05, 6.599450716748834e-05, 6.771973858121783e-05, 6.944497727090493e-05, 7.117021596059203e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 4.0, 8.0, 3.0, 20.0, 12.0, 22.0, 16.0, 20.0, 33.0, 37.0, 38.0, 49.0, 41.0, 38.0, 36.0, 41.0, 46.0, 61.0, 44.0, 49.0, 51.0, 43.0, 38.0, 33.0, 39.0, 25.0, 16.0, 19.0, 23.0, 20.0, 13.0, 7.0, 8.0, 12.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8470991310314275e-05, -2.7579229936236516e-05, -2.6687468562158756e-05, -2.5795705369091593e-05, -2.4903943995013833e-05, -2.4012182620936073e-05, -2.3120421246858314e-05, -2.222865805379115e-05, -2.133689667971339e-05, -2.044513530563563e-05, -1.955337393155787e-05, -1.8661610738490708e-05, -1.776984936441295e-05, -1.687808799033519e-05, -1.598632661625743e-05, -1.5094564332684968e-05, -1.4202802958607208e-05, -1.3311041584529448e-05, -1.2419279300956987e-05, -1.1527517926879227e-05, -1.0635755643306766e-05, -9.743994269229006e-06, -8.852231985656545e-06, -7.960470611578785e-06, -7.068708782753674e-06, -6.176946953928564e-06, -5.285185125103453e-06, -4.393423296278343e-06, -3.5016616948269075e-06, -2.6099000933754724e-06, -1.7181382645503618e-06, -8.263764357252512e-07, 6.538539309985936e-08, 9.5714722192497e-07, 1.8489089370632428e-06, 2.7406706522015156e-06, 3.632432481026626e-06, 4.524194082478061e-06, 5.415955911303172e-06, 6.3077177401282825e-06, 7.199479568953393e-06, 8.091241397778504e-06, 8.983002771856263e-06, 9.874765055428725e-06, 1.0766526429506484e-05, 1.1658288713078946e-05, 1.2550050087156706e-05, 1.3441811461234465e-05, 1.4333573744806927e-05, 1.5225335118884686e-05, 1.6117097402457148e-05, 1.7008858776534908e-05, 1.7900620150612667e-05, 1.879238334367983e-05, 1.968414471775759e-05, 2.057590609183535e-05, 2.146766746591311e-05, 2.235942883999087e-05, 2.325119021406863e-05, 2.4142953407135792e-05, 2.5034714781213552e-05, 2.592647615529131e-05, 2.681823752936907e-05, 2.7710000722436234e-05, 2.8601762096513994e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 20.0, 36.0, 39.0, 66.0, 94.0, 130.0, 203.0, 259.0, 378.0, 660.0, 896.0, 1313.0, 2216.0, 3156.0, 4938.0, 8676.0, 13232.0, 24159.0, 40201.0, 76068.0, 178637.0, 337389.0, 171635.0, 83562.0, 40100.0, 22894.0, 14374.0, 8235.0, 5422.0, 3176.0, 2085.0, 1434.0, 918.0, 600.0, 411.0, 269.0, 183.0, 153.0, 93.0, 64.0, 51.0, 29.0, 23.0, 15.0, 12.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.8848648071289062e-05, -2.7933157980442047e-05, -2.7017667889595032e-05, -2.6102177798748016e-05, -2.5186687707901e-05, -2.4271197617053986e-05, -2.335570752620697e-05, -2.2440217435359955e-05, -2.152472734451294e-05, -2.0609237253665924e-05, -1.969374716281891e-05, -1.8778257071971893e-05, -1.7862766981124878e-05, -1.6947276890277863e-05, -1.6031786799430847e-05, -1.5116296708583832e-05, -1.4200806617736816e-05, -1.3285316526889801e-05, -1.2369826436042786e-05, -1.145433634519577e-05, -1.0538846254348755e-05, -9.62335616350174e-06, -8.707866072654724e-06, -7.792375981807709e-06, -6.876885890960693e-06, -5.961395800113678e-06, -5.045905709266663e-06, -4.130415618419647e-06, -3.214925527572632e-06, -2.2994354367256165e-06, -1.383945345878601e-06, -4.684552550315857e-07, 4.470348358154297e-07, 1.362524926662445e-06, 2.2780150175094604e-06, 3.193505108356476e-06, 4.108995199203491e-06, 5.024485290050507e-06, 5.939975380897522e-06, 6.855465471744537e-06, 7.770955562591553e-06, 8.686445653438568e-06, 9.601935744285583e-06, 1.0517425835132599e-05, 1.1432915925979614e-05, 1.234840601682663e-05, 1.3263896107673645e-05, 1.417938619852066e-05, 1.5094876289367676e-05, 1.601036638021469e-05, 1.6925856471061707e-05, 1.7841346561908722e-05, 1.8756836652755737e-05, 1.9672326743602753e-05, 2.0587816834449768e-05, 2.1503306925296783e-05, 2.24187970161438e-05, 2.3334287106990814e-05, 2.424977719783783e-05, 2.5165267288684845e-05, 2.608075737953186e-05, 2.6996247470378876e-05, 2.791173756122589e-05, 2.8827227652072906e-05, 2.9742717742919922e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 3.0, 5.0, 7.0, 8.0, 15.0, 15.0, 22.0, 20.0, 27.0, 30.0, 38.0, 41.0, 36.0, 42.0, 50.0, 50.0, 54.0, 51.0, 54.0, 52.0, 43.0, 59.0, 42.0, 35.0, 24.0, 27.0, 21.0, 24.0, 19.0, 19.0, 8.0, 11.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.147125244140625e-05, -3.0499882996082306e-05, -2.9528513550758362e-05, -2.8557144105434418e-05, -2.7585774660110474e-05, -2.661440521478653e-05, -2.5643035769462585e-05, -2.467166632413864e-05, -2.3700296878814697e-05, -2.2728927433490753e-05, -2.175755798816681e-05, -2.0786188542842865e-05, -1.981481909751892e-05, -1.8843449652194977e-05, -1.7872080206871033e-05, -1.690071076154709e-05, -1.5929341316223145e-05, -1.49579718708992e-05, -1.3986602425575256e-05, -1.3015232980251312e-05, -1.2043863534927368e-05, -1.1072494089603424e-05, -1.010112464427948e-05, -9.129755198955536e-06, -8.158385753631592e-06, -7.187016308307648e-06, -6.215646862983704e-06, -5.2442774176597595e-06, -4.2729079723358154e-06, -3.3015385270118713e-06, -2.3301690816879272e-06, -1.3587996363639832e-06, -3.8743019104003906e-07, 5.83939254283905e-07, 1.5553086996078491e-06, 2.5266781449317932e-06, 3.4980475902557373e-06, 4.469417035579681e-06, 5.4407864809036255e-06, 6.41215592622757e-06, 7.383525371551514e-06, 8.354894816875458e-06, 9.326264262199402e-06, 1.0297633707523346e-05, 1.126900315284729e-05, 1.2240372598171234e-05, 1.3211742043495178e-05, 1.4183111488819122e-05, 1.5154480934143066e-05, 1.612585037946701e-05, 1.7097219824790955e-05, 1.80685892701149e-05, 1.9039958715438843e-05, 2.0011328160762787e-05, 2.098269760608673e-05, 2.1954067051410675e-05, 2.292543649673462e-05, 2.3896805942058563e-05, 2.4868175387382507e-05, 2.583954483270645e-05, 2.6810914278030396e-05, 2.778228372335434e-05, 2.8753653168678284e-05, 2.9725022614002228e-05, 3.069639205932617e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 14.0, 7.0, 12.0, 16.0, 32.0, 44.0, 50.0, 75.0, 122.0, 198.0, 274.0, 477.0, 660.0, 1026.0, 1682.0, 2633.0, 4332.0, 7165.0, 13356.0, 26609.0, 59599.0, 185674.0, 526140.0, 124547.0, 45523.0, 21203.0, 11094.0, 6248.0, 3477.0, 2244.0, 1358.0, 876.0, 619.0, 369.0, 278.0, 174.0, 91.0, 88.0, 55.0, 37.0, 28.0, 19.0, 11.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-4.5299530029296875e-05, -4.4053420424461365e-05, -4.2807310819625854e-05, -4.1561201214790344e-05, -4.0315091609954834e-05, -3.9068982005119324e-05, -3.7822872400283813e-05, -3.65767627954483e-05, -3.533065319061279e-05, -3.408454358577728e-05, -3.283843398094177e-05, -3.159232437610626e-05, -3.0346214771270752e-05, -2.9100105166435242e-05, -2.785399556159973e-05, -2.660788595676422e-05, -2.536177635192871e-05, -2.41156667470932e-05, -2.286955714225769e-05, -2.162344753742218e-05, -2.037733793258667e-05, -1.913122832775116e-05, -1.788511872291565e-05, -1.663900911808014e-05, -1.539289951324463e-05, -1.4146789908409119e-05, -1.2900680303573608e-05, -1.1654570698738098e-05, -1.0408461093902588e-05, -9.162351489067078e-06, -7.916241884231567e-06, -6.670132279396057e-06, -5.424022674560547e-06, -4.177913069725037e-06, -2.9318034648895264e-06, -1.6856938600540161e-06, -4.3958425521850586e-07, 8.065253496170044e-07, 2.0526349544525146e-06, 3.298744559288025e-06, 4.544854164123535e-06, 5.790963768959045e-06, 7.037073373794556e-06, 8.283182978630066e-06, 9.529292583465576e-06, 1.0775402188301086e-05, 1.2021511793136597e-05, 1.3267621397972107e-05, 1.4513731002807617e-05, 1.5759840607643127e-05, 1.7005950212478638e-05, 1.8252059817314148e-05, 1.9498169422149658e-05, 2.074427902698517e-05, 2.199038863182068e-05, 2.323649823665619e-05, 2.44826078414917e-05, 2.572871744632721e-05, 2.697482705116272e-05, 2.822093665599823e-05, 2.946704626083374e-05, 3.071315586566925e-05, 3.195926547050476e-05, 3.320537507534027e-05, 3.445148468017578e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 8.0, 9.0, 13.0, 7.0, 13.0, 11.0, 23.0, 10.0, 23.0, 23.0, 27.0, 25.0, 32.0, 33.0, 34.0, 38.0, 43.0, 27.0, 42.0, 64.0, 38.0, 32.0, 47.0, 34.0, 27.0, 41.0, 31.0, 39.0, 32.0, 25.0, 23.0, 22.0, 19.0, 11.0, 14.0, 13.0, 8.0, 6.0, 4.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.436471939086914e-05, -1.3857148587703705e-05, -1.3349577784538269e-05, -1.2842006981372833e-05, -1.2334436178207397e-05, -1.1826865375041962e-05, -1.1319294571876526e-05, -1.081172376871109e-05, -1.0304152965545654e-05, -9.796582162380219e-06, -9.289011359214783e-06, -8.781440556049347e-06, -8.273869752883911e-06, -7.766298949718475e-06, -7.2587281465530396e-06, -6.751157343387604e-06, -6.243586540222168e-06, -5.736015737056732e-06, -5.228444933891296e-06, -4.720874130725861e-06, -4.213303327560425e-06, -3.705732524394989e-06, -3.1981617212295532e-06, -2.6905909180641174e-06, -2.1830201148986816e-06, -1.6754493117332458e-06, -1.16787850856781e-06, -6.603077054023743e-07, -1.5273690223693848e-07, 3.548339009284973e-07, 8.624047040939331e-07, 1.369975507259369e-06, 1.8775463104248047e-06, 2.3851171135902405e-06, 2.8926879167556763e-06, 3.400258719921112e-06, 3.907829523086548e-06, 4.415400326251984e-06, 4.9229711294174194e-06, 5.430541932582855e-06, 5.938112735748291e-06, 6.445683538913727e-06, 6.953254342079163e-06, 7.460825145244598e-06, 7.968395948410034e-06, 8.47596675157547e-06, 8.983537554740906e-06, 9.491108357906342e-06, 9.998679161071777e-06, 1.0506249964237213e-05, 1.1013820767402649e-05, 1.1521391570568085e-05, 1.202896237373352e-05, 1.2536533176898956e-05, 1.3044103980064392e-05, 1.3551674783229828e-05, 1.4059245586395264e-05, 1.45668163895607e-05, 1.5074387192726135e-05, 1.558195799589157e-05, 1.6089528799057007e-05, 1.6597099602222443e-05, 1.710467040538788e-05, 1.7612241208553314e-05, 1.811981201171875e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 32.0, 34.0, 35.0, 62.0, 104.0, 133.0, 159.0, 348.0, 411.0, 725.0, 1159.0, 2068.0, 2813.0, 4882.0, 8266.0, 21803.0, 58379.0, 772870.0, 124633.0, 23529.0, 10333.0, 5994.0, 3876.0, 2014.0, 1354.0, 945.0, 558.0, 305.0, 233.0, 150.0, 92.0, 61.0, 73.0, 27.0, 26.0, 14.0, 14.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0592862963676453e-05, -1.0278075933456421e-05, -9.96328890323639e-06, -9.648501873016357e-06, -9.333714842796326e-06, -9.018927812576294e-06, -8.704140782356262e-06, -8.38935375213623e-06, -8.074566721916199e-06, -7.759779691696167e-06, -7.444992661476135e-06, -7.1302056312561035e-06, -6.815418601036072e-06, -6.50063157081604e-06, -6.185844540596008e-06, -5.8710575103759766e-06, -5.556270480155945e-06, -5.241483449935913e-06, -4.926696419715881e-06, -4.61190938949585e-06, -4.297122359275818e-06, -3.982335329055786e-06, -3.6675482988357544e-06, -3.3527612686157227e-06, -3.037974238395691e-06, -2.723187208175659e-06, -2.4084001779556274e-06, -2.0936131477355957e-06, -1.778826117515564e-06, -1.4640390872955322e-06, -1.1492520570755005e-06, -8.344650268554688e-07, -5.19677996635437e-07, -2.0489096641540527e-07, 1.0989606380462646e-07, 4.246830940246582e-07, 7.394701242446899e-07, 1.0542571544647217e-06, 1.3690441846847534e-06, 1.6838312149047852e-06, 1.998618245124817e-06, 2.3134052753448486e-06, 2.6281923055648804e-06, 2.942979335784912e-06, 3.257766366004944e-06, 3.5725533962249756e-06, 3.887340426445007e-06, 4.202127456665039e-06, 4.516914486885071e-06, 4.8317015171051025e-06, 5.146488547325134e-06, 5.461275577545166e-06, 5.776062607765198e-06, 6.0908496379852295e-06, 6.405636668205261e-06, 6.720423698425293e-06, 7.035210728645325e-06, 7.3499977588653564e-06, 7.664784789085388e-06, 7.97957181930542e-06, 8.294358849525452e-06, 8.609145879745483e-06, 8.923932909965515e-06, 9.238719940185547e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 18.0, 0.0, 10.0, 0.0, 21.0, 0.0, 0.0, 20.0, 0.0, 38.0, 0.0, 40.0, 0.0, 64.0, 0.0, 131.0, 0.0, 0.0, 358.0, 0.0, 106.0, 0.0, 55.0, 0.0, 58.0, 0.0, 42.0, 0.0, 0.0, 17.0, 0.0, 12.0, 0.0, 7.0, 0.0, 10.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.670613169670105e-07, -8.400529623031616e-07, -8.130446076393127e-07, -7.860362529754639e-07, -7.59027898311615e-07, -7.320195436477661e-07, -7.050111889839172e-07, -6.780028343200684e-07, -6.509944796562195e-07, -6.239861249923706e-07, -5.969777703285217e-07, -5.699694156646729e-07, -5.42961061000824e-07, -5.159527063369751e-07, -4.889443516731262e-07, -4.6193599700927734e-07, -4.3492764234542847e-07, -4.079192876815796e-07, -3.809109330177307e-07, -3.5390257835388184e-07, -3.2689422369003296e-07, -2.998858690261841e-07, -2.728775143623352e-07, -2.4586915969848633e-07, -2.1886080503463745e-07, -1.9185245037078857e-07, -1.648440957069397e-07, -1.3783574104309082e-07, -1.1082738637924194e-07, -8.381903171539307e-08, -5.681067705154419e-08, -2.9802322387695312e-08, -2.7939677238464355e-09, 2.421438694000244e-08, 5.122274160385132e-08, 7.82310962677002e-08, 1.0523945093154907e-07, 1.3224780559539795e-07, 1.5925616025924683e-07, 1.862645149230957e-07, 2.1327286958694458e-07, 2.4028122425079346e-07, 2.6728957891464233e-07, 2.942979335784912e-07, 3.213062882423401e-07, 3.4831464290618896e-07, 3.7532299757003784e-07, 4.023313522338867e-07, 4.293397068977356e-07, 4.5634806156158447e-07, 4.833564162254333e-07, 5.103647708892822e-07, 5.373731255531311e-07, 5.6438148021698e-07, 5.913898348808289e-07, 6.183981895446777e-07, 6.454065442085266e-07, 6.724148988723755e-07, 6.994232535362244e-07, 7.264316082000732e-07, 7.534399628639221e-07, 7.80448317527771e-07, 8.074566721916199e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 2.0, 6.0, 9.0, 14.0, 25.0, 23.0, 29.0, 78.0, 122.0, 233.0, 444.0, 882.0, 2295.0, 5196.0, 19100.0, 73088.0, 751432.0, 157963.0, 24451.0, 8081.0, 2663.0, 1145.0, 613.0, 270.0, 153.0, 84.0, 40.0, 32.0, 22.0, 8.0, 12.0, 8.0, 9.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633167266845703e-05, -1.583155244588852e-05, -1.5331432223320007e-05, -1.4831312000751495e-05, -1.4331191778182983e-05, -1.3831071555614471e-05, -1.333095133304596e-05, -1.2830831110477448e-05, -1.2330710887908936e-05, -1.1830590665340424e-05, -1.1330470442771912e-05, -1.08303502202034e-05, -1.0330229997634888e-05, -9.830109775066376e-06, -9.329989552497864e-06, -8.829869329929352e-06, -8.32974910736084e-06, -7.829628884792328e-06, -7.329508662223816e-06, -6.829388439655304e-06, -6.329268217086792e-06, -5.82914799451828e-06, -5.329027771949768e-06, -4.828907549381256e-06, -4.328787326812744e-06, -3.828667104244232e-06, -3.3285468816757202e-06, -2.8284266591072083e-06, -2.3283064365386963e-06, -1.8281862139701843e-06, -1.3280659914016724e-06, -8.279457688331604e-07, -3.2782554626464844e-07, 1.7229467630386353e-07, 6.724148988723755e-07, 1.1725351214408875e-06, 1.6726553440093994e-06, 2.1727755665779114e-06, 2.6728957891464233e-06, 3.1730160117149353e-06, 3.6731362342834473e-06, 4.173256456851959e-06, 4.673376679420471e-06, 5.173496901988983e-06, 5.673617124557495e-06, 6.173737347126007e-06, 6.673857569694519e-06, 7.173977792263031e-06, 7.674098014831543e-06, 8.174218237400055e-06, 8.674338459968567e-06, 9.174458682537079e-06, 9.67457890510559e-06, 1.0174699127674103e-05, 1.0674819350242615e-05, 1.1174939572811127e-05, 1.1675059795379639e-05, 1.217518001794815e-05, 1.2675300240516663e-05, 1.3175420463085175e-05, 1.3675540685653687e-05, 1.4175660908222198e-05, 1.467578113079071e-05, 1.5175901353359222e-05, 1.5676021575927734e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 11.0, 11.0, 6.0, 5.0, 14.0, 15.0, 22.0, 17.0, 21.0, 24.0, 35.0, 38.0, 69.0, 265.0, 103.0, 71.0, 40.0, 38.0, 38.0, 23.0, 27.0, 20.0, 17.0, 14.0, 8.0, 5.0, 8.0, 4.0, 4.0, 9.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.086162567138672e-06, -2.0228326320648193e-06, -1.959502696990967e-06, -1.8961727619171143e-06, -1.8328428268432617e-06, -1.7695128917694092e-06, -1.7061829566955566e-06, -1.642853021621704e-06, -1.5795230865478516e-06, -1.516193151473999e-06, -1.4528632164001465e-06, -1.389533281326294e-06, -1.3262033462524414e-06, -1.2628734111785889e-06, -1.1995434761047363e-06, -1.1362135410308838e-06, -1.0728836059570312e-06, -1.0095536708831787e-06, -9.462237358093262e-07, -8.828938007354736e-07, -8.195638656616211e-07, -7.562339305877686e-07, -6.92903995513916e-07, -6.295740604400635e-07, -5.662441253662109e-07, -5.029141902923584e-07, -4.3958425521850586e-07, -3.762543201446533e-07, -3.129243850708008e-07, -2.4959444999694824e-07, -1.862645149230957e-07, -1.2293457984924316e-07, -5.960464477539063e-08, 3.725290298461914e-09, 6.705522537231445e-08, 1.30385160446167e-07, 1.9371509552001953e-07, 2.5704503059387207e-07, 3.203749656677246e-07, 3.8370490074157715e-07, 4.470348358154297e-07, 5.103647708892822e-07, 5.736947059631348e-07, 6.370246410369873e-07, 7.003545761108398e-07, 7.636845111846924e-07, 8.270144462585449e-07, 8.903443813323975e-07, 9.5367431640625e-07, 1.0170042514801025e-06, 1.080334186553955e-06, 1.1436641216278076e-06, 1.2069940567016602e-06, 1.2703239917755127e-06, 1.3336539268493652e-06, 1.3969838619232178e-06, 1.4603137969970703e-06, 1.5236437320709229e-06, 1.5869736671447754e-06, 1.650303602218628e-06, 1.7136335372924805e-06, 1.776963472366333e-06, 1.8402934074401855e-06, 1.903623342514038e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 8.0, 10.0, 11.0, 16.0, 26.0, 20.0, 36.0, 31.0, 59.0, 113.0, 140.0, 157.0, 97.0, 67.0, 53.0, 36.0, 19.0, 25.0, 24.0, 11.0, 3.0, 6.0, 4.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0152670660754666e-05, -2.8730075428029522e-05, -2.7307482014293782e-05, -2.588488678156864e-05, -2.4462291548843496e-05, -2.3039698135107756e-05, -2.1617102902382612e-05, -2.019450766965747e-05, -1.8771912436932325e-05, -1.7349317204207182e-05, -1.5926723790471442e-05, -1.4504128557746299e-05, -1.3081533325021155e-05, -1.1658939001790714e-05, -1.0236344678560272e-05, -8.813749445835128e-06, -7.3911560320993885e-06, -5.968561254121596e-06, -4.5459664761438034e-06, -3.1233721529133618e-06, -1.7007773749355692e-06, -2.781825969577767e-07, 1.144411726272665e-06, 2.5670069589978084e-06, 3.98960128222825e-06, 5.412196060206043e-06, 6.834790838183835e-06, 8.257385161414277e-06, 9.679979484644718e-06, 1.1102574717369862e-05, 1.2525169040600304e-05, 1.3947764273325447e-05, 1.537035859655589e-05, 1.6792953829281032e-05, 1.8215547243016772e-05, 1.9638142475741915e-05, 2.106073770846706e-05, 2.24833311222028e-05, 2.3905926354927942e-05, 2.5328521587653086e-05, 2.675111682037823e-05, 2.8173712053103372e-05, 2.9596305466839112e-05, 3.101889888057485e-05, 3.2441494113299996e-05, 3.386408934602514e-05, 3.528668457875028e-05, 3.6709279811475426e-05, 3.813187504420057e-05, 3.955447027692571e-05, 4.0977065509650856e-05, 4.2399660742376e-05, 4.3822252337122336e-05, 4.524484756984748e-05, 4.666744280257262e-05, 4.8090038035297766e-05, 4.95126296300441e-05, 5.0935224862769246e-05, 5.235782009549439e-05, 5.378041532821953e-05, 5.520300692296587e-05, 5.662560215569101e-05, 5.8048197388416156e-05, 5.94707926211413e-05, 6.089338785386644e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 2.0, 8.0, 7.0, 11.0, 19.0, 14.0, 21.0, 21.0, 30.0, 34.0, 39.0, 48.0, 40.0, 42.0, 34.0, 45.0, 44.0, 58.0, 42.0, 48.0, 56.0, 46.0, 28.0, 38.0, 34.0, 33.0, 19.0, 22.0, 14.0, 23.0, 16.0, 8.0, 7.0, 8.0, 10.0, 9.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7751219022320583e-05, -2.6888899810728617e-05, -2.602658059913665e-05, -2.5164261387544684e-05, -2.4301942175952718e-05, -2.343962296436075e-05, -2.2577303752768785e-05, -2.1714986360166222e-05, -2.0852665329584852e-05, -1.9990346117992885e-05, -1.912802690640092e-05, -1.8265707694808953e-05, -1.7403388483216986e-05, -1.654106927162502e-05, -1.5678750060033053e-05, -1.4816431757935788e-05, -1.3954113455838524e-05, -1.3091794244246557e-05, -1.2229475032654591e-05, -1.1367155821062624e-05, -1.0504836609470658e-05, -9.642517397878692e-06, -8.780199095781427e-06, -7.91787988418946e-06, -7.055560672597494e-06, -6.1932414610055275e-06, -5.330922249413561e-06, -4.4686034925689455e-06, -3.606284280976979e-06, -2.7439650693850126e-06, -1.881646312540397e-06, -1.0193271009484306e-06, -1.570097083458677e-07, 7.05309389559261e-07, 1.5676284874643898e-06, 2.4299474716826808e-06, 3.2922666832746472e-06, 4.154585894866614e-06, 5.016904651711229e-06, 5.879223863303196e-06, 6.741543074895162e-06, 7.603862286487129e-06, 8.466181498079095e-06, 9.32849980017636e-06, 1.0190819011768326e-05, 1.1053138223360293e-05, 1.1915457434952259e-05, 1.2777776646544226e-05, 1.3640095858136192e-05, 1.4502415069728158e-05, 1.5364734281320125e-05, 1.622705349291209e-05, 1.7089372704504058e-05, 1.7951691916096024e-05, 1.881401112768799e-05, 1.9676328520290554e-05, 2.0538649550871924e-05, 2.140096876246389e-05, 2.2263287974055856e-05, 2.3125607185647823e-05, 2.398792639723979e-05, 2.4850245608831756e-05, 2.5712564820423722e-05, 2.6574882213026285e-05, 2.743720142461825e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 9.0, 10.0, 26.0, 32.0, 46.0, 75.0, 103.0, 148.0, 191.0, 299.0, 449.0, 576.0, 889.0, 1290.0, 1920.0, 2839.0, 4485.0, 6566.0, 10347.0, 16184.0, 28483.0, 48258.0, 94473.0, 202697.0, 314941.0, 141959.0, 71316.0, 39141.0, 22191.0, 13617.0, 8452.0, 5509.0, 3509.0, 2382.0, 1562.0, 1077.0, 709.0, 515.0, 387.0, 263.0, 203.0, 118.0, 96.0, 62.0, 39.0, 32.0, 22.0, 14.0, 13.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.692243576049805e-05, -5.504302680492401e-05, -5.3163617849349976e-05, -5.128420889377594e-05, -4.9404799938201904e-05, -4.752539098262787e-05, -4.564598202705383e-05, -4.37665730714798e-05, -4.188716411590576e-05, -4.0007755160331726e-05, -3.812834620475769e-05, -3.6248937249183655e-05, -3.436952829360962e-05, -3.2490119338035583e-05, -3.061071038246155e-05, -2.8731301426887512e-05, -2.6851892471313477e-05, -2.497248351573944e-05, -2.3093074560165405e-05, -2.121366560459137e-05, -1.9334256649017334e-05, -1.74548476934433e-05, -1.5575438737869263e-05, -1.3696029782295227e-05, -1.1816620826721191e-05, -9.937211871147156e-06, -8.05780291557312e-06, -6.1783939599990845e-06, -4.298985004425049e-06, -2.419576048851013e-06, -5.401670932769775e-07, 1.339241862297058e-06, 3.2186508178710938e-06, 5.098059773445129e-06, 6.977468729019165e-06, 8.8568776845932e-06, 1.0736286640167236e-05, 1.2615695595741272e-05, 1.4495104551315308e-05, 1.6374513506889343e-05, 1.825392246246338e-05, 2.0133331418037415e-05, 2.201274037361145e-05, 2.3892149329185486e-05, 2.577155828475952e-05, 2.7650967240333557e-05, 2.9530376195907593e-05, 3.140978515148163e-05, 3.3289194107055664e-05, 3.51686030626297e-05, 3.7048012018203735e-05, 3.892742097377777e-05, 4.080682992935181e-05, 4.268623888492584e-05, 4.456564784049988e-05, 4.6445056796073914e-05, 4.832446575164795e-05, 5.0203874707221985e-05, 5.208328366279602e-05, 5.3962692618370056e-05, 5.584210157394409e-05, 5.772151052951813e-05, 5.960091948509216e-05, 6.14803284406662e-05, 6.335973739624023e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 2.0, 7.0, 6.0, 5.0, 10.0, 16.0, 9.0, 11.0, 24.0, 26.0, 35.0, 35.0, 34.0, 49.0, 44.0, 40.0, 42.0, 55.0, 52.0, 52.0, 44.0, 48.0, 47.0, 42.0, 33.0, 38.0, 33.0, 30.0, 21.0, 12.0, 16.0, 12.0, 16.0, 11.0, 4.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.3305416107177734e-05, -2.2590160369873047e-05, -2.187490463256836e-05, -2.1159648895263672e-05, -2.0444393157958984e-05, -1.9729137420654297e-05, -1.901388168334961e-05, -1.8298625946044922e-05, -1.7583370208740234e-05, -1.6868114471435547e-05, -1.615285873413086e-05, -1.5437602996826172e-05, -1.4722347259521484e-05, -1.4007091522216797e-05, -1.329183578491211e-05, -1.2576580047607422e-05, -1.1861324310302734e-05, -1.1146068572998047e-05, -1.043081283569336e-05, -9.715557098388672e-06, -9.000301361083984e-06, -8.285045623779297e-06, -7.569789886474609e-06, -6.854534149169922e-06, -6.139278411865234e-06, -5.424022674560547e-06, -4.708766937255859e-06, -3.993511199951172e-06, -3.2782554626464844e-06, -2.562999725341797e-06, -1.8477439880371094e-06, -1.1324882507324219e-06, -4.172325134277344e-07, 2.980232238769531e-07, 1.0132789611816406e-06, 1.7285346984863281e-06, 2.4437904357910156e-06, 3.159046173095703e-06, 3.874301910400391e-06, 4.589557647705078e-06, 5.304813385009766e-06, 6.020069122314453e-06, 6.735324859619141e-06, 7.450580596923828e-06, 8.165836334228516e-06, 8.881092071533203e-06, 9.59634780883789e-06, 1.0311603546142578e-05, 1.1026859283447266e-05, 1.1742115020751953e-05, 1.245737075805664e-05, 1.3172626495361328e-05, 1.3887882232666016e-05, 1.4603137969970703e-05, 1.531839370727539e-05, 1.6033649444580078e-05, 1.6748905181884766e-05, 1.7464160919189453e-05, 1.817941665649414e-05, 1.8894672393798828e-05, 1.9609928131103516e-05, 2.0325183868408203e-05, 2.104043960571289e-05, 2.1755695343017578e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 1.0, 10.0, 5.0, 11.0, 15.0, 11.0, 26.0, 39.0, 55.0, 65.0, 114.0, 129.0, 235.0, 374.0, 549.0, 787.0, 1297.0, 2093.0, 3338.0, 5459.0, 8773.0, 15310.0, 27336.0, 51661.0, 109946.0, 277910.0, 299167.0, 119504.0, 55106.0, 29263.0, 15740.0, 9260.0, 5508.0, 3404.0, 2209.0, 1346.0, 868.0, 546.0, 376.0, 214.0, 158.0, 99.0, 69.0, 49.0, 35.0, 25.0, 15.0, 9.0, 8.0, 11.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.549192428588867e-05, -5.358085036277771e-05, -5.166977643966675e-05, -4.9758702516555786e-05, -4.7847628593444824e-05, -4.593655467033386e-05, -4.40254807472229e-05, -4.211440682411194e-05, -4.0203332901000977e-05, -3.8292258977890015e-05, -3.638118505477905e-05, -3.447011113166809e-05, -3.255903720855713e-05, -3.064796328544617e-05, -2.8736889362335205e-05, -2.6825815439224243e-05, -2.491474151611328e-05, -2.300366759300232e-05, -2.1092593669891357e-05, -1.9181519746780396e-05, -1.7270445823669434e-05, -1.535937190055847e-05, -1.344829797744751e-05, -1.1537224054336548e-05, -9.626150131225586e-06, -7.715076208114624e-06, -5.804002285003662e-06, -3.8929283618927e-06, -1.9818544387817383e-06, -7.078051567077637e-08, 1.8402934074401855e-06, 3.7513673305511475e-06, 5.662441253662109e-06, 7.573515176773071e-06, 9.484589099884033e-06, 1.1395663022994995e-05, 1.3306736946105957e-05, 1.5217810869216919e-05, 1.712888479232788e-05, 1.9039958715438843e-05, 2.0951032638549805e-05, 2.2862106561660767e-05, 2.477318048477173e-05, 2.668425440788269e-05, 2.8595328330993652e-05, 3.0506402254104614e-05, 3.2417476177215576e-05, 3.432855010032654e-05, 3.62396240234375e-05, 3.815069794654846e-05, 4.0061771869659424e-05, 4.1972845792770386e-05, 4.388391971588135e-05, 4.579499363899231e-05, 4.770606756210327e-05, 4.9617141485214233e-05, 5.1528215408325195e-05, 5.343928933143616e-05, 5.535036325454712e-05, 5.726143717765808e-05, 5.917251110076904e-05, 6.108358502388e-05, 6.299465894699097e-05, 6.490573287010193e-05, 6.681680679321289e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 10.0, 7.0, 9.0, 9.0, 18.0, 6.0, 18.0, 16.0, 29.0, 38.0, 21.0, 40.0, 34.0, 40.0, 46.0, 40.0, 49.0, 45.0, 47.0, 37.0, 38.0, 36.0, 46.0, 42.0, 34.0, 26.0, 29.0, 31.0, 21.0, 15.0, 18.0, 16.0, 15.0, 8.0, 14.0, 7.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.7642974853515625e-05, -1.7142854630947113e-05, -1.66427344083786e-05, -1.614261418581009e-05, -1.5642493963241577e-05, -1.5142373740673065e-05, -1.4642253518104553e-05, -1.4142133295536041e-05, -1.364201307296753e-05, -1.3141892850399017e-05, -1.2641772627830505e-05, -1.2141652405261993e-05, -1.1641532182693481e-05, -1.114141196012497e-05, -1.0641291737556458e-05, -1.0141171514987946e-05, -9.641051292419434e-06, -9.140931069850922e-06, -8.64081084728241e-06, -8.140690624713898e-06, -7.640570402145386e-06, -7.140450179576874e-06, -6.640329957008362e-06, -6.14020973443985e-06, -5.640089511871338e-06, -5.139969289302826e-06, -4.639849066734314e-06, -4.139728844165802e-06, -3.63960862159729e-06, -3.139488399028778e-06, -2.639368176460266e-06, -2.139247953891754e-06, -1.6391277313232422e-06, -1.1390075087547302e-06, -6.388872861862183e-07, -1.387670636177063e-07, 3.6135315895080566e-07, 8.614733815193176e-07, 1.3615936040878296e-06, 1.8617138266563416e-06, 2.3618340492248535e-06, 2.8619542717933655e-06, 3.3620744943618774e-06, 3.862194716930389e-06, 4.362314939498901e-06, 4.862435162067413e-06, 5.362555384635925e-06, 5.862675607204437e-06, 6.362795829772949e-06, 6.862916052341461e-06, 7.363036274909973e-06, 7.863156497478485e-06, 8.363276720046997e-06, 8.863396942615509e-06, 9.363517165184021e-06, 9.863637387752533e-06, 1.0363757610321045e-05, 1.0863877832889557e-05, 1.1363998055458069e-05, 1.186411827802658e-05, 1.2364238500595093e-05, 1.2864358723163605e-05, 1.3364478945732117e-05, 1.3864599168300629e-05, 1.436471939086914e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 7.0, 0.0, 8.0, 24.0, 17.0, 38.0, 48.0, 0.0, 82.0, 116.0, 155.0, 272.0, 469.0, 0.0, 711.0, 1396.0, 2895.0, 6565.0, 18294.0, 0.0, 82149.0, 821868.0, 82303.0, 18403.0, 0.0, 6479.0, 2872.0, 1349.0, 772.0, 474.0, 0.0, 274.0, 180.0, 119.0, 67.0, 37.0, 0.0, 33.0, 23.0, 19.0, 12.0, 7.0, 0.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5003606677055359e-06, -1.4510005712509155e-06, -1.4016404747962952e-06, -1.3522803783416748e-06, -1.3029202818870544e-06, -1.253560185432434e-06, -1.2042000889778137e-06, -1.1548399925231934e-06, -1.105479896068573e-06, -1.0561197996139526e-06, -1.0067597031593323e-06, -9.57399606704712e-07, -9.080395102500916e-07, -8.586794137954712e-07, -8.093193173408508e-07, -7.599592208862305e-07, -7.105991244316101e-07, -6.612390279769897e-07, -6.118789315223694e-07, -5.62518835067749e-07, -5.131587386131287e-07, -4.637986421585083e-07, -4.1443854570388794e-07, -3.650784492492676e-07, -3.157183527946472e-07, -2.6635825634002686e-07, -2.169981598854065e-07, -1.6763806343078613e-07, -1.1827796697616577e-07, -6.891787052154541e-08, -1.955777406692505e-08, 2.9802322387695312e-08, 7.916241884231567e-08, 1.2852251529693604e-07, 1.778826117515564e-07, 2.2724270820617676e-07, 2.766028046607971e-07, 3.259629011154175e-07, 3.7532299757003784e-07, 4.246830940246582e-07, 4.7404319047927856e-07, 5.234032869338989e-07, 5.727633833885193e-07, 6.221234798431396e-07, 6.7148357629776e-07, 7.208436727523804e-07, 7.702037692070007e-07, 8.195638656616211e-07, 8.689239621162415e-07, 9.182840585708618e-07, 9.676441550254822e-07, 1.0170042514801025e-06, 1.066364347934723e-06, 1.1157244443893433e-06, 1.1650845408439636e-06, 1.214444637298584e-06, 1.2638047337532043e-06, 1.3131648302078247e-06, 1.362524926662445e-06, 1.4118850231170654e-06, 1.4612451195716858e-06, 1.5106052160263062e-06, 1.5599653124809265e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 976.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.069879651069641e-07, -3.9674341678619385e-07, -3.864988684654236e-07, -3.762543201446533e-07, -3.6600977182388306e-07, -3.557652235031128e-07, -3.4552067518234253e-07, -3.3527612686157227e-07, -3.25031578540802e-07, -3.1478703022003174e-07, -3.045424818992615e-07, -2.942979335784912e-07, -2.8405338525772095e-07, -2.738088369369507e-07, -2.635642886161804e-07, -2.5331974029541016e-07, -2.430751919746399e-07, -2.3283064365386963e-07, -2.2258609533309937e-07, -2.123415470123291e-07, -2.0209699869155884e-07, -1.9185245037078857e-07, -1.816079020500183e-07, -1.7136335372924805e-07, -1.6111880540847778e-07, -1.5087425708770752e-07, -1.4062970876693726e-07, -1.30385160446167e-07, -1.2014061212539673e-07, -1.0989606380462646e-07, -9.96515154838562e-08, -8.940696716308594e-08, -7.916241884231567e-08, -6.891787052154541e-08, -5.8673322200775146e-08, -4.842877388000488e-08, -3.818422555923462e-08, -2.7939677238464355e-08, -1.7695128917694092e-08, -7.450580596923828e-09, 2.7939677238464355e-09, 1.30385160446167e-08, 2.3283064365386963e-08, 3.3527612686157227e-08, 4.377216100692749e-08, 5.4016709327697754e-08, 6.426125764846802e-08, 7.450580596923828e-08, 8.475035429000854e-08, 9.499490261077881e-08, 1.0523945093154907e-07, 1.1548399925231934e-07, 1.257285475730896e-07, 1.3597309589385986e-07, 1.4621764421463013e-07, 1.564621925354004e-07, 1.6670674085617065e-07, 1.7695128917694092e-07, 1.8719583749771118e-07, 1.9744038581848145e-07, 2.076849341392517e-07, 2.1792948246002197e-07, 2.2817403078079224e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 13.0, 0.0, 14.0, 0.0, 16.0, 0.0, 24.0, 87.0, 0.0, 118.0, 0.0, 216.0, 0.0, 443.0, 1568.0, 0.0, 3903.0, 0.0, 13515.0, 58859.0, 0.0, 890759.0, 0.0, 59486.0, 0.0, 13229.0, 3749.0, 0.0, 1587.0, 0.0, 473.0, 0.0, 237.0, 135.0, 0.0, 80.0, 0.0, 19.0, 22.0, 0.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.192153811454773e-07, -8.847564458847046e-07, -8.502975106239319e-07, -8.158385753631592e-07, -7.813796401023865e-07, -7.469207048416138e-07, -7.124617695808411e-07, -6.780028343200684e-07, -6.435438990592957e-07, -6.09084963798523e-07, -5.746260285377502e-07, -5.401670932769775e-07, -5.057081580162048e-07, -4.7124922275543213e-07, -4.367902874946594e-07, -4.023313522338867e-07, -3.67872416973114e-07, -3.334134817123413e-07, -2.989545464515686e-07, -2.644956111907959e-07, -2.300366759300232e-07, -1.955777406692505e-07, -1.6111880540847778e-07, -1.2665987014770508e-07, -9.220093488693237e-08, -5.774199962615967e-08, -2.3283064365386963e-08, 1.1175870895385742e-08, 4.563480615615845e-08, 8.009374141693115e-08, 1.1455267667770386e-07, 1.4901161193847656e-07, 1.8347054719924927e-07, 2.1792948246002197e-07, 2.523884177207947e-07, 2.868473529815674e-07, 3.213062882423401e-07, 3.557652235031128e-07, 3.902241587638855e-07, 4.246830940246582e-07, 4.591420292854309e-07, 4.936009645462036e-07, 5.280598998069763e-07, 5.62518835067749e-07, 5.969777703285217e-07, 6.314367055892944e-07, 6.658956408500671e-07, 7.003545761108398e-07, 7.348135113716125e-07, 7.692724466323853e-07, 8.03731381893158e-07, 8.381903171539307e-07, 8.726492524147034e-07, 9.071081876754761e-07, 9.415671229362488e-07, 9.760260581970215e-07, 1.0104849934577942e-06, 1.044943928718567e-06, 1.0794028639793396e-06, 1.1138617992401123e-06, 1.148320734500885e-06, 1.1827796697616577e-06, 1.2172386050224304e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 114.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 762.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.980232238769531e-07, -2.896413207054138e-07, -2.812594175338745e-07, -2.728775143623352e-07, -2.644956111907959e-07, -2.561137080192566e-07, -2.477318048477173e-07, -2.39349901676178e-07, -2.3096799850463867e-07, -2.2258609533309937e-07, -2.1420419216156006e-07, -2.0582228899002075e-07, -1.9744038581848145e-07, -1.8905848264694214e-07, -1.8067657947540283e-07, -1.7229467630386353e-07, -1.6391277313232422e-07, -1.555308699607849e-07, -1.471489667892456e-07, -1.387670636177063e-07, -1.30385160446167e-07, -1.2200325727462769e-07, -1.1362135410308838e-07, -1.0523945093154907e-07, -9.685754776000977e-08, -8.847564458847046e-08, -8.009374141693115e-08, -7.171183824539185e-08, -6.332993507385254e-08, -5.494803190231323e-08, -4.6566128730773926e-08, -3.818422555923462e-08, -2.9802322387695312e-08, -2.1420419216156006e-08, -1.30385160446167e-08, -4.6566128730773926e-09, 3.725290298461914e-09, 1.210719347000122e-08, 2.0489096641540527e-08, 2.8870999813079834e-08, 3.725290298461914e-08, 4.563480615615845e-08, 5.4016709327697754e-08, 6.239861249923706e-08, 7.078051567077637e-08, 7.916241884231567e-08, 8.754432201385498e-08, 9.592622518539429e-08, 1.043081283569336e-07, 1.126900315284729e-07, 1.210719347000122e-07, 1.2945383787155151e-07, 1.3783574104309082e-07, 1.4621764421463013e-07, 1.5459954738616943e-07, 1.6298145055770874e-07, 1.7136335372924805e-07, 1.7974525690078735e-07, 1.8812716007232666e-07, 1.9650906324386597e-07, 2.0489096641540527e-07, 2.1327286958694458e-07, 2.2165477275848389e-07, 2.300366759300232e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 0.0, 7.0, 8.0, 15.0, 11.0, 25.0, 33.0, 48.0, 83.0, 123.0, 193.0, 180.0, 108.0, 52.0, 44.0, 28.0, 16.0, 9.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.160085568903014e-05, -2.014249548665248e-05, -1.868413710326422e-05, -1.722577871987596e-05, -1.57674185174983e-05, -1.430905922461534e-05, -1.2850699931732379e-05, -1.1392340638849419e-05, -9.933981345966458e-06, -8.475622053083498e-06, -7.017262760200538e-06, -5.5589034673175775e-06, -4.100544174434617e-06, -2.642184881551657e-06, -1.1838255886686966e-06, 2.745337042142637e-07, 1.732892997097224e-06, 3.1912522899801843e-06, 4.649611582863145e-06, 6.107970875746105e-06, 7.566330168629065e-06, 9.024689461512025e-06, 1.0483048754394986e-05, 1.1941408047277946e-05, 1.3399767340160906e-05, 1.4858126633043867e-05, 1.6316485925926827e-05, 1.7774844309315085e-05, 1.9233204511692747e-05, 2.069156471407041e-05, 2.2149923097458668e-05, 2.3608281480846927e-05, 2.506664168322459e-05, 2.652500188560225e-05, 2.798336026899051e-05, 2.9441718652378768e-05, 3.090007885475643e-05, 3.235843905713409e-05, 3.381679562153295e-05, 3.527515582391061e-05, 3.673351602628827e-05, 3.819187622866593e-05, 3.9650236431043595e-05, 4.110859299544245e-05, 4.256695319782011e-05, 4.4025313400197774e-05, 4.548366996459663e-05, 4.694203016697429e-05, 4.840039036935195e-05, 4.9858750571729615e-05, 5.131711077410728e-05, 5.277546733850613e-05, 5.4233827540883794e-05, 5.5692187743261456e-05, 5.715054430766031e-05, 5.8608904510037974e-05, 6.0067264712415636e-05, 6.152562127681449e-05, 6.298398511717096e-05, 6.444234168156981e-05, 6.590070552192628e-05, 6.735906208632514e-05, 6.8817418650724e-05, 7.027578249108046e-05, 7.173413905547932e-05]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 7.0, 12.0, 8.0, 5.0, 14.0, 19.0, 21.0, 33.0, 23.0, 30.0, 38.0, 31.0, 52.0, 40.0, 38.0, 48.0, 51.0, 47.0, 40.0, 49.0, 42.0, 41.0, 47.0, 37.0, 35.0, 28.0, 35.0, 21.0, 19.0, 19.0, 11.0, 10.0, 13.0, 6.0, 8.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.268833850394003e-05, -2.2040394469513558e-05, -2.139244861609768e-05, -2.0744504581671208e-05, -2.009655872825533e-05, -1.944861469382886e-05, -1.8800670659402385e-05, -1.815272480598651e-05, -1.7504778952570632e-05, -1.685683491814416e-05, -1.6208889064728282e-05, -1.556094503030181e-05, -1.4912999176885933e-05, -1.426505514245946e-05, -1.3617110198538285e-05, -1.296916525461711e-05, -1.2321221220190637e-05, -1.1673276276269462e-05, -1.1025331332348287e-05, -1.0377387297921814e-05, -9.729441444505937e-06, -9.081497410079464e-06, -8.43355246615829e-06, -7.785607522237115e-06, -7.13766257831594e-06, -6.489717634394765e-06, -5.84177269047359e-06, -5.193828201299766e-06, -4.545883257378591e-06, -3.897938313457416e-06, -3.2499938242835924e-06, -2.6020488803624175e-06, -1.954102117451839e-06, -1.306157287217502e-06, -6.582124569831649e-07, -1.0267740435665473e-08, 6.376772034855094e-07, 1.2856221474066842e-06, 1.933566636580508e-06, 2.581511580501683e-06, 3.229456524422858e-06, 3.877401468344033e-06, 4.525346412265208e-06, 5.173290901439032e-06, 5.8212358453602064e-06, 6.469180789281381e-06, 7.117125278455205e-06, 7.76507022237638e-06, 8.413015166297555e-06, 9.06096011021873e-06, 9.708905054139905e-06, 1.0356849088566378e-05, 1.1004794941982254e-05, 1.1652738976408727e-05, 1.2300683920329902e-05, 1.2948628864251077e-05, 1.3596573808172252e-05, 1.4244518752093427e-05, 1.4892463696014602e-05, 1.5540408639935777e-05, 1.618835267436225e-05, 1.6836298527778126e-05, 1.74842425622046e-05, 1.8132188415620476e-05, 1.878013245004695e-05]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 3.0, 9.0, 18.0, 8.0, 20.0, 31.0, 33.0, 45.0, 48.0, 80.0, 92.0, 150.0, 166.0, 261.0, 359.0, 529.0, 812.0, 1241.0, 1884.0, 4758.0, 66659.0, 3962064.0, 140574.0, 7839.0, 2397.0, 1391.0, 855.0, 622.0, 381.0, 242.0, 213.0, 125.0, 89.0, 57.0, 49.0, 48.0, 20.0, 25.0, 18.0, 11.0, 12.0, 7.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.864763468503952e-05, -4.7108158469200134e-05, -4.556868225336075e-05, -4.402920603752136e-05, -4.2489729821681976e-05, -4.095025360584259e-05, -3.9410777390003204e-05, -3.787130117416382e-05, -3.633182495832443e-05, -3.4792348742485046e-05, -3.325287252664566e-05, -3.1713396310806274e-05, -3.017392009496689e-05, -2.8634443879127502e-05, -2.7094967663288116e-05, -2.555549144744873e-05, -2.4016015231609344e-05, -2.247653901576996e-05, -2.0937062799930573e-05, -1.9397586584091187e-05, -1.78581103682518e-05, -1.6318634152412415e-05, -1.4779157936573029e-05, -1.3239681720733643e-05, -1.1700205504894257e-05, -1.016072928905487e-05, -8.621253073215485e-06, -7.081776857376099e-06, -5.542300641536713e-06, -4.002824425697327e-06, -2.4633482098579407e-06, -9.238719940185547e-07, 6.156042218208313e-07, 2.1550804376602173e-06, 3.6945566534996033e-06, 5.234032869338989e-06, 6.773509085178375e-06, 8.312985301017761e-06, 9.852461516857147e-06, 1.1391937732696533e-05, 1.293141394853592e-05, 1.4470890164375305e-05, 1.601036638021469e-05, 1.7549842596054077e-05, 1.9089318811893463e-05, 2.062879502773285e-05, 2.2168271243572235e-05, 2.370774745941162e-05, 2.5247223675251007e-05, 2.6786699891090393e-05, 2.832617610692978e-05, 2.9865652322769165e-05, 3.140512853860855e-05, 3.294460475444794e-05, 3.448408097028732e-05, 3.602355718612671e-05, 3.7563033401966095e-05, 3.910250961780548e-05, 4.064198583364487e-05, 4.218146204948425e-05, 4.372093826532364e-05, 4.5260414481163025e-05, 4.679989069700241e-05, 4.83393669128418e-05]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 14.0, 6.0, 11.0, 13.0, 5.0, 26.0, 18.0, 27.0, 24.0, 28.0, 31.0, 54.0, 43.0, 32.0, 40.0, 53.0, 57.0, 43.0, 36.0, 58.0, 47.0, 41.0, 46.0, 34.0, 32.0, 31.0, 34.0, 27.0, 14.0, 10.0, 12.0, 5.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9244849681854248e-05, -1.8641352653503418e-05, -1.8037855625152588e-05, -1.7434358596801758e-05, -1.6830861568450928e-05, -1.6227364540100098e-05, -1.5623867511749268e-05, -1.5020370483398438e-05, -1.4416873455047607e-05, -1.3813376426696777e-05, -1.3209879398345947e-05, -1.2606382369995117e-05, -1.2002885341644287e-05, -1.1399388313293457e-05, -1.0795891284942627e-05, -1.0192394256591797e-05, -9.588897228240967e-06, -8.985400199890137e-06, -8.381903171539307e-06, -7.778406143188477e-06, -7.1749091148376465e-06, -6.571412086486816e-06, -5.967915058135986e-06, -5.364418029785156e-06, -4.760921001434326e-06, -4.157423973083496e-06, -3.553926944732666e-06, -2.950429916381836e-06, -2.346932888031006e-06, -1.7434358596801758e-06, -1.1399388313293457e-06, -5.364418029785156e-07, 6.705522537231445e-08, 6.705522537231445e-07, 1.2740492820739746e-06, 1.8775463104248047e-06, 2.4810433387756348e-06, 3.084540367126465e-06, 3.688037395477295e-06, 4.291534423828125e-06, 4.895031452178955e-06, 5.498528480529785e-06, 6.102025508880615e-06, 6.705522537231445e-06, 7.309019565582275e-06, 7.912516593933105e-06, 8.516013622283936e-06, 9.119510650634766e-06, 9.723007678985596e-06, 1.0326504707336426e-05, 1.0930001735687256e-05, 1.1533498764038086e-05, 1.2136995792388916e-05, 1.2740492820739746e-05, 1.3343989849090576e-05, 1.3947486877441406e-05, 1.4550983905792236e-05, 1.5154480934143066e-05, 1.5757977962493896e-05, 1.6361474990844727e-05, 1.6964972019195557e-05, 1.7568469047546387e-05, 1.8171966075897217e-05, 1.8775463104248047e-05]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 28.0, 44.0, 53.0, 101.0, 175.0, 322.0, 596.0, 1209.0, 2706.0, 8153.0, 121232.0, 4028339.0, 22783.0, 4687.0, 1917.0, 858.0, 466.0, 218.0, 135.0, 74.0, 50.0, 36.0, 16.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34600830078125e-05, -9.073317050933838e-05, -8.800625801086426e-05, -8.527934551239014e-05, -8.255243301391602e-05, -7.98255205154419e-05, -7.709860801696777e-05, -7.437169551849365e-05, -7.164478302001953e-05, -6.891787052154541e-05, -6.619095802307129e-05, -6.346404552459717e-05, -6.073713302612305e-05, -5.8010220527648926e-05, -5.5283308029174805e-05, -5.2556395530700684e-05, -4.982948303222656e-05, -4.710257053375244e-05, -4.437565803527832e-05, -4.16487455368042e-05, -3.892183303833008e-05, -3.619492053985596e-05, -3.3468008041381836e-05, -3.0741095542907715e-05, -2.8014183044433594e-05, -2.5287270545959473e-05, -2.256035804748535e-05, -1.983344554901123e-05, -1.710653305053711e-05, -1.4379620552062988e-05, -1.1652708053588867e-05, -8.925795555114746e-06, -6.198883056640625e-06, -3.471970558166504e-06, -7.450580596923828e-07, 1.9818544387817383e-06, 4.708766937255859e-06, 7.4356794357299805e-06, 1.0162591934204102e-05, 1.2889504432678223e-05, 1.5616416931152344e-05, 1.8343329429626465e-05, 2.1070241928100586e-05, 2.3797154426574707e-05, 2.6524066925048828e-05, 2.925097942352295e-05, 3.197789192199707e-05, 3.470480442047119e-05, 3.743171691894531e-05, 4.0158629417419434e-05, 4.2885541915893555e-05, 4.5612454414367676e-05, 4.83393669128418e-05, 5.106627941131592e-05, 5.379319190979004e-05, 5.652010440826416e-05, 5.924701690673828e-05, 6.19739294052124e-05, 6.470084190368652e-05, 6.742775440216064e-05, 7.015466690063477e-05, 7.288157939910889e-05, 7.560849189758301e-05, 7.833540439605713e-05, 8.106231689453125e-05]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 6.0, 8.0, 4.0, 13.0, 23.0, 66.0, 246.0, 867.0, 2451.0, 237.0, 85.0, 29.0, 15.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6391277313232422e-05, -1.599173992872238e-05, -1.559220254421234e-05, -1.5192665159702301e-05, -1.479312777519226e-05, -1.439359039068222e-05, -1.399405300617218e-05, -1.359451562166214e-05, -1.31949782371521e-05, -1.279544085264206e-05, -1.2395903468132019e-05, -1.1996366083621979e-05, -1.1596828699111938e-05, -1.1197291314601898e-05, -1.0797753930091858e-05, -1.0398216545581818e-05, -9.998679161071777e-06, -9.599141776561737e-06, -9.199604392051697e-06, -8.800067007541656e-06, -8.400529623031616e-06, -8.000992238521576e-06, -7.601454854011536e-06, -7.201917469501495e-06, -6.802380084991455e-06, -6.402842700481415e-06, -6.0033053159713745e-06, -5.603767931461334e-06, -5.204230546951294e-06, -4.804693162441254e-06, -4.405155777931213e-06, -4.005618393421173e-06, -3.606081008911133e-06, -3.2065436244010925e-06, -2.8070062398910522e-06, -2.407468855381012e-06, -2.0079314708709717e-06, -1.6083940863609314e-06, -1.2088567018508911e-06, -8.093193173408508e-07, -4.0978193283081055e-07, -1.0244548320770264e-08, 3.8929283618927e-07, 7.888302206993103e-07, 1.1883676052093506e-06, 1.5879049897193909e-06, 1.987442374229431e-06, 2.3869797587394714e-06, 2.7865171432495117e-06, 3.186054527759552e-06, 3.5855919122695923e-06, 3.9851292967796326e-06, 4.384666681289673e-06, 4.784204065799713e-06, 5.183741450309753e-06, 5.583278834819794e-06, 5.982816219329834e-06, 6.382353603839874e-06, 6.7818909883499146e-06, 7.181428372859955e-06, 7.580965757369995e-06, 7.980503141880035e-06, 8.380040526390076e-06, 8.779577910900116e-06, 9.179115295410156e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 17.0, 23.0, 24.0, 25.0, 40.0, 63.0, 86.0, 150.0, 163.0, 133.0, 74.0, 58.0, 45.0, 20.0, 14.0, 18.0, 3.0, 7.0, 4.0, 7.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5133835151791573e-05, -2.4011516870814376e-05, -2.2889196770847775e-05, -2.1766878489870578e-05, -2.0644558389903978e-05, -1.952224010892678e-05, -1.8399921827949584e-05, -1.7277601727982983e-05, -1.6155283447005786e-05, -1.5032964256533887e-05, -1.3910645066061988e-05, -1.2788326785084791e-05, -1.1666007594612893e-05, -1.0543688404140994e-05, -9.421370123163797e-06, -8.299050932691898e-06, -7.1767317422199994e-06, -6.054412551748101e-06, -4.932093816023553e-06, -3.8097748529253295e-06, -2.687455889827106e-06, -1.5651366993552074e-06, -4.428179636306595e-07, 6.795007720938884e-07, 1.8018199625657871e-06, 2.9241389256640105e-06, 4.046457888762234e-06, 5.168776624486782e-06, 6.29109581495868e-06, 7.413415005430579e-06, 8.535733286407776e-06, 9.658052476879675e-06, 1.0780368029372767e-05, 1.1902687219844665e-05, 1.3025006410316564e-05, 1.4147324691293761e-05, 1.526964479126036e-05, 1.639196307223756e-05, 1.7514281353214756e-05, 1.8636601453181356e-05, 1.9758919734158553e-05, 2.088123801513575e-05, 2.200355811510235e-05, 2.3125876396079548e-05, 2.4248194677056745e-05, 2.5370514777023345e-05, 2.6492833058000542e-05, 2.761515133897774e-05, 2.873747143894434e-05, 2.9859789719921537e-05, 3.0982108000898734e-05, 3.2104428100865334e-05, 3.3226748200831935e-05, 3.4349068300798535e-05, 3.547138476278633e-05, 3.659370486275293e-05, 3.771602496271953e-05, 3.883834506268613e-05, 3.9960661524673924e-05, 4.1082981624640524e-05, 4.2205301724607125e-05, 4.3327621824573725e-05, 4.444993828656152e-05, 4.557225838652812e-05, 4.669457484851591e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 6.0, 7.0, 11.0, 8.0, 10.0, 19.0, 16.0, 15.0, 28.0, 31.0, 24.0, 30.0, 33.0, 28.0, 36.0, 38.0, 41.0, 44.0, 38.0, 54.0, 37.0, 49.0, 36.0, 35.0, 45.0, 31.0, 40.0, 32.0, 32.0, 28.0, 17.0, 13.0, 13.0, 16.0, 10.0, 9.0, 13.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8686945622903295e-05, -1.81367158802459e-05, -1.758648613758851e-05, -1.7036256394931115e-05, -1.648602483328432e-05, -1.5935795090626925e-05, -1.5385565347969532e-05, -1.4835335605312139e-05, -1.4285105862654746e-05, -1.3734876119997352e-05, -1.3184646377339959e-05, -1.2634415725187864e-05, -1.2084185982530471e-05, -1.1533956239873078e-05, -1.0983725587720983e-05, -1.043349584506359e-05, -9.883266102406196e-06, -9.333036359748803e-06, -8.78280661709141e-06, -8.232575964939315e-06, -7.682346222281922e-06, -7.1321164796245284e-06, -6.581886282219784e-06, -6.03165608481504e-06, -5.481426342157647e-06, -4.931196599500254e-06, -4.38096640209551e-06, -3.830736204690766e-06, -3.2805064620333724e-06, -2.7302764920023037e-06, -2.180046521971235e-06, -1.629816324566491e-06, -1.0795847629196942e-06, -5.293547928886255e-07, 2.0875177142443135e-08, 5.711051471735118e-07, 1.1213351172045805e-06, 1.6715650872356491e-06, 2.2217950572667178e-06, 2.772025254671462e-06, 3.322254997328855e-06, 3.872484739986248e-06, 4.422714937390992e-06, 4.9729451347957365e-06, 5.52317487745313e-06, 6.073404620110523e-06, 6.623634817515267e-06, 7.173865014920011e-06, 7.724094757577404e-06, 8.274324500234798e-06, 8.82455424289219e-06, 9.374784895044286e-06, 9.925014637701679e-06, 1.0475244380359072e-05, 1.1025475032511167e-05, 1.157570477516856e-05, 1.2125934517825954e-05, 1.2676164260483347e-05, 1.322639400314074e-05, 1.3776624655292835e-05, 1.4326854397950228e-05, 1.4877084140607622e-05, 1.5427314792759717e-05, 1.597754453541711e-05, 1.6527774278074503e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 7.0, 12.0, 9.0, 19.0, 29.0, 39.0, 60.0, 81.0, 102.0, 131.0, 158.0, 304.0, 443.0, 557.0, 942.0, 1334.0, 1763.0, 3007.0, 4747.0, 6906.0, 12359.0, 21258.0, 33860.0, 69948.0, 153780.0, 356152.0, 184967.0, 89328.0, 44593.0, 23029.0, 14662.0, 8635.0, 5003.0, 3438.0, 2223.0, 1395.0, 1045.0, 711.0, 424.0, 309.0, 231.0, 167.0, 119.0, 69.0, 70.0, 39.0, 26.0, 16.0, 11.0, 20.0, 10.0, 4.0, 4.0, 5.0, 3.0], "bins": [-2.4139881134033203e-05, -2.3443251848220825e-05, -2.2746622562408447e-05, -2.204999327659607e-05, -2.135336399078369e-05, -2.0656734704971313e-05, -1.9960105419158936e-05, -1.9263476133346558e-05, -1.856684684753418e-05, -1.7870217561721802e-05, -1.7173588275909424e-05, -1.6476958990097046e-05, -1.5780329704284668e-05, -1.508370041847229e-05, -1.4387071132659912e-05, -1.3690441846847534e-05, -1.2993812561035156e-05, -1.2297183275222778e-05, -1.16005539894104e-05, -1.0903924703598022e-05, -1.0207295417785645e-05, -9.510666131973267e-06, -8.814036846160889e-06, -8.11740756034851e-06, -7.420778274536133e-06, -6.724148988723755e-06, -6.027519702911377e-06, -5.330890417098999e-06, -4.634261131286621e-06, -3.937631845474243e-06, -3.2410025596618652e-06, -2.5443732738494873e-06, -1.8477439880371094e-06, -1.1511147022247314e-06, -4.544854164123535e-07, 2.421438694000244e-07, 9.387731552124023e-07, 1.6354024410247803e-06, 2.332031726837158e-06, 3.028661012649536e-06, 3.725290298461914e-06, 4.421919584274292e-06, 5.11854887008667e-06, 5.815178155899048e-06, 6.511807441711426e-06, 7.208436727523804e-06, 7.905066013336182e-06, 8.60169529914856e-06, 9.298324584960938e-06, 9.994953870773315e-06, 1.0691583156585693e-05, 1.1388212442398071e-05, 1.208484172821045e-05, 1.2781471014022827e-05, 1.3478100299835205e-05, 1.4174729585647583e-05, 1.4871358871459961e-05, 1.556798815727234e-05, 1.6264617443084717e-05, 1.6961246728897095e-05, 1.7657876014709473e-05, 1.835450530052185e-05, 1.905113458633423e-05, 1.9747763872146606e-05, 2.0444393157958984e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 9.0, 2.0, 8.0, 13.0, 18.0, 15.0, 17.0, 23.0, 21.0, 27.0, 29.0, 28.0, 27.0, 43.0, 39.0, 42.0, 54.0, 46.0, 49.0, 48.0, 48.0, 37.0, 37.0, 49.0, 30.0, 43.0, 25.0, 34.0, 23.0, 24.0, 12.0, 14.0, 9.0, 12.0, 9.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.0742416381835938e-05, -2.0153820514678955e-05, -1.9565224647521973e-05, -1.897662878036499e-05, -1.8388032913208008e-05, -1.7799437046051025e-05, -1.7210841178894043e-05, -1.662224531173706e-05, -1.6033649444580078e-05, -1.5445053577423096e-05, -1.4856457710266113e-05, -1.4267861843109131e-05, -1.3679265975952148e-05, -1.3090670108795166e-05, -1.2502074241638184e-05, -1.1913478374481201e-05, -1.1324882507324219e-05, -1.0736286640167236e-05, -1.0147690773010254e-05, -9.559094905853271e-06, -8.970499038696289e-06, -8.381903171539307e-06, -7.793307304382324e-06, -7.204711437225342e-06, -6.616115570068359e-06, -6.027519702911377e-06, -5.4389238357543945e-06, -4.850327968597412e-06, -4.26173210144043e-06, -3.6731362342834473e-06, -3.084540367126465e-06, -2.4959444999694824e-06, -1.9073486328125e-06, -1.3187527656555176e-06, -7.301568984985352e-07, -1.4156103134155273e-07, 4.470348358154297e-07, 1.0356307029724121e-06, 1.6242265701293945e-06, 2.212822437286377e-06, 2.8014183044433594e-06, 3.390014171600342e-06, 3.978610038757324e-06, 4.567205905914307e-06, 5.155801773071289e-06, 5.7443976402282715e-06, 6.332993507385254e-06, 6.921589374542236e-06, 7.510185241699219e-06, 8.098781108856201e-06, 8.687376976013184e-06, 9.275972843170166e-06, 9.864568710327148e-06, 1.0453164577484131e-05, 1.1041760444641113e-05, 1.1630356311798096e-05, 1.2218952178955078e-05, 1.280754804611206e-05, 1.3396143913269043e-05, 1.3984739780426025e-05, 1.4573335647583008e-05, 1.516193151473999e-05, 1.5750527381896973e-05, 1.6339123249053955e-05, 1.6927719116210938e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 16.0, 15.0, 19.0, 32.0, 54.0, 49.0, 89.0, 122.0, 191.0, 279.0, 371.0, 628.0, 871.0, 1419.0, 2458.0, 4324.0, 8119.0, 16172.0, 36697.0, 103035.0, 562982.0, 204908.0, 56941.0, 23421.0, 11018.0, 5786.0, 3251.0, 1820.0, 1146.0, 726.0, 488.0, 323.0, 241.0, 154.0, 93.0, 82.0, 57.0, 39.0, 30.0, 21.0, 14.0, 12.0, 10.0, 11.0, 2.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9087066650390625e-05, -2.80747190117836e-05, -2.7062371373176575e-05, -2.605002373456955e-05, -2.5037676095962524e-05, -2.40253284573555e-05, -2.3012980818748474e-05, -2.200063318014145e-05, -2.0988285541534424e-05, -1.99759379029274e-05, -1.8963590264320374e-05, -1.795124262571335e-05, -1.6938894987106323e-05, -1.5926547348499298e-05, -1.4914199709892273e-05, -1.3901852071285248e-05, -1.2889504432678223e-05, -1.1877156794071198e-05, -1.0864809155464172e-05, -9.852461516857147e-06, -8.840113878250122e-06, -7.827766239643097e-06, -6.815418601036072e-06, -5.803070962429047e-06, -4.7907233238220215e-06, -3.7783756852149963e-06, -2.766028046607971e-06, -1.753680408000946e-06, -7.413327693939209e-07, 2.7101486921310425e-07, 1.2833625078201294e-06, 2.2957101464271545e-06, 3.3080577850341797e-06, 4.320405423641205e-06, 5.33275306224823e-06, 6.345100700855255e-06, 7.35744833946228e-06, 8.369795978069305e-06, 9.38214361667633e-06, 1.0394491255283356e-05, 1.1406838893890381e-05, 1.2419186532497406e-05, 1.3431534171104431e-05, 1.4443881809711456e-05, 1.545622944831848e-05, 1.6468577086925507e-05, 1.7480924725532532e-05, 1.8493272364139557e-05, 1.9505620002746582e-05, 2.0517967641353607e-05, 2.1530315279960632e-05, 2.2542662918567657e-05, 2.3555010557174683e-05, 2.4567358195781708e-05, 2.5579705834388733e-05, 2.6592053472995758e-05, 2.7604401111602783e-05, 2.861674875020981e-05, 2.9629096388816833e-05, 3.064144402742386e-05, 3.1653791666030884e-05, 3.266613930463791e-05, 3.3678486943244934e-05, 3.469083458185196e-05, 3.5703182220458984e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 10.0, 19.0, 15.0, 21.0, 34.0, 37.0, 31.0, 25.0, 37.0, 37.0, 38.0, 46.0, 43.0, 74.0, 70.0, 54.0, 41.0, 40.0, 36.0, 39.0, 29.0, 48.0, 40.0, 23.0, 22.0, 19.0, 12.0, 13.0, 3.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2278556823730469e-05, -1.1881813406944275e-05, -1.1485069990158081e-05, -1.1088326573371887e-05, -1.0691583156585693e-05, -1.02948397397995e-05, -9.898096323013306e-06, -9.501352906227112e-06, -9.104609489440918e-06, -8.707866072654724e-06, -8.31112265586853e-06, -7.914379239082336e-06, -7.517635822296143e-06, -7.120892405509949e-06, -6.724148988723755e-06, -6.327405571937561e-06, -5.930662155151367e-06, -5.533918738365173e-06, -5.1371753215789795e-06, -4.740431904792786e-06, -4.343688488006592e-06, -3.946945071220398e-06, -3.550201654434204e-06, -3.1534582376480103e-06, -2.7567148208618164e-06, -2.3599714040756226e-06, -1.9632279872894287e-06, -1.5664845705032349e-06, -1.169741153717041e-06, -7.729977369308472e-07, -3.762543201446533e-07, 2.0489096641540527e-08, 4.172325134277344e-07, 8.139759302139282e-07, 1.210719347000122e-06, 1.607462763786316e-06, 2.0042061805725098e-06, 2.4009495973587036e-06, 2.7976930141448975e-06, 3.1944364309310913e-06, 3.591179847717285e-06, 3.987923264503479e-06, 4.384666681289673e-06, 4.781410098075867e-06, 5.1781535148620605e-06, 5.574896931648254e-06, 5.971640348434448e-06, 6.368383765220642e-06, 6.765127182006836e-06, 7.16187059879303e-06, 7.558614015579224e-06, 7.955357432365417e-06, 8.352100849151611e-06, 8.748844265937805e-06, 9.145587682723999e-06, 9.542331099510193e-06, 9.939074516296387e-06, 1.033581793308258e-05, 1.0732561349868774e-05, 1.1129304766654968e-05, 1.1526048183441162e-05, 1.1922791600227356e-05, 1.231953501701355e-05, 1.2716278433799744e-05, 1.3113021850585938e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 11.0, 7.0, 11.0, 12.0, 15.0, 20.0, 34.0, 57.0, 65.0, 80.0, 90.0, 118.0, 210.0, 285.0, 420.0, 597.0, 1007.0, 1644.0, 2732.0, 5689.0, 15289.0, 60873.0, 870459.0, 60512.0, 15272.0, 5527.0, 2785.0, 1707.0, 952.0, 601.0, 459.0, 267.0, 214.0, 148.0, 104.0, 69.0, 34.0, 48.0, 26.0, 22.0, 21.0, 9.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-1.6868114471435547e-05, -1.6314908862113953e-05, -1.576170325279236e-05, -1.5208497643470764e-05, -1.465529203414917e-05, -1.4102086424827576e-05, -1.3548880815505981e-05, -1.2995675206184387e-05, -1.2442469596862793e-05, -1.1889263987541199e-05, -1.1336058378219604e-05, -1.078285276889801e-05, -1.0229647159576416e-05, -9.676441550254822e-06, -9.123235940933228e-06, -8.570030331611633e-06, -8.016824722290039e-06, -7.463619112968445e-06, -6.910413503646851e-06, -6.357207894325256e-06, -5.804002285003662e-06, -5.250796675682068e-06, -4.697591066360474e-06, -4.144385457038879e-06, -3.591179847717285e-06, -3.037974238395691e-06, -2.4847686290740967e-06, -1.9315630197525024e-06, -1.3783574104309082e-06, -8.25151801109314e-07, -2.7194619178771973e-07, 2.812594175338745e-07, 8.344650268554688e-07, 1.387670636177063e-06, 1.9408762454986572e-06, 2.4940818548202515e-06, 3.0472874641418457e-06, 3.60049307346344e-06, 4.153698682785034e-06, 4.706904292106628e-06, 5.260109901428223e-06, 5.813315510749817e-06, 6.366521120071411e-06, 6.919726729393005e-06, 7.4729323387146e-06, 8.026137948036194e-06, 8.579343557357788e-06, 9.132549166679382e-06, 9.685754776000977e-06, 1.023896038532257e-05, 1.0792165994644165e-05, 1.134537160396576e-05, 1.1898577213287354e-05, 1.2451782822608948e-05, 1.3004988431930542e-05, 1.3558194041252136e-05, 1.411139965057373e-05, 1.4664605259895325e-05, 1.5217810869216919e-05, 1.5771016478538513e-05, 1.6324222087860107e-05, 1.68774276971817e-05, 1.7430633306503296e-05, 1.798383891582489e-05, 1.8537044525146484e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 7.0, 0.0, 5.0, 13.0, 0.0, 12.0, 0.0, 18.0, 0.0, 30.0, 0.0, 20.0, 0.0, 39.0, 67.0, 0.0, 84.0, 0.0, 107.0, 0.0, 238.0, 0.0, 90.0, 0.0, 74.0, 58.0, 0.0, 32.0, 0.0, 25.0, 0.0, 24.0, 0.0, 16.0, 0.0, 18.0, 7.0, 0.0, 12.0, 0.0, 6.0, 0.0, 8.0, 0.0, 2.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2191012501716614e-06, -1.1865049600601196e-06, -1.1539086699485779e-06, -1.1213123798370361e-06, -1.0887160897254944e-06, -1.0561197996139526e-06, -1.0235235095024109e-06, -9.909272193908691e-07, -9.583309292793274e-07, -9.257346391677856e-07, -8.931383490562439e-07, -8.605420589447021e-07, -8.279457688331604e-07, -7.953494787216187e-07, -7.627531886100769e-07, -7.301568984985352e-07, -6.975606083869934e-07, -6.649643182754517e-07, -6.323680281639099e-07, -5.997717380523682e-07, -5.671754479408264e-07, -5.345791578292847e-07, -5.019828677177429e-07, -4.6938657760620117e-07, -4.367902874946594e-07, -4.041939973831177e-07, -3.7159770727157593e-07, -3.390014171600342e-07, -3.0640512704849243e-07, -2.738088369369507e-07, -2.4121254682540894e-07, -2.086162567138672e-07, -1.7601996660232544e-07, -1.434236764907837e-07, -1.1082738637924194e-07, -7.82310962677002e-08, -4.563480615615845e-08, -1.30385160446167e-08, 1.955777406692505e-08, 5.21540641784668e-08, 8.475035429000854e-08, 1.1734664440155029e-07, 1.4994293451309204e-07, 1.825392246246338e-07, 2.1513551473617554e-07, 2.477318048477173e-07, 2.8032809495925903e-07, 3.129243850708008e-07, 3.4552067518234253e-07, 3.781169652938843e-07, 4.10713255405426e-07, 4.4330954551696777e-07, 4.759058356285095e-07, 5.085021257400513e-07, 5.41098415851593e-07, 5.736947059631348e-07, 6.062909960746765e-07, 6.388872861862183e-07, 6.7148357629776e-07, 7.040798664093018e-07, 7.366761565208435e-07, 7.692724466323853e-07, 8.01868736743927e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 9.0, 16.0, 23.0, 34.0, 55.0, 82.0, 131.0, 177.0, 330.0, 648.0, 1253.0, 2131.0, 4575.0, 9672.0, 30253.0, 220742.0, 711299.0, 43500.0, 12221.0, 5472.0, 2631.0, 1448.0, 768.0, 415.0, 242.0, 135.0, 95.0, 57.0, 45.0, 24.0, 15.0, 7.0, 5.0, 7.0, 2.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294778823852539e-05, -2.2275373339653015e-05, -2.160295844078064e-05, -2.0930543541908264e-05, -2.025812864303589e-05, -1.9585713744163513e-05, -1.8913298845291138e-05, -1.8240883946418762e-05, -1.7568469047546387e-05, -1.689605414867401e-05, -1.6223639249801636e-05, -1.555122435092926e-05, -1.4878809452056885e-05, -1.420639455318451e-05, -1.3533979654312134e-05, -1.2861564755439758e-05, -1.2189149856567383e-05, -1.1516734957695007e-05, -1.0844320058822632e-05, -1.0171905159950256e-05, -9.499490261077881e-06, -8.827075362205505e-06, -8.15466046333313e-06, -7.482245564460754e-06, -6.809830665588379e-06, -6.137415766716003e-06, -5.465000867843628e-06, -4.7925859689712524e-06, -4.120171070098877e-06, -3.4477561712265015e-06, -2.775341272354126e-06, -2.1029263734817505e-06, -1.430511474609375e-06, -7.580965757369995e-07, -8.568167686462402e-08, 5.867332220077515e-07, 1.259148120880127e-06, 1.9315630197525024e-06, 2.603977918624878e-06, 3.2763928174972534e-06, 3.948807716369629e-06, 4.621222615242004e-06, 5.29363751411438e-06, 5.966052412986755e-06, 6.638467311859131e-06, 7.310882210731506e-06, 7.983297109603882e-06, 8.655712008476257e-06, 9.328126907348633e-06, 1.0000541806221008e-05, 1.0672956705093384e-05, 1.134537160396576e-05, 1.2017786502838135e-05, 1.269020140171051e-05, 1.3362616300582886e-05, 1.4035031199455261e-05, 1.4707446098327637e-05, 1.5379860997200012e-05, 1.6052275896072388e-05, 1.6724690794944763e-05, 1.739710569381714e-05, 1.8069520592689514e-05, 1.874193549156189e-05, 1.9414350390434265e-05, 2.008676528930664e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 5.0, 6.0, 8.0, 5.0, 12.0, 14.0, 17.0, 22.0, 44.0, 56.0, 56.0, 172.0, 267.0, 123.0, 44.0, 32.0, 18.0, 11.0, 17.0, 6.0, 6.0, 10.0, 6.0, 4.0, 3.0, 10.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-4.112720489501953e-06, -4.001893103122711e-06, -3.891065716743469e-06, -3.7802383303642273e-06, -3.6694109439849854e-06, -3.5585835576057434e-06, -3.4477561712265015e-06, -3.3369287848472595e-06, -3.2261013984680176e-06, -3.1152740120887756e-06, -3.0044466257095337e-06, -2.8936192393302917e-06, -2.78279185295105e-06, -2.671964466571808e-06, -2.561137080192566e-06, -2.450309693813324e-06, -2.339482307434082e-06, -2.22865492105484e-06, -2.117827534675598e-06, -2.007000148296356e-06, -1.8961727619171143e-06, -1.7853453755378723e-06, -1.6745179891586304e-06, -1.5636906027793884e-06, -1.4528632164001465e-06, -1.3420358300209045e-06, -1.2312084436416626e-06, -1.1203810572624207e-06, -1.0095536708831787e-06, -8.987262845039368e-07, -7.878988981246948e-07, -6.770715117454529e-07, -5.662441253662109e-07, -4.55416738986969e-07, -3.4458935260772705e-07, -2.337619662284851e-07, -1.2293457984924316e-07, -1.210719347000122e-08, 9.872019290924072e-08, 2.0954757928848267e-07, 3.203749656677246e-07, 4.3120235204696655e-07, 5.420297384262085e-07, 6.528571248054504e-07, 7.636845111846924e-07, 8.745118975639343e-07, 9.853392839431763e-07, 1.0961666703224182e-06, 1.2069940567016602e-06, 1.317821443080902e-06, 1.428648829460144e-06, 1.539476215839386e-06, 1.650303602218628e-06, 1.7611309885978699e-06, 1.8719583749771118e-06, 1.9827857613563538e-06, 2.0936131477355957e-06, 2.2044405341148376e-06, 2.3152679204940796e-06, 2.4260953068733215e-06, 2.5369226932525635e-06, 2.6477500796318054e-06, 2.7585774660110474e-06, 2.8694048523902893e-06, 2.9802322387695312e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 10.0, 12.0, 11.0, 14.0, 17.0, 23.0, 34.0, 40.0, 51.0, 64.0, 103.0, 157.0, 137.0, 87.0, 61.0, 51.0, 30.0, 27.0, 17.0, 10.0, 10.0, 8.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2808990252087824e-05, -2.18875447899336e-05, -2.096610114676878e-05, -2.0044655684614554e-05, -1.912321022246033e-05, -1.820176657929551e-05, -1.7280321117141284e-05, -1.6358877473976463e-05, -1.543743201182224e-05, -1.4515987459162716e-05, -1.3594542906503193e-05, -1.2673097444348969e-05, -1.1751652891689446e-05, -1.0830208339029923e-05, -9.908762876875699e-06, -8.987318324216176e-06, -8.065873771556653e-06, -7.14442921889713e-06, -6.222984211490257e-06, -5.301539204083383e-06, -4.38009465142386e-06, -3.4586500987643376e-06, -2.537205091357464e-06, -1.6157600839505903e-06, -6.943155312910676e-07, 2.2712924874213059e-07, 1.1485740287753288e-06, 2.070018808808527e-06, 2.991463588841725e-06, 3.912908141501248e-06, 4.8343531489081215e-06, 5.755798156314995e-06, 6.6772445279639214e-06, 7.598689080623444e-06, 8.520133633282967e-06, 9.441579095437191e-06, 1.0363023648096714e-05, 1.1284468200756237e-05, 1.2205913662910461e-05, 1.3127358215569984e-05, 1.4048802768229507e-05, 1.497024732088903e-05, 1.5891691873548552e-05, 1.6813137335702777e-05, 1.7734582797857e-05, 1.8656026441021822e-05, 1.9577471903176047e-05, 2.0498915546340868e-05, 2.1420361008495092e-05, 2.2341806470649317e-05, 2.3263250113814138e-05, 2.4184695575968362e-05, 2.5106139219133183e-05, 2.6027584681287408e-05, 2.6949030143441632e-05, 2.7870475605595857e-05, 2.8791919248760678e-05, 2.9713364710914902e-05, 3.063480835407972e-05, 3.155625381623395e-05, 3.247769927838817e-05, 3.339914110256359e-05, 3.4320586564717814e-05, 3.524203202687204e-05, 3.616347748902626e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 4.0, 7.0, 5.0, 10.0, 7.0, 8.0, 8.0, 20.0, 14.0, 19.0, 23.0, 29.0, 28.0, 25.0, 30.0, 34.0, 34.0, 27.0, 50.0, 44.0, 40.0, 43.0, 49.0, 39.0, 43.0, 43.0, 40.0, 25.0, 34.0, 41.0, 32.0, 27.0, 23.0, 12.0, 14.0, 13.0, 15.0, 8.0, 13.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7914922864292748e-05, -1.7392103472957388e-05, -1.6869282262632623e-05, -1.6346462871297263e-05, -1.58236416609725e-05, -1.5300822269637138e-05, -1.4778001968807075e-05, -1.4255181667977013e-05, -1.373236136714695e-05, -1.3209541066316888e-05, -1.2686720765486825e-05, -1.2163900464656763e-05, -1.1641081073321402e-05, -1.1118259862996638e-05, -1.0595440471661277e-05, -1.0072620170831215e-05, -9.549799870001152e-06, -9.02697956917109e-06, -8.504159268341027e-06, -7.981338967510965e-06, -7.458519121428253e-06, -6.935698820598191e-06, -6.412878974515479e-06, -5.890058673685417e-06, -5.367238372855354e-06, -4.844418072025292e-06, -4.321597771195229e-06, -3.7987779251125176e-06, -3.275957624282455e-06, -2.7531373234523926e-06, -2.2303172499960056e-06, -1.7074971765396185e-06, -1.1846750567201525e-06, -6.618548695769277e-07, -1.3903468243370298e-07, 3.837855047095218e-07, 9.066056918527465e-07, 1.429425992682809e-06, 1.952246066139196e-06, 2.475066139595583e-06, 2.9978864404256456e-06, 3.520706741255708e-06, 4.0435270420857705e-06, 4.566346888168482e-06, 5.089167188998545e-06, 5.611987489828607e-06, 6.134807335911319e-06, 6.657627636741381e-06, 7.180447937571444e-06, 7.703268238401506e-06, 8.226088539231569e-06, 8.748908840061631e-06, 9.271729140891694e-06, 9.794548532227054e-06, 1.0317368833057117e-05, 1.084018913388718e-05, 1.1363009434717242e-05, 1.1885829735547304e-05, 1.2408650036377367e-05, 1.2931470337207429e-05, 1.345428972854279e-05, 1.3977110938867554e-05, 1.4499930330202915e-05, 1.5022750631032977e-05, 1.554557093186304e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 21.0, 33.0, 47.0, 82.0, 119.0, 164.0, 198.0, 312.0, 408.0, 685.0, 915.0, 1375.0, 1861.0, 2619.0, 3887.0, 5529.0, 8390.0, 11553.0, 18661.0, 29029.0, 46153.0, 76995.0, 140958.0, 253782.0, 187273.0, 98494.0, 54174.0, 35878.0, 22840.0, 14778.0, 9843.0, 6656.0, 4439.0, 3127.0, 2158.0, 1464.0, 1047.0, 776.0, 565.0, 394.0, 293.0, 159.0, 141.0, 84.0, 52.0, 44.0, 27.0, 21.0, 19.0, 12.0, 4.0, 1.0, 1.0, 3.0], "bins": [-3.796815872192383e-05, -3.6842189729213715e-05, -3.57162207365036e-05, -3.459025174379349e-05, -3.3464282751083374e-05, -3.233831375837326e-05, -3.121234476566315e-05, -3.0086375772953033e-05, -2.896040678024292e-05, -2.7834437787532806e-05, -2.6708468794822693e-05, -2.558249980211258e-05, -2.4456530809402466e-05, -2.3330561816692352e-05, -2.220459282398224e-05, -2.1078623831272125e-05, -1.9952654838562012e-05, -1.8826685845851898e-05, -1.7700716853141785e-05, -1.657474786043167e-05, -1.5448778867721558e-05, -1.4322809875011444e-05, -1.319684088230133e-05, -1.2070871889591217e-05, -1.0944902896881104e-05, -9.81893390417099e-06, -8.692964911460876e-06, -7.566995918750763e-06, -6.441026926040649e-06, -5.315057933330536e-06, -4.189088940620422e-06, -3.063119947910309e-06, -1.9371509552001953e-06, -8.111819624900818e-07, 3.1478703022003174e-07, 1.4407560229301453e-06, 2.566725015640259e-06, 3.6926940083503723e-06, 4.818663001060486e-06, 5.944631993770599e-06, 7.070600986480713e-06, 8.196569979190826e-06, 9.32253897190094e-06, 1.0448507964611053e-05, 1.1574476957321167e-05, 1.270044595003128e-05, 1.3826414942741394e-05, 1.4952383935451508e-05, 1.607835292816162e-05, 1.7204321920871735e-05, 1.8330290913581848e-05, 1.945625990629196e-05, 2.0582228899002075e-05, 2.170819789171219e-05, 2.2834166884422302e-05, 2.3960135877132416e-05, 2.508610486984253e-05, 2.6212073862552643e-05, 2.7338042855262756e-05, 2.846401184797287e-05, 2.9589980840682983e-05, 3.07159498333931e-05, 3.184191882610321e-05, 3.2967887818813324e-05, 3.409385681152344e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 9.0, 5.0, 5.0, 6.0, 9.0, 9.0, 17.0, 8.0, 23.0, 20.0, 28.0, 22.0, 38.0, 29.0, 30.0, 37.0, 28.0, 44.0, 44.0, 50.0, 39.0, 35.0, 44.0, 32.0, 46.0, 36.0, 32.0, 32.0, 39.0, 30.0, 29.0, 17.0, 26.0, 11.0, 19.0, 10.0, 7.0, 9.0, 8.0, 8.0, 4.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-1.6391277313232422e-05, -1.5933066606521606e-05, -1.547485589981079e-05, -1.5016645193099976e-05, -1.455843448638916e-05, -1.4100223779678345e-05, -1.364201307296753e-05, -1.3183802366256714e-05, -1.2725591659545898e-05, -1.2267380952835083e-05, -1.1809170246124268e-05, -1.1350959539413452e-05, -1.0892748832702637e-05, -1.0434538125991821e-05, -9.976327419281006e-06, -9.51811671257019e-06, -9.059906005859375e-06, -8.60169529914856e-06, -8.143484592437744e-06, -7.685273885726929e-06, -7.227063179016113e-06, -6.768852472305298e-06, -6.310641765594482e-06, -5.852431058883667e-06, -5.3942203521728516e-06, -4.936009645462036e-06, -4.477798938751221e-06, -4.019588232040405e-06, -3.56137752532959e-06, -3.1031668186187744e-06, -2.644956111907959e-06, -2.1867454051971436e-06, -1.7285346984863281e-06, -1.2703239917755127e-06, -8.121132850646973e-07, -3.5390257835388184e-07, 1.043081283569336e-07, 5.62518835067749e-07, 1.0207295417785645e-06, 1.4789402484893799e-06, 1.9371509552001953e-06, 2.3953616619110107e-06, 2.853572368621826e-06, 3.3117830753326416e-06, 3.769993782043457e-06, 4.2282044887542725e-06, 4.686415195465088e-06, 5.144625902175903e-06, 5.602836608886719e-06, 6.061047315597534e-06, 6.51925802230835e-06, 6.977468729019165e-06, 7.4356794357299805e-06, 7.893890142440796e-06, 8.352100849151611e-06, 8.810311555862427e-06, 9.268522262573242e-06, 9.726732969284058e-06, 1.0184943675994873e-05, 1.0643154382705688e-05, 1.1101365089416504e-05, 1.155957579612732e-05, 1.2017786502838135e-05, 1.247599720954895e-05, 1.2934207916259766e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 15.0, 12.0, 17.0, 28.0, 42.0, 71.0, 95.0, 139.0, 254.0, 370.0, 544.0, 869.0, 1551.0, 2650.0, 4719.0, 8552.0, 15336.0, 31831.0, 70416.0, 187003.0, 399675.0, 182221.0, 73151.0, 32970.0, 16031.0, 8559.0, 4539.0, 2801.0, 1536.0, 938.0, 575.0, 344.0, 219.0, 149.0, 97.0, 65.0, 45.0, 32.0, 33.0, 19.0, 13.0, 9.0, 9.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.352497100830078e-05, -5.1927752792835236e-05, -5.033053457736969e-05, -4.8733316361904144e-05, -4.71360981464386e-05, -4.553887993097305e-05, -4.394166171550751e-05, -4.234444350004196e-05, -4.0747225284576416e-05, -3.915000706911087e-05, -3.7552788853645325e-05, -3.595557063817978e-05, -3.4358352422714233e-05, -3.276113420724869e-05, -3.116391599178314e-05, -2.9566697776317596e-05, -2.796947956085205e-05, -2.6372261345386505e-05, -2.477504312992096e-05, -2.3177824914455414e-05, -2.1580606698989868e-05, -1.9983388483524323e-05, -1.8386170268058777e-05, -1.678895205259323e-05, -1.5191733837127686e-05, -1.359451562166214e-05, -1.1997297406196594e-05, -1.0400079190731049e-05, -8.802860975265503e-06, -7.205642759799957e-06, -5.608424544334412e-06, -4.011206328868866e-06, -2.4139881134033203e-06, -8.167698979377747e-07, 7.80448317527771e-07, 2.3776665329933167e-06, 3.974884748458862e-06, 5.572102963924408e-06, 7.169321179389954e-06, 8.7665393948555e-06, 1.0363757610321045e-05, 1.196097582578659e-05, 1.3558194041252136e-05, 1.5155412256717682e-05, 1.6752630472183228e-05, 1.8349848687648773e-05, 1.994706690311432e-05, 2.1544285118579865e-05, 2.314150333404541e-05, 2.4738721549510956e-05, 2.63359397649765e-05, 2.7933157980442047e-05, 2.9530376195907593e-05, 3.112759441137314e-05, 3.2724812626838684e-05, 3.432203084230423e-05, 3.5919249057769775e-05, 3.751646727323532e-05, 3.911368548870087e-05, 4.071090370416641e-05, 4.230812191963196e-05, 4.3905340135097504e-05, 4.550255835056305e-05, 4.7099776566028595e-05, 4.869699478149414e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 4.0, 9.0, 10.0, 13.0, 16.0, 13.0, 10.0, 18.0, 29.0, 35.0, 40.0, 42.0, 34.0, 36.0, 43.0, 42.0, 46.0, 47.0, 47.0, 40.0, 55.0, 47.0, 41.0, 40.0, 44.0, 29.0, 19.0, 29.0, 23.0, 15.0, 13.0, 13.0, 12.0, 6.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.239776611328125e-05, -1.1987052857875824e-05, -1.1576339602470398e-05, -1.1165626347064972e-05, -1.0754913091659546e-05, -1.034419983625412e-05, -9.933486580848694e-06, -9.522773325443268e-06, -9.112060070037842e-06, -8.701346814632416e-06, -8.29063355922699e-06, -7.879920303821564e-06, -7.469207048416138e-06, -7.058493793010712e-06, -6.647780537605286e-06, -6.23706728219986e-06, -5.826354026794434e-06, -5.4156407713890076e-06, -5.0049275159835815e-06, -4.5942142605781555e-06, -4.1835010051727295e-06, -3.7727877497673035e-06, -3.3620744943618774e-06, -2.9513612389564514e-06, -2.5406479835510254e-06, -2.1299347281455994e-06, -1.7192214727401733e-06, -1.3085082173347473e-06, -8.977949619293213e-07, -4.870817065238953e-07, -7.636845111846924e-08, 3.343448042869568e-07, 7.450580596923828e-07, 1.1557713150978088e-06, 1.5664845705032349e-06, 1.977197825908661e-06, 2.387911081314087e-06, 2.798624336719513e-06, 3.209337592124939e-06, 3.620050847530365e-06, 4.030764102935791e-06, 4.441477358341217e-06, 4.852190613746643e-06, 5.262903869152069e-06, 5.673617124557495e-06, 6.084330379962921e-06, 6.495043635368347e-06, 6.905756890773773e-06, 7.316470146179199e-06, 7.727183401584625e-06, 8.137896656990051e-06, 8.548609912395477e-06, 8.959323167800903e-06, 9.37003642320633e-06, 9.780749678611755e-06, 1.0191462934017181e-05, 1.0602176189422607e-05, 1.1012889444828033e-05, 1.142360270023346e-05, 1.1834315955638885e-05, 1.2245029211044312e-05, 1.2655742466449738e-05, 1.3066455721855164e-05, 1.347716897726059e-05, 1.3887882232666016e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 3.0, 8.0, 12.0, 14.0, 23.0, 27.0, 54.0, 100.0, 148.0, 190.0, 0.0, 363.0, 552.0, 1112.0, 2000.0, 4172.0, 9577.0, 26912.0, 106808.0, 744039.0, 107313.0, 26991.0, 9466.0, 0.0, 4070.0, 1987.0, 1119.0, 546.0, 366.0, 168.0, 157.0, 86.0, 59.0, 33.0, 20.0, 17.0, 0.0, 15.0, 9.0, 8.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.9073486328125e-06, -1.8524006009101868e-06, -1.7974525690078735e-06, -1.7425045371055603e-06, -1.687556505203247e-06, -1.6326084733009338e-06, -1.5776604413986206e-06, -1.5227124094963074e-06, -1.4677643775939941e-06, -1.412816345691681e-06, -1.3578683137893677e-06, -1.3029202818870544e-06, -1.2479722499847412e-06, -1.193024218082428e-06, -1.1380761861801147e-06, -1.0831281542778015e-06, -1.0281801223754883e-06, -9.73232090473175e-07, -9.182840585708618e-07, -8.633360266685486e-07, -8.083879947662354e-07, -7.534399628639221e-07, -6.984919309616089e-07, -6.435438990592957e-07, -5.885958671569824e-07, -5.336478352546692e-07, -4.78699803352356e-07, -4.237517714500427e-07, -3.688037395477295e-07, -3.1385570764541626e-07, -2.5890767574310303e-07, -2.039596438407898e-07, -1.4901161193847656e-07, -9.406358003616333e-08, -3.91155481338501e-08, 1.5832483768463135e-08, 7.078051567077637e-08, 1.257285475730896e-07, 1.8067657947540283e-07, 2.3562461137771606e-07, 2.905726432800293e-07, 3.4552067518234253e-07, 4.0046870708465576e-07, 4.55416738986969e-07, 5.103647708892822e-07, 5.653128027915955e-07, 6.202608346939087e-07, 6.752088665962219e-07, 7.301568984985352e-07, 7.851049304008484e-07, 8.400529623031616e-07, 8.950009942054749e-07, 9.499490261077881e-07, 1.0048970580101013e-06, 1.0598450899124146e-06, 1.1147931218147278e-06, 1.169741153717041e-06, 1.2246891856193542e-06, 1.2796372175216675e-06, 1.3345852494239807e-06, 1.389533281326294e-06, 1.4444813132286072e-06, 1.4994293451309204e-06, 1.5543773770332336e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 802.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.8777867555618286e-07, -2.775341272354126e-07, -2.6728957891464233e-07, -2.5704503059387207e-07, -2.468004822731018e-07, -2.3655593395233154e-07, -2.2631138563156128e-07, -2.1606683731079102e-07, -2.0582228899002075e-07, -1.955777406692505e-07, -1.8533319234848022e-07, -1.7508864402770996e-07, -1.648440957069397e-07, -1.5459954738616943e-07, -1.4435499906539917e-07, -1.341104507446289e-07, -1.2386590242385864e-07, -1.1362135410308838e-07, -1.0337680578231812e-07, -9.313225746154785e-08, -8.288770914077759e-08, -7.264316082000732e-08, -6.239861249923706e-08, -5.21540641784668e-08, -4.190951585769653e-08, -3.166496753692627e-08, -2.1420419216156006e-08, -1.1175870895385742e-08, -9.313225746154785e-10, 9.313225746154785e-09, 1.955777406692505e-08, 2.9802322387695312e-08, 4.0046870708465576e-08, 5.029141902923584e-08, 6.05359673500061e-08, 7.078051567077637e-08, 8.102506399154663e-08, 9.12696123123169e-08, 1.0151416063308716e-07, 1.1175870895385742e-07, 1.2200325727462769e-07, 1.3224780559539795e-07, 1.424923539161682e-07, 1.5273690223693848e-07, 1.6298145055770874e-07, 1.73225998878479e-07, 1.8347054719924927e-07, 1.9371509552001953e-07, 2.039596438407898e-07, 2.1420419216156006e-07, 2.2444874048233032e-07, 2.3469328880310059e-07, 2.4493783712387085e-07, 2.551823854446411e-07, 2.654269337654114e-07, 2.7567148208618164e-07, 2.859160304069519e-07, 2.9616057872772217e-07, 3.0640512704849243e-07, 3.166496753692627e-07, 3.2689422369003296e-07, 3.371387720108032e-07, 3.473833203315735e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 7.0, 0.0, 12.0, 19.0, 3.0, 0.0, 25.0, 40.0, 58.0, 0.0, 143.0, 168.0, 285.0, 522.0, 0.0, 836.0, 1547.0, 3381.0, 0.0, 8283.0, 26021.0, 103281.0, 0.0, 759825.0, 102629.0, 26174.0, 0.0, 8290.0, 3377.0, 1509.0, 860.0, 0.0, 492.0, 291.0, 172.0, 0.0, 140.0, 47.0, 44.0, 0.0, 47.0, 2.0, 9.0, 0.0, 7.0, 1.0, 5.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.146458089351654e-06, -1.1008232831954956e-06, -1.0551884770393372e-06, -1.0095536708831787e-06, -9.639188647270203e-07, -9.182840585708618e-07, -8.726492524147034e-07, -8.270144462585449e-07, -7.813796401023865e-07, -7.35744833946228e-07, -6.901100277900696e-07, -6.444752216339111e-07, -5.988404154777527e-07, -5.532056093215942e-07, -5.075708031654358e-07, -4.6193599700927734e-07, -4.163011908531189e-07, -3.7066638469696045e-07, -3.25031578540802e-07, -2.7939677238464355e-07, -2.337619662284851e-07, -1.8812716007232666e-07, -1.424923539161682e-07, -9.685754776000977e-08, -5.122274160385132e-08, -5.587935447692871e-09, 4.0046870708465576e-08, 8.568167686462402e-08, 1.3131648302078247e-07, 1.7695128917694092e-07, 2.2258609533309937e-07, 2.682209014892578e-07, 3.1385570764541626e-07, 3.594905138015747e-07, 4.0512531995773315e-07, 4.507601261138916e-07, 4.9639493227005e-07, 5.420297384262085e-07, 5.876645445823669e-07, 6.332993507385254e-07, 6.789341568946838e-07, 7.245689630508423e-07, 7.702037692070007e-07, 8.158385753631592e-07, 8.614733815193176e-07, 9.071081876754761e-07, 9.527429938316345e-07, 9.98377799987793e-07, 1.0440126061439514e-06, 1.0896474123001099e-06, 1.1352822184562683e-06, 1.1809170246124268e-06, 1.2265518307685852e-06, 1.2721866369247437e-06, 1.317821443080902e-06, 1.3634562492370605e-06, 1.409091055393219e-06, 1.4547258615493774e-06, 1.5003606677055359e-06, 1.5459954738616943e-06, 1.5916302800178528e-06, 1.6372650861740112e-06, 1.6828998923301697e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 167.0, 0.0, 0.0, 0.0, 0.0, 537.0, 0.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-4.172325134277344e-07, -4.0605664253234863e-07, -3.948807716369629e-07, -3.8370490074157715e-07, -3.725290298461914e-07, -3.6135315895080566e-07, -3.501772880554199e-07, -3.390014171600342e-07, -3.2782554626464844e-07, -3.166496753692627e-07, -3.0547380447387695e-07, -2.942979335784912e-07, -2.8312206268310547e-07, -2.7194619178771973e-07, -2.60770320892334e-07, -2.4959444999694824e-07, -2.384185791015625e-07, -2.2724270820617676e-07, -2.1606683731079102e-07, -2.0489096641540527e-07, -1.9371509552001953e-07, -1.825392246246338e-07, -1.7136335372924805e-07, -1.601874828338623e-07, -1.4901161193847656e-07, -1.3783574104309082e-07, -1.2665987014770508e-07, -1.1548399925231934e-07, -1.043081283569336e-07, -9.313225746154785e-08, -8.195638656616211e-08, -7.078051567077637e-08, -5.960464477539063e-08, -4.842877388000488e-08, -3.725290298461914e-08, -2.60770320892334e-08, -1.4901161193847656e-08, -3.725290298461914e-09, 7.450580596923828e-09, 1.862645149230957e-08, 2.9802322387695312e-08, 4.0978193283081055e-08, 5.21540641784668e-08, 6.332993507385254e-08, 7.450580596923828e-08, 8.568167686462402e-08, 9.685754776000977e-08, 1.0803341865539551e-07, 1.1920928955078125e-07, 1.30385160446167e-07, 1.4156103134155273e-07, 1.5273690223693848e-07, 1.6391277313232422e-07, 1.7508864402770996e-07, 1.862645149230957e-07, 1.9744038581848145e-07, 2.086162567138672e-07, 2.1979212760925293e-07, 2.3096799850463867e-07, 2.421438694000244e-07, 2.5331974029541016e-07, 2.644956111907959e-07, 2.7567148208618164e-07, 2.868473529815674e-07, 2.980232238769531e-07]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 11.0, 9.0, 19.0, 21.0, 33.0, 31.0, 84.0, 129.0, 194.0, 169.0, 96.0, 72.0, 35.0, 35.0, 17.0, 15.0, 7.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.979523767658975e-05, -1.874690133263357e-05, -1.7698566807666793e-05, -1.6650230463710614e-05, -1.5601894119754434e-05, -1.4553559594787657e-05, -1.3505223250831477e-05, -1.245688781637e-05, -1.1408552381908521e-05, -1.0360216947447043e-05, -9.311881512985565e-06, -8.263545169029385e-06, -7.215209734567907e-06, -6.1668743001064286e-06, -5.1185384108975995e-06, -4.0702025216887705e-06, -3.0218670872272924e-06, -1.9735314253921388e-06, -9.251957635569852e-07, 1.231398982781684e-07, 1.171475560113322e-06, 2.2198109945748e-06, 3.268146883783629e-06, 4.316482772992458e-06, 5.364818207453936e-06, 6.4131536419154145e-06, 7.4614895311242435e-06, 8.509825420333073e-06, 9.55816085479455e-06, 1.0606496289256029e-05, 1.1654832633212209e-05, 1.2703168067673687e-05, 1.3751501683145761e-05, 1.479983711760724e-05, 1.5848172552068718e-05, 1.6896508896024898e-05, 1.7944843420991674e-05, 1.8993179764947854e-05, 2.0041516108904034e-05, 2.108985063387081e-05, 2.213818697782699e-05, 2.318652332178317e-05, 2.4234857846749946e-05, 2.5283194190706126e-05, 2.6331530534662306e-05, 2.7379865059629083e-05, 2.8428201403585263e-05, 2.9476537747541443e-05, 3.052487227250822e-05, 3.1573206797474995e-05, 3.262154496042058e-05, 3.3669879485387355e-05, 3.471821401035413e-05, 3.576654853532091e-05, 3.681488669826649e-05, 3.786322122323327e-05, 3.891155938617885e-05, 3.995989391114563e-05, 4.100823207409121e-05, 4.205656659905799e-05, 4.3104901124024764e-05, 4.415323928697035e-05, 4.5201573811937124e-05, 4.62499083369039e-05, 4.7298242861870676e-05]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 5.0, 2.0, 5.0, 9.0, 10.0, 10.0, 18.0, 11.0, 15.0, 16.0, 17.0, 23.0, 34.0, 34.0, 34.0, 41.0, 39.0, 47.0, 24.0, 37.0, 37.0, 45.0, 42.0, 35.0, 51.0, 47.0, 38.0, 37.0, 32.0, 30.0, 24.0, 19.0, 14.0, 18.0, 12.0, 21.0, 14.0, 10.0, 9.0, 7.0, 10.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4939198081265204e-05, -1.4489710338239092e-05, -1.4040222595212981e-05, -1.359073485218687e-05, -1.3141247109160759e-05, -1.2691760275629349e-05, -1.2242272532603238e-05, -1.1792784789577127e-05, -1.1343297046551015e-05, -1.0893809303524904e-05, -1.0444321560498793e-05, -9.994833817472681e-06, -9.545346983941272e-06, -9.095858331420459e-06, -8.64637149788905e-06, -8.196883754862938e-06, -7.747396011836827e-06, -7.2979082688107155e-06, -6.848420525784604e-06, -6.398933237505844e-06, -5.949445494479733e-06, -5.499957751453621e-06, -5.050470463174861e-06, -4.60098272014875e-06, -4.151494977122638e-06, -3.702007234096527e-06, -3.2525197184440913e-06, -2.8030322027916554e-06, -2.353544459765544e-06, -1.9040567167394329e-06, -1.454569201086997e-06, -1.0050816854345612e-06, -5.555930329137482e-07, -1.0610540357447462e-07, 3.4338222576479893e-07, 7.928698551040725e-07, 1.242357484443346e-06, 1.6918452274694573e-06, 2.141332743121893e-06, 2.590820258774329e-06, 3.0403080018004403e-06, 3.4897957448265515e-06, 3.939283487852663e-06, 4.388770776131423e-06, 4.8382585191575345e-06, 5.287746262183646e-06, 5.737233550462406e-06, 6.186721293488517e-06, 6.636209036514629e-06, 7.08569677954074e-06, 7.535184522566851e-06, 7.984672265592963e-06, 8.434159099124372e-06, 8.883647751645185e-06, 9.333134585176595e-06, 9.782622328202706e-06, 1.0232110071228817e-05, 1.0681597814254928e-05, 1.113108555728104e-05, 1.1580573300307151e-05, 1.2030061043333262e-05, 1.2479547876864672e-05, 1.2929035619890783e-05, 1.3378523362916894e-05, 1.3828011105943006e-05]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 11.0, 7.0, 16.0, 12.0, 25.0, 34.0, 40.0, 46.0, 76.0, 70.0, 114.0, 120.0, 178.0, 229.0, 345.0, 567.0, 838.0, 2396.0, 56929.0, 3967418.0, 156278.0, 5265.0, 1131.0, 638.0, 350.0, 262.0, 164.0, 170.0, 133.0, 100.0, 59.0, 65.0, 52.0, 32.0, 27.0, 26.0, 16.0, 10.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.00543212890625e-05, -3.889854997396469e-05, -3.774277865886688e-05, -3.6587007343769073e-05, -3.5431236028671265e-05, -3.4275464713573456e-05, -3.311969339847565e-05, -3.196392208337784e-05, -3.080815076828003e-05, -2.965237945318222e-05, -2.849660813808441e-05, -2.7340836822986603e-05, -2.6185065507888794e-05, -2.5029294192790985e-05, -2.3873522877693176e-05, -2.2717751562595367e-05, -2.156198024749756e-05, -2.040620893239975e-05, -1.925043761730194e-05, -1.8094666302204132e-05, -1.6938894987106323e-05, -1.5783123672008514e-05, -1.4627352356910706e-05, -1.3471581041812897e-05, -1.2315809726715088e-05, -1.1160038411617279e-05, -1.000426709651947e-05, -8.848495781421661e-06, -7.692724466323853e-06, -6.536953151226044e-06, -5.381181836128235e-06, -4.225410521030426e-06, -3.069639205932617e-06, -1.9138678908348083e-06, -7.580965757369995e-07, 3.976747393608093e-07, 1.5534460544586182e-06, 2.709217369556427e-06, 3.864988684654236e-06, 5.020759999752045e-06, 6.1765313148498535e-06, 7.332302629947662e-06, 8.488073945045471e-06, 9.64384526014328e-06, 1.0799616575241089e-05, 1.1955387890338898e-05, 1.3111159205436707e-05, 1.4266930520534515e-05, 1.5422701835632324e-05, 1.6578473150730133e-05, 1.7734244465827942e-05, 1.889001578092575e-05, 2.004578709602356e-05, 2.120155841112137e-05, 2.2357329726219177e-05, 2.3513101041316986e-05, 2.4668872356414795e-05, 2.5824643671512604e-05, 2.6980414986610413e-05, 2.813618630170822e-05, 2.929195761680603e-05, 3.044772893190384e-05, 3.160350024700165e-05, 3.275927156209946e-05, 3.3915042877197266e-05]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 1.0, 7.0, 5.0, 9.0, 10.0, 10.0, 16.0, 15.0, 11.0, 18.0, 20.0, 32.0, 33.0, 35.0, 41.0, 43.0, 59.0, 35.0, 35.0, 52.0, 53.0, 41.0, 42.0, 40.0, 54.0, 25.0, 33.0, 42.0, 25.0, 25.0, 19.0, 16.0, 16.0, 16.0, 13.0, 14.0, 10.0, 10.0, 4.0, 2.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.5914440155029297e-05, -1.546088606119156e-05, -1.500733196735382e-05, -1.4553777873516083e-05, -1.4100223779678345e-05, -1.3646669685840607e-05, -1.3193115592002869e-05, -1.273956149816513e-05, -1.2286007404327393e-05, -1.1832453310489655e-05, -1.1378899216651917e-05, -1.0925345122814178e-05, -1.047179102897644e-05, -1.0018236935138702e-05, -9.564682841300964e-06, -9.111128747463226e-06, -8.657574653625488e-06, -8.20402055978775e-06, -7.750466465950012e-06, -7.296912372112274e-06, -6.843358278274536e-06, -6.389804184436798e-06, -5.93625009059906e-06, -5.482695996761322e-06, -5.029141902923584e-06, -4.575587809085846e-06, -4.122033715248108e-06, -3.66847962141037e-06, -3.214925527572632e-06, -2.761371433734894e-06, -2.3078173398971558e-06, -1.8542632460594177e-06, -1.4007091522216797e-06, -9.471550583839417e-07, -4.936009645462036e-07, -4.0046870708465576e-08, 4.1350722312927246e-07, 8.670613169670105e-07, 1.3206154108047485e-06, 1.7741695046424866e-06, 2.2277235984802246e-06, 2.6812776923179626e-06, 3.1348317861557007e-06, 3.5883858799934387e-06, 4.041939973831177e-06, 4.495494067668915e-06, 4.949048161506653e-06, 5.402602255344391e-06, 5.856156349182129e-06, 6.309710443019867e-06, 6.763264536857605e-06, 7.216818630695343e-06, 7.670372724533081e-06, 8.123926818370819e-06, 8.577480912208557e-06, 9.031035006046295e-06, 9.484589099884033e-06, 9.938143193721771e-06, 1.039169728755951e-05, 1.0845251381397247e-05, 1.1298805475234985e-05, 1.1752359569072723e-05, 1.2205913662910461e-05, 1.26594677567482e-05, 1.3113021850585938e-05]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 7.0, 12.0, 28.0, 41.0, 82.0, 140.0, 412.0, 1490.0, 13061.0, 4157219.0, 19261.0, 1772.0, 406.0, 156.0, 72.0, 40.0, 31.0, 17.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.31348991394043e-05, -6.957631558179855e-05, -6.601773202419281e-05, -6.245914846658707e-05, -5.890056490898132e-05, -5.534198135137558e-05, -5.1783397793769836e-05, -4.822481423616409e-05, -4.466623067855835e-05, -4.1107647120952606e-05, -3.754906356334686e-05, -3.399048000574112e-05, -3.0431896448135376e-05, -2.6873312890529633e-05, -2.331472933292389e-05, -1.9756145775318146e-05, -1.6197562217712402e-05, -1.2638978660106659e-05, -9.080395102500916e-06, -5.521811544895172e-06, -1.9632279872894287e-06, 1.5953555703163147e-06, 5.153939127922058e-06, 8.712522685527802e-06, 1.2271106243133545e-05, 1.582968980073929e-05, 1.9388273358345032e-05, 2.2946856915950775e-05, 2.650544047355652e-05, 3.0064024031162262e-05, 3.3622607588768005e-05, 3.718119114637375e-05, 4.073977470397949e-05, 4.4298358261585236e-05, 4.785694181919098e-05, 5.141552537679672e-05, 5.4974108934402466e-05, 5.853269249200821e-05, 6.209127604961395e-05, 6.56498596072197e-05, 6.920844316482544e-05, 7.276702672243118e-05, 7.632561028003693e-05, 7.988419383764267e-05, 8.344277739524841e-05, 8.700136095285416e-05, 9.05599445104599e-05, 9.411852806806564e-05, 9.767711162567139e-05, 0.00010123569518327713, 0.00010479427874088287, 0.00010835286229848862, 0.00011191144585609436, 0.0001154700294137001, 0.00011902861297130585, 0.0001225871965289116, 0.00012614578008651733, 0.00012970436364412308, 0.00013326294720172882, 0.00013682153075933456, 0.0001403801143169403, 0.00014393869787454605, 0.0001474972814321518, 0.00015105586498975754, 0.00015461444854736328]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 11.0, 19.0, 66.0, 241.0, 2946.0, 547.0, 160.0, 42.0, 17.0, 4.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5676021575927734e-05, -1.5325844287872314e-05, -1.4975666999816895e-05, -1.4625489711761475e-05, -1.4275312423706055e-05, -1.3925135135650635e-05, -1.3574957847595215e-05, -1.3224780559539795e-05, -1.2874603271484375e-05, -1.2524425983428955e-05, -1.2174248695373535e-05, -1.1824071407318115e-05, -1.1473894119262695e-05, -1.1123716831207275e-05, -1.0773539543151855e-05, -1.0423362255096436e-05, -1.0073184967041016e-05, -9.723007678985596e-06, -9.372830390930176e-06, -9.022653102874756e-06, -8.672475814819336e-06, -8.322298526763916e-06, -7.972121238708496e-06, -7.621943950653076e-06, -7.271766662597656e-06, -6.921589374542236e-06, -6.571412086486816e-06, -6.2212347984313965e-06, -5.8710575103759766e-06, -5.520880222320557e-06, -5.170702934265137e-06, -4.820525646209717e-06, -4.470348358154297e-06, -4.120171070098877e-06, -3.769993782043457e-06, -3.419816493988037e-06, -3.069639205932617e-06, -2.7194619178771973e-06, -2.3692846298217773e-06, -2.0191073417663574e-06, -1.6689300537109375e-06, -1.3187527656555176e-06, -9.685754776000977e-07, -6.183981895446777e-07, -2.682209014892578e-07, 8.195638656616211e-08, 4.3213367462158203e-07, 7.82310962677002e-07, 1.1324882507324219e-06, 1.4826655387878418e-06, 1.8328428268432617e-06, 2.1830201148986816e-06, 2.5331974029541016e-06, 2.8833746910095215e-06, 3.2335519790649414e-06, 3.5837292671203613e-06, 3.933906555175781e-06, 4.284083843231201e-06, 4.634261131286621e-06, 4.984438419342041e-06, 5.334615707397461e-06, 5.684792995452881e-06, 6.034970283508301e-06, 6.385147571563721e-06, 6.735324859619141e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 19.0, 15.0, 38.0, 55.0, 59.0, 134.0, 156.0, 173.0, 110.0, 56.0, 45.0, 34.0, 17.0, 20.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4528842914151028e-05, -2.3681644961470738e-05, -2.2834448827779852e-05, -2.1987252694088966e-05, -2.1140054741408676e-05, -2.0292856788728386e-05, -1.94456606550375e-05, -1.8598464521346614e-05, -1.7751266568666324e-05, -1.6904068615986034e-05, -1.6056872482295148e-05, -1.520967543910956e-05, -1.4362478395923972e-05, -1.3515281352738384e-05, -1.2668084309552796e-05, -1.1820887266367208e-05, -1.097369022318162e-05, -1.0126493179996032e-05, -9.279296136810444e-06, -8.432099093624856e-06, -7.584902050439268e-06, -6.73770500725368e-06, -5.890507964068092e-06, -5.0433109208825044e-06, -4.1961138776969165e-06, -3.3489168345113285e-06, -2.5017197913257405e-06, -1.6545227481401525e-06, -8.073257049545646e-07, 3.98713382310234e-08, 8.870683814166114e-07, 1.7342654246021993e-06, 2.5814624677877873e-06, 3.4286595109733753e-06, 4.275856554158963e-06, 5.123053597344551e-06, 5.970250640530139e-06, 6.817447683715727e-06, 7.664644726901315e-06, 8.511841770086903e-06, 9.359038813272491e-06, 1.0206235856458079e-05, 1.1053432899643667e-05, 1.1900629942829255e-05, 1.2747826986014843e-05, 1.3595024029200431e-05, 1.4442221072386019e-05, 1.5289417206076905e-05, 1.6136615158757195e-05, 1.6983813111437485e-05, 1.783100924512837e-05, 1.8678205378819257e-05, 1.9525403331499547e-05, 2.0372601284179837e-05, 2.1219797417870723e-05, 2.206699355156161e-05, 2.29141915042419e-05, 2.376138945692219e-05, 2.4608585590613075e-05, 2.545578172430396e-05, 2.630297967698425e-05, 2.715017762966454e-05, 2.7997373763355426e-05, 2.8844569897046313e-05, 2.9691767849726602e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 8.0, 13.0, 12.0, 23.0, 16.0, 25.0, 25.0, 29.0, 34.0, 27.0, 38.0, 53.0, 46.0, 42.0, 43.0, 29.0, 35.0, 40.0, 44.0, 44.0, 34.0, 44.0, 31.0, 32.0, 42.0, 28.0, 23.0, 15.0, 22.0, 12.0, 15.0, 10.0, 4.0, 6.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4665742128272541e-05, -1.424709535058355e-05, -1.3828448572894558e-05, -1.3409801795205567e-05, -1.2991155017516576e-05, -1.2572509149322286e-05, -1.2153862371633295e-05, -1.1735215593944304e-05, -1.1316568816255312e-05, -1.0897922038566321e-05, -1.047927526087733e-05, -1.0060628483188339e-05, -9.641982614994049e-06, -9.223334927810356e-06, -8.804689059616067e-06, -8.386042281927075e-06, -7.967395504238084e-06, -7.548748726549093e-06, -7.130101948860101e-06, -6.711455625918461e-06, -6.29280884822947e-06, -5.8741620705404785e-06, -5.455515747598838e-06, -5.036868969909847e-06, -4.6182221922208555e-06, -4.199575414531864e-06, -3.7809288642165484e-06, -3.3622823139012326e-06, -2.9436355362122413e-06, -2.52498875852325e-06, -2.106342208207934e-06, -1.6876956578926183e-06, -1.2690479707089253e-06, -8.504013067067717e-07, -4.3175464270461816e-07, -1.3107978702464607e-08, 4.0553868529968895e-07, 8.241854629886802e-07, 1.242832013303996e-06, 1.661478563619312e-06, 2.080125341308303e-06, 2.4987721189972945e-06, 2.9174186693126103e-06, 3.336065219627926e-06, 3.7547119973169174e-06, 4.173358775005909e-06, 4.592005097947549e-06, 5.01065187563654e-06, 5.429298653325532e-06, 5.847945431014523e-06, 6.266592208703514e-06, 6.685238531645155e-06, 7.103885309334146e-06, 7.522532087023137e-06, 7.941178409964778e-06, 8.359825187653769e-06, 8.77847196534276e-06, 9.197118743031751e-06, 9.615765520720743e-06, 1.0034412298409734e-05, 1.0453059076098725e-05, 1.0871704944293015e-05, 1.1290351721982006e-05, 1.1708998499670997e-05, 1.2127645277359989e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 12.0, 9.0, 15.0, 26.0, 27.0, 58.0, 74.0, 125.0, 191.0, 245.0, 408.0, 708.0, 868.0, 1497.0, 1965.0, 3357.0, 5317.0, 7482.0, 13151.0, 22026.0, 31600.0, 65284.0, 109991.0, 285479.0, 255062.0, 99550.0, 59797.0, 33328.0, 17208.0, 12490.0, 6955.0, 5100.0, 3190.0, 1915.0, 1397.0, 941.0, 539.0, 398.0, 238.0, 181.0, 137.0, 47.0, 55.0, 31.0, 29.0, 13.0, 12.0, 9.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4960765838623047e-05, -1.4506280422210693e-05, -1.405179500579834e-05, -1.3597309589385986e-05, -1.3142824172973633e-05, -1.268833875656128e-05, -1.2233853340148926e-05, -1.1779367923736572e-05, -1.1324882507324219e-05, -1.0870397090911865e-05, -1.0415911674499512e-05, -9.961426258087158e-06, -9.506940841674805e-06, -9.052455425262451e-06, -8.597970008850098e-06, -8.143484592437744e-06, -7.68899917602539e-06, -7.234513759613037e-06, -6.780028343200684e-06, -6.32554292678833e-06, -5.8710575103759766e-06, -5.416572093963623e-06, -4.9620866775512695e-06, -4.507601261138916e-06, -4.0531158447265625e-06, -3.598630428314209e-06, -3.1441450119018555e-06, -2.689659595489502e-06, -2.2351741790771484e-06, -1.780688762664795e-06, -1.3262033462524414e-06, -8.717179298400879e-07, -4.172325134277344e-07, 3.725290298461914e-08, 4.917383193969727e-07, 9.462237358093262e-07, 1.4007091522216797e-06, 1.8551945686340332e-06, 2.3096799850463867e-06, 2.7641654014587402e-06, 3.2186508178710938e-06, 3.6731362342834473e-06, 4.127621650695801e-06, 4.582107067108154e-06, 5.036592483520508e-06, 5.491077899932861e-06, 5.945563316345215e-06, 6.400048732757568e-06, 6.854534149169922e-06, 7.309019565582275e-06, 7.763504981994629e-06, 8.217990398406982e-06, 8.672475814819336e-06, 9.12696123123169e-06, 9.581446647644043e-06, 1.0035932064056396e-05, 1.049041748046875e-05, 1.0944902896881104e-05, 1.1399388313293457e-05, 1.185387372970581e-05, 1.2308359146118164e-05, 1.2762844562530518e-05, 1.3217329978942871e-05, 1.3671815395355225e-05, 1.4126300811767578e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 12.0, 15.0, 17.0, 15.0, 18.0, 29.0, 23.0, 35.0, 24.0, 22.0, 32.0, 56.0, 53.0, 45.0, 37.0, 33.0, 49.0, 43.0, 38.0, 37.0, 37.0, 47.0, 39.0, 39.0, 26.0, 19.0, 24.0, 16.0, 15.0, 14.0, 12.0, 12.0, 14.0, 1.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3237819075584412e-05, -1.282617449760437e-05, -1.2414529919624329e-05, -1.2002885341644287e-05, -1.1591240763664246e-05, -1.1179596185684204e-05, -1.0767951607704163e-05, -1.0356307029724121e-05, -9.94466245174408e-06, -9.533017873764038e-06, -9.121373295783997e-06, -8.709728717803955e-06, -8.298084139823914e-06, -7.886439561843872e-06, -7.4747949838638306e-06, -7.063150405883789e-06, -6.6515058279037476e-06, -6.239861249923706e-06, -5.8282166719436646e-06, -5.416572093963623e-06, -5.0049275159835815e-06, -4.59328293800354e-06, -4.1816383600234985e-06, -3.769993782043457e-06, -3.3583492040634155e-06, -2.946704626083374e-06, -2.5350600481033325e-06, -2.123415470123291e-06, -1.7117708921432495e-06, -1.300126314163208e-06, -8.884817361831665e-07, -4.76837158203125e-07, -6.51925802230835e-08, 3.46451997756958e-07, 7.580965757369995e-07, 1.169741153717041e-06, 1.5813857316970825e-06, 1.993030309677124e-06, 2.4046748876571655e-06, 2.816319465637207e-06, 3.2279640436172485e-06, 3.63960862159729e-06, 4.0512531995773315e-06, 4.462897777557373e-06, 4.8745423555374146e-06, 5.286186933517456e-06, 5.6978315114974976e-06, 6.109476089477539e-06, 6.5211206674575806e-06, 6.932765245437622e-06, 7.3444098234176636e-06, 7.756054401397705e-06, 8.167698979377747e-06, 8.579343557357788e-06, 8.99098813533783e-06, 9.402632713317871e-06, 9.814277291297913e-06, 1.0225921869277954e-05, 1.0637566447257996e-05, 1.1049211025238037e-05, 1.1460855603218079e-05, 1.187250018119812e-05, 1.2284144759178162e-05, 1.2695789337158203e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 12.0, 26.0, 26.0, 45.0, 53.0, 61.0, 110.0, 171.0, 214.0, 374.0, 502.0, 727.0, 1113.0, 1717.0, 2696.0, 4143.0, 7058.0, 13529.0, 22936.0, 44266.0, 108155.0, 501132.0, 197649.0, 67743.0, 31534.0, 17951.0, 9204.0, 5473.0, 3378.0, 2164.0, 1425.0, 929.0, 639.0, 441.0, 300.0, 176.0, 156.0, 93.0, 65.0, 46.0, 36.0, 17.0, 17.0, 9.0, 10.0, 8.0, 0.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7344951629638672e-05, -1.6741454601287842e-05, -1.6137957572937012e-05, -1.553446054458618e-05, -1.4930963516235352e-05, -1.4327466487884521e-05, -1.3723969459533691e-05, -1.3120472431182861e-05, -1.2516975402832031e-05, -1.1913478374481201e-05, -1.1309981346130371e-05, -1.0706484317779541e-05, -1.0102987289428711e-05, -9.499490261077881e-06, -8.89599323272705e-06, -8.29249620437622e-06, -7.68899917602539e-06, -7.0855021476745605e-06, -6.4820051193237305e-06, -5.8785080909729e-06, -5.27501106262207e-06, -4.67151403427124e-06, -4.06801700592041e-06, -3.46451997756958e-06, -2.86102294921875e-06, -2.25752592086792e-06, -1.6540288925170898e-06, -1.0505318641662598e-06, -4.470348358154297e-07, 1.564621925354004e-07, 7.599592208862305e-07, 1.3634562492370605e-06, 1.9669532775878906e-06, 2.5704503059387207e-06, 3.1739473342895508e-06, 3.777444362640381e-06, 4.380941390991211e-06, 4.984438419342041e-06, 5.587935447692871e-06, 6.191432476043701e-06, 6.794929504394531e-06, 7.398426532745361e-06, 8.001923561096191e-06, 8.605420589447021e-06, 9.208917617797852e-06, 9.812414646148682e-06, 1.0415911674499512e-05, 1.1019408702850342e-05, 1.1622905731201172e-05, 1.2226402759552002e-05, 1.2829899787902832e-05, 1.3433396816253662e-05, 1.4036893844604492e-05, 1.4640390872955322e-05, 1.5243887901306152e-05, 1.5847384929656982e-05, 1.6450881958007812e-05, 1.7054378986358643e-05, 1.7657876014709473e-05, 1.8261373043060303e-05, 1.8864870071411133e-05, 1.9468367099761963e-05, 2.0071864128112793e-05, 2.0675361156463623e-05, 2.1278858184814453e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 6.0, 8.0, 8.0, 15.0, 22.0, 18.0, 27.0, 16.0, 15.0, 28.0, 20.0, 42.0, 30.0, 27.0, 31.0, 28.0, 27.0, 25.0, 34.0, 116.0, 28.0, 30.0, 25.0, 40.0, 18.0, 27.0, 49.0, 26.0, 19.0, 28.0, 23.0, 12.0, 17.0, 24.0, 9.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 9.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.212162017822266e-06, -6.991438567638397e-06, -6.770715117454529e-06, -6.54999166727066e-06, -6.329268217086792e-06, -6.108544766902924e-06, -5.887821316719055e-06, -5.667097866535187e-06, -5.446374416351318e-06, -5.22565096616745e-06, -5.0049275159835815e-06, -4.784204065799713e-06, -4.563480615615845e-06, -4.342757165431976e-06, -4.122033715248108e-06, -3.9013102650642395e-06, -3.680586814880371e-06, -3.4598633646965027e-06, -3.2391399145126343e-06, -3.018416464328766e-06, -2.7976930141448975e-06, -2.576969563961029e-06, -2.3562461137771606e-06, -2.1355226635932922e-06, -1.914799213409424e-06, -1.6940757632255554e-06, -1.473352313041687e-06, -1.2526288628578186e-06, -1.0319054126739502e-06, -8.111819624900818e-07, -5.904585123062134e-07, -3.6973506212234497e-07, -1.4901161193847656e-07, 7.171183824539185e-08, 2.9243528842926025e-07, 5.131587386131287e-07, 7.338821887969971e-07, 9.546056389808655e-07, 1.1753290891647339e-06, 1.3960525393486023e-06, 1.6167759895324707e-06, 1.8374994397163391e-06, 2.0582228899002075e-06, 2.278946340084076e-06, 2.4996697902679443e-06, 2.7203932404518127e-06, 2.941116690635681e-06, 3.1618401408195496e-06, 3.382563591003418e-06, 3.6032870411872864e-06, 3.824010491371155e-06, 4.044733941555023e-06, 4.265457391738892e-06, 4.48618084192276e-06, 4.706904292106628e-06, 4.927627742290497e-06, 5.148351192474365e-06, 5.369074642658234e-06, 5.589798092842102e-06, 5.8105215430259705e-06, 6.031244993209839e-06, 6.251968443393707e-06, 6.472691893577576e-06, 6.693415343761444e-06, 6.9141387939453125e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 5.0, 16.0, 24.0, 20.0, 33.0, 41.0, 48.0, 59.0, 108.0, 119.0, 144.0, 324.0, 319.0, 395.0, 865.0, 938.0, 1362.0, 3363.0, 4322.0, 8073.0, 31562.0, 88154.0, 828955.0, 52131.0, 11104.0, 7830.0, 2550.0, 1586.0, 1570.0, 606.0, 439.0, 545.0, 242.0, 166.0, 158.0, 84.0, 62.0, 68.0, 26.0, 28.0, 26.0, 16.0, 9.0, 24.0, 8.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.351139068603516e-06, -4.211440682411194e-06, -4.071742296218872e-06, -3.93204391002655e-06, -3.7923455238342285e-06, -3.6526471376419067e-06, -3.512948751449585e-06, -3.373250365257263e-06, -3.2335519790649414e-06, -3.0938535928726196e-06, -2.954155206680298e-06, -2.814456820487976e-06, -2.6747584342956543e-06, -2.5350600481033325e-06, -2.3953616619110107e-06, -2.255663275718689e-06, -2.115964889526367e-06, -1.9762665033340454e-06, -1.8365681171417236e-06, -1.6968697309494019e-06, -1.55717134475708e-06, -1.4174729585647583e-06, -1.2777745723724365e-06, -1.1380761861801147e-06, -9.98377799987793e-07, -8.586794137954712e-07, -7.189810276031494e-07, -5.792826414108276e-07, -4.3958425521850586e-07, -2.998858690261841e-07, -1.601874828338623e-07, -2.0489096641540527e-08, 1.1920928955078125e-07, 2.5890767574310303e-07, 3.986060619354248e-07, 5.383044481277466e-07, 6.780028343200684e-07, 8.177012205123901e-07, 9.57399606704712e-07, 1.0970979928970337e-06, 1.2367963790893555e-06, 1.3764947652816772e-06, 1.516193151473999e-06, 1.6558915376663208e-06, 1.7955899238586426e-06, 1.9352883100509644e-06, 2.074986696243286e-06, 2.214685082435608e-06, 2.3543834686279297e-06, 2.4940818548202515e-06, 2.6337802410125732e-06, 2.773478627204895e-06, 2.913177013397217e-06, 3.0528753995895386e-06, 3.1925737857818604e-06, 3.332272171974182e-06, 3.471970558166504e-06, 3.6116689443588257e-06, 3.7513673305511475e-06, 3.891065716743469e-06, 4.030764102935791e-06, 4.170462489128113e-06, 4.3101608753204346e-06, 4.449859261512756e-06, 4.589557647705078e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 8.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 54.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 69.0, 0.0, 0.0, 585.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 68.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 5.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539062e-07, -5.783513188362122e-07, -5.606561899185181e-07, -5.42961061000824e-07, -5.252659320831299e-07, -5.075708031654358e-07, -4.898756742477417e-07, -4.721805453300476e-07, -4.544854164123535e-07, -4.367902874946594e-07, -4.1909515857696533e-07, -4.0140002965927124e-07, -3.8370490074157715e-07, -3.6600977182388306e-07, -3.4831464290618896e-07, -3.3061951398849487e-07, -3.129243850708008e-07, -2.952292561531067e-07, -2.775341272354126e-07, -2.598389983177185e-07, -2.421438694000244e-07, -2.2444874048233032e-07, -2.0675361156463623e-07, -1.8905848264694214e-07, -1.7136335372924805e-07, -1.5366822481155396e-07, -1.3597309589385986e-07, -1.1827796697616577e-07, -1.0058283805847168e-07, -8.288770914077759e-08, -6.51925802230835e-08, -4.7497451305389404e-08, -2.9802322387695312e-08, -1.210719347000122e-08, 5.587935447692871e-09, 2.3283064365386963e-08, 4.0978193283081055e-08, 5.8673322200775146e-08, 7.636845111846924e-08, 9.406358003616333e-08, 1.1175870895385742e-07, 1.2945383787155151e-07, 1.471489667892456e-07, 1.648440957069397e-07, 1.825392246246338e-07, 2.0023435354232788e-07, 2.1792948246002197e-07, 2.3562461137771606e-07, 2.5331974029541016e-07, 2.7101486921310425e-07, 2.8870999813079834e-07, 3.0640512704849243e-07, 3.241002559661865e-07, 3.417953848838806e-07, 3.594905138015747e-07, 3.771856427192688e-07, 3.948807716369629e-07, 4.12575900554657e-07, 4.302710294723511e-07, 4.4796615839004517e-07, 4.6566128730773926e-07, 4.833564162254333e-07, 5.010515451431274e-07, 5.187466740608215e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 9.0, 4.0, 13.0, 17.0, 30.0, 88.0, 160.0, 332.0, 845.0, 2320.0, 10883.0, 104814.0, 895618.0, 25532.0, 5184.0, 1536.0, 698.0, 237.0, 100.0, 45.0, 22.0, 13.0, 14.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.33514404296875e-05, -1.2983568012714386e-05, -1.2615695595741272e-05, -1.2247823178768158e-05, -1.1879950761795044e-05, -1.151207834482193e-05, -1.1144205927848816e-05, -1.0776333510875702e-05, -1.0408461093902588e-05, -1.0040588676929474e-05, -9.67271625995636e-06, -9.304843842983246e-06, -8.936971426010132e-06, -8.569099009037018e-06, -8.201226592063904e-06, -7.83335417509079e-06, -7.465481758117676e-06, -7.097609341144562e-06, -6.729736924171448e-06, -6.361864507198334e-06, -5.99399209022522e-06, -5.626119673252106e-06, -5.258247256278992e-06, -4.890374839305878e-06, -4.522502422332764e-06, -4.15463000535965e-06, -3.7867575883865356e-06, -3.4188851714134216e-06, -3.0510127544403076e-06, -2.6831403374671936e-06, -2.3152679204940796e-06, -1.9473955035209656e-06, -1.5795230865478516e-06, -1.2116506695747375e-06, -8.437782526016235e-07, -4.759058356285095e-07, -1.0803341865539551e-07, 2.598389983177185e-07, 6.277114152908325e-07, 9.955838322639465e-07, 1.3634562492370605e-06, 1.7313286662101746e-06, 2.0992010831832886e-06, 2.4670735001564026e-06, 2.8349459171295166e-06, 3.2028183341026306e-06, 3.5706907510757446e-06, 3.938563168048859e-06, 4.306435585021973e-06, 4.674308001995087e-06, 5.042180418968201e-06, 5.410052835941315e-06, 5.777925252914429e-06, 6.145797669887543e-06, 6.513670086860657e-06, 6.881542503833771e-06, 7.249414920806885e-06, 7.617287337779999e-06, 7.985159754753113e-06, 8.353032171726227e-06, 8.72090458869934e-06, 9.088777005672455e-06, 9.456649422645569e-06, 9.824521839618683e-06, 1.0192394256591797e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 7.0, 0.0, 3.0, 0.0, 5.0, 0.0, 8.0, 0.0, 9.0, 0.0, 18.0, 0.0, 33.0, 0.0, 60.0, 0.0, 126.0, 0.0, 448.0, 0.0, 139.0, 61.0, 0.0, 39.0, 0.0, 20.0, 0.0, 12.0, 0.0, 5.0, 0.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.633360266685486e-07, -8.326023817062378e-07, -8.01868736743927e-07, -7.711350917816162e-07, -7.404014468193054e-07, -7.096678018569946e-07, -6.789341568946838e-07, -6.48200511932373e-07, -6.174668669700623e-07, -5.867332220077515e-07, -5.559995770454407e-07, -5.252659320831299e-07, -4.945322871208191e-07, -4.637986421585083e-07, -4.330649971961975e-07, -4.023313522338867e-07, -3.7159770727157593e-07, -3.4086406230926514e-07, -3.1013041734695435e-07, -2.7939677238464355e-07, -2.4866312742233276e-07, -2.1792948246002197e-07, -1.8719583749771118e-07, -1.564621925354004e-07, -1.257285475730896e-07, -9.499490261077881e-08, -6.426125764846802e-08, -3.3527612686157227e-08, -2.7939677238464355e-09, 2.7939677238464355e-08, 5.8673322200775146e-08, 8.940696716308594e-08, 1.2014061212539673e-07, 1.5087425708770752e-07, 1.816079020500183e-07, 2.123415470123291e-07, 2.430751919746399e-07, 2.738088369369507e-07, 3.045424818992615e-07, 3.3527612686157227e-07, 3.6600977182388306e-07, 3.9674341678619385e-07, 4.2747706174850464e-07, 4.5821070671081543e-07, 4.889443516731262e-07, 5.19677996635437e-07, 5.504116415977478e-07, 5.811452865600586e-07, 6.118789315223694e-07, 6.426125764846802e-07, 6.73346221446991e-07, 7.040798664093018e-07, 7.348135113716125e-07, 7.655471563339233e-07, 7.962808012962341e-07, 8.270144462585449e-07, 8.577480912208557e-07, 8.884817361831665e-07, 9.192153811454773e-07, 9.499490261077881e-07, 9.806826710700989e-07, 1.0114163160324097e-06, 1.0421499609947205e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 4.0, 9.0, 10.0, 8.0, 17.0, 23.0, 41.0, 44.0, 65.0, 100.0, 135.0, 135.0, 109.0, 81.0, 47.0, 33.0, 26.0, 22.0, 20.0, 13.0, 5.0, 12.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6575791960349306e-05, -1.591942782397382e-05, -1.5263063687598333e-05, -1.4606698641728144e-05, -1.3950334505352657e-05, -1.329397036897717e-05, -1.2637605323106982e-05, -1.1981241186731495e-05, -1.1324877050356008e-05, -1.0668512913980521e-05, -1.0012148777605034e-05, -9.355783731734846e-06, -8.699419595359359e-06, -8.043055458983872e-06, -7.386690867861034e-06, -6.730326276738197e-06, -6.07396214036271e-06, -5.417598003987223e-06, -4.761233412864385e-06, -4.1048688217415474e-06, -3.4485046853660606e-06, -2.7921403216168983e-06, -2.135775957867736e-06, -1.4794113667448983e-06, -8.230472303694114e-07, -1.6668286662024911e-07, 4.896814971289132e-07, 1.1460458608780755e-06, 1.8024102246272378e-06, 2.4587745883764e-06, 3.1151389521255624e-06, 3.7715035432484e-06, 4.427867679623887e-06, 5.084231815999374e-06, 5.7405964071222115e-06, 6.396960998245049e-06, 7.053325134620536e-06, 7.709689270996023e-06, 8.366054316866212e-06, 9.022418453241698e-06, 9.678782589617185e-06, 1.0335146725992672e-05, 1.0991510862368159e-05, 1.1647875908238348e-05, 1.2304240044613834e-05, 1.2960604180989321e-05, 1.361696922685951e-05, 1.4273333363234997e-05, 1.4929697499610484e-05, 1.558606163598597e-05, 1.6242425772361457e-05, 1.6898789908736944e-05, 1.755515404511243e-05, 1.821152000047732e-05, 1.8867884136852808e-05, 1.9524248273228295e-05, 2.0180612409603782e-05, 2.083697654597927e-05, 2.1493340682354756e-05, 2.2149704818730243e-05, 2.2806070774095133e-05, 2.346243491047062e-05, 2.4118799046846107e-05, 2.4775163183221593e-05, 2.543152731959708e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 2.0, 4.0, 7.0, 7.0, 13.0, 6.0, 14.0, 26.0, 19.0, 24.0, 25.0, 33.0, 26.0, 34.0, 34.0, 57.0, 48.0, 40.0, 41.0, 30.0, 35.0, 40.0, 51.0, 38.0, 39.0, 33.0, 32.0, 33.0, 39.0, 34.0, 22.0, 18.0, 15.0, 11.0, 17.0, 7.0, 5.0, 7.0, 9.0, 6.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3626325198856648e-05, -1.3235392543720081e-05, -1.2844458979088813e-05, -1.2453526323952246e-05, -1.206259366881568e-05, -1.1671660104184411e-05, -1.1280727449047845e-05, -1.0889794793911278e-05, -1.049886122928001e-05, -1.0107928574143443e-05, -9.716995009512175e-06, -9.326062354375608e-06, -8.935129699239042e-06, -8.544197044102475e-06, -8.153263479471207e-06, -7.76233082433464e-06, -7.3713981691980734e-06, -6.980465059314156e-06, -6.589532404177589e-06, -6.198599294293672e-06, -5.807666639157105e-06, -5.416733529273188e-06, -5.02580041938927e-06, -4.634867764252704e-06, -4.243934654368786e-06, -3.853001544484869e-06, -3.462068889348302e-06, -3.0711357794643845e-06, -2.6802028969541425e-06, -2.2892700144439004e-06, -1.898336904559983e-06, -1.5074040220497409e-06, -1.1164711395394988e-06, -7.255382001858379e-07, -3.34605260832177e-07, 5.6327735364902765e-08, 4.472606178751448e-07, 8.381935003853869e-07, 1.2291266102693044e-06, 1.6200594927795464e-06, 2.0109923752897885e-06, 2.4019252578000305e-06, 2.7928581403102726e-06, 3.18379125019419e-06, 3.574724132704432e-06, 3.965657015214674e-06, 4.356590125098592e-06, 4.747523234982509e-06, 5.138455890119076e-06, 5.529389000002993e-06, 5.92032165513956e-06, 6.311254765023477e-06, 6.702187420160044e-06, 7.0931205300439615e-06, 7.484053639927879e-06, 7.874986295064446e-06, 8.265918950201012e-06, 8.656851605337579e-06, 9.047785169968847e-06, 9.438717825105414e-06, 9.82965048024198e-06, 1.0220583135378547e-05, 1.0611516700009815e-05, 1.1002449355146382e-05, 1.139338291977765e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 19.0, 20.0, 16.0, 40.0, 53.0, 103.0, 98.0, 146.0, 270.0, 291.0, 579.0, 768.0, 1090.0, 1617.0, 2455.0, 3941.0, 5869.0, 9195.0, 14685.0, 23925.0, 44580.0, 77598.0, 156496.0, 282746.0, 196441.0, 100619.0, 49024.0, 28326.0, 17104.0, 10510.0, 7040.0, 4283.0, 2762.0, 1914.0, 1277.0, 853.0, 602.0, 365.0, 288.0, 181.0, 119.0, 91.0, 49.0, 29.0, 27.0, 21.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.153085708618164e-05, -3.056507557630539e-05, -2.9599294066429138e-05, -2.8633512556552887e-05, -2.7667731046676636e-05, -2.6701949536800385e-05, -2.5736168026924133e-05, -2.4770386517047882e-05, -2.380460500717163e-05, -2.283882349729538e-05, -2.187304198741913e-05, -2.0907260477542877e-05, -1.9941478967666626e-05, -1.8975697457790375e-05, -1.8009915947914124e-05, -1.7044134438037872e-05, -1.607835292816162e-05, -1.511257141828537e-05, -1.4146789908409119e-05, -1.3181008398532867e-05, -1.2215226888656616e-05, -1.1249445378780365e-05, -1.0283663868904114e-05, -9.317882359027863e-06, -8.352100849151611e-06, -7.38631933927536e-06, -6.420537829399109e-06, -5.454756319522858e-06, -4.4889748096466064e-06, -3.5231932997703552e-06, -2.557411789894104e-06, -1.5916302800178528e-06, -6.258487701416016e-07, 3.3993273973464966e-07, 1.3057142496109009e-06, 2.271495759487152e-06, 3.2372772693634033e-06, 4.2030587792396545e-06, 5.168840289115906e-06, 6.134621798992157e-06, 7.100403308868408e-06, 8.06618481874466e-06, 9.03196632862091e-06, 9.997747838497162e-06, 1.0963529348373413e-05, 1.1929310858249664e-05, 1.2895092368125916e-05, 1.3860873878002167e-05, 1.4826655387878418e-05, 1.579243689775467e-05, 1.675821840763092e-05, 1.772399991750717e-05, 1.8689781427383423e-05, 1.9655562937259674e-05, 2.0621344447135925e-05, 2.1587125957012177e-05, 2.2552907466888428e-05, 2.351868897676468e-05, 2.448447048664093e-05, 2.545025199651718e-05, 2.6416033506393433e-05, 2.7381815016269684e-05, 2.8347596526145935e-05, 2.9313378036022186e-05, 3.0279159545898438e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 2.0, 4.0, 8.0, 5.0, 11.0, 9.0, 10.0, 18.0, 20.0, 23.0, 30.0, 23.0, 28.0, 35.0, 45.0, 44.0, 52.0, 52.0, 45.0, 39.0, 38.0, 40.0, 55.0, 50.0, 40.0, 31.0, 36.0, 28.0, 35.0, 21.0, 18.0, 23.0, 9.0, 9.0, 17.0, 6.0, 10.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.2755393981933594e-05, -1.239776611328125e-05, -1.2040138244628906e-05, -1.1682510375976562e-05, -1.1324882507324219e-05, -1.0967254638671875e-05, -1.0609626770019531e-05, -1.0251998901367188e-05, -9.894371032714844e-06, -9.5367431640625e-06, -9.179115295410156e-06, -8.821487426757812e-06, -8.463859558105469e-06, -8.106231689453125e-06, -7.748603820800781e-06, -7.3909759521484375e-06, -7.033348083496094e-06, -6.67572021484375e-06, -6.318092346191406e-06, -5.9604644775390625e-06, -5.602836608886719e-06, -5.245208740234375e-06, -4.887580871582031e-06, -4.5299530029296875e-06, -4.172325134277344e-06, -3.814697265625e-06, -3.4570693969726562e-06, -3.0994415283203125e-06, -2.7418136596679688e-06, -2.384185791015625e-06, -2.0265579223632812e-06, -1.6689300537109375e-06, -1.3113021850585938e-06, -9.5367431640625e-07, -5.960464477539062e-07, -2.384185791015625e-07, 1.1920928955078125e-07, 4.76837158203125e-07, 8.344650268554688e-07, 1.1920928955078125e-06, 1.5497207641601562e-06, 1.9073486328125e-06, 2.2649765014648438e-06, 2.6226043701171875e-06, 2.9802322387695312e-06, 3.337860107421875e-06, 3.6954879760742188e-06, 4.0531158447265625e-06, 4.410743713378906e-06, 4.76837158203125e-06, 5.125999450683594e-06, 5.4836273193359375e-06, 5.841255187988281e-06, 6.198883056640625e-06, 6.556510925292969e-06, 6.9141387939453125e-06, 7.271766662597656e-06, 7.62939453125e-06, 7.987022399902344e-06, 8.344650268554688e-06, 8.702278137207031e-06, 9.059906005859375e-06, 9.417533874511719e-06, 9.775161743164062e-06, 1.0132789611816406e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 10.0, 7.0, 17.0, 26.0, 40.0, 74.0, 116.0, 198.0, 320.0, 543.0, 1001.0, 1548.0, 2939.0, 4991.0, 9082.0, 17061.0, 31153.0, 69930.0, 193102.0, 417546.0, 165173.0, 66966.0, 30977.0, 16146.0, 8545.0, 4450.0, 2760.0, 1605.0, 922.0, 550.0, 290.0, 170.0, 116.0, 60.0, 36.0, 25.0, 16.0, 10.0, 10.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.409385681152344e-05, -3.297440707683563e-05, -3.185495734214783e-05, -3.073550760746002e-05, -2.9616057872772217e-05, -2.849660813808441e-05, -2.7377158403396606e-05, -2.62577086687088e-05, -2.5138258934020996e-05, -2.401880919933319e-05, -2.2899359464645386e-05, -2.177990972995758e-05, -2.0660459995269775e-05, -1.954101026058197e-05, -1.8421560525894165e-05, -1.730211079120636e-05, -1.6182661056518555e-05, -1.506321132183075e-05, -1.3943761587142944e-05, -1.282431185245514e-05, -1.1704862117767334e-05, -1.0585412383079529e-05, -9.465962648391724e-06, -8.346512913703918e-06, -7.227063179016113e-06, -6.107613444328308e-06, -4.988163709640503e-06, -3.868713974952698e-06, -2.7492642402648926e-06, -1.6298145055770874e-06, -5.103647708892822e-07, 6.09084963798523e-07, 1.7285346984863281e-06, 2.8479844331741333e-06, 3.9674341678619385e-06, 5.086883902549744e-06, 6.206333637237549e-06, 7.325783371925354e-06, 8.44523310661316e-06, 9.564682841300964e-06, 1.068413257598877e-05, 1.1803582310676575e-05, 1.292303204536438e-05, 1.4042481780052185e-05, 1.516193151473999e-05, 1.6281381249427795e-05, 1.74008309841156e-05, 1.8520280718803406e-05, 1.963973045349121e-05, 2.0759180188179016e-05, 2.187862992286682e-05, 2.2998079657554626e-05, 2.411752939224243e-05, 2.5236979126930237e-05, 2.6356428861618042e-05, 2.7475878596305847e-05, 2.8595328330993652e-05, 2.9714778065681458e-05, 3.083422780036926e-05, 3.195367753505707e-05, 3.307312726974487e-05, 3.419257700443268e-05, 3.5312026739120483e-05, 3.643147647380829e-05, 3.7550926208496094e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 6.0, 6.0, 3.0, 13.0, 16.0, 4.0, 15.0, 12.0, 14.0, 22.0, 26.0, 30.0, 32.0, 27.0, 42.0, 34.0, 36.0, 42.0, 62.0, 50.0, 40.0, 39.0, 49.0, 49.0, 43.0, 34.0, 32.0, 36.0, 24.0, 22.0, 17.0, 24.0, 13.0, 15.0, 15.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.715557098388672e-06, -9.432435035705566e-06, -9.149312973022461e-06, -8.866190910339355e-06, -8.58306884765625e-06, -8.299946784973145e-06, -8.016824722290039e-06, -7.733702659606934e-06, -7.450580596923828e-06, -7.167458534240723e-06, -6.884336471557617e-06, -6.601214408874512e-06, -6.318092346191406e-06, -6.034970283508301e-06, -5.751848220825195e-06, -5.46872615814209e-06, -5.185604095458984e-06, -4.902482032775879e-06, -4.6193599700927734e-06, -4.336237907409668e-06, -4.0531158447265625e-06, -3.769993782043457e-06, -3.4868717193603516e-06, -3.203749656677246e-06, -2.9206275939941406e-06, -2.637505531311035e-06, -2.3543834686279297e-06, -2.0712614059448242e-06, -1.7881393432617188e-06, -1.5050172805786133e-06, -1.2218952178955078e-06, -9.387731552124023e-07, -6.556510925292969e-07, -3.725290298461914e-07, -8.940696716308594e-08, 1.9371509552001953e-07, 4.76837158203125e-07, 7.599592208862305e-07, 1.043081283569336e-06, 1.3262033462524414e-06, 1.6093254089355469e-06, 1.8924474716186523e-06, 2.175569534301758e-06, 2.4586915969848633e-06, 2.7418136596679688e-06, 3.0249357223510742e-06, 3.3080577850341797e-06, 3.591179847717285e-06, 3.874301910400391e-06, 4.157423973083496e-06, 4.4405460357666016e-06, 4.723668098449707e-06, 5.0067901611328125e-06, 5.289912223815918e-06, 5.5730342864990234e-06, 5.856156349182129e-06, 6.139278411865234e-06, 6.42240047454834e-06, 6.705522537231445e-06, 6.988644599914551e-06, 7.271766662597656e-06, 7.554888725280762e-06, 7.838010787963867e-06, 8.121132850646973e-06, 8.404254913330078e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 6.0, 11.0, 17.0, 21.0, 24.0, 44.0, 54.0, 73.0, 143.0, 229.0, 314.0, 643.0, 1289.0, 2745.0, 6512.0, 18508.0, 76741.0, 833973.0, 76697.0, 18360.0, 6361.0, 2869.0, 1335.0, 616.0, 320.0, 228.0, 137.0, 59.0, 62.0, 48.0, 28.0, 20.0, 18.0, 12.0, 10.0, 6.0, 11.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5506520867347717e-06, -1.4919787645339966e-06, -1.4333054423332214e-06, -1.3746321201324463e-06, -1.3159587979316711e-06, -1.257285475730896e-06, -1.1986121535301208e-06, -1.1399388313293457e-06, -1.0812655091285706e-06, -1.0225921869277954e-06, -9.639188647270203e-07, -9.052455425262451e-07, -8.4657222032547e-07, -7.878988981246948e-07, -7.292255759239197e-07, -6.705522537231445e-07, -6.118789315223694e-07, -5.532056093215942e-07, -4.945322871208191e-07, -4.3585896492004395e-07, -3.771856427192688e-07, -3.1851232051849365e-07, -2.598389983177185e-07, -2.0116567611694336e-07, -1.424923539161682e-07, -8.381903171539307e-08, -2.514570951461792e-08, 3.3527612686157227e-08, 9.220093488693237e-08, 1.5087425708770752e-07, 2.0954757928848267e-07, 2.682209014892578e-07, 3.2689422369003296e-07, 3.855675458908081e-07, 4.4424086809158325e-07, 5.029141902923584e-07, 5.615875124931335e-07, 6.202608346939087e-07, 6.789341568946838e-07, 7.37607479095459e-07, 7.962808012962341e-07, 8.549541234970093e-07, 9.136274456977844e-07, 9.723007678985596e-07, 1.0309740900993347e-06, 1.0896474123001099e-06, 1.148320734500885e-06, 1.2069940567016602e-06, 1.2656673789024353e-06, 1.3243407011032104e-06, 1.3830140233039856e-06, 1.4416873455047607e-06, 1.5003606677055359e-06, 1.559033989906311e-06, 1.6177073121070862e-06, 1.6763806343078613e-06, 1.7350539565086365e-06, 1.7937272787094116e-06, 1.8524006009101868e-06, 1.911073923110962e-06, 1.969747245311737e-06, 2.028420567512512e-06, 2.0870938897132874e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 886.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.830079317092896e-07, -5.699694156646729e-07, -5.569308996200562e-07, -5.438923835754395e-07, -5.308538675308228e-07, -5.178153514862061e-07, -5.047768354415894e-07, -4.917383193969727e-07, -4.78699803352356e-07, -4.6566128730773926e-07, -4.5262277126312256e-07, -4.3958425521850586e-07, -4.2654573917388916e-07, -4.1350722312927246e-07, -4.0046870708465576e-07, -3.8743019104003906e-07, -3.7439167499542236e-07, -3.6135315895080566e-07, -3.4831464290618896e-07, -3.3527612686157227e-07, -3.2223761081695557e-07, -3.0919909477233887e-07, -2.9616057872772217e-07, -2.8312206268310547e-07, -2.7008354663848877e-07, -2.5704503059387207e-07, -2.4400651454925537e-07, -2.3096799850463867e-07, -2.1792948246002197e-07, -2.0489096641540527e-07, -1.9185245037078857e-07, -1.7881393432617188e-07, -1.6577541828155518e-07, -1.5273690223693848e-07, -1.3969838619232178e-07, -1.2665987014770508e-07, -1.1362135410308838e-07, -1.0058283805847168e-07, -8.754432201385498e-08, -7.450580596923828e-08, -6.146728992462158e-08, -4.842877388000488e-08, -3.5390257835388184e-08, -2.2351741790771484e-08, -9.313225746154785e-09, 3.725290298461914e-09, 1.6763806343078613e-08, 2.9802322387695312e-08, 4.284083843231201e-08, 5.587935447692871e-08, 6.891787052154541e-08, 8.195638656616211e-08, 9.499490261077881e-08, 1.0803341865539551e-07, 1.210719347000122e-07, 1.341104507446289e-07, 1.471489667892456e-07, 1.601874828338623e-07, 1.73225998878479e-07, 1.862645149230957e-07, 1.993030309677124e-07, 2.123415470123291e-07, 2.253800630569458e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 3.0, 15.0, 16.0, 21.0, 33.0, 0.0, 50.0, 80.0, 162.0, 210.0, 348.0, 697.0, 1615.0, 3593.0, 15271.0, 68661.0, 866754.0, 68865.0, 0.0, 15284.0, 3682.0, 1546.0, 698.0, 354.0, 188.0, 154.0, 88.0, 56.0, 44.0, 22.0, 18.0, 0.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.971609890460968e-06, -1.9166618585586548e-06, -1.8617138266563416e-06, -1.8067657947540283e-06, -1.751817762851715e-06, -1.6968697309494019e-06, -1.6419216990470886e-06, -1.5869736671447754e-06, -1.5320256352424622e-06, -1.477077603340149e-06, -1.4221295714378357e-06, -1.3671815395355225e-06, -1.3122335076332092e-06, -1.257285475730896e-06, -1.2023374438285828e-06, -1.1473894119262695e-06, -1.0924413800239563e-06, -1.037493348121643e-06, -9.825453162193298e-07, -9.275972843170166e-07, -8.726492524147034e-07, -8.177012205123901e-07, -7.627531886100769e-07, -7.078051567077637e-07, -6.528571248054504e-07, -5.979090929031372e-07, -5.42961061000824e-07, -4.880130290985107e-07, -4.330649971961975e-07, -3.781169652938843e-07, -3.2316893339157104e-07, -2.682209014892578e-07, -2.1327286958694458e-07, -1.5832483768463135e-07, -1.0337680578231812e-07, -4.842877388000488e-08, 6.51925802230835e-09, 6.146728992462158e-08, 1.1641532182693481e-07, 1.7136335372924805e-07, 2.2631138563156128e-07, 2.812594175338745e-07, 3.3620744943618774e-07, 3.91155481338501e-07, 4.461035132408142e-07, 5.010515451431274e-07, 5.559995770454407e-07, 6.109476089477539e-07, 6.658956408500671e-07, 7.208436727523804e-07, 7.757917046546936e-07, 8.307397365570068e-07, 8.856877684593201e-07, 9.406358003616333e-07, 9.955838322639465e-07, 1.0505318641662598e-06, 1.105479896068573e-06, 1.1604279279708862e-06, 1.2153759598731995e-06, 1.2703239917755127e-06, 1.325272023677826e-06, 1.3802200555801392e-06, 1.4351680874824524e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 118.0, 0.0, 0.0, 0.0, 0.0, 711.0, 0.0, 0.0, 0.0, 0.0, 130.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 8.0, 14.0, 19.0, 11.0, 16.0, 25.0, 34.0, 37.0, 58.0, 79.0, 107.0, 148.0, 130.0, 93.0, 46.0, 29.0, 32.0, 14.0, 17.0, 16.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7423095414415002e-05, -1.688692827883642e-05, -1.6350762962247245e-05, -1.5814595826668665e-05, -1.5278428691090085e-05, -1.4742262465006206e-05, -1.4206096238922328e-05, -1.3669929103343748e-05, -1.3133762877259869e-05, -1.259759665117599e-05, -1.206142951559741e-05, -1.1525263289513532e-05, -1.0989097063429654e-05, -1.0452929927851073e-05, -9.916763701767195e-06, -9.380597475683317e-06, -8.844430340104736e-06, -8.308264114020858e-06, -7.772096978442278e-06, -7.235930752358399e-06, -6.69976407152717e-06, -6.163597390695941e-06, -5.627431164612062e-06, -5.091264483780833e-06, -4.555097802949604e-06, -4.018931122118374e-06, -3.4827646686608205e-06, -2.9465982152032666e-06, -2.4104315343720373e-06, -1.874264853540808e-06, -1.338098400083254e-06, -8.019319466257002e-07, -2.6576708478387445e-07, 2.7039948236051714e-07, 8.065660495049087e-07, 1.3427326166493003e-06, 1.878899183793692e-06, 2.4150658646249212e-06, 2.951232318082475e-06, 3.487398771540029e-06, 4.023565452371258e-06, 4.559732133202488e-06, 5.095898814033717e-06, 5.632065040117595e-06, 6.168231720948825e-06, 6.704398401780054e-06, 7.240564627863932e-06, 7.77673085394781e-06, 8.312897989526391e-06, 8.84906421561027e-06, 9.38523135118885e-06, 9.921397577272728e-06, 1.0457564712851308e-05, 1.0993730938935187e-05, 1.1529897165019065e-05, 1.2066064300597645e-05, 1.2602230526681524e-05, 1.3138396752765402e-05, 1.3674563888343982e-05, 1.421073011442786e-05, 1.474689634051174e-05, 1.528306347609032e-05, 1.58192306116689e-05, 1.6355395928258076e-05, 1.6891563063836657e-05]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 11.0, 9.0, 9.0, 27.0, 19.0, 22.0, 16.0, 34.0, 40.0, 29.0, 30.0, 36.0, 44.0, 34.0, 48.0, 54.0, 39.0, 41.0, 47.0, 40.0, 50.0, 42.0, 35.0, 36.0, 24.0, 27.0, 23.0, 26.0, 13.0, 21.0, 17.0, 8.0, 9.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3146675883035641e-05, -1.2768387932737824e-05, -1.2390100891934708e-05, -1.201181294163689e-05, -1.1633524991339073e-05, -1.1255237041041255e-05, -1.087695000023814e-05, -1.0498662049940322e-05, -1.0120375009137206e-05, -9.742087058839388e-06, -9.363800018036272e-06, -8.985512067738455e-06, -8.607224117440637e-06, -8.228937076637521e-06, -7.850649126339704e-06, -7.472361176041886e-06, -7.094073225744069e-06, -6.715785730193602e-06, -6.337497779895784e-06, -5.959210284345318e-06, -5.5809223340475e-06, -5.202634838497033e-06, -4.824347342946567e-06, -4.446059392648749e-06, -4.067771897098282e-06, -3.68948417417414e-06, -3.311196451249998e-06, -2.9329089556995314e-06, -2.5546212327753892e-06, -2.176333509851247e-06, -1.7980460143007804e-06, -1.4197582913766382e-06, -1.0414696589577943e-06, -6.63181992877071e-07, -2.8489432679634774e-07, 9.339328244095668e-08, 4.7168100536509883e-07, 8.49968728289241e-07, 1.2282562238397077e-06, 1.6065439467638498e-06, 1.984831669687992e-06, 2.363119392612134e-06, 2.7414071155362763e-06, 3.119694611086743e-06, 3.497982334010885e-06, 3.876270056935027e-06, 4.254557552485494e-06, 4.632845048035961e-06, 5.011132998333778e-06, 5.389420493884245e-06, 5.7677084441820625e-06, 6.145995939732529e-06, 6.524283890030347e-06, 6.9025713855808135e-06, 7.28085888113128e-06, 7.659146831429098e-06, 8.037433872232214e-06, 8.415721822530031e-06, 8.794008863333147e-06, 9.172296813630965e-06, 9.550584763928782e-06, 9.928871804731898e-06, 1.0307159755029716e-05, 1.0685447705327533e-05, 1.106373565562535e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 16.0, 17.0, 22.0, 34.0, 41.0, 65.0, 88.0, 132.0, 205.0, 307.0, 401.0, 659.0, 1005.0, 1533.0, 2183.0, 3776.0, 6081.0, 11648.0, 24884.0, 3219990.0, 873030.0, 22081.0, 10826.0, 5468.0, 3493.0, 2105.0, 1400.0, 903.0, 618.0, 362.0, 283.0, 192.0, 120.0, 85.0, 73.0, 45.0, 29.0, 16.0, 18.0, 13.0, 10.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.023313522338867e-05, -3.901217132806778e-05, -3.779120743274689e-05, -3.6570243537425995e-05, -3.53492796421051e-05, -3.412831574678421e-05, -3.290735185146332e-05, -3.1686387956142426e-05, -3.0465424060821533e-05, -2.924446016550064e-05, -2.802349627017975e-05, -2.6802532374858856e-05, -2.5581568479537964e-05, -2.436060458421707e-05, -2.313964068889618e-05, -2.1918676793575287e-05, -2.0697712898254395e-05, -1.9476749002933502e-05, -1.825578510761261e-05, -1.7034821212291718e-05, -1.5813857316970825e-05, -1.4592893421649933e-05, -1.337192952632904e-05, -1.2150965631008148e-05, -1.0930001735687256e-05, -9.709037840366364e-06, -8.488073945045471e-06, -7.267110049724579e-06, -6.0461461544036865e-06, -4.825182259082794e-06, -3.604218363761902e-06, -2.3832544684410095e-06, -1.1622905731201172e-06, 5.8673322200775146e-08, 1.2796372175216675e-06, 2.50060111284256e-06, 3.721565008163452e-06, 4.9425289034843445e-06, 6.163492798805237e-06, 7.384456694126129e-06, 8.605420589447021e-06, 9.826384484767914e-06, 1.1047348380088806e-05, 1.2268312275409698e-05, 1.348927617073059e-05, 1.4710240066051483e-05, 1.5931203961372375e-05, 1.7152167856693268e-05, 1.837313175201416e-05, 1.9594095647335052e-05, 2.0815059542655945e-05, 2.2036023437976837e-05, 2.325698733329773e-05, 2.4477951228618622e-05, 2.5698915123939514e-05, 2.6919879019260406e-05, 2.81408429145813e-05, 2.936180680990219e-05, 3.0582770705223083e-05, 3.1803734600543976e-05, 3.302469849586487e-05, 3.424566239118576e-05, 3.546662628650665e-05, 3.6687590181827545e-05, 3.790855407714844e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 5.0, 11.0, 9.0, 12.0, 27.0, 15.0, 16.0, 24.0, 22.0, 25.0, 42.0, 31.0, 31.0, 25.0, 54.0, 62.0, 47.0, 56.0, 29.0, 55.0, 49.0, 41.0, 40.0, 27.0, 37.0, 29.0, 25.0, 28.0, 17.0, 18.0, 19.0, 17.0, 14.0, 5.0, 5.0, 4.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.62939453125e-06, -7.403083145618439e-06, -7.1767717599868774e-06, -6.950460374355316e-06, -6.724148988723755e-06, -6.497837603092194e-06, -6.271526217460632e-06, -6.045214831829071e-06, -5.81890344619751e-06, -5.5925920605659485e-06, -5.366280674934387e-06, -5.139969289302826e-06, -4.913657903671265e-06, -4.687346518039703e-06, -4.461035132408142e-06, -4.234723746776581e-06, -4.0084123611450195e-06, -3.7821009755134583e-06, -3.555789589881897e-06, -3.3294782042503357e-06, -3.1031668186187744e-06, -2.876855432987213e-06, -2.650544047355652e-06, -2.4242326617240906e-06, -2.1979212760925293e-06, -1.971609890460968e-06, -1.7452985048294067e-06, -1.5189871191978455e-06, -1.2926757335662842e-06, -1.066364347934723e-06, -8.400529623031616e-07, -6.137415766716003e-07, -3.8743019104003906e-07, -1.6111880540847778e-07, 6.51925802230835e-08, 2.915039658546448e-07, 5.178153514862061e-07, 7.441267371177673e-07, 9.704381227493286e-07, 1.1967495083808899e-06, 1.4230608940124512e-06, 1.6493722796440125e-06, 1.8756836652755737e-06, 2.101995050907135e-06, 2.3283064365386963e-06, 2.5546178221702576e-06, 2.780929207801819e-06, 3.00724059343338e-06, 3.2335519790649414e-06, 3.4598633646965027e-06, 3.686174750328064e-06, 3.912486135959625e-06, 4.1387975215911865e-06, 4.365108907222748e-06, 4.591420292854309e-06, 4.81773167848587e-06, 5.044043064117432e-06, 5.270354449748993e-06, 5.496665835380554e-06, 5.7229772210121155e-06, 5.949288606643677e-06, 6.175599992275238e-06, 6.401911377906799e-06, 6.628222763538361e-06, 6.854534149169922e-06]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 9.0, 17.0, 35.0, 56.0, 78.0, 150.0, 257.0, 495.0, 1013.0, 2483.0, 5709.0, 16916.0, 82932.0, 3998178.0, 61911.0, 14661.0, 5103.0, 2198.0, 945.0, 519.0, 220.0, 152.0, 66.0, 42.0, 29.0, 19.0, 14.0, 9.0, 14.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6253204345703125e-05, -4.4733285903930664e-05, -4.32133674621582e-05, -4.169344902038574e-05, -4.017353057861328e-05, -3.865361213684082e-05, -3.713369369506836e-05, -3.56137752532959e-05, -3.409385681152344e-05, -3.2573938369750977e-05, -3.1054019927978516e-05, -2.9534101486206055e-05, -2.8014183044433594e-05, -2.6494264602661133e-05, -2.4974346160888672e-05, -2.345442771911621e-05, -2.193450927734375e-05, -2.041459083557129e-05, -1.8894672393798828e-05, -1.7374753952026367e-05, -1.5854835510253906e-05, -1.4334917068481445e-05, -1.2814998626708984e-05, -1.1295080184936523e-05, -9.775161743164062e-06, -8.255243301391602e-06, -6.735324859619141e-06, -5.21540641784668e-06, -3.6954879760742188e-06, -2.175569534301758e-06, -6.556510925292969e-07, 8.642673492431641e-07, 2.384185791015625e-06, 3.904104232788086e-06, 5.424022674560547e-06, 6.943941116333008e-06, 8.463859558105469e-06, 9.98377799987793e-06, 1.150369644165039e-05, 1.3023614883422852e-05, 1.4543533325195312e-05, 1.6063451766967773e-05, 1.7583370208740234e-05, 1.9103288650512695e-05, 2.0623207092285156e-05, 2.2143125534057617e-05, 2.3663043975830078e-05, 2.518296241760254e-05, 2.6702880859375e-05, 2.822279930114746e-05, 2.9742717742919922e-05, 3.126263618469238e-05, 3.2782554626464844e-05, 3.4302473068237305e-05, 3.5822391510009766e-05, 3.7342309951782227e-05, 3.886222839355469e-05, 4.038214683532715e-05, 4.190206527709961e-05, 4.342198371887207e-05, 4.494190216064453e-05, 4.646182060241699e-05, 4.798173904418945e-05, 4.9501657485961914e-05, 5.1021575927734375e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 3.0, 5.0, 3.0, 8.0, 10.0, 6.0, 13.0, 6.0, 18.0, 19.0, 33.0, 54.0, 230.0, 679.0, 2520.0, 223.0, 106.0, 28.0, 14.0, 21.0, 7.0, 16.0, 5.0, 4.0, 5.0, 5.0, 5.0, 6.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.6335702538490295e-06, -5.425885319709778e-06, -5.218200385570526e-06, -5.010515451431274e-06, -4.802830517292023e-06, -4.595145583152771e-06, -4.387460649013519e-06, -4.179775714874268e-06, -3.972090780735016e-06, -3.764405846595764e-06, -3.5567209124565125e-06, -3.3490359783172607e-06, -3.141351044178009e-06, -2.9336661100387573e-06, -2.7259811758995056e-06, -2.518296241760254e-06, -2.310611307621002e-06, -2.1029263734817505e-06, -1.8952414393424988e-06, -1.687556505203247e-06, -1.4798715710639954e-06, -1.2721866369247437e-06, -1.064501702785492e-06, -8.568167686462402e-07, -6.491318345069885e-07, -4.414469003677368e-07, -2.337619662284851e-07, -2.60770320892334e-08, 1.816079020500183e-07, 3.8929283618927e-07, 5.969777703285217e-07, 8.046627044677734e-07, 1.0123476386070251e-06, 1.2200325727462769e-06, 1.4277175068855286e-06, 1.6354024410247803e-06, 1.843087375164032e-06, 2.0507723093032837e-06, 2.2584572434425354e-06, 2.466142177581787e-06, 2.673827111721039e-06, 2.8815120458602905e-06, 3.0891969799995422e-06, 3.296881914138794e-06, 3.5045668482780457e-06, 3.7122517824172974e-06, 3.919936716556549e-06, 4.127621650695801e-06, 4.3353065848350525e-06, 4.542991518974304e-06, 4.750676453113556e-06, 4.958361387252808e-06, 5.166046321392059e-06, 5.373731255531311e-06, 5.581416189670563e-06, 5.7891011238098145e-06, 5.996786057949066e-06, 6.204470992088318e-06, 6.41215592622757e-06, 6.619840860366821e-06, 6.827525794506073e-06, 7.035210728645325e-06, 7.242895662784576e-06, 7.450580596923828e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 7.0, 9.0, 8.0, 13.0, 13.0, 21.0, 18.0, 27.0, 26.0, 49.0, 72.0, 91.0, 95.0, 115.0, 97.0, 75.0, 58.0, 37.0, 40.0, 26.0, 29.0, 18.0, 14.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2182227692392189e-05, -1.1837671081593726e-05, -1.1493115380289964e-05, -1.1148558769491501e-05, -1.0804002158693038e-05, -1.0459446457389276e-05, -1.0114889846590813e-05, -9.770334145287052e-06, -9.425777534488589e-06, -9.081220923690125e-06, -8.736665222386364e-06, -8.3921086115879e-06, -8.04755291028414e-06, -7.702996299485676e-06, -7.358439688687213e-06, -7.0138835326361004e-06, -6.669327376584988e-06, -6.324771220533876e-06, -5.980215064482763e-06, -5.6356584536843e-06, -5.291102297633188e-06, -4.9465461415820755e-06, -4.601989530783612e-06, -4.2574333747325e-06, -3.912877218681388e-06, -3.5683210626302753e-06, -3.2237646792054875e-06, -2.8792082957806997e-06, -2.5346521397295874e-06, -2.190095983678475e-06, -1.8455396002536872e-06, -1.5009832168288995e-06, -1.1564261512830853e-06, -8.118698815451353e-07, -4.673136118071852e-07, -1.2275734206923516e-07, 2.217989276687149e-07, 5.66355197406665e-07, 9.10911467144615e-07, 1.2554678505694028e-06, 1.6000240066205151e-06, 1.9445801626716275e-06, 2.2891365460964153e-06, 2.633692929521203e-06, 2.9782490855723154e-06, 3.3228052416234277e-06, 3.6673616250482155e-06, 4.011918008473003e-06, 4.356474164524116e-06, 4.701030320575228e-06, 5.04558647662634e-06, 5.3901430874248035e-06, 5.734699243475916e-06, 6.079255399527028e-06, 6.4238120103254914e-06, 6.768368166376604e-06, 7.112924322427716e-06, 7.4574804784788284e-06, 7.80203663452994e-06, 8.146593245328404e-06, 8.491149856126867e-06, 8.835705557430629e-06, 9.180262168229092e-06, 9.524817869532853e-06, 9.869374480331317e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 6.0, 12.0, 11.0, 19.0, 17.0, 23.0, 20.0, 26.0, 36.0, 26.0, 33.0, 34.0, 31.0, 39.0, 33.0, 49.0, 40.0, 45.0, 39.0, 41.0, 40.0, 35.0, 33.0, 32.0, 31.0, 31.0, 25.0, 17.0, 27.0, 17.0, 24.0, 19.0, 14.0, 11.0, 8.0, 14.0, 5.0, 8.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-8.500781405018643e-06, -8.262325536634307e-06, -8.023869668249972e-06, -7.785413799865637e-06, -7.546957931481302e-06, -7.308502063096967e-06, -7.070046649459982e-06, -6.831590781075647e-06, -6.593134912691312e-06, -6.354679044306977e-06, -6.1162231759226415e-06, -5.877767307538306e-06, -5.639311893901322e-06, -5.400856025516987e-06, -5.162400157132652e-06, -4.9239442887483165e-06, -4.685488420363981e-06, -4.447032551979646e-06, -4.208576683595311e-06, -3.970120815210976e-06, -3.731665174200316e-06, -3.4932093058159808e-06, -3.254753664805321e-06, -3.016297796420986e-06, -2.7778419280366506e-06, -2.5393860596523155e-06, -2.3009301912679803e-06, -2.0624745502573205e-06, -1.8240186818729853e-06, -1.5855628134886501e-06, -1.3471070587911527e-06, -1.1086513040936552e-06, -8.701945262146182e-07, -6.317387146737019e-07, -3.932829031327856e-07, -1.5482709159186925e-07, 8.362871994904708e-08, 3.2208458833338227e-07, 5.605403430308797e-07, 7.989960977283772e-07, 1.0374519661127124e-06, 1.2759078344970476e-06, 1.514363589194545e-06, 1.7528193438920425e-06, 1.9912752122763777e-06, 2.229731080660713e-06, 2.4681867216713727e-06, 2.706642590055708e-06, 2.945098458440043e-06, 3.1835543268243782e-06, 3.4220101952087134e-06, 3.660465836219373e-06, 3.898921931977384e-06, 4.137377800361719e-06, 4.375833213998703e-06, 4.6142890823830385e-06, 4.852744950767374e-06, 5.091200819151709e-06, 5.329656687536044e-06, 5.568112555920379e-06, 5.8065679695573635e-06, 6.045023837941699e-06, 6.283479706326034e-06, 6.521935574710369e-06, 6.760391443094704e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 9.0, 7.0, 10.0, 18.0, 21.0, 40.0, 36.0, 58.0, 82.0, 102.0, 142.0, 202.0, 317.0, 451.0, 676.0, 975.0, 1316.0, 2088.0, 3256.0, 5477.0, 9166.0, 16446.0, 25459.0, 55572.0, 118198.0, 315180.0, 273721.0, 106614.0, 51067.0, 25974.0, 13859.0, 8153.0, 4784.0, 3026.0, 1880.0, 1272.0, 866.0, 586.0, 411.0, 310.0, 208.0, 152.0, 116.0, 62.0, 74.0, 35.0, 29.0, 12.0, 14.0, 14.0, 2.0, 4.0, 1.0, 2.0, 3.0], "bins": [-1.6570091247558594e-05, -1.60951167345047e-05, -1.5620142221450806e-05, -1.5145167708396912e-05, -1.4670193195343018e-05, -1.4195218682289124e-05, -1.372024416923523e-05, -1.3245269656181335e-05, -1.2770295143127441e-05, -1.2295320630073547e-05, -1.1820346117019653e-05, -1.134537160396576e-05, -1.0870397090911865e-05, -1.0395422577857971e-05, -9.920448064804077e-06, -9.445473551750183e-06, -8.970499038696289e-06, -8.495524525642395e-06, -8.020550012588501e-06, -7.545575499534607e-06, -7.070600986480713e-06, -6.595626473426819e-06, -6.120651960372925e-06, -5.645677447319031e-06, -5.170702934265137e-06, -4.695728421211243e-06, -4.220753908157349e-06, -3.7457793951034546e-06, -3.2708048820495605e-06, -2.7958303689956665e-06, -2.3208558559417725e-06, -1.8458813428878784e-06, -1.3709068298339844e-06, -8.959323167800903e-07, -4.209578037261963e-07, 5.4016709327697754e-08, 5.289912223815918e-07, 1.0039657354354858e-06, 1.4789402484893799e-06, 1.953914761543274e-06, 2.428889274597168e-06, 2.903863787651062e-06, 3.378838300704956e-06, 3.85381281375885e-06, 4.328787326812744e-06, 4.803761839866638e-06, 5.278736352920532e-06, 5.753710865974426e-06, 6.22868537902832e-06, 6.703659892082214e-06, 7.178634405136108e-06, 7.653608918190002e-06, 8.128583431243896e-06, 8.60355794429779e-06, 9.078532457351685e-06, 9.553506970405579e-06, 1.0028481483459473e-05, 1.0503455996513367e-05, 1.097843050956726e-05, 1.1453405022621155e-05, 1.1928379535675049e-05, 1.2403354048728943e-05, 1.2878328561782837e-05, 1.3353303074836731e-05, 1.3828277587890625e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 5.0, 14.0, 7.0, 11.0, 13.0, 22.0, 34.0, 21.0, 27.0, 24.0, 37.0, 39.0, 25.0, 23.0, 41.0, 47.0, 52.0, 49.0, 40.0, 37.0, 43.0, 34.0, 32.0, 32.0, 28.0, 37.0, 27.0, 25.0, 25.0, 23.0, 17.0, 13.0, 15.0, 10.0, 16.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-8.344650268554688e-06, -8.111819624900818e-06, -7.878988981246948e-06, -7.646158337593079e-06, -7.413327693939209e-06, -7.180497050285339e-06, -6.94766640663147e-06, -6.7148357629776e-06, -6.4820051193237305e-06, -6.249174475669861e-06, -6.016343832015991e-06, -5.783513188362122e-06, -5.550682544708252e-06, -5.317851901054382e-06, -5.085021257400513e-06, -4.852190613746643e-06, -4.6193599700927734e-06, -4.386529326438904e-06, -4.153698682785034e-06, -3.9208680391311646e-06, -3.688037395477295e-06, -3.4552067518234253e-06, -3.2223761081695557e-06, -2.989545464515686e-06, -2.7567148208618164e-06, -2.5238841772079468e-06, -2.291053533554077e-06, -2.0582228899002075e-06, -1.8253922462463379e-06, -1.5925616025924683e-06, -1.3597309589385986e-06, -1.126900315284729e-06, -8.940696716308594e-07, -6.612390279769897e-07, -4.284083843231201e-07, -1.955777406692505e-07, 3.725290298461914e-08, 2.7008354663848877e-07, 5.029141902923584e-07, 7.35744833946228e-07, 9.685754776000977e-07, 1.2014061212539673e-06, 1.434236764907837e-06, 1.6670674085617065e-06, 1.8998980522155762e-06, 2.132728695869446e-06, 2.3655593395233154e-06, 2.598389983177185e-06, 2.8312206268310547e-06, 3.0640512704849243e-06, 3.296881914138794e-06, 3.5297125577926636e-06, 3.762543201446533e-06, 3.995373845100403e-06, 4.2282044887542725e-06, 4.461035132408142e-06, 4.693865776062012e-06, 4.926696419715881e-06, 5.159527063369751e-06, 5.392357707023621e-06, 5.62518835067749e-06, 5.85801899433136e-06, 6.0908496379852295e-06, 6.323680281639099e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 11.0, 18.0, 9.0, 18.0, 25.0, 29.0, 49.0, 70.0, 103.0, 154.0, 141.0, 241.0, 381.0, 544.0, 911.0, 1218.0, 2143.0, 3650.0, 6651.0, 13662.0, 34557.0, 100760.0, 700837.0, 113418.0, 35406.0, 16267.0, 7068.0, 3898.0, 2216.0, 1319.0, 905.0, 572.0, 388.0, 250.0, 165.0, 110.0, 101.0, 70.0, 45.0, 34.0, 28.0, 22.0, 16.0, 12.0, 9.0, 11.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0], "bins": [-2.5093555450439453e-05, -2.436712384223938e-05, -2.3640692234039307e-05, -2.2914260625839233e-05, -2.218782901763916e-05, -2.1461397409439087e-05, -2.0734965801239014e-05, -2.000853419303894e-05, -1.9282102584838867e-05, -1.8555670976638794e-05, -1.782923936843872e-05, -1.7102807760238647e-05, -1.6376376152038574e-05, -1.56499445438385e-05, -1.4923512935638428e-05, -1.4197081327438354e-05, -1.3470649719238281e-05, -1.2744218111038208e-05, -1.2017786502838135e-05, -1.1291354894638062e-05, -1.0564923286437988e-05, -9.838491678237915e-06, -9.112060070037842e-06, -8.385628461837769e-06, -7.659196853637695e-06, -6.932765245437622e-06, -6.206333637237549e-06, -5.479902029037476e-06, -4.753470420837402e-06, -4.027038812637329e-06, -3.300607204437256e-06, -2.5741755962371826e-06, -1.8477439880371094e-06, -1.1213123798370361e-06, -3.948807716369629e-07, 3.3155083656311035e-07, 1.0579824447631836e-06, 1.7844140529632568e-06, 2.51084566116333e-06, 3.2372772693634033e-06, 3.9637088775634766e-06, 4.69014048576355e-06, 5.416572093963623e-06, 6.143003702163696e-06, 6.8694353103637695e-06, 7.595866918563843e-06, 8.322298526763916e-06, 9.04873013496399e-06, 9.775161743164062e-06, 1.0501593351364136e-05, 1.1228024959564209e-05, 1.1954456567764282e-05, 1.2680888175964355e-05, 1.3407319784164429e-05, 1.4133751392364502e-05, 1.4860183000564575e-05, 1.558661460876465e-05, 1.631304621696472e-05, 1.7039477825164795e-05, 1.7765909433364868e-05, 1.849234104156494e-05, 1.9218772649765015e-05, 1.9945204257965088e-05, 2.067163586616516e-05, 2.1398067474365234e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 11.0, 2.0, 10.0, 7.0, 11.0, 10.0, 4.0, 19.0, 9.0, 19.0, 15.0, 35.0, 14.0, 28.0, 25.0, 45.0, 38.0, 32.0, 51.0, 177.0, 53.0, 36.0, 52.0, 26.0, 34.0, 26.0, 40.0, 18.0, 21.0, 22.0, 16.0, 16.0, 10.0, 7.0, 11.0, 10.0, 4.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.860572516918182e-06, -4.714354872703552e-06, -4.568137228488922e-06, -4.421919584274292e-06, -4.275701940059662e-06, -4.129484295845032e-06, -3.983266651630402e-06, -3.8370490074157715e-06, -3.6908313632011414e-06, -3.5446137189865112e-06, -3.398396074771881e-06, -3.252178430557251e-06, -3.105960786342621e-06, -2.9597431421279907e-06, -2.8135254979133606e-06, -2.6673078536987305e-06, -2.5210902094841003e-06, -2.3748725652694702e-06, -2.22865492105484e-06, -2.08243727684021e-06, -1.93621963262558e-06, -1.7900019884109497e-06, -1.6437843441963196e-06, -1.4975666999816895e-06, -1.3513490557670593e-06, -1.2051314115524292e-06, -1.058913767337799e-06, -9.126961231231689e-07, -7.664784789085388e-07, -6.202608346939087e-07, -4.7404319047927856e-07, -3.2782554626464844e-07, -1.816079020500183e-07, -3.5390257835388184e-08, 1.1082738637924194e-07, 2.5704503059387207e-07, 4.032626748085022e-07, 5.494803190231323e-07, 6.956979632377625e-07, 8.419156074523926e-07, 9.881332516670227e-07, 1.1343508958816528e-06, 1.280568540096283e-06, 1.426786184310913e-06, 1.5730038285255432e-06, 1.7192214727401733e-06, 1.8654391169548035e-06, 2.0116567611694336e-06, 2.1578744053840637e-06, 2.304092049598694e-06, 2.450309693813324e-06, 2.596527338027954e-06, 2.7427449822425842e-06, 2.8889626264572144e-06, 3.0351802706718445e-06, 3.1813979148864746e-06, 3.3276155591011047e-06, 3.473833203315735e-06, 3.620050847530365e-06, 3.766268491744995e-06, 3.912486135959625e-06, 4.058703780174255e-06, 4.2049214243888855e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 9.0, 23.0, 29.0, 29.0, 35.0, 59.0, 77.0, 136.0, 183.0, 328.0, 487.0, 912.0, 1256.0, 2911.0, 6125.0, 11774.0, 56406.0, 887420.0, 55994.0, 11566.0, 6198.0, 2572.0, 1661.0, 844.0, 569.0, 276.0, 209.0, 93.0, 104.0, 64.0, 57.0, 47.0, 24.0, 11.0, 12.0, 3.0, 7.0, 10.0, 13.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.1682510375976562e-05, -1.1353753507137299e-05, -1.1024996638298035e-05, -1.069623976945877e-05, -1.0367482900619507e-05, -1.0038726031780243e-05, -9.709969162940979e-06, -9.381212294101715e-06, -9.052455425262451e-06, -8.723698556423187e-06, -8.394941687583923e-06, -8.06618481874466e-06, -7.737427949905396e-06, -7.408671081066132e-06, -7.079914212226868e-06, -6.751157343387604e-06, -6.42240047454834e-06, -6.093643605709076e-06, -5.764886736869812e-06, -5.436129868030548e-06, -5.107372999191284e-06, -4.77861613035202e-06, -4.449859261512756e-06, -4.1211023926734924e-06, -3.7923455238342285e-06, -3.4635886549949646e-06, -3.1348317861557007e-06, -2.8060749173164368e-06, -2.477318048477173e-06, -2.148561179637909e-06, -1.819804310798645e-06, -1.491047441959381e-06, -1.1622905731201172e-06, -8.335337042808533e-07, -5.047768354415894e-07, -1.7601996660232544e-07, 1.5273690223693848e-07, 4.814937710762024e-07, 8.102506399154663e-07, 1.1390075087547302e-06, 1.4677643775939941e-06, 1.796521246433258e-06, 2.125278115272522e-06, 2.454034984111786e-06, 2.78279185295105e-06, 3.1115487217903137e-06, 3.4403055906295776e-06, 3.7690624594688416e-06, 4.0978193283081055e-06, 4.426576197147369e-06, 4.755333065986633e-06, 5.084089934825897e-06, 5.412846803665161e-06, 5.741603672504425e-06, 6.070360541343689e-06, 6.399117410182953e-06, 6.727874279022217e-06, 7.056631147861481e-06, 7.385388016700745e-06, 7.714144885540009e-06, 8.042901754379272e-06, 8.371658623218536e-06, 8.7004154920578e-06, 9.029172360897064e-06, 9.357929229736328e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 0.0, 8.0, 0.0, 9.0, 0.0, 12.0, 0.0, 17.0, 0.0, 23.0, 0.0, 38.0, 0.0, 60.0, 0.0, 78.0, 0.0, 508.0, 0.0, 98.0, 0.0, 58.0, 0.0, 25.0, 0.0, 25.0, 0.0, 18.0, 0.0, 11.0, 0.0, 6.0, 0.0, 8.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07, 9.834766387939453e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 5.0, 10.0, 18.0, 33.0, 50.0, 53.0, 109.0, 190.0, 315.0, 703.0, 1473.0, 2851.0, 8119.0, 21733.0, 200304.0, 769319.0, 27014.0, 9679.0, 3593.0, 1354.0, 718.0, 337.0, 205.0, 126.0, 71.0, 50.0, 28.0, 12.0, 19.0, 9.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2658536434173584e-05, -1.2263655662536621e-05, -1.1868774890899658e-05, -1.1473894119262695e-05, -1.1079013347625732e-05, -1.068413257598877e-05, -1.0289251804351807e-05, -9.894371032714844e-06, -9.499490261077881e-06, -9.104609489440918e-06, -8.709728717803955e-06, -8.314847946166992e-06, -7.91996717453003e-06, -7.525086402893066e-06, -7.1302056312561035e-06, -6.735324859619141e-06, -6.340444087982178e-06, -5.945563316345215e-06, -5.550682544708252e-06, -5.155801773071289e-06, -4.760921001434326e-06, -4.366040229797363e-06, -3.9711594581604e-06, -3.5762786865234375e-06, -3.1813979148864746e-06, -2.7865171432495117e-06, -2.391636371612549e-06, -1.996755599975586e-06, -1.601874828338623e-06, -1.2069940567016602e-06, -8.121132850646973e-07, -4.172325134277344e-07, -2.2351741790771484e-08, 3.725290298461914e-07, 7.674098014831543e-07, 1.1622905731201172e-06, 1.55717134475708e-06, 1.952052116394043e-06, 2.346932888031006e-06, 2.7418136596679688e-06, 3.1366944313049316e-06, 3.5315752029418945e-06, 3.926455974578857e-06, 4.32133674621582e-06, 4.716217517852783e-06, 5.111098289489746e-06, 5.505979061126709e-06, 5.900859832763672e-06, 6.295740604400635e-06, 6.690621376037598e-06, 7.0855021476745605e-06, 7.4803829193115234e-06, 7.875263690948486e-06, 8.27014446258545e-06, 8.665025234222412e-06, 9.059906005859375e-06, 9.454786777496338e-06, 9.8496675491333e-06, 1.0244548320770264e-05, 1.0639429092407227e-05, 1.103430986404419e-05, 1.1429190635681152e-05, 1.1824071407318115e-05, 1.2218952178955078e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 7.0, 10.0, 0.0, 7.0, 10.0, 21.0, 23.0, 43.0, 38.0, 70.0, 477.0, 0.0, 73.0, 45.0, 43.0, 28.0, 11.0, 12.0, 17.0, 6.0, 0.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8542632460594177e-06, -1.8011778593063354e-06, -1.7480924725532532e-06, -1.695007085800171e-06, -1.6419216990470886e-06, -1.5888363122940063e-06, -1.535750925540924e-06, -1.4826655387878418e-06, -1.4295801520347595e-06, -1.3764947652816772e-06, -1.323409378528595e-06, -1.2703239917755127e-06, -1.2172386050224304e-06, -1.1641532182693481e-06, -1.1110678315162659e-06, -1.0579824447631836e-06, -1.0048970580101013e-06, -9.51811671257019e-07, -8.987262845039368e-07, -8.456408977508545e-07, -7.925555109977722e-07, -7.394701242446899e-07, -6.863847374916077e-07, -6.332993507385254e-07, -5.802139639854431e-07, -5.271285772323608e-07, -4.7404319047927856e-07, -4.209578037261963e-07, -3.67872416973114e-07, -3.1478703022003174e-07, -2.6170164346694946e-07, -2.086162567138672e-07, -1.555308699607849e-07, -1.0244548320770264e-07, -4.936009645462036e-08, 3.725290298461914e-09, 5.681067705154419e-08, 1.0989606380462646e-07, 1.6298145055770874e-07, 2.1606683731079102e-07, 2.691522240638733e-07, 3.2223761081695557e-07, 3.7532299757003784e-07, 4.284083843231201e-07, 4.814937710762024e-07, 5.345791578292847e-07, 5.876645445823669e-07, 6.407499313354492e-07, 6.938353180885315e-07, 7.469207048416138e-07, 8.00006091594696e-07, 8.530914783477783e-07, 9.061768651008606e-07, 9.592622518539429e-07, 1.0123476386070251e-06, 1.0654330253601074e-06, 1.1185184121131897e-06, 1.171603798866272e-06, 1.2246891856193542e-06, 1.2777745723724365e-06, 1.3308599591255188e-06, 1.383945345878601e-06, 1.4370307326316833e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 9.0, 9.0, 10.0, 11.0, 15.0, 33.0, 27.0, 32.0, 53.0, 61.0, 80.0, 101.0, 140.0, 101.0, 69.0, 39.0, 45.0, 35.0, 26.0, 26.0, 14.0, 14.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.078967579815071e-05, -1.0464242222951725e-05, -1.0138809557247441e-05, -9.813375982048456e-06, -9.487943316344172e-06, -9.162509741145186e-06, -8.8370761659462e-06, -8.511643500241917e-06, -8.186210834537633e-06, -7.860777259338647e-06, -7.535344593634363e-06, -7.209911018435378e-06, -6.884478352731094e-06, -6.559044777532108e-06, -6.233611657080473e-06, -5.908178536628839e-06, -5.582744961429853e-06, -5.257311840978218e-06, -4.9318787205265835e-06, -4.606445145327598e-06, -4.281012479623314e-06, -3.955578904424328e-06, -3.6301457839726936e-06, -3.304712663521059e-06, -2.979279543069424e-06, -2.6538464226177894e-06, -2.3284133021661546e-06, -2.0029799543408444e-06, -1.6775468338892097e-06, -1.352113713437575e-06, -1.0266803656122647e-06, -7.0124724516063e-07, -3.7581321521429345e-07, -5.038003791923984e-08, 2.7505313937581377e-07, 6.004863735142862e-07, 9.25919493965921e-07, 1.2513526144175557e-06, 1.576785962242866e-06, 1.9022190826945007e-06, 2.2276522031461354e-06, 2.55308532359777e-06, 2.878518444049405e-06, 3.203951791874715e-06, 3.52938491232635e-06, 3.854817805404309e-06, 4.180251380603295e-06, 4.5056845010549296e-06, 4.831117621506564e-06, 5.156550741958199e-06, 5.481983862409834e-06, 5.8074174376088195e-06, 6.132850103313103e-06, 6.458283678512089e-06, 6.783716798963724e-06, 7.1091499194153585e-06, 7.434583039866993e-06, 7.760016160318628e-06, 8.085449735517614e-06, 8.410882401221897e-06, 8.736315976420883e-06, 9.061748642125167e-06, 9.387182217324153e-06, 9.712615792523138e-06, 1.0038048458227422e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 4.0, 6.0, 10.0, 18.0, 15.0, 24.0, 23.0, 24.0, 20.0, 34.0, 36.0, 32.0, 44.0, 39.0, 34.0, 35.0, 48.0, 36.0, 53.0, 40.0, 45.0, 33.0, 31.0, 31.0, 31.0, 29.0, 27.0, 25.0, 26.0, 18.0, 21.0, 19.0, 19.0, 8.0, 16.0, 8.0, 6.0, 8.0, 1.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.76297201809939e-06, -7.54152461013291e-06, -7.320077202166431e-06, -7.0986293394526e-06, -6.8771819314861204e-06, -6.655734523519641e-06, -6.434287115553161e-06, -6.212839252839331e-06, -5.991391844872851e-06, -5.769944436906371e-06, -5.548497028939892e-06, -5.327049166226061e-06, -5.105601758259581e-06, -4.884154350293102e-06, -4.662706942326622e-06, -4.4412590796127915e-06, -4.219811671646312e-06, -3.998364263679832e-06, -3.776916628339677e-06, -3.5554692203731975e-06, -3.3340215850330424e-06, -3.1125741770665627e-06, -2.891126769100083e-06, -2.669679133759928e-06, -2.4482319531671237e-06, -2.226784545200644e-06, -2.005336909860489e-06, -1.7838895018940093e-06, -1.5624418665538542e-06, -1.3409944585873745e-06, -1.1195469369340572e-06, -8.980994152807398e-07, -6.766517799405847e-07, -4.552042582872673e-07, -2.3375676505565934e-07, -1.2309271824051393e-08, 2.09138249829266e-07, 4.305857146391645e-07, 6.520332362924819e-07, 8.734807579457993e-07, 1.0949282795991166e-06, 1.316375801252434e-06, 1.5378233229057514e-06, 1.7592708445590688e-06, 1.9807182525255485e-06, 2.2021658878657036e-06, 2.4236132958321832e-06, 2.645060703798663e-06, 2.866508339138818e-06, 3.0879557471052976e-06, 3.3094033824454527e-06, 3.5308507904119324e-06, 3.7522984257520875e-06, 3.973746061092243e-06, 4.195193469058722e-06, 4.416640877025202e-06, 4.6380882849916816e-06, 4.859535692958161e-06, 5.080983100924641e-06, 5.3024309636384714e-06, 5.523878371604951e-06, 5.745325779571431e-06, 5.96677318753791e-06, 6.188221050251741e-06, 6.409668458218221e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 9.0, 4.0, 9.0, 15.0, 25.0, 43.0, 52.0, 85.0, 124.0, 172.0, 291.0, 452.0, 703.0, 1185.0, 1889.0, 3297.0, 5754.0, 10552.0, 19983.0, 43725.0, 91911.0, 256484.0, 377245.0, 123349.0, 53894.0, 26167.0, 13463.0, 7322.0, 4160.0, 2493.0, 1375.0, 831.0, 524.0, 293.0, 200.0, 141.0, 92.0, 73.0, 55.0, 31.0, 23.0, 16.0, 11.0, 10.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-3.165006637573242e-05, -3.075040876865387e-05, -2.9850751161575317e-05, -2.8951093554496765e-05, -2.8051435947418213e-05, -2.715177834033966e-05, -2.625212073326111e-05, -2.5352463126182556e-05, -2.4452805519104004e-05, -2.355314791202545e-05, -2.26534903049469e-05, -2.1753832697868347e-05, -2.0854175090789795e-05, -1.9954517483711243e-05, -1.905485987663269e-05, -1.8155202269554138e-05, -1.7255544662475586e-05, -1.6355887055397034e-05, -1.545622944831848e-05, -1.455657184123993e-05, -1.3656914234161377e-05, -1.2757256627082825e-05, -1.1857599020004272e-05, -1.095794141292572e-05, -1.0058283805847168e-05, -9.158626198768616e-06, -8.258968591690063e-06, -7.359310984611511e-06, -6.459653377532959e-06, -5.559995770454407e-06, -4.6603381633758545e-06, -3.7606805562973022e-06, -2.86102294921875e-06, -1.9613653421401978e-06, -1.0617077350616455e-06, -1.6205012798309326e-07, 7.37607479095459e-07, 1.6372650861740112e-06, 2.5369226932525635e-06, 3.4365803003311157e-06, 4.336237907409668e-06, 5.23589551448822e-06, 6.1355531215667725e-06, 7.035210728645325e-06, 7.934868335723877e-06, 8.83452594280243e-06, 9.734183549880981e-06, 1.0633841156959534e-05, 1.1533498764038086e-05, 1.2433156371116638e-05, 1.333281397819519e-05, 1.4232471585273743e-05, 1.5132129192352295e-05, 1.6031786799430847e-05, 1.69314444065094e-05, 1.783110201358795e-05, 1.8730759620666504e-05, 1.9630417227745056e-05, 2.053007483482361e-05, 2.142973244190216e-05, 2.2329390048980713e-05, 2.3229047656059265e-05, 2.4128705263137817e-05, 2.502836287021637e-05, 2.5928020477294922e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 14.0, 9.0, 9.0, 20.0, 16.0, 34.0, 12.0, 25.0, 33.0, 34.0, 43.0, 34.0, 40.0, 58.0, 30.0, 62.0, 35.0, 60.0, 34.0, 33.0, 45.0, 29.0, 36.0, 28.0, 24.0, 37.0, 16.0, 26.0, 15.0, 15.0, 16.0, 9.0, 18.0, 9.0, 4.0, 10.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.066394805908203e-06, -4.9229711294174194e-06, -4.779547452926636e-06, -4.636123776435852e-06, -4.492700099945068e-06, -4.349276423454285e-06, -4.205852746963501e-06, -4.062429070472717e-06, -3.919005393981934e-06, -3.77558171749115e-06, -3.632158041000366e-06, -3.4887343645095825e-06, -3.345310688018799e-06, -3.201887011528015e-06, -3.0584633350372314e-06, -2.9150396585464478e-06, -2.771615982055664e-06, -2.6281923055648804e-06, -2.4847686290740967e-06, -2.341344952583313e-06, -2.1979212760925293e-06, -2.0544975996017456e-06, -1.911073923110962e-06, -1.7676502466201782e-06, -1.6242265701293945e-06, -1.4808028936386108e-06, -1.3373792171478271e-06, -1.1939555406570435e-06, -1.0505318641662598e-06, -9.071081876754761e-07, -7.636845111846924e-07, -6.202608346939087e-07, -4.76837158203125e-07, -3.334134817123413e-07, -1.8998980522155762e-07, -4.6566128730773926e-08, 9.685754776000977e-08, 2.4028122425079346e-07, 3.8370490074157715e-07, 5.271285772323608e-07, 6.705522537231445e-07, 8.139759302139282e-07, 9.57399606704712e-07, 1.1008232831954956e-06, 1.2442469596862793e-06, 1.387670636177063e-06, 1.5310943126678467e-06, 1.6745179891586304e-06, 1.817941665649414e-06, 1.9613653421401978e-06, 2.1047890186309814e-06, 2.248212695121765e-06, 2.391636371612549e-06, 2.5350600481033325e-06, 2.678483724594116e-06, 2.8219074010849e-06, 2.9653310775756836e-06, 3.1087547540664673e-06, 3.252178430557251e-06, 3.3956021070480347e-06, 3.5390257835388184e-06, 3.682449460029602e-06, 3.825873136520386e-06, 3.9692968130111694e-06, 4.112720489501953e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 17.0, 14.0, 29.0, 35.0, 60.0, 98.0, 110.0, 170.0, 274.0, 334.0, 605.0, 920.0, 1309.0, 2176.0, 3474.0, 4304.0, 7838.0, 12728.0, 21183.0, 36317.0, 65443.0, 103577.0, 296084.0, 252725.0, 104197.0, 54943.0, 27477.0, 19799.0, 11811.0, 7397.0, 4617.0, 2905.0, 1634.0, 1359.0, 870.0, 563.0, 384.0, 256.0, 133.0, 146.0, 73.0, 40.0, 38.0, 22.0, 17.0, 16.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2169592082500458e-05, -1.1762604117393494e-05, -1.135561615228653e-05, -1.0948628187179565e-05, -1.0541640222072601e-05, -1.0134652256965637e-05, -9.727664291858673e-06, -9.320676326751709e-06, -8.913688361644745e-06, -8.50670039653778e-06, -8.099712431430817e-06, -7.692724466323853e-06, -7.2857365012168884e-06, -6.878748536109924e-06, -6.47176057100296e-06, -6.064772605895996e-06, -5.657784640789032e-06, -5.250796675682068e-06, -4.843808710575104e-06, -4.43682074546814e-06, -4.0298327803611755e-06, -3.6228448152542114e-06, -3.2158568501472473e-06, -2.808868885040283e-06, -2.401880919933319e-06, -1.994892954826355e-06, -1.5879049897193909e-06, -1.1809170246124268e-06, -7.739290595054626e-07, -3.6694109439849854e-07, 4.0046870708465576e-08, 4.470348358154297e-07, 8.540228009223938e-07, 1.261010766029358e-06, 1.667998731136322e-06, 2.074986696243286e-06, 2.4819746613502502e-06, 2.8889626264572144e-06, 3.2959505915641785e-06, 3.7029385566711426e-06, 4.109926521778107e-06, 4.516914486885071e-06, 4.923902451992035e-06, 5.330890417098999e-06, 5.737878382205963e-06, 6.144866347312927e-06, 6.551854312419891e-06, 6.9588422775268555e-06, 7.36583024263382e-06, 7.772818207740784e-06, 8.179806172847748e-06, 8.586794137954712e-06, 8.993782103061676e-06, 9.40077006816864e-06, 9.807758033275604e-06, 1.0214745998382568e-05, 1.0621733963489532e-05, 1.1028721928596497e-05, 1.143570989370346e-05, 1.1842697858810425e-05, 1.2249685823917389e-05, 1.2656673789024353e-05, 1.3063661754131317e-05, 1.3470649719238281e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 8.0, 7.0, 8.0, 2.0, 3.0, 9.0, 11.0, 16.0, 14.0, 21.0, 19.0, 30.0, 36.0, 53.0, 33.0, 41.0, 28.0, 40.0, 38.0, 59.0, 44.0, 28.0, 32.0, 38.0, 53.0, 42.0, 33.0, 35.0, 30.0, 30.0, 31.0, 18.0, 19.0, 13.0, 16.0, 16.0, 18.0, 8.0, 9.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-06, -3.86405736207962e-06, -3.734603524208069e-06, -3.6051496863365173e-06, -3.475695848464966e-06, -3.3462420105934143e-06, -3.216788172721863e-06, -3.0873343348503113e-06, -2.9578804969787598e-06, -2.8284266591072083e-06, -2.6989728212356567e-06, -2.5695189833641052e-06, -2.4400651454925537e-06, -2.310611307621002e-06, -2.1811574697494507e-06, -2.051703631877899e-06, -1.9222497940063477e-06, -1.7927959561347961e-06, -1.6633421182632446e-06, -1.5338882803916931e-06, -1.4044344425201416e-06, -1.27498060464859e-06, -1.1455267667770386e-06, -1.016072928905487e-06, -8.866190910339355e-07, -7.57165253162384e-07, -6.277114152908325e-07, -4.98257577419281e-07, -3.688037395477295e-07, -2.39349901676178e-07, -1.0989606380462646e-07, 1.955777406692505e-08, 1.4901161193847656e-07, 2.784654498100281e-07, 4.079192876815796e-07, 5.373731255531311e-07, 6.668269634246826e-07, 7.962808012962341e-07, 9.257346391677856e-07, 1.0551884770393372e-06, 1.1846423149108887e-06, 1.3140961527824402e-06, 1.4435499906539917e-06, 1.5730038285255432e-06, 1.7024576663970947e-06, 1.8319115042686462e-06, 1.9613653421401978e-06, 2.0908191800117493e-06, 2.2202730178833008e-06, 2.3497268557548523e-06, 2.479180693626404e-06, 2.6086345314979553e-06, 2.738088369369507e-06, 2.8675422072410583e-06, 2.99699604511261e-06, 3.1264498829841614e-06, 3.255903720855713e-06, 3.3853575587272644e-06, 3.514811396598816e-06, 3.6442652344703674e-06, 3.773719072341919e-06, 3.9031729102134705e-06, 4.032626748085022e-06, 4.1620805859565735e-06, 4.291534423828125e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 16.0, 0.0, 0.0, 24.0, 0.0, 0.0, 43.0, 0.0, 0.0, 64.0, 0.0, 0.0, 188.0, 0.0, 0.0, 605.0, 0.0, 0.0, 2850.0, 0.0, 0.0, 1041002.0, 0.0, 0.0, 2842.0, 0.0, 585.0, 0.0, 0.0, 198.0, 0.0, 0.0, 66.0, 0.0, 0.0, 37.0, 0.0, 0.0, 21.0, 0.0, 0.0, 13.0, 0.0, 0.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.960464477539062e-07, -5.755573511123657e-07, -5.550682544708252e-07, -5.345791578292847e-07, -5.140900611877441e-07, -4.936009645462036e-07, -4.731118679046631e-07, -4.5262277126312256e-07, -4.3213367462158203e-07, -4.116445779800415e-07, -3.91155481338501e-07, -3.7066638469696045e-07, -3.501772880554199e-07, -3.296881914138794e-07, -3.0919909477233887e-07, -2.8870999813079834e-07, -2.682209014892578e-07, -2.477318048477173e-07, -2.2724270820617676e-07, -2.0675361156463623e-07, -1.862645149230957e-07, -1.6577541828155518e-07, -1.4528632164001465e-07, -1.2479722499847412e-07, -1.043081283569336e-07, -8.381903171539307e-08, -6.332993507385254e-08, -4.284083843231201e-08, -2.2351741790771484e-08, -1.862645149230957e-09, 1.862645149230957e-08, 3.91155481338501e-08, 5.960464477539063e-08, 8.009374141693115e-08, 1.0058283805847168e-07, 1.210719347000122e-07, 1.4156103134155273e-07, 1.6205012798309326e-07, 1.825392246246338e-07, 2.0302832126617432e-07, 2.2351741790771484e-07, 2.4400651454925537e-07, 2.644956111907959e-07, 2.849847078323364e-07, 3.0547380447387695e-07, 3.259629011154175e-07, 3.46451997756958e-07, 3.6694109439849854e-07, 3.8743019104003906e-07, 4.079192876815796e-07, 4.284083843231201e-07, 4.4889748096466064e-07, 4.6938657760620117e-07, 4.898756742477417e-07, 5.103647708892822e-07, 5.308538675308228e-07, 5.513429641723633e-07, 5.718320608139038e-07, 5.923211574554443e-07, 6.128102540969849e-07, 6.332993507385254e-07, 6.537884473800659e-07, 6.742775440216064e-07, 6.94766640663147e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 408.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2688.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1042228.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2772.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 408.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1012.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 15.0, 27.0, 18.0, 32.0, 52.0, 74.0, 85.0, 194.0, 171.0, 87.0, 48.0, 41.0, 26.0, 23.0, 21.0, 9.0, 10.0, 7.0, 11.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0594035302347038e-05, -1.03144875538419e-05, -1.0034939805336762e-05, -9.755392966326326e-06, -9.475845217821188e-06, -9.19629746931605e-06, -8.916749720810913e-06, -8.637201972305775e-06, -8.357655133295339e-06, -8.0781073847902e-06, -7.798559636285063e-06, -7.519012342527276e-06, -7.239465048769489e-06, -6.959917300264351e-06, -6.680369551759213e-06, -6.400822258001426e-06, -6.121274509496288e-06, -5.8417267609911505e-06, -5.5621794672333635e-06, -5.282631718728226e-06, -5.003084424970439e-06, -4.723536676465301e-06, -4.443989382707514e-06, -4.164441634202376e-06, -3.884893885697238e-06, -3.6053463645657757e-06, -3.3257988434343133e-06, -3.0462510949291755e-06, -2.7667038011713885e-06, -2.4871560526662506e-06, -2.207608531534788e-06, -1.9280610104033258e-06, -1.6485137166455388e-06, -1.3689661955140764e-06, -1.089418674382614e-06, -8.098710395643138e-07, -5.303235184328514e-07, -2.50775997301389e-07, 2.877163751691114e-08, 3.0831915864837356e-07, 5.87866679779836e-07, 8.674142009112984e-07, 1.1469617220427608e-06, 1.426509356861061e-06, 1.7060568779925234e-06, 1.985604285437148e-06, 2.265152033942286e-06, 2.5446995550737483e-06, 2.8242470762052108e-06, 3.103794597336673e-06, 3.3833421184681356e-06, 3.6628898669732735e-06, 3.9424371607310604e-06, 4.221984909236198e-06, 4.501532202993985e-06, 4.781079951499123e-06, 5.060627700004261e-06, 5.340175448509399e-06, 5.619722742267186e-06, 5.899270490772324e-06, 6.178817784530111e-06, 6.4583655330352485e-06, 6.737913281540386e-06, 7.017460575298173e-06, 7.29700786905596e-06]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 6.0, 4.0, 7.0, 13.0, 12.0, 10.0, 9.0, 9.0, 20.0, 22.0, 18.0, 19.0, 27.0, 35.0, 36.0, 35.0, 40.0, 23.0, 46.0, 39.0, 45.0, 37.0, 36.0, 33.0, 37.0, 39.0, 33.0, 48.0, 21.0, 36.0, 32.0, 22.0, 20.0, 23.0, 21.0, 21.0, 13.0, 13.0, 6.0, 4.0, 5.0, 6.0, 6.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.13698853662936e-06, -4.000267381343292e-06, -3.863546226057224e-06, -3.7268255255185068e-06, -3.5901043702324387e-06, -3.4533832149463706e-06, -3.316662287033978e-06, -3.1799413591215853e-06, -3.043220203835517e-06, -2.906499048549449e-06, -2.7697781206370564e-06, -2.6330571927246638e-06, -2.4963360374385957e-06, -2.3596148821525276e-06, -2.222893954240135e-06, -2.0861730263277423e-06, -1.949451871041674e-06, -1.8127308294424438e-06, -1.6760097878432134e-06, -1.539288746243983e-06, -1.4025677046447527e-06, -1.2658466630455223e-06, -1.129125621446292e-06, -9.924045798470615e-07, -8.556835382478312e-07, -7.189624966486008e-07, -5.822414550493704e-07, -4.4552041345014004e-07, -3.0879937185090967e-07, -1.720783302516793e-07, -3.5357288652448915e-08, 1.0136375294678146e-07, 2.3808433979866095e-07, 3.748053813978913e-07, 5.115264229971217e-07, 6.482474645963521e-07, 7.849685061955824e-07, 9.216895477948128e-07, 1.0584105893940432e-06, 1.1951316309932736e-06, 1.331852672592504e-06, 1.4685737141917343e-06, 1.6052947557909647e-06, 1.742015797390195e-06, 1.8787368389894255e-06, 2.0154579942754935e-06, 2.152178922187886e-06, 2.288899850100279e-06, 2.425621005386347e-06, 2.562342160672415e-06, 2.6990630885848077e-06, 2.8357840164972004e-06, 2.9725051717832685e-06, 3.1092263270693365e-06, 3.245947254981729e-06, 3.382668182894122e-06, 3.51938933818019e-06, 3.656110493466258e-06, 3.7928314213786507e-06, 3.929552349291043e-06, 4.0662735045771115e-06, 4.2029946598631795e-06, 4.339715815149248e-06, 4.476436515687965e-06, 4.613157670974033e-06]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 11.0, 19.0, 16.0, 29.0, 46.0, 67.0, 122.0, 106.0, 265.0, 234.0, 438.0, 933.0, 774.0, 1843.0, 2650.0, 3212.0, 6534.0, 7918.0, 17260.0, 31117.0, 41807.0, 105747.0, 170159.0, 2832891.0, 649929.0, 138816.0, 86370.0, 34874.0, 25148.0, 13685.0, 6398.0, 5345.0, 2700.0, 2315.0, 1457.0, 712.0, 800.0, 421.0, 257.0, 262.0, 140.0, 163.0, 79.0, 53.0, 48.0, 32.0, 25.0, 15.0, 10.0, 14.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0], "bins": [-6.854534149169922e-06, -6.639398634433746e-06, -6.424263119697571e-06, -6.209127604961395e-06, -5.99399209022522e-06, -5.778856575489044e-06, -5.563721060752869e-06, -5.348585546016693e-06, -5.133450031280518e-06, -4.918314516544342e-06, -4.7031790018081665e-06, -4.488043487071991e-06, -4.2729079723358154e-06, -4.05777245759964e-06, -3.842636942863464e-06, -3.627501428127289e-06, -3.4123659133911133e-06, -3.1972303986549377e-06, -2.982094883918762e-06, -2.7669593691825867e-06, -2.551823854446411e-06, -2.3366883397102356e-06, -2.12155282497406e-06, -1.9064173102378845e-06, -1.691281795501709e-06, -1.4761462807655334e-06, -1.261010766029358e-06, -1.0458752512931824e-06, -8.307397365570068e-07, -6.156042218208313e-07, -4.0046870708465576e-07, -1.8533319234848022e-07, 2.9802322387695312e-08, 2.4493783712387085e-07, 4.600733518600464e-07, 6.752088665962219e-07, 8.903443813323975e-07, 1.105479896068573e-06, 1.3206154108047485e-06, 1.535750925540924e-06, 1.7508864402770996e-06, 1.966021955013275e-06, 2.1811574697494507e-06, 2.3962929844856262e-06, 2.6114284992218018e-06, 2.8265640139579773e-06, 3.041699528694153e-06, 3.2568350434303284e-06, 3.471970558166504e-06, 3.6871060729026794e-06, 3.902241587638855e-06, 4.1173771023750305e-06, 4.332512617111206e-06, 4.547648131847382e-06, 4.762783646583557e-06, 4.977919161319733e-06, 5.193054676055908e-06, 5.408190190792084e-06, 5.623325705528259e-06, 5.838461220264435e-06, 6.05359673500061e-06, 6.268732249736786e-06, 6.4838677644729614e-06, 6.699003279209137e-06, 6.9141387939453125e-06]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 11.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 48.0, 0.0, 0.0, 65.0, 0.0, 0.0, 123.0, 0.0, 0.0, 136.0, 0.0, 0.0, 0.0, 145.0, 0.0, 0.0, 156.0, 0.0, 0.0, 124.0, 0.0, 0.0, 74.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 10.0, 0.0, 0.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 11.0, 7.0, 20.0, 10.0, 23.0, 41.0, 21.0, 69.0, 64.0, 161.0, 177.0, 534.0, 815.0, 1709.0, 6324.0, 13875.0, 41515.0, 242890.0, 2953094.0, 732129.0, 154995.0, 28198.0, 11664.0, 3070.0, 1273.0, 827.0, 233.0, 180.0, 143.0, 56.0, 51.0, 27.0, 27.0, 6.0, 19.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.139278411865234e-06, -5.939975380897522e-06, -5.7406723499298096e-06, -5.541369318962097e-06, -5.342066287994385e-06, -5.142763257026672e-06, -4.94346022605896e-06, -4.7441571950912476e-06, -4.544854164123535e-06, -4.345551133155823e-06, -4.14624810218811e-06, -3.946945071220398e-06, -3.7476420402526855e-06, -3.548339009284973e-06, -3.3490359783172607e-06, -3.1497329473495483e-06, -2.950429916381836e-06, -2.7511268854141235e-06, -2.551823854446411e-06, -2.3525208234786987e-06, -2.1532177925109863e-06, -1.953914761543274e-06, -1.7546117305755615e-06, -1.5553086996078491e-06, -1.3560056686401367e-06, -1.1567026376724243e-06, -9.57399606704712e-07, -7.580965757369995e-07, -5.587935447692871e-07, -3.594905138015747e-07, -1.601874828338623e-07, 3.91155481338501e-08, 2.384185791015625e-07, 4.377216100692749e-07, 6.370246410369873e-07, 8.363276720046997e-07, 1.0356307029724121e-06, 1.2349337339401245e-06, 1.434236764907837e-06, 1.6335397958755493e-06, 1.8328428268432617e-06, 2.032145857810974e-06, 2.2314488887786865e-06, 2.430751919746399e-06, 2.6300549507141113e-06, 2.8293579816818237e-06, 3.028661012649536e-06, 3.2279640436172485e-06, 3.427267074584961e-06, 3.6265701055526733e-06, 3.825873136520386e-06, 4.025176167488098e-06, 4.2244791984558105e-06, 4.423782229423523e-06, 4.623085260391235e-06, 4.822388291358948e-06, 5.02169132232666e-06, 5.2209943532943726e-06, 5.420297384262085e-06, 5.619600415229797e-06, 5.81890344619751e-06, 6.018206477165222e-06, 6.2175095081329346e-06, 6.416812539100647e-06, 6.616115570068359e-06]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 0.0, 7.0, 0.0, 0.0, 20.0, 0.0, 39.0, 0.0, 66.0, 0.0, 143.0, 0.0, 167.0, 0.0, 243.0, 0.0, 427.0, 0.0, 0.0, 1824.0, 0.0, 425.0, 0.0, 254.0, 0.0, 164.0, 0.0, 122.0, 0.0, 64.0, 0.0, 52.0, 0.0, 27.0, 0.0, 0.0, 17.0, 0.0, 10.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.66129994392395e-07, -8.381903171539307e-07, -8.102506399154663e-07, -7.82310962677002e-07, -7.543712854385376e-07, -7.264316082000732e-07, -6.984919309616089e-07, -6.705522537231445e-07, -6.426125764846802e-07, -6.146728992462158e-07, -5.867332220077515e-07, -5.587935447692871e-07, -5.308538675308228e-07, -5.029141902923584e-07, -4.7497451305389404e-07, -4.470348358154297e-07, -4.1909515857696533e-07, -3.91155481338501e-07, -3.632158041000366e-07, -3.3527612686157227e-07, -3.073364496231079e-07, -2.7939677238464355e-07, -2.514570951461792e-07, -2.2351741790771484e-07, -1.955777406692505e-07, -1.6763806343078613e-07, -1.3969838619232178e-07, -1.1175870895385742e-07, -8.381903171539307e-08, -5.587935447692871e-08, -2.7939677238464355e-08, 0.0, 2.7939677238464355e-08, 5.587935447692871e-08, 8.381903171539307e-08, 1.1175870895385742e-07, 1.3969838619232178e-07, 1.6763806343078613e-07, 1.955777406692505e-07, 2.2351741790771484e-07, 2.514570951461792e-07, 2.7939677238464355e-07, 3.073364496231079e-07, 3.3527612686157227e-07, 3.632158041000366e-07, 3.91155481338501e-07, 4.1909515857696533e-07, 4.470348358154297e-07, 4.7497451305389404e-07, 5.029141902923584e-07, 5.308538675308228e-07, 5.587935447692871e-07, 5.867332220077515e-07, 6.146728992462158e-07, 6.426125764846802e-07, 6.705522537231445e-07, 6.984919309616089e-07, 7.264316082000732e-07, 7.543712854385376e-07, 7.82310962677002e-07, 8.102506399154663e-07, 8.381903171539307e-07, 8.66129994392395e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 7.0, 1.0, 11.0, 21.0, 23.0, 23.0, 27.0, 62.0, 73.0, 122.0, 195.0, 143.0, 77.0, 49.0, 35.0, 32.0, 30.0, 15.0, 13.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.476279405527748e-06, -2.3832872102502733e-06, -2.290295242346474e-06, -2.197303047068999e-06, -2.1043108517915243e-06, -2.0113186565140495e-06, -1.91832668861025e-06, -1.8253344933327753e-06, -1.7323422980553005e-06, -1.6393502164646634e-06, -1.5463580211871886e-06, -1.4533659395965515e-06, -1.3603737443190766e-06, -1.2673816627284396e-06, -1.1743895811378025e-06, -1.0813973858603276e-06, -9.884053042696905e-07, -8.954131658356346e-07, -8.024210274015786e-07, -7.094289458109415e-07, -6.164367505334667e-07, -5.234446689428296e-07, -4.3045253050877363e-07, -3.374603920747177e-07, -2.444682536406617e-07, -1.5147611520660575e-07, -5.848399098340451e-08, 3.4508133239796734e-08, 1.275002716738527e-07, 2.2049241010790865e-07, 3.134845201202552e-07, 4.0647665855431114e-07, 4.994687969883671e-07, 5.924609354224231e-07, 6.85453073856479e-07, 7.784451554471161e-07, 8.714373507245909e-07, 9.64429432315228e-07, 1.0574215139058651e-06, 1.15041370918334e-06, 1.2434059044608148e-06, 1.3363979860514519e-06, 1.4293901813289267e-06, 1.5223822629195638e-06, 1.6153744581970386e-06, 1.7083665397876757e-06, 1.8013586213783128e-06, 1.8943508166557876e-06, 1.987342784559587e-06, 2.080334979837062e-06, 2.1733269477408612e-06, 2.266319143018336e-06, 2.359311338295811e-06, 2.4523035335732857e-06, 2.545295501477085e-06, 2.63828769675456e-06, 2.7312798920320347e-06, 2.8242720873095095e-06, 2.917264055213309e-06, 3.0102562504907837e-06, 3.1032484457682585e-06, 3.1962406410457334e-06, 3.2892326089495327e-06, 3.3822248042270076e-06, 3.4752169995044824e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 3.0, 7.0, 6.0, 5.0, 8.0, 12.0, 14.0, 10.0, 18.0, 19.0, 21.0, 20.0, 31.0, 19.0, 40.0, 25.0, 39.0, 28.0, 27.0, 36.0, 38.0, 35.0, 46.0, 36.0, 50.0, 35.0, 30.0, 47.0, 28.0, 34.0, 25.0, 31.0, 24.0, 26.0, 17.0, 21.0, 22.0, 12.0, 7.0, 10.0, 8.0, 7.0, 9.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-1.4540173651766963e-06, -1.4105760328675387e-06, -1.3671345868715434e-06, -1.3236932545623858e-06, -1.2802519222532283e-06, -1.236810476257233e-06, -1.1933691439480754e-06, -1.1499278116389178e-06, -1.1064864793297602e-06, -1.0630451470206026e-06, -1.0196037010246073e-06, -9.761623687154497e-07, -9.327210364062921e-07, -8.892796472537157e-07, -8.458382581011392e-07, -8.023969257919816e-07, -7.589554797959863e-07, -7.155140906434099e-07, -6.720727583342523e-07, -6.286313691816758e-07, -5.851900368725182e-07, -5.417486477199418e-07, -4.983072585673654e-07, -4.5486589783649833e-07, -4.114245371056313e-07, -3.679831763747643e-07, -3.245418156438973e-07, -2.8110042649132083e-07, -2.3765906576045381e-07, -1.942177050295868e-07, -1.5077631587701035e-07, -1.0733495514614333e-07, -6.389348072843859e-08, -2.0452112892144214e-08, 2.298925494415016e-08, 6.64306298858719e-08, 1.0987199061673891e-07, 1.5331335134760593e-07, 1.9675474050018238e-07, 2.401961012310494e-07, 2.836374619619164e-07, 3.2707882269278343e-07, 3.7052018342365045e-07, 4.139615725762269e-07, 4.574029333070939e-07, 5.008442940379609e-07, 5.442856831905374e-07, 5.877270723431138e-07, 6.311684046522714e-07, 6.746097938048479e-07, 7.180511261140055e-07, 7.614925152665819e-07, 8.049338475757395e-07, 8.483752367283159e-07, 8.918166258808924e-07, 9.3525795819005e-07, 9.786992904992076e-07, 1.0221406228083652e-06, 1.0655820688043605e-06, 1.109023401113518e-06, 1.1524647334226756e-06, 1.195906179418671e-06, 1.2393475117278285e-06, 1.2827888440369861e-06, 1.3262302900329814e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 15.0, 22.0, 37.0, 36.0, 62.0, 73.0, 95.0, 116.0, 399.0, 328.0, 441.0, 597.0, 815.0, 1087.0, 1568.0, 2231.0, 3173.0, 4674.0, 6755.0, 10432.0, 16180.0, 26312.0, 44510.0, 80646.0, 481833.0, 165280.0, 80900.0, 44679.0, 26149.0, 16214.0, 10338.0, 6873.0, 4665.0, 3044.0, 2200.0, 1586.0, 1164.0, 777.0, 561.0, 411.0, 576.0, 205.0, 117.0, 97.0, 55.0, 46.0, 45.0, 36.0, 30.0, 18.0, 13.0, 5.0, 7.0, 2.0, 3.0, 6.0], "bins": [-2.086162567138672e-06, -2.0228326320648193e-06, -1.959502696990967e-06, -1.8961727619171143e-06, -1.8328428268432617e-06, -1.7695128917694092e-06, -1.7061829566955566e-06, -1.642853021621704e-06, -1.5795230865478516e-06, -1.516193151473999e-06, -1.4528632164001465e-06, -1.389533281326294e-06, -1.3262033462524414e-06, -1.2628734111785889e-06, -1.1995434761047363e-06, -1.1362135410308838e-06, -1.0728836059570312e-06, -1.0095536708831787e-06, -9.462237358093262e-07, -8.828938007354736e-07, -8.195638656616211e-07, -7.562339305877686e-07, -6.92903995513916e-07, -6.295740604400635e-07, -5.662441253662109e-07, -5.029141902923584e-07, -4.3958425521850586e-07, -3.762543201446533e-07, -3.129243850708008e-07, -2.4959444999694824e-07, -1.862645149230957e-07, -1.2293457984924316e-07, -5.960464477539063e-08, 3.725290298461914e-09, 6.705522537231445e-08, 1.30385160446167e-07, 1.9371509552001953e-07, 2.5704503059387207e-07, 3.203749656677246e-07, 3.8370490074157715e-07, 4.470348358154297e-07, 5.103647708892822e-07, 5.736947059631348e-07, 6.370246410369873e-07, 7.003545761108398e-07, 7.636845111846924e-07, 8.270144462585449e-07, 8.903443813323975e-07, 9.5367431640625e-07, 1.0170042514801025e-06, 1.080334186553955e-06, 1.1436641216278076e-06, 1.2069940567016602e-06, 1.2703239917755127e-06, 1.3336539268493652e-06, 1.3969838619232178e-06, 1.4603137969970703e-06, 1.5236437320709229e-06, 1.5869736671447754e-06, 1.650303602218628e-06, 1.7136335372924805e-06, 1.776963472366333e-06, 1.8402934074401855e-06, 1.903623342514038e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 0.0, 5.0, 5.0, 5.0, 0.0, 7.0, 18.0, 16.0, 18.0, 0.0, 20.0, 32.0, 30.0, 0.0, 37.0, 42.0, 37.0, 42.0, 0.0, 38.0, 48.0, 51.0, 0.0, 53.0, 61.0, 56.0, 62.0, 0.0, 40.0, 42.0, 52.0, 28.0, 0.0, 32.0, 20.0, 22.0, 0.0, 16.0, 13.0, 18.0, 9.0, 0.0, 9.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4435499906539917e-06, -1.3969838619232178e-06, -1.3504177331924438e-06, -1.30385160446167e-06, -1.257285475730896e-06, -1.210719347000122e-06, -1.1641532182693481e-06, -1.1175870895385742e-06, -1.0710209608078003e-06, -1.0244548320770264e-06, -9.778887033462524e-07, -9.313225746154785e-07, -8.847564458847046e-07, -8.381903171539307e-07, -7.916241884231567e-07, -7.450580596923828e-07, -6.984919309616089e-07, -6.51925802230835e-07, -6.05359673500061e-07, -5.587935447692871e-07, -5.122274160385132e-07, -4.6566128730773926e-07, -4.1909515857696533e-07, -3.725290298461914e-07, -3.259629011154175e-07, -2.7939677238464355e-07, -2.3283064365386963e-07, -1.862645149230957e-07, -1.3969838619232178e-07, -9.313225746154785e-08, -4.6566128730773926e-08, 0.0, 4.6566128730773926e-08, 9.313225746154785e-08, 1.3969838619232178e-07, 1.862645149230957e-07, 2.3283064365386963e-07, 2.7939677238464355e-07, 3.259629011154175e-07, 3.725290298461914e-07, 4.1909515857696533e-07, 4.6566128730773926e-07, 5.122274160385132e-07, 5.587935447692871e-07, 6.05359673500061e-07, 6.51925802230835e-07, 6.984919309616089e-07, 7.450580596923828e-07, 7.916241884231567e-07, 8.381903171539307e-07, 8.847564458847046e-07, 9.313225746154785e-07, 9.778887033462524e-07, 1.0244548320770264e-06, 1.0710209608078003e-06, 1.1175870895385742e-06, 1.1641532182693481e-06, 1.210719347000122e-06, 1.257285475730896e-06, 1.30385160446167e-06, 1.3504177331924438e-06, 1.3969838619232178e-06, 1.4435499906539917e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 2.0, 9.0, 18.0, 10.0, 31.0, 18.0, 14.0, 47.0, 30.0, 79.0, 64.0, 74.0, 181.0, 105.0, 128.0, 357.0, 243.0, 690.0, 513.0, 673.0, 1895.0, 1410.0, 5038.0, 4691.0, 8382.0, 980421.0, 18555.0, 13125.0, 3018.0, 1991.0, 2480.0, 813.0, 1222.0, 384.0, 315.0, 438.0, 179.0, 137.0, 252.0, 82.0, 132.0, 43.0, 38.0, 47.0, 23.0, 33.0, 14.0, 19.0, 31.0, 11.0, 16.0, 7.0, 6.0, 9.0, 2.0, 4.0], "bins": [-2.8014183044433594e-06, -2.7185305953025818e-06, -2.635642886161804e-06, -2.5527551770210266e-06, -2.469867467880249e-06, -2.3869797587394714e-06, -2.304092049598694e-06, -2.2212043404579163e-06, -2.1383166313171387e-06, -2.055428922176361e-06, -1.9725412130355835e-06, -1.889653503894806e-06, -1.8067657947540283e-06, -1.7238780856132507e-06, -1.6409903764724731e-06, -1.5581026673316956e-06, -1.475214958190918e-06, -1.3923272490501404e-06, -1.3094395399093628e-06, -1.2265518307685852e-06, -1.1436641216278076e-06, -1.06077641248703e-06, -9.778887033462524e-07, -8.950009942054749e-07, -8.121132850646973e-07, -7.292255759239197e-07, -6.463378667831421e-07, -5.634501576423645e-07, -4.805624485015869e-07, -3.976747393608093e-07, -3.1478703022003174e-07, -2.3189932107925415e-07, -1.4901161193847656e-07, -6.612390279769897e-08, 1.6763806343078613e-08, 9.96515154838562e-08, 1.825392246246338e-07, 2.654269337654114e-07, 3.4831464290618896e-07, 4.3120235204696655e-07, 5.140900611877441e-07, 5.969777703285217e-07, 6.798654794692993e-07, 7.627531886100769e-07, 8.456408977508545e-07, 9.285286068916321e-07, 1.0114163160324097e-06, 1.0943040251731873e-06, 1.1771917343139648e-06, 1.2600794434547424e-06, 1.34296715259552e-06, 1.4258548617362976e-06, 1.5087425708770752e-06, 1.5916302800178528e-06, 1.6745179891586304e-06, 1.757405698299408e-06, 1.8402934074401855e-06, 1.923181116580963e-06, 2.0060688257217407e-06, 2.0889565348625183e-06, 2.171844244003296e-06, 2.2547319531440735e-06, 2.337619662284851e-06, 2.4205073714256287e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 9.0, 0.0, 7.0, 0.0, 10.0, 0.0, 0.0, 16.0, 0.0, 887.0, 0.0, 12.0, 0.0, 22.0, 0.0, 0.0, 8.0, 0.0, 7.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.67992639541626e-07, -8.419156074523926e-07, -8.158385753631592e-07, -7.897615432739258e-07, -7.636845111846924e-07, -7.37607479095459e-07, -7.115304470062256e-07, -6.854534149169922e-07, -6.593763828277588e-07, -6.332993507385254e-07, -6.07222318649292e-07, -5.811452865600586e-07, -5.550682544708252e-07, -5.289912223815918e-07, -5.029141902923584e-07, -4.76837158203125e-07, -4.507601261138916e-07, -4.246830940246582e-07, -3.986060619354248e-07, -3.725290298461914e-07, -3.46451997756958e-07, -3.203749656677246e-07, -2.942979335784912e-07, -2.682209014892578e-07, -2.421438694000244e-07, -2.1606683731079102e-07, -1.8998980522155762e-07, -1.6391277313232422e-07, -1.3783574104309082e-07, -1.1175870895385742e-07, -8.568167686462402e-08, -5.960464477539063e-08, -3.3527612686157227e-08, -7.450580596923828e-09, 1.862645149230957e-08, 4.470348358154297e-08, 7.078051567077637e-08, 9.685754776000977e-08, 1.2293457984924316e-07, 1.4901161193847656e-07, 1.7508864402770996e-07, 2.0116567611694336e-07, 2.2724270820617676e-07, 2.5331974029541016e-07, 2.7939677238464355e-07, 3.0547380447387695e-07, 3.3155083656311035e-07, 3.5762786865234375e-07, 3.8370490074157715e-07, 4.0978193283081055e-07, 4.3585896492004395e-07, 4.6193599700927734e-07, 4.880130290985107e-07, 5.140900611877441e-07, 5.401670932769775e-07, 5.662441253662109e-07, 5.923211574554443e-07, 6.183981895446777e-07, 6.444752216339111e-07, 6.705522537231445e-07, 6.966292858123779e-07, 7.227063179016113e-07, 7.487833499908447e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 15.0, 12.0, 20.0, 22.0, 25.0, 47.0, 45.0, 64.0, 124.0, 159.0, 114.0, 71.0, 44.0, 45.0, 25.0, 33.0, 27.0, 20.0, 11.0, 11.0, 10.0, 2.0, 4.0, 1.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9813198832707712e-06, -1.9119959233648842e-06, -1.8426719634589972e-06, -1.7733480035531102e-06, -1.7040240436472232e-06, -1.6347000837413361e-06, -1.5653761238354491e-06, -1.496052163929562e-06, -1.426728204023675e-06, -1.357404244117788e-06, -1.288080284211901e-06, -1.218756324306014e-06, -1.149432364400127e-06, -1.08010840449424e-06, -1.010784444588353e-06, -9.414605415258848e-07, -8.721366384634166e-07, -8.028126785575296e-07, -7.334887186516426e-07, -6.641647587457555e-07, -5.948407988398685e-07, -5.255168389339815e-07, -4.5619293587151333e-07, -3.868689759656263e-07, -3.175450160597393e-07, -2.4822105615385226e-07, -1.7889711045881995e-07, -1.0957316476378764e-07, -4.024920485790062e-08, 2.90747550479864e-08, 9.839868653216399e-08, 1.6772264643805102e-07, 2.3704660634393804e-07, 3.0637056624982506e-07, 3.756945261557121e-07, 4.450184576398897e-07, 5.143424459674861e-07, 5.836664058733732e-07, 6.529903089358413e-07, 7.223142688417283e-07, 7.916382287476154e-07, 8.609621886535024e-07, 9.302861485593894e-07, 9.996100516218576e-07, 1.0689340115277446e-06, 1.1382579714336316e-06, 1.2075819313395186e-06, 1.2769058912454057e-06, 1.3462298511512927e-06, 1.4155538110571797e-06, 1.4848777709630667e-06, 1.5542017308689537e-06, 1.6235256907748408e-06, 1.6928496506807278e-06, 1.762173496899777e-06, 1.8314974568056641e-06, 1.9008214167115511e-06, 1.970145376617438e-06, 2.039469336523325e-06, 2.108793296429212e-06, 2.1781172563350992e-06, 2.2474412162409863e-06, 2.3167651761468733e-06, 2.3860891360527603e-06, 2.4554130959586473e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 7.0, 5.0, 5.0, 8.0, 13.0, 14.0, 9.0, 18.0, 19.0, 19.0, 23.0, 28.0, 19.0, 42.0, 30.0, 33.0, 32.0, 27.0, 31.0, 40.0, 33.0, 47.0, 35.0, 49.0, 37.0, 32.0, 49.0, 26.0, 30.0, 29.0, 29.0, 25.0, 27.0, 16.0, 20.0, 21.0, 12.0, 9.0, 10.0, 8.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.3961376907900558e-06, -1.3544873809223645e-06, -1.312837184741511e-06, -1.2711868748738198e-06, -1.2295365650061285e-06, -1.187886368825275e-06, -1.1462360589575837e-06, -1.1045858627767302e-06, -1.062935552909039e-06, -1.0212852430413477e-06, -9.796350468604942e-07, -9.379847369928029e-07, -8.963344839685305e-07, -8.546842309442582e-07, -8.130339210765669e-07, -7.713836680522945e-07, -7.297334150280221e-07, -6.880831620037497e-07, -6.464329089794774e-07, -6.047825991117861e-07, -5.631323460875137e-07, -5.214820930632413e-07, -4.798317831955501e-07, -4.381815301712777e-07, -3.965312771470053e-07, -3.548810241227329e-07, -3.132307426767511e-07, -2.715804612307693e-07, -2.299302082064969e-07, -1.882799409713698e-07, -1.466296737362427e-07, -1.0497939229026088e-07, -6.332925295282621e-08, -2.1678985717699106e-08, 1.9971281517427997e-08, 6.16215487525551e-08, 1.032718159876822e-07, 1.449220832228093e-07, 1.865723504579364e-07, 2.2822263190391823e-07, 2.698728849281906e-07, 3.11523137952463e-07, 3.531734193984448e-07, 3.9482370084442664e-07, 4.3647395386869903e-07, 4.781242068929714e-07, 5.197745167606627e-07, 5.61424769784935e-07, 6.030750228092074e-07, 6.447252758334798e-07, 6.863755288577522e-07, 7.280258387254435e-07, 7.696760917497159e-07, 8.113263447739882e-07, 8.529766546416795e-07, 8.946269076659519e-07, 9.362771606902243e-07, 9.779274705579155e-07, 1.019577666738769e-06, 1.0612279766064603e-06, 1.1028782864741515e-06, 1.144528482655005e-06, 1.1861787925226963e-06, 1.2278289887035498e-06, 1.269479298571241e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 2.0, 0.0, 11.0, 6.0, 13.0, 10.0, 15.0, 49.0, 48.0, 51.0, 133.0, 143.0, 254.0, 223.0, 479.0, 826.0, 1185.0, 1215.0, 2944.0, 4961.0, 8421.0, 9356.0, 24391.0, 49333.0, 113228.0, 202028.0, 412411.0, 112523.0, 49277.0, 18018.0, 15864.0, 8611.0, 4876.0, 2116.0, 2062.0, 1199.0, 804.0, 366.0, 333.0, 273.0, 148.0, 93.0, 90.0, 54.0, 50.0, 12.0, 11.0, 14.0, 5.0, 5.0, 6.0, 0.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.245208740234375e-06, -5.081295967102051e-06, -4.9173831939697266e-06, -4.753470420837402e-06, -4.589557647705078e-06, -4.425644874572754e-06, -4.26173210144043e-06, -4.0978193283081055e-06, -3.933906555175781e-06, -3.769993782043457e-06, -3.606081008911133e-06, -3.4421682357788086e-06, -3.2782554626464844e-06, -3.11434268951416e-06, -2.950429916381836e-06, -2.7865171432495117e-06, -2.6226043701171875e-06, -2.4586915969848633e-06, -2.294778823852539e-06, -2.130866050720215e-06, -1.9669532775878906e-06, -1.8030405044555664e-06, -1.6391277313232422e-06, -1.475214958190918e-06, -1.3113021850585938e-06, -1.1473894119262695e-06, -9.834766387939453e-07, -8.195638656616211e-07, -6.556510925292969e-07, -4.917383193969727e-07, -3.2782554626464844e-07, -1.6391277313232422e-07, 0.0, 1.6391277313232422e-07, 3.2782554626464844e-07, 4.917383193969727e-07, 6.556510925292969e-07, 8.195638656616211e-07, 9.834766387939453e-07, 1.1473894119262695e-06, 1.3113021850585938e-06, 1.475214958190918e-06, 1.6391277313232422e-06, 1.8030405044555664e-06, 1.9669532775878906e-06, 2.130866050720215e-06, 2.294778823852539e-06, 2.4586915969848633e-06, 2.6226043701171875e-06, 2.7865171432495117e-06, 2.950429916381836e-06, 3.11434268951416e-06, 3.2782554626464844e-06, 3.4421682357788086e-06, 3.606081008911133e-06, 3.769993782043457e-06, 3.933906555175781e-06, 4.0978193283081055e-06, 4.26173210144043e-06, 4.425644874572754e-06, 4.589557647705078e-06, 4.753470420837402e-06, 4.9173831939697266e-06, 5.081295967102051e-06, 5.245208740234375e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 8.0, 0.0, 0.0, 5.0, 0.0, 11.0, 0.0, 0.0, 12.0, 0.0, 0.0, 27.0, 0.0, 40.0, 0.0, 0.0, 66.0, 0.0, 0.0, 73.0, 0.0, 84.0, 0.0, 0.0, 128.0, 0.0, 0.0, 123.0, 0.0, 108.0, 0.0, 0.0, 83.0, 0.0, 0.0, 71.0, 0.0, 59.0, 0.0, 0.0, 49.0, 0.0, 0.0, 29.0, 0.0, 17.0, 0.0, 0.0, 8.0, 0.0, 0.0, 7.0, 0.0, 7.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 11.0, 23.0, 38.0, 40.0, 87.0, 100.0, 199.0, 330.0, 575.0, 413.0, 1326.0, 2098.0, 3732.0, 6816.0, 12878.0, 23781.0, 50348.0, 124354.0, 451752.0, 141866.0, 124138.0, 50574.0, 24276.0, 12944.0, 6974.0, 3715.0, 2124.0, 1326.0, 696.0, 419.0, 120.0, 175.0, 119.0, 59.0, 42.0, 33.0, 15.0, 9.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.4030526876449585e-06, -3.28943133354187e-06, -3.1758099794387817e-06, -3.0621886253356934e-06, -2.948567271232605e-06, -2.8349459171295166e-06, -2.7213245630264282e-06, -2.60770320892334e-06, -2.4940818548202515e-06, -2.380460500717163e-06, -2.2668391466140747e-06, -2.1532177925109863e-06, -2.039596438407898e-06, -1.9259750843048096e-06, -1.8123537302017212e-06, -1.6987323760986328e-06, -1.5851110219955444e-06, -1.471489667892456e-06, -1.3578683137893677e-06, -1.2442469596862793e-06, -1.130625605583191e-06, -1.0170042514801025e-06, -9.033828973770142e-07, -7.897615432739258e-07, -6.761401891708374e-07, -5.62518835067749e-07, -4.4889748096466064e-07, -3.3527612686157227e-07, -2.2165477275848389e-07, -1.0803341865539551e-07, 5.587935447692871e-09, 1.1920928955078125e-07, 2.3283064365386963e-07, 3.46451997756958e-07, 4.600733518600464e-07, 5.736947059631348e-07, 6.873160600662231e-07, 8.009374141693115e-07, 9.145587682723999e-07, 1.0281801223754883e-06, 1.1418014764785767e-06, 1.255422830581665e-06, 1.3690441846847534e-06, 1.4826655387878418e-06, 1.5962868928909302e-06, 1.7099082469940186e-06, 1.823529601097107e-06, 1.9371509552001953e-06, 2.0507723093032837e-06, 2.164393663406372e-06, 2.2780150175094604e-06, 2.391636371612549e-06, 2.505257725715637e-06, 2.6188790798187256e-06, 2.732500433921814e-06, 2.8461217880249023e-06, 2.9597431421279907e-06, 3.073364496231079e-06, 3.1869858503341675e-06, 3.300607204437256e-06, 3.4142285585403442e-06, 3.5278499126434326e-06, 3.641471266746521e-06, 3.7550926208496094e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 0.0, 7.0, 0.0, 0.0, 13.0, 0.0, 18.0, 0.0, 34.0, 0.0, 34.0, 0.0, 51.0, 0.0, 0.0, 67.0, 0.0, 99.0, 0.0, 111.0, 0.0, 112.0, 0.0, 100.0, 0.0, 0.0, 92.0, 0.0, 65.0, 0.0, 72.0, 0.0, 51.0, 0.0, 27.0, 0.0, 0.0, 25.0, 0.0, 11.0, 0.0, 13.0, 0.0, 5.0, 0.0, 2.0], "bins": [-1.0728836059570312e-06, -1.0458752512931824e-06, -1.0188668966293335e-06, -9.918585419654846e-07, -9.648501873016357e-07, -9.378418326377869e-07, -9.10833477973938e-07, -8.838251233100891e-07, -8.568167686462402e-07, -8.298084139823914e-07, -8.028000593185425e-07, -7.757917046546936e-07, -7.487833499908447e-07, -7.217749953269958e-07, -6.94766640663147e-07, -6.677582859992981e-07, -6.407499313354492e-07, -6.137415766716003e-07, -5.867332220077515e-07, -5.597248673439026e-07, -5.327165126800537e-07, -5.057081580162048e-07, -4.78699803352356e-07, -4.516914486885071e-07, -4.246830940246582e-07, -3.976747393608093e-07, -3.7066638469696045e-07, -3.4365803003311157e-07, -3.166496753692627e-07, -2.896413207054138e-07, -2.6263296604156494e-07, -2.3562461137771606e-07, -2.086162567138672e-07, -1.816079020500183e-07, -1.5459954738616943e-07, -1.2759119272232056e-07, -1.0058283805847168e-07, -7.35744833946228e-08, -4.6566128730773926e-08, -1.955777406692505e-08, 7.450580596923828e-09, 3.4458935260772705e-08, 6.146728992462158e-08, 8.847564458847046e-08, 1.1548399925231934e-07, 1.424923539161682e-07, 1.695007085800171e-07, 1.9650906324386597e-07, 2.2351741790771484e-07, 2.505257725715637e-07, 2.775341272354126e-07, 3.045424818992615e-07, 3.3155083656311035e-07, 3.5855919122695923e-07, 3.855675458908081e-07, 4.12575900554657e-07, 4.3958425521850586e-07, 4.6659260988235474e-07, 4.936009645462036e-07, 5.206093192100525e-07, 5.476176738739014e-07, 5.746260285377502e-07, 6.016343832015991e-07, 6.28642737865448e-07, 6.556510925292969e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 7.0, 17.0, 20.0, 17.0, 26.0, 33.0, 62.0, 94.0, 151.0, 222.0, 88.0, 65.0, 46.0, 34.0, 21.0, 24.0, 19.0, 11.0, 9.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8178758409703732e-06, -1.763027853485255e-06, -1.7081799796869745e-06, -1.6533319922018563e-06, -1.5984841184035758e-06, -1.5436361309184576e-06, -1.4887882571201771e-06, -1.433940269635059e-06, -1.3790922821499407e-06, -1.3242442946648225e-06, -1.269396420866542e-06, -1.2145484333814238e-06, -1.1597005595831433e-06, -1.1048525720980251e-06, -1.050004584612907e-06, -9.951567108146264e-07, -9.403088370163459e-07, -8.854609063746466e-07, -8.306129757329472e-07, -7.75764988247829e-07, -7.209171144495485e-07, -6.660691269644303e-07, -6.11221196322731e-07, -5.563732656810316e-07, -5.015253350393323e-07, -4.4667740439763293e-07, -3.918294737559336e-07, -3.369815146925248e-07, -2.8213358405082545e-07, -2.272856534091261e-07, -1.7243769434571732e-07, -1.1758976370401797e-07, -6.274183306231862e-08, -7.893895315191912e-09, 4.6954042431934795e-08, 1.0180198728448886e-07, 1.566499179261882e-07, 2.1149784856788756e-07, 2.6634580763129634e-07, 3.211937382729957e-07, 3.7604166891469504e-07, 4.308895995563944e-07, 4.857375301980937e-07, 5.405854608397931e-07, 5.954334483249113e-07, 6.502813221231918e-07, 7.0512930960831e-07, 7.599772402500093e-07, 8.148251708917087e-07, 8.69673101533408e-07, 9.245210321751074e-07, 9.793690196602256e-07, 1.034216893458506e-06, 1.0890648809436243e-06, 1.1439128684287425e-06, 1.198760742227023e-06, 1.2536086160253035e-06, 1.3084566035104217e-06, 1.3633044773087022e-06, 1.4181524647938204e-06, 1.4730003385921009e-06, 1.527848326077219e-06, 1.5826963135623373e-06, 1.6375441873606178e-06, 1.692392174845736e-06]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 7.0, 4.0, 7.0, 9.0, 7.0, 17.0, 9.0, 13.0, 17.0, 21.0, 24.0, 19.0, 20.0, 27.0, 37.0, 24.0, 30.0, 30.0, 31.0, 28.0, 45.0, 40.0, 44.0, 32.0, 31.0, 36.0, 41.0, 22.0, 40.0, 31.0, 24.0, 27.0, 18.0, 22.0, 27.0, 15.0, 11.0, 10.0, 16.0, 12.0, 12.0, 14.0, 7.0, 6.0, 10.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.86760267601494e-07, -7.631307425981504e-07, -7.395011607513879e-07, -7.158716357480444e-07, -6.922420539012819e-07, -6.686125288979383e-07, -6.449829470511759e-07, -6.213534220478323e-07, -5.977238402010698e-07, -5.740943151977262e-07, -5.504647333509638e-07, -5.268352083476202e-07, -5.032056265008578e-07, -4.795761014975142e-07, -4.559465196507517e-07, -4.3231699464740814e-07, -4.086874412223551e-07, -3.850578877973021e-07, -3.614283343722491e-07, -3.3779878094719606e-07, -3.1416922752214305e-07, -2.9053967409709003e-07, -2.6691014909374644e-07, -2.43280567246984e-07, -2.196510280327857e-07, -1.9602147460773267e-07, -1.7239192118267965e-07, -1.4876238196848135e-07, -1.2513282854342833e-07, -1.0150326801294796e-07, -7.78737216933223e-08, -5.424416826826928e-08, -3.061461484321626e-08, -6.98506319452008e-09, 1.66444884541761e-08, 4.027403832651544e-08, 6.390359175156846e-08, 8.753314517662147e-08, 1.1116269149624713e-07, 1.3479224492130015e-07, 1.5842179834635317e-07, 1.820513517714062e-07, 2.056809051964592e-07, 2.293104444106575e-07, 2.5293999783571053e-07, 2.7656955126076355e-07, 3.0019910468581656e-07, 3.238286581108696e-07, 3.474582115359226e-07, 3.710877649609756e-07, 3.9471731838602864e-07, 4.1834687181108166e-07, 4.4197642523613467e-07, 4.656059786611877e-07, 4.892355036645313e-07, 5.128650855112937e-07, 5.364946105146373e-07, 5.601241355179809e-07, 5.837537173647434e-07, 6.073832423680869e-07, 6.310128242148494e-07, 6.54642349218193e-07, 6.782719310649554e-07, 7.01901456068299e-07, 7.255310379150615e-07]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [17.0, 0.0, 17.0, 0.0, 0.0, 238.0, 0.0, 0.0, 459.0, 0.0, 935.0, 0.0, 0.0, 2329.0, 0.0, 0.0, 3910.0, 0.0, 5423.0, 0.0, 0.0, 9010.0, 0.0, 0.0, 11254.0, 0.0, 11220.0, 0.0, 0.0, 10948.0, 0.0, 0.0, 4066384.0, 0.0, 14168.0, 0.0, 0.0, 14520.0, 0.0, 0.0, 14564.0, 0.0, 11660.0, 0.0, 0.0, 7018.0, 0.0, 0.0, 5060.0, 0.0, 3014.0, 0.0, 0.0, 1210.0, 0.0, 0.0, 594.0, 0.0, 308.0, 0.0, 0.0, 22.0, 0.0, 22.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 985.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [79.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 582.0, 0.0, 0.0, 5584.0, 0.0, 0.0, 26697.0, 0.0, 0.0, 0.0, 4127029.0, 0.0, 0.0, 28503.0, 0.0, 0.0, 5111.0, 0.0, 0.0, 453.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0], "bins": [-5.960464477539062e-07, -5.774199962615967e-07, -5.587935447692871e-07, -5.401670932769775e-07, -5.21540641784668e-07, -5.029141902923584e-07, -4.842877388000488e-07, -4.6566128730773926e-07, -4.470348358154297e-07, -4.284083843231201e-07, -4.0978193283081055e-07, -3.91155481338501e-07, -3.725290298461914e-07, -3.5390257835388184e-07, -3.3527612686157227e-07, -3.166496753692627e-07, -2.980232238769531e-07, -2.7939677238464355e-07, -2.60770320892334e-07, -2.421438694000244e-07, -2.2351741790771484e-07, -2.0489096641540527e-07, -1.862645149230957e-07, -1.6763806343078613e-07, -1.4901161193847656e-07, -1.30385160446167e-07, -1.1175870895385742e-07, -9.313225746154785e-08, -7.450580596923828e-08, -5.587935447692871e-08, -3.725290298461914e-08, -1.862645149230957e-08, 0.0, 1.862645149230957e-08, 3.725290298461914e-08, 5.587935447692871e-08, 7.450580596923828e-08, 9.313225746154785e-08, 1.1175870895385742e-07, 1.30385160446167e-07, 1.4901161193847656e-07, 1.6763806343078613e-07, 1.862645149230957e-07, 2.0489096641540527e-07, 2.2351741790771484e-07, 2.421438694000244e-07, 2.60770320892334e-07, 2.7939677238464355e-07, 2.980232238769531e-07, 3.166496753692627e-07, 3.3527612686157227e-07, 3.5390257835388184e-07, 3.725290298461914e-07, 3.91155481338501e-07, 4.0978193283081055e-07, 4.284083843231201e-07, 4.470348358154297e-07, 4.6566128730773926e-07, 4.842877388000488e-07, 5.029141902923584e-07, 5.21540641784668e-07, 5.401670932769775e-07, 5.587935447692871e-07, 5.774199962615967e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3981.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 10.0, 3.0, 15.0, 16.0, 21.0, 32.0, 56.0, 106.0, 165.0, 205.0, 131.0, 67.0, 42.0, 35.0, 18.0, 15.0, 15.0, 12.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4478546006557735e-07, -1.407831433652973e-07, -1.3678081245416251e-07, -1.3277849575388245e-07, -1.287761790536024e-07, -1.2477386235332233e-07, -1.2077153144218755e-07, -1.1676921474190749e-07, -1.1276689093620007e-07, -1.0876456713049265e-07, -1.0476225043021259e-07, -1.0075992662450517e-07, -9.675760281879775e-08, -9.275528611851769e-08, -8.875296231281027e-08, -8.475063850710285e-08, -8.074832180682279e-08, -7.674599800111537e-08, -7.27436813008353e-08, -6.874135749512789e-08, -6.473904079484782e-08, -6.07367169891404e-08, -5.6734393183432985e-08, -5.2732072930439244e-08, -4.8729752677445504e-08, -4.472743242445176e-08, -4.072511217145802e-08, -3.67227883657506e-08, -3.272046811275686e-08, -2.871814785976312e-08, -2.471582583041254e-08, -2.071350380106196e-08, -1.6711190653495578e-08, -1.2708869512323417e-08, -8.706548371151257e-09, -4.704227229979097e-09, -7.019060888069362e-10, 3.3004141641868046e-09, 7.302736193537385e-09, 1.1305058222887965e-08, 1.5307378475881706e-08, 1.9309698728875446e-08, 2.3312020758226026e-08, 2.7314342787576606e-08, 3.131666304057035e-08, 3.531898329356409e-08, 3.932130709927151e-08, 4.332362735226525e-08, 4.732594760525899e-08, 5.132826785825273e-08, 5.533058811124647e-08, 5.933291191695389e-08, 6.333523572266131e-08, 6.733755242294137e-08, 7.133987622864879e-08, 7.534220003435621e-08, 7.934451673463627e-08, 8.334684054034369e-08, 8.734915724062375e-08, 9.135148104633117e-08, 9.535379774661124e-08, 9.935612155231865e-08, 1.0335844535802607e-07, 1.0736076205830614e-07, 1.1136308586401356e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 13.0, 11.0, 9.0, 26.0, 29.0, 38.0, 45.0, 66.0, 57.0, 68.0, 90.0, 74.0, 82.0, 74.0, 66.0, 44.0, 47.0, 36.0, 26.0, 23.0, 15.0, 14.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.897478747689092e-08, -9.582619497905398e-08, -9.267759537578968e-08, -8.952900287795273e-08, -8.638041038011579e-08, -8.323181077685149e-08, -8.008321827901455e-08, -7.69346257811776e-08, -7.37860261779133e-08, -7.063743368007636e-08, -6.748883407681205e-08, -6.434024157897511e-08, -6.119164197571081e-08, -5.8043049477873865e-08, -5.489445698003692e-08, -5.17458609294863e-08, -4.8597264878935675e-08, -4.544866882838505e-08, -4.230007277783443e-08, -3.9151480279997486e-08, -3.600288422944686e-08, -3.285428817889624e-08, -2.9705693904702457e-08, -2.6557099630508674e-08, -2.340850357995805e-08, -2.0259907529407428e-08, -1.7111313255213645e-08, -1.3962718092841442e-08, -1.0814122930469239e-08, -7.665526879918616e-09, -4.516932605724833e-09, -1.3683383315310493e-09, 1.7802577190195734e-09, 4.9288528813917765e-09, 8.07744804376398e-09, 1.1226043206136183e-08, 1.4374638368508386e-08, 1.752323441905901e-08, 2.0671828693252792e-08, 2.3820422967446575e-08, 2.6969019017997198e-08, 3.011761506854782e-08, 3.326621111909844e-08, 3.641480361693539e-08, 3.956339966748601e-08, 4.271199571803663e-08, 4.586058821587358e-08, 4.90091842664242e-08, 5.215778031697482e-08, 5.5306376367525445e-08, 5.845497241807607e-08, 6.160356491591301e-08, 6.475215741374996e-08, 6.790075701701426e-08, 7.10493495148512e-08, 7.419794201268815e-08, 7.734654161595245e-08, 8.049513411378939e-08, 8.364373371705369e-08, 8.679232621489064e-08, 8.994092581815494e-08, 9.308951831599188e-08, 9.623811081382883e-08, 9.938671041709313e-08, 1.0253530291493007e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4932.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1038636.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4938.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 954.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 17.0, 19.0, 22.0, 25.0, 67.0, 88.0, 186.0, 221.0, 116.0, 61.0, 48.0, 29.0, 24.0, 17.0, 9.0, 6.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1262915222687298e-07, -1.0876061651288182e-07, -1.0489208079889067e-07, -1.0102354508489952e-07, -9.715500937090837e-08, -9.328647365691722e-08, -8.941794504835343e-08, -8.554940933436228e-08, -8.168087362037113e-08, -7.781233790637998e-08, -7.394380219238883e-08, -7.007526647839768e-08, -6.620673786983389e-08, -6.233820215584274e-08, -5.8469666441851587e-08, -5.4601130727860436e-08, -5.0732595013869286e-08, -4.6864059299878136e-08, -4.2995523585886986e-08, -3.9126991424609514e-08, -3.5258455710618364e-08, -3.1389919996627214e-08, -2.7521386058992903e-08, -2.3652852121358592e-08, -1.978431640736744e-08, -1.591578069337629e-08, -1.204724675574198e-08, -8.17871192992925e-09, -4.310177104116519e-09, -4.4164139012536907e-10, 3.4268925475089418e-09, 7.295426485143253e-09, 1.1163947988279688e-08, 1.5032483702270838e-08, 1.890101763990515e-08, 2.276955157753946e-08, 2.663808729153061e-08, 3.050662300552176e-08, 3.437515516679923e-08, 3.824369088079038e-08, 4.211222659478153e-08, 4.598076230877268e-08, 4.984929802276383e-08, 5.3717830184041304e-08, 5.7586365898032454e-08, 6.145489805930993e-08, 6.532343377330108e-08, 6.919196948729223e-08, 7.306050520128338e-08, 7.692904091527453e-08, 8.079757662926568e-08, 8.466611234325683e-08, 8.853464805724798e-08, 9.240318377123913e-08, 9.627171237980292e-08, 1.0014024809379407e-07, 1.0400878380778522e-07, 1.0787731952177637e-07, 1.1174585523576752e-07, 1.1561439094975867e-07, 1.1948291955832246e-07, 1.2335145527231361e-07, 1.2721999098630477e-07, 1.3108852670029592e-07, 1.3495706241428707e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 14.0, 10.0, 8.0, 27.0, 29.0, 39.0, 48.0, 60.0, 64.0, 64.0, 94.0, 72.0, 85.0, 72.0, 63.0, 45.0, 46.0, 34.0, 29.0, 20.0, 18.0, 12.0, 8.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.814005525437096e-08, -8.532660444870999e-08, -8.251315364304901e-08, -7.969970283738803e-08, -7.688625203172705e-08, -7.407279412063872e-08, -7.125934331497774e-08, -6.844589250931676e-08, -6.563244170365579e-08, -6.281899089799481e-08, -6.000554009233383e-08, -5.7192085733959175e-08, -5.43786349282982e-08, -5.156518412263722e-08, -4.8751729764262564e-08, -4.5938278958601586e-08, -4.312482815294061e-08, -4.031137734727963e-08, -3.7497926541618654e-08, -3.4684472183244e-08, -3.187102137758302e-08, -2.9057570571922042e-08, -2.6244117989904225e-08, -2.343066540788641e-08, -2.061721460222543e-08, -1.7803763796564454e-08, -1.4990311214546637e-08, -1.217685952070724e-08, -9.363407826867842e-09, -6.549956133028445e-09, -3.736504439189048e-09, -9.23051857171231e-10, 1.8903989484897465e-09, 4.703850642329144e-09, 7.517302336168541e-09, 1.0330754030007938e-08, 1.3144205723847335e-08, 1.5957656529508313e-08, 1.877110911152613e-08, 2.1584561693543947e-08, 2.4398012499204924e-08, 2.72114633048659e-08, 3.002491411052688e-08, 3.2838368468901535e-08, 3.565181927456251e-08, 3.846527008022349e-08, 4.1278724438598147e-08, 4.4092175244259124e-08, 4.69056260499201e-08, 4.971907685558108e-08, 5.2532527661242057e-08, 5.534598201961671e-08, 5.815943282527769e-08, 6.097288718365235e-08, 6.378633798931332e-08, 6.65997887949743e-08, 6.941323960063528e-08, 7.222669040629626e-08, 7.504014121195723e-08, 7.785359201761821e-08, 8.066704992870655e-08, 8.348050073436752e-08, 8.62939515400285e-08, 8.910740234568948e-08, 9.192085315135046e-08]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [10.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 396.0, 0.0, 0.0, 1521.0, 0.0, 0.0, 0.0, 3932.0, 0.0, 0.0, 0.0, 1036234.0, 0.0, 0.0, 3956.0, 0.0, 0.0, 0.0, 1539.0, 0.0, 0.0, 420.0, 0.0, 0.0, 0.0, 174.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 7.0], "bins": [-5.364418029785156e-07, -5.19677996635437e-07, -5.029141902923584e-07, -4.861503839492798e-07, -4.6938657760620117e-07, -4.5262277126312256e-07, -4.3585896492004395e-07, -4.1909515857696533e-07, -4.023313522338867e-07, -3.855675458908081e-07, -3.688037395477295e-07, -3.520399332046509e-07, -3.3527612686157227e-07, -3.1851232051849365e-07, -3.0174851417541504e-07, -2.849847078323364e-07, -2.682209014892578e-07, -2.514570951461792e-07, -2.3469328880310059e-07, -2.1792948246002197e-07, -2.0116567611694336e-07, -1.8440186977386475e-07, -1.6763806343078613e-07, -1.5087425708770752e-07, -1.341104507446289e-07, -1.1734664440155029e-07, -1.0058283805847168e-07, -8.381903171539307e-08, -6.705522537231445e-08, -5.029141902923584e-08, -3.3527612686157227e-08, -1.6763806343078613e-08, 0.0, 1.6763806343078613e-08, 3.3527612686157227e-08, 5.029141902923584e-08, 6.705522537231445e-08, 8.381903171539307e-08, 1.0058283805847168e-07, 1.1734664440155029e-07, 1.341104507446289e-07, 1.5087425708770752e-07, 1.6763806343078613e-07, 1.8440186977386475e-07, 2.0116567611694336e-07, 2.1792948246002197e-07, 2.3469328880310059e-07, 2.514570951461792e-07, 2.682209014892578e-07, 2.849847078323364e-07, 3.0174851417541504e-07, 3.1851232051849365e-07, 3.3527612686157227e-07, 3.520399332046509e-07, 3.688037395477295e-07, 3.855675458908081e-07, 4.023313522338867e-07, 4.1909515857696533e-07, 4.3585896492004395e-07, 4.5262277126312256e-07, 4.6938657760620117e-07, 4.861503839492798e-07, 5.029141902923584e-07, 5.19677996635437e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1007.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 1.0, 9.0, 9.0, 6.0, 17.0, 27.0, 45.0, 85.0, 157.0, 275.0, 131.0, 87.0, 43.0, 25.0, 20.0, 14.0, 12.0, 11.0, 6.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8463750346172674e-08, -4.648336116019891e-08, -4.450296842151147e-08, -4.2522579235537705e-08, -4.054219004956394e-08, -3.85617973108765e-08, -3.658140812490274e-08, -3.4601015386215295e-08, -3.262062620024153e-08, -3.064023701426777e-08, -2.8659844275580326e-08, -2.6679455089606563e-08, -2.469906412727596e-08, -2.2718673164945358e-08, -2.0738283978971594e-08, -1.8757893016640992e-08, -1.677750205431039e-08, -1.4797111091979787e-08, -1.2816721017827604e-08, -1.083633094367542e-08, -8.855939981344818e-09, -6.8755490190142154e-09, -4.8951589448620325e-09, -2.9147688707098496e-09, -9.34377908379247e-10, 1.0460126098621458e-09, 3.0264031281035386e-09, 5.006793646344931e-09, 6.987184164586324e-09, 8.967575126916927e-09, 1.094796520106911e-08, 1.2928355275221293e-08, 1.4908742684838217e-08, 1.688913364716882e-08, 1.8869524609499422e-08, 2.0849913795473185e-08, 2.2830304757803788e-08, 2.481069572013439e-08, 2.6791084906108154e-08, 2.8771475868438756e-08, 3.075186683076936e-08, 3.273225601674312e-08, 3.4712648755430564e-08, 3.669303794140433e-08, 3.867342712737809e-08, 4.065381986606553e-08, 4.2634209052039296e-08, 4.461460179072674e-08, 4.65949909767005e-08, 4.8575380162674264e-08, 5.0555772901361706e-08, 5.253616208733547e-08, 5.451655482602291e-08, 5.6496944011996675e-08, 5.847733319797044e-08, 6.04577223839442e-08, 6.243811867534532e-08, 6.441850786131909e-08, 6.639889704729285e-08, 6.837929333869397e-08, 7.035968252466773e-08, 7.23400717106415e-08, 7.432046089661526e-08, 7.630085008258902e-08, 7.828123926856279e-08]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 12.0, 12.0, 16.0, 25.0, 34.0, 44.0, 54.0, 60.0, 71.0, 76.0, 96.0, 74.0, 83.0, 74.0, 43.0, 52.0, 39.0, 30.0, 21.0, 21.0, 12.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.018497179458791e-08, -3.8881783126498703e-08, -3.75785944584095e-08, -3.627540934303397e-08, -3.4972220674944765e-08, -3.366903200685556e-08, -3.2365843338766354e-08, -3.106265467067715e-08, -2.9759466002587942e-08, -2.8456277334498736e-08, -2.715309044276637e-08, -2.5849901774677164e-08, -2.454671310658796e-08, -2.3243526214855592e-08, -2.1940337546766386e-08, -2.063714887867718e-08, -1.9333961986944814e-08, -1.803077331885561e-08, -1.6727586427123242e-08, -1.5424397759034036e-08, -1.412120909094483e-08, -1.2818021311034045e-08, -1.1514833531123259e-08, -1.0211644863034053e-08, -8.908457083123267e-09, -7.60526930321248e-09, -6.302080635123275e-09, -4.998892855212489e-09, -3.695704631212493e-09, -2.392516407212497e-09, -1.089328627301711e-09, 2.1386004078749465e-10, 1.5170478206982807e-09, 2.8202360446982766e-09, 4.1234242686982725e-09, 5.4266120486090585e-09, 6.7298002726090544e-09, 8.03298849660905e-09, 9.336176276519836e-09, 1.0639364944609042e-08, 1.1942552724519828e-08, 1.3245740504430614e-08, 1.454892917251982e-08, 1.5852116064252186e-08, 1.7155304732341392e-08, 1.8458493400430598e-08, 1.9761682068519804e-08, 2.106487073660901e-08, 2.2368057628341376e-08, 2.367124629643058e-08, 2.4974433188162948e-08, 2.6277621856252154e-08, 2.758081052434136e-08, 2.8883999192430565e-08, 3.018718786051977e-08, 3.14903729758953e-08, 3.2793561643984503e-08, 3.409675031207371e-08, 3.5399938980162915e-08, 3.670312764825212e-08, 3.800631276362765e-08, 3.9309501431716853e-08, 4.061269009980606e-08, 4.1915878767895265e-08, 4.321906743598447e-08]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 9.0, 3.0, 6.0, 13.0, 27.0, 28.0, 46.0, 77.0, 107.0, 198.0, 181.0, 123.0, 62.0, 38.0, 16.0, 14.0, 14.0, 14.0, 8.0, 3.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.477832466458608e-09, -3.3574829583216115e-09, -3.237133450184615e-09, -3.1167839420476184e-09, -2.996434655955227e-09, -2.8760851478182303e-09, -2.755735639681234e-09, -2.6353861315442373e-09, -2.5150366234072408e-09, -2.3946871152702442e-09, -2.2743376071332477e-09, -2.1539880989962512e-09, -2.0336385908592547e-09, -1.913289082722258e-09, -1.7929397966298666e-09, -1.67259028849287e-09, -1.5522407803558735e-09, -1.431891272218877e-09, -1.3115417640818805e-09, -1.1911923669671864e-09, -1.07084285883019e-09, -9.504933506931934e-10, -8.301438980673481e-10, -7.097944454415028e-10, -5.894449373045063e-10, -4.690954291675098e-10, -3.487459765416645e-10, -2.283964961602436e-10, -1.080470157788227e-10, 1.2302492358173822e-11, 1.326519449840191e-10, 2.530013976098644e-10, 3.7335112779146584e-10, 4.937006359284624e-10, 6.140500885543076e-10, 7.343995411801529e-10, 8.547490493171495e-10, 9.75098557454146e-10, 1.09544795456884e-09, 1.2157974627058366e-09, 1.336146970842833e-09, 1.4564964789798296e-09, 1.5768459871168261e-09, 1.6971953842315202e-09, 1.8175448923685167e-09, 1.9378942894832107e-09, 2.0582437976202073e-09, 2.1785933057572038e-09, 2.2989428138942003e-09, 2.419292322031197e-09, 2.5396418301681933e-09, 2.65999133830519e-09, 2.7803408464421864e-09, 2.900690354579183e-09, 3.0210396406715745e-09, 3.141389148808571e-09, 3.2617386569455675e-09, 3.382088165082564e-09, 3.5024376732195606e-09, 3.622787181356557e-09, 3.743136467448949e-09, 3.863485975585945e-09, 3.983835483722942e-09, 4.104184991859938e-09, 4.224534499996935e-09]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 1.0, 11.0, 18.0, 17.0, 24.0, 37.0, 48.0, 48.0, 50.0, 80.0, 73.0, 78.0, 92.0, 85.0, 59.0, 51.0, 50.0, 43.0, 33.0, 19.0, 19.0, 10.0, 10.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1426115043586833e-09, -3.043745921971208e-09, -2.944880339583733e-09, -2.846014757196258e-09, -2.747149174808783e-09, -2.6482835924213077e-09, -2.5494180100338326e-09, -2.4505524276463575e-09, -2.3516868452588824e-09, -2.2528212628714073e-09, -2.153955680483932e-09, -2.055090098096457e-09, -1.956224515708982e-09, -1.8573589333215068e-09, -1.7584933509340317e-09, -1.6596277685465566e-09, -1.560762075136779e-09, -1.4618964927493039e-09, -1.3630309103618288e-09, -1.2641653279743537e-09, -1.1652997455868785e-09, -1.066434052177101e-09, -9.675684697896259e-10, -8.68702942913302e-10, -7.698373605258269e-10, -6.709717781383517e-10, -5.721061957508766e-10, -4.732405578522503e-10, -3.743750032203508e-10, -2.7550939307730005e-10, -1.7664381068982493e-10, -7.777822830234982e-11, 2.1087354085125298e-11, 1.1995293647260041e-10, 2.1881853273786334e-10, 3.1768412900312626e-10, 4.1654971139060137e-10, 5.154153215336521e-10, 6.142809039211272e-10, 7.131464863086023e-10, 8.120120686960774e-10, 9.108776510835526e-10, 1.009743288982179e-09, 1.108608871369654e-09, 1.2074744537571291e-09, 1.3063400361446043e-09, 1.4052056185320794e-09, 1.5040712009195545e-09, 1.6029367833070296e-09, 1.7018023656945047e-09, 1.8006679480819798e-09, 1.8995336414917574e-09, 1.9983992238792325e-09, 2.0972648062667076e-09, 2.1961303886541828e-09, 2.294995971041658e-09, 2.393861553429133e-09, 2.492727135816608e-09, 2.5915927182040832e-09, 2.6904583005915583e-09, 2.7893238829790334e-09, 2.8881894653665086e-09, 2.9870550477539837e-09, 3.0859206301414588e-09, 3.184786212528934e-09]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 1.0, 5.0, 12.0, 20.0, 23.0, 45.0, 66.0, 109.0, 204.0, 210.0, 117.0, 65.0, 30.0, 21.0, 16.0, 16.0, 8.0, 5.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357676803261711e-09, -3.241576562729165e-09, -3.1254761001520137e-09, -3.0093758596194675e-09, -2.8932753970423164e-09, -2.77717515650977e-09, -2.661074693932619e-09, -2.544974453400073e-09, -2.4288739908229218e-09, -2.3127737502903756e-09, -2.1966732877132245e-09, -2.0805730471806783e-09, -1.964472584603527e-09, -1.848372344070981e-09, -1.7322718814938298e-09, -1.6161716409612836e-09, -1.500071289406435e-09, -1.3839709378515863e-09, -1.2678705862967377e-09, -1.151770234741889e-09, -1.0356698831870403e-09, -9.195695871433429e-10, -8.034692355884943e-10, -6.873688840336456e-10, -5.712685324787969e-10, -4.551681809239483e-10, -3.3906782936909963e-10, -2.2296750556982659e-10, -1.0686715401497793e-10, 9.233169784295114e-12, 1.2533352133914377e-10, 2.4143387289399243e-10, 3.575342244488411e-10, 4.736345760036897e-10, 5.897349275585384e-10, 7.058352791133871e-10, 8.219356306682357e-10, 9.38035871200782e-10, 1.054136333777933e-09, 1.1702365743104792e-09, 1.2863370368876303e-09, 1.402437388442479e-09, 1.5185377399973277e-09, 1.6346380915521763e-09, 1.750738443107025e-09, 1.866838683639571e-09, 1.9829391462167223e-09, 2.0990393867492685e-09, 2.2151396272818147e-09, 2.331239867814361e-09, 2.447340330391512e-09, 2.563440570924058e-09, 2.6795410335012093e-09, 2.7956412740337555e-09, 2.9117417366109066e-09, 3.027841977143453e-09, 3.143942439720604e-09, 3.26004268025315e-09, 3.3761431428303013e-09, 3.4922433833628475e-09, 3.6083438459399986e-09, 3.7244440864725448e-09, 3.840544327005091e-09, 3.956644789582242e-09, 4.072745252159393e-09]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 9.0, 19.0, 20.0, 22.0, 32.0, 50.0, 51.0, 46.0, 88.0, 67.0, 82.0, 88.0, 83.0, 61.0, 53.0, 49.0, 43.0, 33.0, 21.0, 18.0, 9.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5321738039707498e-09, -2.4524811070847363e-09, -2.372788410198723e-09, -2.2930957133127094e-09, -2.213402794382091e-09, -2.1337100974960777e-09, -2.0540174006100642e-09, -1.9743247037240508e-09, -1.8946320068380373e-09, -1.814939309952024e-09, -1.7352466130660105e-09, -1.6555538051576946e-09, -1.5758611082716811e-09, -1.4961684113856677e-09, -1.4164756034773518e-09, -1.3367829065913384e-09, -1.257090209705325e-09, -1.1773975128193115e-09, -1.097704815933298e-09, -1.0180120080249822e-09, -9.383193111389687e-10, -8.586266142529553e-10, -7.789338618557906e-10, -6.992411094586259e-10, -6.195484125726125e-10, -5.398557156865991e-10, -4.601629632894344e-10, -3.8047023864784535e-10, -3.007775140062563e-10, -2.2108478936466724e-10, -1.413920647230782e-10, -6.169931232591352e-11, 1.7993606604704837e-11, 9.768633124629389e-11, 1.7737905588788294e-10, 2.57071780529472e-10, 3.3676450517106105e-10, 4.164572298126501e-10, 4.961499544542392e-10, 5.758427068514038e-10, 6.555354037374173e-10, 7.352281006234307e-10, 8.149208530205954e-10, 8.9461360541776e-10, 9.743063023037735e-10, 1.053998999189787e-09, 1.1336918070981028e-09, 1.2133845039841162e-09, 1.2930772008701297e-09, 1.3727698977561431e-09, 1.4524625946421565e-09, 1.5321554025504724e-09, 1.6118480994364859e-09, 1.6915407963224993e-09, 1.7712336042308152e-09, 1.8509263011168287e-09, 1.930618998002842e-09, 2.0103116948888555e-09, 2.090004391774869e-09, 2.1696970886608824e-09, 2.2493900075915008e-09, 2.329082704477514e-09, 2.4087754013635276e-09, 2.488468098249541e-09, 2.5681607951355545e-09]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 9.0, 7.0, 6.0, 12.0, 20.0, 32.0, 49.0, 126.0, 192.0, 202.0, 126.0, 92.0, 39.0, 25.0, 14.0, 10.0, 13.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7531853746532988e-09, -1.6804161395711503e-09, -1.6076469044890018e-09, -1.5348777804291558e-09, -1.4621085453470073e-09, -1.3893393102648588e-09, -1.3165701862050128e-09, -1.2438009511228643e-09, -1.1710317160407158e-09, -1.0982624809585673e-09, -1.0254932458764188e-09, -9.527241218165727e-10, -8.799548867344242e-10, -8.071856516522757e-10, -7.344164720812785e-10, -6.616472925102812e-10, -5.888780574281327e-10, -5.161088223459842e-10, -4.4333964277498694e-10, -3.7057043544841406e-10, -2.978012281218412e-10, -2.250320207952683e-10, -1.522628134686954e-10, -7.949363389769815e-11, -6.724398815549648e-12, 6.604480851102323e-11, 1.3881401583759612e-10, 2.11583223164169e-10, 2.843524304907419e-10, 3.5712163781731476e-10, 4.2989084514388765e-10, 5.026600247148849e-10, 5.754290377524285e-10, 6.48198272834577e-10, 7.209674524055742e-10, 7.937366319765715e-10, 8.6650586705872e-10, 9.392751021408685e-10, 1.0120442262007145e-09, 1.084813461282863e-09, 1.1575826963650115e-09, 1.23035193144716e-09, 1.3031211665293085e-09, 1.3758902905891546e-09, 1.448659525671303e-09, 1.5214287607534516e-09, 1.5941978848132976e-09, 1.666967119895446e-09, 1.7397363549775946e-09, 1.812505590059743e-09, 1.8852748251418916e-09, 1.9580439492017376e-09, 2.0308132953061886e-09, 2.1035824193660346e-09, 2.1763515434258807e-09, 2.2491208895303316e-09, 2.3218900135901777e-09, 2.3946591376500237e-09, 2.4674284837544747e-09, 2.5401976078143207e-09, 2.6129667318741667e-09, 2.6857360779786177e-09, 2.7585052020384637e-09, 2.8312743260983098e-09, 2.9040436722027607e-09]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 7.0, 3.0, 6.0, 25.0, 17.0, 22.0, 38.0, 58.0, 38.0, 62.0, 75.0, 68.0, 96.0, 88.0, 80.0, 56.0, 49.0, 54.0, 41.0, 29.0, 21.0, 14.0, 11.0, 9.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.45125311767913e-09, -1.4053689323390017e-09, -1.3594847469988736e-09, -1.3136005616587454e-09, -1.2677164873409197e-09, -1.2218323020007915e-09, -1.1759481166606633e-09, -1.1300639313205352e-09, -1.0841798570027095e-09, -1.0382956716625813e-09, -9.924114863224531e-10, -9.46527300982325e-10, -9.006432266644993e-10, -8.547590413243711e-10, -8.088748559842429e-10, -7.629906706441147e-10, -7.171064853039866e-10, -6.712222999638584e-10, -6.253381701348815e-10, -5.794539847947533e-10, -5.335698549657764e-10, -4.876856696256482e-10, -4.4180148428552e-10, -3.9591732670096746e-10, -3.500331691164149e-10, -3.0414901153186236e-10, -2.582648539473098e-10, -2.1238066860718163e-10, -1.6649651102262908e-10, -1.2061235343807652e-10, -7.472816809794836e-11, -2.88440105133958e-11, 1.7040147071156753e-11, 6.292431159460321e-11, 1.0880847611804967e-10, 1.5469264758039003e-10, 2.0057680516494258e-10, 2.4646096274949514e-10, 2.923451480896233e-10, 3.3822930567417586e-10, 3.841134632587284e-10, 4.2999762084328097e-10, 4.758817784278335e-10, 5.217659637679617e-10, 5.676501491080899e-10, 6.135342789370668e-10, 6.59418464277195e-10, 7.053025941061719e-10, 7.511867794463001e-10, 7.970709647864282e-10, 8.429550946154052e-10, 8.888392799555334e-10, 9.347234097845103e-10, 9.806075951246385e-10, 1.0264917804647666e-09, 1.0723759658048948e-09, 1.118260151145023e-09, 1.1641443364851511e-09, 1.2100285218252793e-09, 1.2559127071654075e-09, 1.3017967814832332e-09, 1.3476809668233614e-09, 1.3935651521634895e-09, 1.4394493375036177e-09, 1.4853334118214434e-09]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 11.0, 20.0, 12.0, 44.0, 111.0, 315.0, 311.0, 106.0, 48.0, 16.0, 11.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.893536160148869e-09, -3.810822768457456e-09, -3.728109376766042e-09, -3.6453957630300238e-09, -3.5626821492940053e-09, -3.4799687576025917e-09, -3.397255365911178e-09, -3.3145417521751597e-09, -3.231828138439141e-09, -3.1491147467477276e-09, -3.066401133011709e-09, -2.9836877413202956e-09, -2.900974127584277e-09, -2.8182607358928635e-09, -2.73554734420145e-09, -2.6528337304654315e-09, -2.570120338774018e-09, -2.4874069470826043e-09, -2.404693333346586e-09, -2.3219799416551723e-09, -2.239266327919154e-09, -2.1565529362277402e-09, -2.0738393224917218e-09, -1.991125930800308e-09, -1.9084125391088946e-09, -1.8256990363951786e-09, -1.7429855336814626e-09, -1.660272141990049e-09, -1.5775585282540305e-09, -1.494845136562617e-09, -1.412131633848901e-09, -1.329418131135185e-09, -1.2467047394437714e-09, -1.1639912367300553e-09, -1.0812777340163393e-09, -9.985643423249257e-10, -9.158507841000585e-10, -8.331372813863425e-10, -7.504238341837777e-10, -6.677103314700616e-10, -5.849968287563456e-10, -5.022833260426296e-10, -4.195698510844892e-10, -3.368563761263488e-10, -2.5414287341263275e-10, -1.7142937069891673e-10, -8.871592349635193e-11, -6.002420782635909e-12, 7.671108193108012e-11, 1.5942457076700833e-10, 2.4213805960293655e-10, 3.2485153456107696e-10, 4.07565037274793e-10, 4.90278539988509e-10, 5.729919871910738e-10, 6.557054899047898e-10, 7.384189926185059e-10, 8.211324953322219e-10, 9.038459980459379e-10, 9.86559500759654e-10, 1.0692728924510675e-09, 1.151986506187086e-09, 1.2346998978784995e-09, 1.3174134005922156e-09, 1.4001269033059316e-09]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 17.0, 21.0, 20.0, 37.0, 51.0, 43.0, 59.0, 78.0, 80.0, 79.0, 92.0, 80.0, 64.0, 47.0, 57.0, 38.0, 37.0, 19.0, 11.0, 9.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.026623674960092e-09, -9.9521246799128e-10, -9.638011500001653e-10, -9.323899430313531e-10, -9.009786250402385e-10, -8.695674180714263e-10, -8.381561555914629e-10, -8.067448931114996e-10, -7.753336306315362e-10, -7.439223681515728e-10, -7.125111056716094e-10, -6.81099843191646e-10, -6.496886362228338e-10, -6.182773182317192e-10, -5.86866111262907e-10, -5.554548487829436e-10, -5.240435863029802e-10, -4.926323238230168e-10, -4.612210613430534e-10, -4.298098266186656e-10, -3.9839856413870223e-10, -3.6698730165873883e-10, -3.3557606693435105e-10, -3.0416480445438765e-10, -2.7275354197442425e-10, -2.4134227949446085e-10, -2.0993103089228526e-10, -1.7851978229010967e-10, -1.4710851981014628e-10, -1.1569725733018288e-10, -8.428600872800729e-11, -5.28747601258317e-11, -2.14634976458683e-11, 9.947757895201192e-12, 4.1359013436270686e-11, 7.277026897734018e-11, 1.0418152451840967e-10, 1.3559278699837307e-10, 1.6700403560054866e-10, 1.9841528420272425e-10, 2.2982654668268765e-10, 2.6123780916265105e-10, 2.9264907164261444e-10, 3.2406030636700223e-10, 3.554715688469656e-10, 3.86882831326929e-10, 4.182940660513168e-10, 4.497053285312802e-10, 4.811165910112436e-10, 5.12527853491207e-10, 5.439391159711704e-10, 5.753503784511338e-10, 6.067616409310972e-10, 6.381728478999094e-10, 6.695841103798728e-10, 7.009953728598362e-10, 7.324066353397995e-10, 7.638178978197629e-10, 7.952291602997263e-10, 8.266404227796897e-10, 8.580516297485019e-10, 8.894629477396165e-10, 9.208741547084287e-10, 9.522853616772409e-10, 9.836966796683555e-10]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 9.0, 15.0, 29.0, 38.0, 79.0, 154.0, 245.0, 181.0, 103.0, 46.0, 36.0, 22.0, 10.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2761546264172807e-09, -1.2316531128320207e-09, -1.1871517102690632e-09, -1.1426501966838032e-09, -1.0981486830985432e-09, -1.0536472805355857e-09, -1.0091457669503257e-09, -9.646443643873681e-10, -9.201428508021081e-10, -8.756413927279993e-10, -8.311399346538906e-10, -7.866384210686306e-10, -7.421369629945218e-10, -6.97635504920413e-10, -6.53133991335153e-10, -6.086325332610443e-10, -5.641310751869355e-10, -5.196296171128267e-10, -4.75128159038718e-10, -4.3062664545345797e-10, -3.861251873793492e-10, -3.4162372930524043e-10, -2.9712224347555605e-10, -2.5262075764587166e-10, -2.081192995717629e-10, -1.6361782761986632e-10, -1.1911635566796974e-10, -7.461488371607317e-11, -3.011341176417659e-11, 1.4388060187719987e-11, 5.888953213961656e-11, 1.0339101796930095e-10, 1.4789247604340972e-10, 1.923939479953063e-10, 2.3689541994720287e-10, 2.8139690577688725e-10, 3.25898363850996e-10, 3.703998219251048e-10, 4.1490130775478917e-10, 4.5940279358447356e-10, 5.039042516585823e-10, 5.484057097326911e-10, 5.929071678067999e-10, 6.374086813920599e-10, 6.819101394661686e-10, 7.264115975402774e-10, 7.709131111255374e-10, 8.154145691996462e-10, 8.599160272737549e-10, 9.044174853478637e-10, 9.489189434219725e-10, 9.934204570072325e-10, 1.0379219705924925e-09, 1.08242337315545e-09, 1.12692488674071e-09, 1.1714262893036675e-09, 1.2159278028889275e-09, 1.2604293164741875e-09, 1.304930719037145e-09, 1.349432232622405e-09, 1.3939336351853626e-09, 1.4384351487706226e-09, 1.4829366623558826e-09, 1.5274381759411426e-09, 1.5719395785041002e-09]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 4.0, 8.0, 18.0, 24.0, 17.0, 36.0, 50.0, 46.0, 48.0, 77.0, 71.0, 85.0, 91.0, 79.0, 71.0, 53.0, 46.0, 44.0, 32.0, 26.0, 13.0, 9.0, 11.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.681490998834306e-10, -7.448070493687453e-10, -7.2146499885406e-10, -6.981229483393747e-10, -6.747808978246894e-10, -6.514389028211554e-10, -6.280968523064701e-10, -6.047548017917848e-10, -5.814127512770995e-10, -5.580707007624142e-10, -5.347286502477289e-10, -5.113865997330436e-10, -4.880446047295095e-10, -4.647025264592486e-10, -4.413605037001389e-10, -4.180184531854536e-10, -3.946764026707683e-10, -3.71334352156083e-10, -3.479923016413977e-10, -3.2465027888228803e-10, -3.0130822836760274e-10, -2.7796617785291744e-10, -2.5462415509380776e-10, -2.3128210457912246e-10, -2.0794005406443716e-10, -1.8459800354975187e-10, -1.6125596691285438e-10, -1.3791393027595689e-10, -1.1457187976127159e-10, -9.122982924658629e-11, -6.78877926096888e-11, -4.454575597279131e-11, -2.1203705458106015e-11, 2.138338117685379e-12, 2.5480381693476772e-11, 4.8822425269268166e-11, 7.216446884505956e-11, 9.550651935974486e-11, 1.1884855599664235e-10, 1.4219059263353984e-10, 1.6553264314822513e-10, 1.8887469366291043e-10, 2.1221673029980792e-10, 2.355587669367054e-10, 2.589008174513907e-10, 2.82242867966076e-10, 3.055848907251857e-10, 3.28926941239871e-10, 3.522689917545563e-10, 3.756110422692416e-10, 3.989530927839269e-10, 4.2229511554303656e-10, 4.4563716605772186e-10, 4.689791888168315e-10, 4.923212393315168e-10, 5.156632898462021e-10, 5.390053403608874e-10, 5.623473908755727e-10, 5.85689441390258e-10, 6.090314919049433e-10, 6.323734869084774e-10, 6.557155929343139e-10, 6.79057587937848e-10, 7.023996384525333e-10, 7.257416889672186e-10]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 11.0, 32.0, 153.0, 578.0, 200.0, 30.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0199350253259354e-09, -9.232645203915979e-10, -8.265940154572604e-10, -7.299234550117717e-10, -6.332529500774342e-10, -5.365824451430967e-10, -4.39911884697608e-10, -3.432413797632705e-10, -2.4657087482893303e-10, -1.4990035601680773e-10, -5.322983720468244e-11, 4.344069548523066e-11, 1.4011120041956815e-10, 2.3678170535390564e-10, 3.3345226579939435e-10, 4.3012277073373184e-10, 5.267932756680693e-10, 6.234637806024068e-10, 7.201342855367443e-10, 8.16804845982233e-10, 9.134753509165705e-10, 1.010145855850908e-09, 1.1068164162963967e-09, 1.203486865719583e-09, 1.3001574261650717e-09, 1.3968279866105604e-09, 1.4934984360337467e-09, 1.5901689964792354e-09, 1.686839556924724e-09, 1.7835100063479103e-09, 1.8801804557710966e-09, 1.9768511272388878e-09, 2.073521354617469e-09, 2.1701918040406554e-09, 2.2668624755084466e-09, 2.363532924931633e-09, 2.460203374354819e-09, 2.5568738237780053e-09, 2.6535444952457965e-09, 2.7502149446689828e-09, 2.846885394092169e-09, 2.9435558435153553e-09, 3.0402265149831464e-09, 3.1368969644063327e-09, 3.233567413829519e-09, 3.3302378632527052e-09, 3.4269085347204964e-09, 3.5235789841436826e-09, 3.620249655611474e-09, 3.71692010503466e-09, 3.813590776502451e-09, 3.9102614479702424e-09, 4.006931675348824e-09, 4.103602346816615e-09, 4.200273018284406e-09, 4.2969432456629875e-09, 4.393613917130779e-09, 4.49028458859857e-09, 4.586954815977151e-09, 4.683625487444942e-09, 4.7802961589127335e-09, 4.876966386291315e-09, 4.973637057759106e-09, 5.070307729226897e-09, 5.1669779566054785e-09]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 4.0, 8.0, 27.0, 17.0, 21.0, 36.0, 57.0, 46.0, 56.0, 88.0, 71.0, 92.0, 86.0, 84.0, 57.0, 47.0, 59.0, 27.0, 31.0, 21.0, 11.0, 9.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.82423442807567e-10, -5.64511659639777e-10, -5.46599876471987e-10, -5.286880933041971e-10, -5.107763101364071e-10, -4.928645269686172e-10, -4.749527438008272e-10, -4.5704098838861285e-10, -4.391292052208229e-10, -4.212174220530329e-10, -4.0330563888524296e-10, -3.85393855717453e-10, -3.6748210030523865e-10, -3.495703171374487e-10, -3.316585339696587e-10, -3.1374675080186876e-10, -2.958349676340788e-10, -2.7792318446628883e-10, -2.6001140129849887e-10, -2.420996181307089e-10, -2.2418784884070675e-10, -2.0627606567291679e-10, -1.8836429638291463e-10, -1.7045251321512467e-10, -1.525407300473347e-10, -1.3462894687954474e-10, -1.1671716371175478e-10, -9.880539442175262e-11, -8.089361125396266e-11, -6.29818280861727e-11, -4.507005185727664e-11, -2.715827562838058e-11, -9.246492460590616e-12, 8.665287237752395e-12, 2.6577066936095406e-11, 4.448884663443842e-11, 6.240062633278143e-11, 8.031240950057139e-11, 9.822418572946745e-11, 1.1613596195836351e-10, 1.3404774512615347e-10, 1.5195952829394344e-10, 1.698713114617334e-10, 1.8778308075173555e-10, 2.0569486391952552e-10, 2.2360664708731548e-10, 2.4151841637731764e-10, 2.594301995451076e-10, 2.7734198271289756e-10, 2.952537658806875e-10, 3.131655490484775e-10, 3.3107733221626745e-10, 3.489891153840574e-10, 3.669008985518474e-10, 3.848126539640617e-10, 4.027244371318517e-10, 4.2063622029964165e-10, 4.385480034674316e-10, 4.564597866352216e-10, 4.743715420474359e-10, 4.922833252152259e-10, 5.101951083830158e-10, 5.281068915508058e-10, 5.460186747185958e-10, 5.639304578863857e-10]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 52.0, 400.0, 485.0, 58.0, 9.0, 5.0], "bins": [-1.5754921811605982e-09, -1.549255501664959e-09, -1.5230188221693197e-09, -1.496782031651378e-09, -1.4705453521557388e-09, -1.4443086726600995e-09, -1.4180718821421578e-09, -1.3918352026465186e-09, -1.3655985231508794e-09, -1.3393618436552401e-09, -1.313125164159601e-09, -1.2868883736416592e-09, -1.26065169414602e-09, -1.2344150146503807e-09, -1.208178224132439e-09, -1.1819415446367998e-09, -1.1557048651411606e-09, -1.1294681856455213e-09, -1.103231506149882e-09, -1.0769947156319404e-09, -1.0507580361363011e-09, -1.024521356640662e-09, -9.982845661227202e-10, -9.72047886627081e-10, -9.458112071314417e-10, -9.195745276358025e-10, -8.93337792629012e-10, -8.671010576222216e-10, -8.408643781265823e-10, -8.146276986309431e-10, -7.883909636241526e-10, -7.621542286173622e-10, -7.359176046328741e-10, -7.096808696260837e-10, -6.834441901304444e-10, -6.572075106348052e-10, -6.309707756280147e-10, -6.047340406212243e-10, -5.78497361125585e-10, -5.522606816299458e-10, -5.260239466231553e-10, -4.997872116163649e-10, -4.735505321207256e-10, -4.4731382486951077e-10, -4.210771176182959e-10, -3.9484041036708106e-10, -3.686037031158662e-10, -3.4236699586465136e-10, -3.161302608578609e-10, -2.8989355360664604e-10, -2.636568463554312e-10, -2.3742013910421633e-10, -2.1118343185300148e-10, -1.8494672460178663e-10, -1.5871001735057177e-10, -1.3247331009935692e-10, -1.0623660978703597e-10, -7.999990253582112e-11, -5.376319528460627e-11, -2.7526488033391416e-11, -1.2897807821765639e-12, 2.494692646903829e-11, 5.118363372025314e-11, 7.7420340971468e-11, 1.0365704822268285e-10]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 7.0, 1.0, 10.0, 8.0, 12.0, 13.0, 25.0, 37.0, 38.0, 33.0, 29.0, 42.0, 60.0, 51.0, 69.0, 58.0, 72.0, 50.0, 59.0, 50.0, 41.0, 41.0, 27.0, 38.0, 30.0, 19.0, 16.0, 11.0, 8.0, 9.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.549673445122579e-10, -1.4959426752891858e-10, -1.4422120442336706e-10, -1.3884812744002772e-10, -1.334750643344762e-10, -1.2810198735113687e-10, -1.2272891036779754e-10, -1.1735584726224602e-10, -1.1198277027890668e-10, -1.0660970023446126e-10, -1.0123663019001583e-10, -9.58635532066765e-11, -9.049048316223107e-11, -8.511741311778565e-11, -7.974433613444631e-11, -7.437126609000089e-11, -6.899819604555546e-11, -6.362512600111003e-11, -5.82520559566646e-11, -5.2878978973325275e-11, -4.750590892887985e-11, -4.213283888443442e-11, -3.675976537054204e-11, -3.138669185664966e-11, -2.6013621812204235e-11, -2.0640550033035332e-11, -1.526747825386643e-11, -9.894406474697526e-12, -4.521334695528623e-12, 8.517370836402804e-13, 6.2248088628091836e-12, 1.1597882376701563e-11, 1.6970966298934798e-11, 2.23440380781037e-11, 2.7717109857272604e-11, 3.309018337116498e-11, 3.846325341561041e-11, 4.383632346005584e-11, 4.9209396973948216e-11, 5.4582470487840595e-11, 5.995554053228602e-11, 6.532861057673145e-11, 7.070168062117688e-11, 7.607475760451621e-11, 8.144782764896163e-11, 8.682089769340706e-11, 9.219397467674639e-11, 9.756704472119182e-11, 1.0294011476563725e-10, 1.0831318481008267e-10, 1.136862548545281e-10, 1.1905933183786743e-10, 1.2443240882120676e-10, 1.2980547192675829e-10, 1.3517854891009762e-10, 1.4055162589343695e-10, 1.4592468899898847e-10, 1.512977659823278e-10, 1.5667082908787933e-10, 1.6204390607121866e-10, 1.6741696917677018e-10, 1.727900461601095e-10, 1.7816312314344884e-10, 1.8353618624900037e-10, 1.889092632323397e-10]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 7.0, 9.0, 4.0, 10.0, 15.0, 16.0, 34.0, 33.0, 56.0, 65.0, 87.0, 138.0, 121.0, 101.0, 80.0, 56.0, 43.0, 30.0, 21.0, 16.0, 9.0, 11.0, 14.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0216351375991195e-10, -9.917876242493406e-11, -9.619401108995618e-11, -9.320925975497829e-11, -9.02245084200004e-11, -8.723975708502252e-11, -8.425500575004463e-11, -8.127025441506674e-11, -7.828550308008886e-11, -7.530075174511097e-11, -7.231600041013309e-11, -6.93312490751552e-11, -6.634649774017731e-11, -6.336174640519943e-11, -6.037699507022154e-11, -5.739224373524365e-11, -5.4407492400265767e-11, -5.142274106528788e-11, -4.8437989730309994e-11, -4.545323839533211e-11, -4.246848706035422e-11, -3.9483735725376334e-11, -3.649898439039845e-11, -3.351423305542056e-11, -3.0529481720442675e-11, -2.754473038546479e-11, -2.4559979050486902e-11, -2.1575227715509016e-11, -1.859047638053113e-11, -1.5605725045553243e-11, -1.2620973710575356e-11, -9.63622237559747e-12, -6.651477979513487e-12, -3.666726644535601e-12, -6.819753095577141e-13, 2.3027760254201723e-12, 5.287527360398059e-12, 8.272278695375945e-12, 1.1257030030353832e-11, 1.4241781365331718e-11, 1.7226532700309605e-11, 2.021128403528749e-11, 2.3196035370265378e-11, 2.6180786705243264e-11, 2.916553804022115e-11, 3.215028937519904e-11, 3.5135040710176924e-11, 3.811979204515481e-11, 4.1104543380132696e-11, 4.408929471511058e-11, 4.707404605008847e-11, 5.0058797385066356e-11, 5.304354872004424e-11, 5.602830005502213e-11, 5.901305139000002e-11, 6.19978027249779e-11, 6.498255405995579e-11, 6.796730539493367e-11, 7.095205672991156e-11, 7.393680806488945e-11, 7.692155939986733e-11, 7.990631073484522e-11, 8.289106206982311e-11, 8.5875813404801e-11, 8.886056473977888e-11]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 8.0, 7.0, 6.0, 16.0, 18.0, 35.0, 36.0, 30.0, 36.0, 42.0, 48.0, 48.0, 69.0, 54.0, 67.0, 68.0, 62.0, 46.0, 49.0, 41.0, 33.0, 23.0, 36.0, 23.0, 21.0, 14.0, 7.0, 8.0, 12.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03905761403989e-11, -7.754510922275415e-11, -7.469963536621549e-11, -7.185416844857073e-11, -6.900870153092598e-11, -6.616323461328122e-11, -6.331776769563646e-11, -6.04722938390978e-11, -5.7626826921453045e-11, -5.478136000380829e-11, -5.193588961671658e-11, -4.909041922962487e-11, -4.6244952311980114e-11, -4.339948539433536e-11, -4.055401500724365e-11, -3.770854462015194e-11, -3.4863077702507184e-11, -3.201761078486243e-11, -2.917214039777072e-11, -2.6326671745402486e-11, -2.3481203093034253e-11, -2.063573444066602e-11, -1.7790265788297788e-11, -1.4944797135929555e-11, -1.2099328483561322e-11, -9.25385983119309e-12, -6.408391178824857e-12, -3.5629225264566244e-12, -7.174538740883918e-13, 2.128014778279841e-12, 4.9734834306480735e-12, 7.818952083016306e-12, 1.0664427674278443e-11, 1.3509896326646675e-11, 1.6355364979014908e-11, 1.920083363138314e-11, 2.2046302283751373e-11, 2.4891770936119606e-11, 2.773723958848784e-11, 3.058270997557955e-11, 3.3428176893224304e-11, 3.627364381086906e-11, 3.911911419796077e-11, 4.196458458505248e-11, 4.4810051502697235e-11, 4.765551842034199e-11, 5.05009888074337e-11, 5.334645919452541e-11, 5.6191926112170165e-11, 5.903739302981492e-11, 6.188285994745968e-11, 6.472833380399834e-11, 6.75738007216431e-11, 7.041926763928785e-11, 7.326474149582651e-11, 7.611020841347127e-11, 7.895567533111603e-11, 8.180114224876078e-11, 8.464660916640554e-11, 8.74920830229442e-11, 9.033754994058896e-11, 9.318301685823371e-11, 9.602849071477237e-11, 9.887395763241713e-11, 1.0171942455006189e-10]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 0.0, 5.0, 6.0, 8.0, 13.0, 15.0, 42.0, 44.0, 58.0, 81.0, 121.0, 174.0, 121.0, 99.0, 64.0, 30.0, 28.0, 19.0, 22.0, 14.0, 5.0, 11.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.352927377552888e-11, -8.069812873490179e-11, -7.78669906331686e-11, -7.50358455925415e-11, -7.220470055191441e-11, -6.937356245018123e-11, -6.654241740955413e-11, -6.371127236892704e-11, -6.088013426719385e-11, -5.804899269601371e-11, -5.521785112483357e-11, -5.238670608420648e-11, -4.955556451302634e-11, -4.67244229418462e-11, -4.389327790121911e-11, -4.106213633003897e-11, -3.823099475885883e-11, -3.539985318767869e-11, -3.256871161649855e-11, -2.9737566575871455e-11, -2.6906425004691314e-11, -2.4075283433511174e-11, -2.1244140127607558e-11, -1.8412996821703942e-11, -1.5581855250523802e-11, -1.2750712811981924e-11, -9.919570373440045e-12, -7.088427934898167e-12, -4.257285496356289e-12, -1.4261430578144108e-12, 1.4049993807274674e-12, 4.236142686631084e-12, 7.067291196705128e-12, 9.898433635247006e-12, 1.2729576073788884e-11, 1.55607193796925e-11, 1.839186095087264e-11, 2.122300252205278e-11, 2.4054145827956397e-11, 2.6885289133860013e-11, 2.9716430705040153e-11, 3.2547572276220293e-11, 3.5378713847400434e-11, 3.8209858888027526e-11, 4.1041000459207666e-11, 4.3872142030387806e-11, 4.67032870710149e-11, 4.953442864219504e-11, 5.236557021337518e-11, 5.519671178455532e-11, 5.802785335573546e-11, 6.085899839636255e-11, 6.369013649809574e-11, 6.652128153872283e-11, 6.935242657934992e-11, 7.218356468108311e-11, 7.50147097217102e-11, 7.78458547623373e-11, 8.067699286407048e-11, 8.350813790469758e-11, 8.633928294532467e-11, 8.917042104705786e-11, 9.200156608768495e-11, 9.483271112831204e-11, 9.766384923004523e-11]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 9.0, 14.0, 20.0, 33.0, 35.0, 34.0, 38.0, 37.0, 46.0, 55.0, 56.0, 71.0, 67.0, 64.0, 60.0, 48.0, 41.0, 45.0, 38.0, 23.0, 35.0, 17.0, 21.0, 16.0, 8.0, 8.0, 14.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.606374739453024e-11, -5.407851597083457e-11, -5.2093281077691955e-11, -5.010804965399629e-11, -4.812281476085367e-11, -4.6137583337158006e-11, -4.415234844401539e-11, -4.216711702031972e-11, -4.0181885596624056e-11, -3.819665417292839e-11, -3.621141927978577e-11, -3.4226187856090107e-11, -3.224095296294749e-11, -3.025572153925182e-11, -2.827048838083268e-11, -2.628525522241354e-11, -2.430002032927092e-11, -2.231478717085178e-11, -2.0329554012432638e-11, -1.8344322588736972e-11, -1.6359087695594354e-11, -1.437385540453695e-11, -1.2388623113479547e-11, -1.0403389955060405e-11, -8.418156796641263e-12, -6.432923638222121e-12, -4.447690913483848e-12, -2.4624581887455754e-12, -4.772250303264336e-13, 1.5080081280927082e-12, 3.493240419150112e-12, 5.478473577569254e-12, 7.463710205435348e-12, 9.44894336385449e-12, 1.1434176522273631e-11, 1.3419408813331035e-11, 1.5404642839111915e-11, 1.738987426280758e-11, 1.9375107421226723e-11, 2.1360340579645865e-11, 2.3345573738065006e-11, 2.5330806896484148e-11, 2.731604005490329e-11, 2.930127321332243e-11, 3.12865046370181e-11, 3.3271739530160716e-11, 3.525697095385638e-11, 3.724220237755205e-11, 3.9227437270694665e-11, 4.121266869439033e-11, 4.319790358753295e-11, 4.5183135011228615e-11, 4.716836990437123e-11, 4.91536013280669e-11, 5.1138836221209516e-11, 5.312406764490518e-11, 5.510929906860085e-11, 5.7094530492296514e-11, 5.907976191599218e-11, 6.106500027858175e-11, 6.305023170227742e-11, 6.503546312597308e-11, 6.702069454966875e-11, 6.900592597336441e-11, 7.099116433595398e-11]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 6.0, 10.0, 19.0, 18.0, 35.0, 52.0, 66.0, 120.0, 218.0, 157.0, 92.0, 64.0, 44.0, 28.0, 17.0, 15.0, 9.0, 3.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.939718425966966e-11, -4.778989703968506e-11, -4.618261328914741e-11, -4.457532606916281e-11, -4.2968042318625166e-11, -4.136075509864057e-11, -3.975347134810292e-11, -3.814618412811832e-11, -3.653889690813372e-11, -3.4931609688149123e-11, -3.3324325937611476e-11, -3.171703871762688e-11, -3.010975496708923e-11, -2.8502467747104632e-11, -2.689518226184351e-11, -2.5287896776582386e-11, -2.368061302604474e-11, -2.2073327540783616e-11, -2.0466042055522493e-11, -1.8858754835537894e-11, -1.7251471085000247e-11, -1.564418386501565e-11, -1.4036898379754525e-11, -1.2429612894493403e-11, -1.082232740923228e-11, -9.215041923971157e-12, -7.607756438710034e-12, -6.000470086087173e-12, -4.39318460082605e-12, -2.785899115564927e-12, -1.1786127629420662e-12, 4.2867272231905673e-13, 2.0359547381332277e-12, 3.643240223394351e-12, 5.2505261423363425e-12, 6.8578120612783344e-12, 8.465097546539457e-12, 1.007238303180058e-11, 1.1679669384423441e-11, 1.3286954869684564e-11, 1.4894240354945687e-11, 1.650152584020681e-11, 1.8108811325467933e-11, 1.9716096810729056e-11, 2.1323384030713655e-11, 2.29306677812513e-11, 2.45379550012359e-11, 2.6145240486497023e-11, 2.7752525971758146e-11, 2.9359813191742745e-11, 3.096709694228039e-11, 3.257438416226499e-11, 3.418166791280264e-11, 3.578895513278724e-11, 3.7396238883324884e-11, 3.900352610330948e-11, 4.061081332329408e-11, 4.221810054327868e-11, 4.382538429381633e-11, 4.5432671513800926e-11, 4.703995526433857e-11, 4.864724248432317e-11, 5.025452970430777e-11, 5.186181345484542e-11, 5.3469097205383065e-11]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 7.0, 4.0, 5.0, 10.0, 9.0, 11.0, 22.0, 23.0, 24.0, 32.0, 32.0, 37.0, 45.0, 71.0, 80.0, 73.0, 77.0, 73.0, 56.0, 46.0, 42.0, 39.0, 29.0, 38.0, 29.0, 20.0, 20.0, 18.0, 12.0, 7.0, 8.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0945523921133145e-11, -2.9720462202398323e-11, -2.849539701421655e-11, -2.727033529548173e-11, -2.6045270107299956e-11, -2.4820208388565135e-11, -2.3595144935106838e-11, -2.237008148164854e-11, -2.1145018028190243e-11, -1.9919954574731946e-11, -1.869489112127365e-11, -1.7469827667815352e-11, -1.624476594908053e-11, -1.5019700760898758e-11, -1.3794639042163936e-11, -1.256957558870564e-11, -1.1344512135247342e-11, -1.0119448681789045e-11, -8.894385228330748e-12, -7.669322642234189e-12, -6.4442591887758915e-12, -5.219195735317594e-12, -3.994133149221035e-12, -2.769069695762738e-12, -1.544006242304441e-12, -3.189430056865783e-13, 9.061202309312844e-13, 2.1311832507087125e-12, 3.3562467041670097e-12, 4.581310157625307e-12, 5.806372743721866e-12, 7.031436197180163e-12, 8.256496181191508e-12, 9.481559634649805e-12, 1.0706623088108103e-11, 1.1931685674204662e-11, 1.3156749127662959e-11, 1.4381812581121256e-11, 1.5606875167217815e-11, 1.6831938620676112e-11, 1.805700207413441e-11, 1.9282065527592707e-11, 2.0507128981051004e-11, 2.17321924345093e-11, 2.2957254153244122e-11, 2.4182319341425895e-11, 2.5407381060160716e-11, 2.6632444513619014e-11, 2.785750796707731e-11, 2.9082571420535608e-11, 3.0307634873993905e-11, 3.1532696592728726e-11, 3.27577617809105e-11, 3.398282349964532e-11, 3.520788521838014e-11, 3.6432950406561915e-11, 3.765801559474369e-11, 3.888307731347851e-11, 4.010814250166028e-11, 4.1333204220395103e-11, 4.2558269408576876e-11, 4.37833311273117e-11, 4.500839284604652e-11, 4.623345803422829e-11, 4.745851975296311e-11]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 17.0, 15.0, 19.0, 22.0, 23.0, 32.0, 61.0, 66.0, 139.0, 178.0, 107.0, 80.0, 58.0, 38.0, 26.0, 27.0, 15.0, 8.0, 8.0, 5.0, 7.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.8765310406141396e-11, -3.7670196822992e-11, -3.65750832398426e-11, -3.547996618724625e-11, -3.438485260409685e-11, -3.328973902094745e-11, -3.219462543779805e-11, -3.1099511854648654e-11, -3.0004398271499255e-11, -2.8909284688349857e-11, -2.7814169370476982e-11, -2.6719055787327584e-11, -2.5623942204178185e-11, -2.452882688630531e-11, -2.3433713303155912e-11, -2.2338599720006513e-11, -2.124348440213364e-11, -2.014837081898424e-11, -1.9053255501111366e-11, -1.7958141917961967e-11, -1.686302833481257e-11, -1.576791475166317e-11, -1.4672799433790296e-11, -1.3577685850640897e-11, -1.248257140012976e-11, -1.1387456949618624e-11, -1.0292343366469225e-11, -9.197228915958089e-12, -8.102114465446952e-12, -7.007000882297554e-12, -5.911886431786417e-12, -4.816772848637019e-12, -3.721658398125882e-12, -2.6265443812956146e-12, -1.5314301476249126e-12, -4.3631591395421054e-13, 6.58798102876057e-13, 1.7539121197063245e-12, 2.849026570217461e-12, 3.94414015336686e-12, 5.039254603877996e-12, 6.134368620708264e-12, 7.229482637538531e-12, 8.324597088049668e-12, 9.419711538560804e-12, 1.0514825121710203e-11, 1.160993957222134e-11, 1.2705053155370738e-11, 1.3800167605881875e-11, 1.4895281189031273e-11, 1.5990396506904148e-11, 1.7085510090053546e-11, 1.8180623673202945e-11, 1.9275737256352343e-11, 2.0370852574225218e-11, 2.1465966157374616e-11, 2.256108147524749e-11, 2.365619505839689e-11, 2.4751310376269764e-11, 2.5846423959419162e-11, 2.694153754256856e-11, 2.8036652860441436e-11, 2.9131766443590834e-11, 3.022688002674023e-11, 3.132199360988963e-11]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 4.0, 8.0, 11.0, 6.0, 23.0, 20.0, 28.0, 26.0, 33.0, 40.0, 43.0, 56.0, 73.0, 72.0, 86.0, 72.0, 65.0, 50.0, 34.0, 37.0, 37.0, 38.0, 30.0, 26.0, 18.0, 17.0, 15.0, 10.0, 6.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3901033929796256e-11, -2.296635798204605e-11, -2.203168203429584e-11, -2.1097006086545633e-11, -2.016232840407195e-11, -1.9227652456321742e-11, -1.8292976508571535e-11, -1.7358300560821327e-11, -1.6423622878347643e-11, -1.5488946930597436e-11, -1.4554270982847228e-11, -1.3619594167735283e-11, -1.2684917352623337e-11, -1.175024140487313e-11, -1.0815565457122922e-11, -9.880889509372714e-12, -8.946213561622507e-12, -8.0115376138723e-12, -7.076860798760354e-12, -6.142184851010146e-12, -5.20750846957907e-12, -4.272832088147993e-12, -3.3381561403977855e-12, -2.403479758966709e-12, -1.4688033775356324e-12, -5.341271045247731e-13, 4.0054916848608624e-13, 1.3352253330767283e-12, 2.269901714507805e-12, 3.2045780959388814e-12, 4.139254043689089e-12, 5.0739304251201656e-12, 6.008606806551242e-12, 6.943283187982319e-12, 7.877959569413395e-12, 8.812635517163603e-12, 9.747312332275548e-12, 1.0681988280025756e-11, 1.1616664227775964e-11, 1.2551340175526171e-11, 1.3486016990638117e-11, 1.4420692938388324e-11, 1.535536975350027e-11, 1.6290045701250477e-11, 1.7224721649000685e-11, 1.8159397596750892e-11, 1.90940735445011e-11, 2.0028751226974784e-11, 2.096342717472499e-11, 2.18981031224752e-11, 2.2832779070225406e-11, 2.376745675269909e-11, 2.4702132700449297e-11, 2.5636808648199505e-11, 2.6571484595949713e-11, 2.750616054369992e-11, 2.8440836491450128e-11, 2.9375512439200335e-11, 3.031018838695054e-11, 3.124486433470075e-11, 3.217954028245096e-11, 3.311421969964812e-11, 3.4048895647398325e-11, 3.498357159514853e-11, 3.591824754289874e-11]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 9.0, 11.0, 18.0, 13.0, 21.0, 37.0, 35.0, 56.0, 84.0, 140.0, 206.0, 111.0, 52.0, 51.0, 31.0, 26.0, 27.0, 14.0, 11.0, 11.0, 6.0, 8.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.3412978900935215e-11, -5.2051599142011185e-11, -5.0690219383087154e-11, -4.9328839624163123e-11, -4.7967463334686045e-11, -4.6606083575762014e-11, -4.5244703816837983e-11, -4.388332405791395e-11, -4.252194429898992e-11, -4.116056454006589e-11, -3.979918478114186e-11, -3.843780849166478e-11, -3.707642873274075e-11, -3.571504897381672e-11, -3.435366921489269e-11, -3.299228945596866e-11, -3.163091316649158e-11, -3.026953340756755e-11, -2.8908155383366996e-11, -2.7546775624442965e-11, -2.618539760024241e-11, -2.482401784131838e-11, -2.346263808239435e-11, -2.210125832347032e-11, -2.0739880299269764e-11, -1.9378500540345733e-11, -1.801712251614518e-11, -1.6655742757221148e-11, -1.5294362998297117e-11, -1.3932984974096563e-11, -1.2571605215172532e-11, -1.121022632361024e-11, -9.848850901494899e-12, -8.487472009932606e-12, -7.1260926846894446e-12, -5.764713359446283e-12, -4.40333446788399e-12, -3.0419555763216977e-12, -1.680575817397667e-12, -3.191969258353744e-13, 1.0421819657269182e-12, 2.4035610741296454e-12, 3.7649401825323725e-12, 5.126319507775534e-12, 6.487698399337827e-12, 7.84907729090012e-12, 9.21045704982415e-12, 1.0571835941386443e-11, 1.1933214832948735e-11, 1.3294593724511028e-11, 1.465597261607332e-11, 1.601735237499735e-11, 1.7378730399197906e-11, 1.8740110158121936e-11, 2.0101489917045967e-11, 2.1462869675969998e-11, 2.2824247700170552e-11, 2.4185627459094583e-11, 2.5547005483295138e-11, 2.6908385242219168e-11, 2.82697650011432e-11, 2.963114476006723e-11, 3.099252104954431e-11, 3.235390080846834e-11, 3.371528056739237e-11]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 8.0, 13.0, 27.0, 25.0, 24.0, 32.0, 36.0, 49.0, 66.0, 72.0, 103.0, 109.0, 73.0, 62.0, 36.0, 51.0, 34.0, 35.0, 18.0, 32.0, 15.0, 22.0, 10.0, 11.0, 4.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.673344350392128e-11, -4.480192952738271e-11, -4.2870419020291095e-11, -4.093890504375253e-11, -3.900739453666091e-11, -3.707588056012234e-11, -3.5144366583583775e-11, -3.321285607649216e-11, -3.128134209995359e-11, -2.934982812341502e-11, -2.7418317616323407e-11, -2.548680363978484e-11, -2.3555291397969746e-11, -2.1623779156154654e-11, -1.9692265179616086e-11, -1.7760752937800994e-11, -1.5829240695985902e-11, -1.389772845417081e-11, -1.196621534499398e-11, -1.003470223581715e-11, -8.103189994002058e-12, -6.171677752186966e-12, -4.240164643010136e-12, -2.3086515338333058e-12, -3.771392920182137e-13, 1.5543733834777473e-12, 3.4858860589737084e-12, 5.4173987344696695e-12, 7.34891140996563e-12, 9.280423651780723e-12, 1.1211936760957553e-11, 1.3143449870134383e-11, 1.507495517305557e-11, 1.7006467414870663e-11, 1.8937979656685755e-11, 2.0869493633224323e-11, 2.2801005875039415e-11, 2.4732518116854507e-11, 2.6664032093393075e-11, 2.8595544335208167e-11, 3.052705657702326e-11, 3.245857055356183e-11, 3.4390081060653444e-11, 3.632159503719201e-11, 3.825310901373058e-11, 4.0184619520822196e-11, 4.2116133497360764e-11, 4.404764747389933e-11, 4.597915798099095e-11, 4.7910671957529516e-11, 4.984218246462113e-11, 5.17736964411597e-11, 5.3705206948251316e-11, 5.5636720924789884e-11, 5.756823490132845e-11, 5.949974540842007e-11, 6.143126285440559e-11, 6.33627733614972e-11, 6.529429080748272e-11, 6.722580131457434e-11, 6.915731182166596e-11, 7.108882926765148e-11, 7.302033977474309e-11, 7.495185028183471e-11, 7.688336078892632e-11]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 5.0, 4.0, 9.0, 6.0, 9.0, 13.0, 22.0, 16.0, 26.0, 24.0, 31.0, 59.0, 57.0, 108.0, 453.0, 522707.0, 344.0, 76.0, 54.0, 50.0, 34.0, 37.0, 40.0, 22.0, 17.0, 8.0, 14.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.414084346457628e-10, -7.098016618911629e-10, -6.781948336254118e-10, -6.465880608708119e-10, -6.14981288116212e-10, -5.833744598504609e-10, -5.51767687095861e-10, -5.201609143412611e-10, -4.8855408607551e-10, -4.569472855653345e-10, -4.25340485055159e-10, -3.937337123005591e-10, -3.621269117903836e-10, -3.305201112802081e-10, -2.989133385256082e-10, -2.673065380154327e-10, -2.356997375052572e-10, -2.0409293699508169e-10, -1.72486150362694e-10, -1.408793637303063e-10, -1.0927256322013079e-10, -7.766576270995529e-11, -4.605897607756759e-11, -1.4452189445179897e-11, 1.7154611064995606e-11, 4.8761404636277206e-11, 8.03681982075588e-11, 1.119749917788404e-10, 1.43581785350122e-10, 1.751885858602975e-10, 2.067953724926852e-10, 2.384021591250729e-10, 2.7000890412409717e-10, 3.016157046342727e-10, 3.332225051444482e-10, 3.6482927789904807e-10, 3.9643607840922357e-10, 4.2804287891939907e-10, 4.5964965167399896e-10, 4.912564799397501e-10, 5.2286325269435e-10, 5.544700254489499e-10, 5.86076853714701e-10, 6.176836264693009e-10, 6.492903992239007e-10, 6.808972274896519e-10, 7.125040002442518e-10, 7.441107729988516e-10, 7.757176012646028e-10, 8.073243740192027e-10, 8.389312022849538e-10, 8.705379750395537e-10, 9.021448033053048e-10, 9.337515205487534e-10, 9.653583488145046e-10, 9.969651770802557e-10, 1.0285718943237043e-09, 1.0601787225894554e-09, 1.091785439832904e-09, 1.1233922680986552e-09, 1.1549990963644063e-09, 1.1866059246301575e-09, 1.2182126418736061e-09, 1.2498194701393572e-09, 1.2814262984051084e-09]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 5.0, 7.0, 11.0, 16.0, 22.0, 29.0, 22.0, 33.0, 40.0, 57.0, 59.0, 99.0, 1173.0, 86.0, 71.0, 44.0, 42.0, 47.0, 34.0, 30.0, 20.0, 24.0, 17.0, 9.0, 9.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765658116554164e-10, -7.438202831444585e-10, -7.110747546335006e-10, -6.783292261225427e-10, -6.455836976115847e-10, -6.128382246117781e-10, -5.800926961008201e-10, -5.473471675898622e-10, -5.146016390789043e-10, -4.818561105679464e-10, -4.491105820569885e-10, -4.163650813016062e-10, -3.836195527906483e-10, -3.508740242796904e-10, -3.181285235243081e-10, -2.853829950133502e-10, -2.5263746650239227e-10, -2.1989193799143436e-10, -1.8714642335826426e-10, -1.5440090872509415e-10, -1.2165538021413624e-10, -8.890985170317833e-11, -5.616433707000823e-11, -2.3418822436838127e-11, 9.326706074119784e-12, 4.207222764618379e-11, 7.48177492182478e-11, 1.075632707903118e-10, 1.403087923623758e-10, 1.7305432087333372e-10, 2.0579983550650383e-10, 2.3854535013967393e-10, 2.712909896729343e-10, 3.040365181838922e-10, 3.367820466948501e-10, 3.695275474502324e-10, 4.0227307596119033e-10, 4.3501860447214824e-10, 4.677641052275305e-10, 5.005096337384884e-10, 5.332551622494464e-10, 5.660006907604043e-10, 5.987462192713622e-10, 6.314917477823201e-10, 6.642372207821268e-10, 6.969828048042359e-10, 7.297282778040426e-10, 7.624738063150005e-10, 7.952193348259584e-10, 8.279648633369163e-10, 8.607103918478742e-10, 8.934559203588321e-10, 9.262014488697901e-10, 9.589469218695967e-10, 9.916925058917059e-10, 1.0244379788915126e-09, 1.0571834518913192e-09, 1.089928924891126e-09, 1.122674508913235e-09, 1.1554199819130417e-09, 1.1881655659351509e-09, 1.2209110389349576e-09, 1.2536566229570667e-09, 1.2864020959568734e-09, 1.3191476799789825e-09]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 9.0, 6.0, 16.0, 33.0, 57.0, 91.0, 138.0, 245.0, 470.0, 995.0, 2507.0, 7569.0, 19679.0, 46938.0, 31126680.0, 30108.0, 13919.0, 3348.0, 769.0, 369.0, 248.0, 113.0, 77.0, 46.0, 23.0, 12.0, 21.0, 10.0, 5.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.875, -187.021484375, -180.16796875, -173.314453125, -166.4609375, -159.607421875, -152.75390625, -145.900390625, -139.046875, -132.193359375, -125.33984375, -118.486328125, -111.6328125, -104.779296875, -97.92578125, -91.072265625, -84.21875, -77.365234375, -70.51171875, -63.658203125, -56.8046875, -49.951171875, -43.09765625, -36.244140625, -29.390625, -22.537109375, -15.68359375, -8.830078125, -1.9765625, 4.876953125, 11.73046875, 18.583984375, 25.4375, 32.291015625, 39.14453125, 45.998046875, 52.8515625, 59.705078125, 66.55859375, 73.412109375, 80.265625, 87.119140625, 93.97265625, 100.826171875, 107.6796875, 114.533203125, 121.38671875, 128.240234375, 135.09375, 141.947265625, 148.80078125, 155.654296875, 162.5078125, 169.361328125, 176.21484375, 183.068359375, 189.921875, 196.775390625, 203.62890625, 210.482421875, 217.3359375, 224.189453125, 231.04296875, 237.896484375, 244.75]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 3.0, 6.0, 8.0, 16.0, 15.0, 25.0, 42.0, 75.0, 111.0, 185.0, 301.0, 474.0, 819.0, 1677.0, 3138.0, 6876.0, 15462.0, 36698.0, 100709.0, 376013.0, 4069180.0, 1346866.0, 216092.0, 68224.0, 26170.0, 11187.0, 5374.0, 2598.0, 1325.0, 705.0, 433.0, 222.0, 150.0, 90.0, 54.0, 28.0, 26.0, 23.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.625, -18.057373046875, -17.48974609375, -16.922119140625, -16.3544921875, -15.786865234375, -15.21923828125, -14.651611328125, -14.083984375, -13.516357421875, -12.94873046875, -12.381103515625, -11.8134765625, -11.245849609375, -10.67822265625, -10.110595703125, -9.54296875, -8.975341796875, -8.40771484375, -7.840087890625, -7.2724609375, -6.704833984375, -6.13720703125, -5.569580078125, -5.001953125, -4.434326171875, -3.86669921875, -3.299072265625, -2.7314453125, -2.163818359375, -1.59619140625, -1.028564453125, -0.4609375, 0.106689453125, 0.67431640625, 1.241943359375, 1.8095703125, 2.377197265625, 2.94482421875, 3.512451171875, 4.080078125, 4.647705078125, 5.21533203125, 5.782958984375, 6.3505859375, 6.918212890625, 7.48583984375, 8.053466796875, 8.62109375, 9.188720703125, 9.75634765625, 10.323974609375, 10.8916015625, 11.459228515625, 12.02685546875, 12.594482421875, 13.162109375, 13.729736328125, 14.29736328125, 14.864990234375, 15.4326171875, 16.000244140625, 16.56787109375, 17.135498046875, 17.703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 11.0, 5.0, 11.0, 14.0, 14.0, 26.0, 21.0, 29.0, 31.0, 40.0, 49.0, 60.0, 60.0, 81.0, 92.0, 114.0, 171.0, 184.0, 197.0, 162.0, 126.0, 107.0, 82.0, 64.0, 57.0, 41.0, 33.0, 29.0, 17.0, 13.0, 10.0, 17.0, 6.0, 7.0, 2.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.03125, -4.88262939453125, -4.7340087890625, -4.58538818359375, -4.436767578125, -4.28814697265625, -4.1395263671875, -3.99090576171875, -3.84228515625, -3.69366455078125, -3.5450439453125, -3.39642333984375, -3.247802734375, -3.09918212890625, -2.9505615234375, -2.80194091796875, -2.6533203125, -2.50469970703125, -2.3560791015625, -2.20745849609375, -2.058837890625, -1.91021728515625, -1.7615966796875, -1.61297607421875, -1.46435546875, -1.31573486328125, -1.1671142578125, -1.01849365234375, -0.869873046875, -0.72125244140625, -0.5726318359375, -0.42401123046875, -0.275390625, -0.12677001953125, 0.0218505859375, 0.17047119140625, 0.319091796875, 0.46771240234375, 0.6163330078125, 0.76495361328125, 0.91357421875, 1.06219482421875, 1.2108154296875, 1.35943603515625, 1.508056640625, 1.65667724609375, 1.8052978515625, 1.95391845703125, 2.1025390625, 2.25115966796875, 2.3997802734375, 2.54840087890625, 2.697021484375, 2.84564208984375, 2.9942626953125, 3.14288330078125, 3.29150390625, 3.44012451171875, 3.5887451171875, 3.73736572265625, 3.885986328125, 4.03460693359375, 4.1832275390625, 4.33184814453125, 4.48046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 6.0, 10.0, 16.0, 21.0, 22.0, 36.0, 66.0, 86.0, 104.0, 166.0, 284.0, 433.0, 618.0, 965.0, 1415.0, 2241.0, 3674.0, 6201.0, 10579.0, 18868.0, 35787.0, 70750.0, 154471.0, 411552.0, 2160923.0, 2649637.0, 442519.0, 162071.0, 73604.0, 36742.0, 19951.0, 10844.0, 6331.0, 3795.0, 2314.0, 1475.0, 954.0, 545.0, 390.0, 294.0, 204.0, 137.0, 118.0, 56.0, 46.0, 33.0, 22.0, 16.0, 9.0, 5.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0], "bins": [-6.25390625, -6.0645751953125, -5.875244140625, -5.6859130859375, -5.49658203125, -5.3072509765625, -5.117919921875, -4.9285888671875, -4.7392578125, -4.5499267578125, -4.360595703125, -4.1712646484375, -3.98193359375, -3.7926025390625, -3.603271484375, -3.4139404296875, -3.224609375, -3.0352783203125, -2.845947265625, -2.6566162109375, -2.46728515625, -2.2779541015625, -2.088623046875, -1.8992919921875, -1.7099609375, -1.5206298828125, -1.331298828125, -1.1419677734375, -0.95263671875, -0.7633056640625, -0.573974609375, -0.3846435546875, -0.1953125, -0.0059814453125, 0.183349609375, 0.3726806640625, 0.56201171875, 0.7513427734375, 0.940673828125, 1.1300048828125, 1.3193359375, 1.5086669921875, 1.697998046875, 1.8873291015625, 2.07666015625, 2.2659912109375, 2.455322265625, 2.6446533203125, 2.833984375, 3.0233154296875, 3.212646484375, 3.4019775390625, 3.59130859375, 3.7806396484375, 3.969970703125, 4.1593017578125, 4.3486328125, 4.5379638671875, 4.727294921875, 4.9166259765625, 5.10595703125, 5.2952880859375, 5.484619140625, 5.6739501953125, 5.86328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 9.0, 6.0, 8.0, 10.0, 18.0, 21.0, 30.0, 31.0, 60.0, 53.0, 72.0, 105.0, 127.0, 185.0, 285.0, 284.0, 182.0, 129.0, 90.0, 52.0, 52.0, 43.0, 34.0, 34.0, 19.0, 17.0, 13.0, 12.0, 11.0, 6.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.31640625, -5.12518310546875, -4.9339599609375, -4.74273681640625, -4.551513671875, -4.36029052734375, -4.1690673828125, -3.97784423828125, -3.78662109375, -3.59539794921875, -3.4041748046875, -3.21295166015625, -3.021728515625, -2.83050537109375, -2.6392822265625, -2.44805908203125, -2.2568359375, -2.06561279296875, -1.8743896484375, -1.68316650390625, -1.491943359375, -1.30072021484375, -1.1094970703125, -0.91827392578125, -0.72705078125, -0.53582763671875, -0.3446044921875, -0.15338134765625, 0.037841796875, 0.22906494140625, 0.4202880859375, 0.61151123046875, 0.802734375, 0.99395751953125, 1.1851806640625, 1.37640380859375, 1.567626953125, 1.75885009765625, 1.9500732421875, 2.14129638671875, 2.33251953125, 2.52374267578125, 2.7149658203125, 2.90618896484375, 3.097412109375, 3.28863525390625, 3.4798583984375, 3.67108154296875, 3.8623046875, 4.05352783203125, 4.2447509765625, 4.43597412109375, 4.627197265625, 4.81842041015625, 5.0096435546875, 5.20086669921875, 5.39208984375, 5.58331298828125, 5.7745361328125, 5.96575927734375, 6.156982421875, 6.34820556640625, 6.5394287109375, 6.73065185546875, 6.921875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 10.0, 11.0, 5.0, 10.0, 31.0, 27.0, 44.0, 73.0, 80.0, 109.0, 170.0, 221.0, 330.0, 560.0, 921.0, 1580.0, 3276.0, 7821.0, 25309.0, 192439.0, 5986860.0, 49649.0, 12156.0, 4479.0, 2118.0, 1157.0, 641.0, 404.0, 287.0, 166.0, 129.0, 97.0, 70.0, 66.0, 35.0, 35.0, 9.0, 11.0, 11.0, 10.0, 5.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.609375, -29.628662109375, -28.64794921875, -27.667236328125, -26.6865234375, -25.705810546875, -24.72509765625, -23.744384765625, -22.763671875, -21.782958984375, -20.80224609375, -19.821533203125, -18.8408203125, -17.860107421875, -16.87939453125, -15.898681640625, -14.91796875, -13.937255859375, -12.95654296875, -11.975830078125, -10.9951171875, -10.014404296875, -9.03369140625, -8.052978515625, -7.072265625, -6.091552734375, -5.11083984375, -4.130126953125, -3.1494140625, -2.168701171875, -1.18798828125, -0.207275390625, 0.7734375, 1.754150390625, 2.73486328125, 3.715576171875, 4.6962890625, 5.677001953125, 6.65771484375, 7.638427734375, 8.619140625, 9.599853515625, 10.58056640625, 11.561279296875, 12.5419921875, 13.522705078125, 14.50341796875, 15.484130859375, 16.46484375, 17.445556640625, 18.42626953125, 19.406982421875, 20.3876953125, 21.368408203125, 22.34912109375, 23.329833984375, 24.310546875, 25.291259765625, 26.27197265625, 27.252685546875, 28.2333984375, 29.214111328125, 30.19482421875, 31.175537109375, 32.15625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 3.0, 17.0, 17.0, 10.0, 14.0, 17.0, 25.0, 22.0, 27.0, 28.0, 44.0, 56.0, 53.0, 118.0, 206.0, 402.0, 417.0, 120.0, 71.0, 52.0, 42.0, 24.0, 42.0, 24.0, 27.0, 27.0, 17.0, 11.0, 17.0, 11.0, 12.0, 10.0, 4.0, 8.0, 1.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-8.8046875, -8.56097412109375, -8.3172607421875, -8.07354736328125, -7.829833984375, -7.58612060546875, -7.3424072265625, -7.09869384765625, -6.85498046875, -6.61126708984375, -6.3675537109375, -6.12384033203125, -5.880126953125, -5.63641357421875, -5.3927001953125, -5.14898681640625, -4.9052734375, -4.66156005859375, -4.4178466796875, -4.17413330078125, -3.930419921875, -3.68670654296875, -3.4429931640625, -3.19927978515625, -2.95556640625, -2.71185302734375, -2.4681396484375, -2.22442626953125, -1.980712890625, -1.73699951171875, -1.4932861328125, -1.24957275390625, -1.005859375, -0.76214599609375, -0.5184326171875, -0.27471923828125, -0.031005859375, 0.21270751953125, 0.4564208984375, 0.70013427734375, 0.94384765625, 1.18756103515625, 1.4312744140625, 1.67498779296875, 1.918701171875, 2.16241455078125, 2.4061279296875, 2.64984130859375, 2.8935546875, 3.13726806640625, 3.3809814453125, 3.62469482421875, 3.868408203125, 4.11212158203125, 4.3558349609375, 4.59954833984375, 4.84326171875, 5.08697509765625, 5.3306884765625, 5.57440185546875, 5.818115234375, 6.06182861328125, 6.3055419921875, 6.54925537109375, 6.79296875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 18.0, 57.0, 899.0, 20.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-562.325927734375, -552.0142211914062, -541.7025146484375, -531.3907470703125, -521.0790405273438, -510.767333984375, -500.4555969238281, -490.14385986328125, -479.8321533203125, -469.52044677734375, -459.2087097167969, -448.89697265625, -438.58526611328125, -428.2735595703125, -417.9618225097656, -407.65008544921875, -397.33837890625, -387.02667236328125, -376.7149353027344, -366.4031982421875, -356.09149169921875, -345.77978515625, -335.4680480957031, -325.15631103515625, -314.8446044921875, -304.53289794921875, -294.2211608886719, -283.909423828125, -273.59771728515625, -263.2860107421875, -252.97427368164062, -242.6625518798828, -232.35081481933594, -222.03909301757812, -211.7273712158203, -201.4156494140625, -191.1039276123047, -180.79220581054688, -170.48048400878906, -160.16876220703125, -149.85704040527344, -139.54531860351562, -129.2335968017578, -118.921875, -108.61015319824219, -98.29843139648438, -87.98670959472656, -77.67498779296875, -67.36326599121094, -57.051544189453125, -46.73982238769531, -36.4281005859375, -26.116378784179688, -15.804656982421875, -5.4929351806640625, 4.81878662109375, 15.130508422851562, 25.442230224609375, 35.75395202636719, 46.065673828125, 56.37739562988281, 66.68911743164062, 77.00083923339844, 87.31256103515625, 97.62428283691406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 8.0, 5.0, 19.0, 46.0, 574.0, 276.0, 34.0, 21.0, 13.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.41301727294922, -114.61406707763672, -109.81511688232422, -105.01616668701172, -100.21721649169922, -95.41826629638672, -90.61932373046875, -85.82037353515625, -81.02142333984375, -76.22247314453125, -71.42352294921875, -66.62457275390625, -61.82562255859375, -57.02667236328125, -52.227725982666016, -47.428775787353516, -42.62982177734375, -37.83087158203125, -33.03192138671875, -28.232973098754883, -23.434022903442383, -18.635072708129883, -13.836124420166016, -9.037174224853516, -4.238224029541016, 0.5607256889343262, 5.359675407409668, 10.158624649047852, 14.957574844360352, 19.75652503967285, 24.55547332763672, 29.35442352294922, 34.15336608886719, 38.95231628417969, 43.75126647949219, 48.55021667480469, 53.34916687011719, 58.14811706542969, 62.94706344604492, 67.74601745605469, 72.54496765136719, 77.34391784667969, 82.14286804199219, 86.94181823730469, 91.74076843261719, 96.53971862792969, 101.33866882324219, 106.13761901855469, 110.93656158447266, 115.73551177978516, 120.53446197509766, 125.33341217041016, 130.13235473632812, 134.93130493164062, 139.73025512695312, 144.52920532226562, 149.32815551757812, 154.12710571289062, 158.92605590820312, 163.72500610351562, 168.52395629882812, 173.32290649414062, 178.12185668945312, 182.92080688476562, 187.71975708007812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 7.0, 23.0, 15.0, 21.0, 37.0, 56.0, 80.0, 108.0, 149.0, 257.0, 349.0, 511.0, 856.0, 1490.0, 2808.0, 6156.0, 16609.0, 120660.0, 3954836.0, 61746.0, 14434.0, 5952.0, 3008.0, 1550.0, 868.0, 471.0, 304.0, 204.0, 147.0, 98.0, 92.0, 60.0, 50.0, 48.0, 31.0, 29.0, 33.0, 21.0, 17.0, 12.0, 14.0, 16.0, 11.0, 7.0, 2.0, 4.0, 6.0, 3.0, 0.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1854248046875, -0.1778240203857422, -0.17022323608398438, -0.16262245178222656, -0.15502166748046875, -0.14742088317871094, -0.13982009887695312, -0.1322193145751953, -0.1246185302734375, -0.11701774597167969, -0.10941696166992188, -0.10181617736816406, -0.09421539306640625, -0.08661460876464844, -0.07901382446289062, -0.07141304016113281, -0.063812255859375, -0.05621147155761719, -0.048610687255859375, -0.04100990295410156, -0.03340911865234375, -0.025808334350585938, -0.018207550048828125, -0.010606765747070312, -0.0030059814453125, 0.0045948028564453125, 0.012195587158203125, 0.019796371459960938, 0.02739715576171875, 0.03499794006347656, 0.042598724365234375, 0.05019950866699219, 0.05780029296875, 0.06540107727050781, 0.07300186157226562, 0.08060264587402344, 0.08820343017578125, 0.09580421447753906, 0.10340499877929688, 0.11100578308105469, 0.1186065673828125, 0.1262073516845703, 0.13380813598632812, 0.14140892028808594, 0.14900970458984375, 0.15661048889160156, 0.16421127319335938, 0.1718120574951172, 0.179412841796875, 0.1870136260986328, 0.19461441040039062, 0.20221519470214844, 0.20981597900390625, 0.21741676330566406, 0.22501754760742188, 0.2326183319091797, 0.2402191162109375, 0.2478199005126953, 0.2554206848144531, 0.26302146911621094, 0.27062225341796875, 0.27822303771972656, 0.2858238220214844, 0.2934246063232422, 0.301025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 4.0, 10.0, 23.0, 32.0, 226.0, 476.0, 144.0, 24.0, 5.0, 11.0, 12.0, 2.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.0180051326751709, -0.017165660858154297, -0.016326189041137695, -0.015486717224121094, -0.014647245407104492, -0.01380777359008789, -0.012968301773071289, -0.012128829956054688, -0.011289358139038086, -0.010449886322021484, -0.009610414505004883, -0.008770942687988281, -0.00793147087097168, -0.007091999053955078, -0.0062525272369384766, -0.005413055419921875, -0.0045735836029052734, -0.003734111785888672, -0.0028946399688720703, -0.0020551681518554688, -0.0012156963348388672, -0.0003762245178222656, 0.00046324729919433594, 0.0013027191162109375, 0.002142190933227539, 0.0029816627502441406, 0.003821134567260742, 0.004660606384277344, 0.005500078201293945, 0.006339550018310547, 0.0071790218353271484, 0.00801849365234375, 0.008857965469360352, 0.009697437286376953, 0.010536909103393555, 0.011376380920410156, 0.012215852737426758, 0.01305532455444336, 0.013894796371459961, 0.014734268188476562, 0.015573740005493164, 0.016413211822509766, 0.017252683639526367, 0.01809215545654297, 0.01893162727355957, 0.019771099090576172, 0.020610570907592773, 0.021450042724609375, 0.022289514541625977, 0.023128986358642578, 0.02396845817565918, 0.02480792999267578, 0.025647401809692383, 0.026486873626708984, 0.027326345443725586, 0.028165817260742188, 0.02900528907775879, 0.02984476089477539, 0.030684232711791992, 0.031523704528808594, 0.032363176345825195, 0.0332026481628418, 0.0340421199798584, 0.034881591796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 14.0, 5.0, 23.0, 37.0, 45.0, 77.0, 122.0, 254.0, 674.0, 1728.0, 6485.0, 40349.0, 3249781.0, 857695.0, 29094.0, 5066.0, 1475.0, 593.0, 259.0, 165.0, 101.0, 54.0, 46.0, 29.0, 27.0, 11.0, 12.0, 13.0, 7.0, 5.0, 8.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2765388488769531, -0.26499176025390625, -0.2534446716308594, -0.2418975830078125, -0.23035049438476562, -0.21880340576171875, -0.20725631713867188, -0.195709228515625, -0.18416213989257812, -0.17261505126953125, -0.16106796264648438, -0.1495208740234375, -0.13797378540039062, -0.12642669677734375, -0.11487960815429688, -0.10333251953125, -0.09178543090820312, -0.08023834228515625, -0.06869125366210938, -0.0571441650390625, -0.045597076416015625, -0.03404998779296875, -0.022502899169921875, -0.010955810546875, 0.000591278076171875, 0.01213836669921875, 0.023685455322265625, 0.0352325439453125, 0.046779632568359375, 0.05832672119140625, 0.06987380981445312, 0.0814208984375, 0.09296798706054688, 0.10451507568359375, 0.11606216430664062, 0.1276092529296875, 0.13915634155273438, 0.15070343017578125, 0.16225051879882812, 0.173797607421875, 0.18534469604492188, 0.19689178466796875, 0.20843887329101562, 0.2199859619140625, 0.23153305053710938, 0.24308013916015625, 0.2546272277832031, 0.26617431640625, 0.2777214050292969, 0.28926849365234375, 0.3008155822753906, 0.3123626708984375, 0.3239097595214844, 0.33545684814453125, 0.3470039367675781, 0.358551025390625, 0.3700981140136719, 0.38164520263671875, 0.3931922912597656, 0.4047393798828125, 0.4162864685058594, 0.42783355712890625, 0.4393806457519531, 0.450927734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 5.0, 2.0, 5.0, 8.0, 11.0, 15.0, 20.0, 24.0, 35.0, 33.0, 43.0, 66.0, 70.0, 80.0, 113.0, 134.0, 229.0, 337.0, 819.0, 1160.0, 249.0, 171.0, 99.0, 84.0, 80.0, 50.0, 29.0, 26.0, 20.0, 15.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.038482666015625, -0.0374455451965332, -0.036408424377441406, -0.03537130355834961, -0.03433418273925781, -0.033297061920166016, -0.03225994110107422, -0.031222820281982422, -0.030185699462890625, -0.029148578643798828, -0.02811145782470703, -0.027074337005615234, -0.026037216186523438, -0.02500009536743164, -0.023962974548339844, -0.022925853729248047, -0.02188873291015625, -0.020851612091064453, -0.019814491271972656, -0.01877737045288086, -0.017740249633789062, -0.016703128814697266, -0.01566600799560547, -0.014628887176513672, -0.013591766357421875, -0.012554645538330078, -0.011517524719238281, -0.010480403900146484, -0.009443283081054688, -0.00840616226196289, -0.007369041442871094, -0.006331920623779297, -0.0052947998046875, -0.004257678985595703, -0.0032205581665039062, -0.0021834373474121094, -0.0011463165283203125, -0.00010919570922851562, 0.0009279251098632812, 0.001965045928955078, 0.003002166748046875, 0.004039287567138672, 0.005076408386230469, 0.006113529205322266, 0.0071506500244140625, 0.00818777084350586, 0.009224891662597656, 0.010262012481689453, 0.01129913330078125, 0.012336254119873047, 0.013373374938964844, 0.01441049575805664, 0.015447616577148438, 0.016484737396240234, 0.01752185821533203, 0.018558979034423828, 0.019596099853515625, 0.020633220672607422, 0.02167034149169922, 0.022707462310791016, 0.023744583129882812, 0.02478170394897461, 0.025818824768066406, 0.026855945587158203, 0.02789306640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 11.0, 25.0, 56.0, 218.0, 542.0, 126.0, 22.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5480759143829346, -1.4975101947784424, -1.4469445943832397, -1.3963788747787476, -1.3458131551742554, -1.2952475547790527, -1.2446818351745605, -1.1941161155700684, -1.1435503959655762, -1.092984676361084, -1.0424190759658813, -0.9918533563613892, -0.941287636756897, -0.8907219767570496, -0.8401563167572021, -0.78959059715271, -0.7390249967575073, -0.6884593367576599, -0.6378936171531677, -0.5873279571533203, -0.5367622375488281, -0.4861965775489807, -0.4356309175491333, -0.3850652277469635, -0.3344995379447937, -0.2839338481426239, -0.2333681732416153, -0.1828024983406067, -0.1322368085384369, -0.08167111873626709, -0.031105458736419678, 0.019460231065750122, 0.07002592086791992, 0.12059160321950912, 0.17115728557109833, 0.22172296047210693, 0.27228865027427673, 0.32285434007644653, 0.37342000007629395, 0.42398568987846375, 0.47455137968063354, 0.525117039680481, 0.5756827592849731, 0.6262484192848206, 0.676814079284668, 0.7273797988891602, 0.7779454588890076, 0.828511118888855, 0.8790768384933472, 0.9296424984931946, 0.9802082180976868, 1.0307738780975342, 1.0813395977020264, 1.1319053173065186, 1.1824709177017212, 1.2330366373062134, 1.283602237701416, 1.3341679573059082, 1.3847335577011108, 1.435299277305603, 1.4858649969100952, 1.5364305973052979, 1.58699631690979, 1.6375620365142822, 1.6881277561187744]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 16.0, 19.0, 43.0, 46.0, 43.0, 56.0, 92.0, 100.0, 75.0, 87.0, 86.0, 77.0, 69.0, 49.0, 41.0, 28.0, 23.0, 13.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4925731420516968, -0.4781525135040283, -0.4637318551540375, -0.449311226606369, -0.4348905682563782, -0.4204699397087097, -0.40604931116104126, -0.3916286826133728, -0.37720802426338196, -0.3627873957157135, -0.34836673736572266, -0.3339461088180542, -0.31952548027038574, -0.3051048219203949, -0.29068419337272644, -0.2762635350227356, -0.26184290647506714, -0.2474222630262375, -0.23300161957740784, -0.21858099102973938, -0.20416034758090973, -0.18973970413208008, -0.17531907558441162, -0.16089843213558197, -0.14647778868675232, -0.13205714523792267, -0.11763650923967361, -0.10321587324142456, -0.08879522979259491, -0.07437458634376526, -0.059953950345516205, -0.04553331434726715, -0.0311126708984375, -0.016692031174898148, -0.002271391451358795, 0.012149248272180557, 0.02656988799571991, 0.04099053144454956, 0.055411167442798615, 0.06983180344104767, 0.08425244688987732, 0.09867309033870697, 0.11309372633695602, 0.12751436233520508, 0.14193500578403473, 0.15635564923286438, 0.17077627778053284, 0.1851969212293625, 0.19961756467819214, 0.2140382081270218, 0.22845885157585144, 0.2428794801235199, 0.25730013847351074, 0.2717207670211792, 0.28614139556884766, 0.3005620241165161, 0.31498268246650696, 0.3294033110141754, 0.34382396936416626, 0.3582445979118347, 0.3726652264595032, 0.387085884809494, 0.4015065133571625, 0.4159271717071533, 0.4303478002548218]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 4.0, 6.0, 11.0, 6.0, 12.0, 13.0, 13.0, 19.0, 14.0, 29.0, 29.0, 44.0, 84.0, 108.0, 158.0, 193.0, 298.0, 391.0, 689.0, 1139.0, 2135.0, 4600.0, 11840.0, 66490.0, 881425.0, 58016.0, 11193.0, 4244.0, 2064.0, 1156.0, 685.0, 408.0, 278.0, 221.0, 138.0, 100.0, 72.0, 58.0, 32.0, 27.0, 22.0, 16.0, 8.0, 11.0, 13.0, 12.0, 3.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.2125244140625, -0.20577239990234375, -0.1990203857421875, -0.19226837158203125, -0.185516357421875, -0.17876434326171875, -0.1720123291015625, -0.16526031494140625, -0.15850830078125, -0.15175628662109375, -0.1450042724609375, -0.13825225830078125, -0.131500244140625, -0.12474822998046875, -0.1179962158203125, -0.11124420166015625, -0.1044921875, -0.09774017333984375, -0.0909881591796875, -0.08423614501953125, -0.077484130859375, -0.07073211669921875, -0.0639801025390625, -0.05722808837890625, -0.05047607421875, -0.04372406005859375, -0.0369720458984375, -0.03022003173828125, -0.023468017578125, -0.01671600341796875, -0.0099639892578125, -0.00321197509765625, 0.0035400390625, 0.01029205322265625, 0.0170440673828125, 0.02379608154296875, 0.030548095703125, 0.03730010986328125, 0.0440521240234375, 0.05080413818359375, 0.05755615234375, 0.06430816650390625, 0.0710601806640625, 0.07781219482421875, 0.084564208984375, 0.09131622314453125, 0.0980682373046875, 0.10482025146484375, 0.111572265625, 0.11832427978515625, 0.1250762939453125, 0.13182830810546875, 0.138580322265625, 0.14533233642578125, 0.1520843505859375, 0.15883636474609375, 0.16558837890625, 0.17234039306640625, 0.1790924072265625, 0.18584442138671875, 0.192596435546875, 0.19934844970703125, 0.2061004638671875, 0.21285247802734375, 0.2196044921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 7.0, 7.0, 14.0, 22.0, 65.0, 151.0, 210.0, 209.0, 161.0, 54.0, 24.0, 13.0, 2.0, 8.0, 4.0, 8.0, 2.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0200347900390625, -0.01944565773010254, -0.018856525421142578, -0.018267393112182617, -0.017678260803222656, -0.017089128494262695, -0.016499996185302734, -0.015910863876342773, -0.015321731567382812, -0.014732599258422852, -0.01414346694946289, -0.01355433464050293, -0.012965202331542969, -0.012376070022583008, -0.011786937713623047, -0.011197805404663086, -0.010608673095703125, -0.010019540786743164, -0.009430408477783203, -0.008841276168823242, -0.008252143859863281, -0.00766301155090332, -0.007073879241943359, -0.0064847469329833984, -0.0058956146240234375, -0.0053064823150634766, -0.004717350006103516, -0.004128217697143555, -0.0035390853881835938, -0.002949953079223633, -0.002360820770263672, -0.001771688461303711, -0.00118255615234375, -0.0005934238433837891, -4.291534423828125e-06, 0.0005848407745361328, 0.0011739730834960938, 0.0017631053924560547, 0.0023522377014160156, 0.0029413700103759766, 0.0035305023193359375, 0.0041196346282958984, 0.004708766937255859, 0.00529789924621582, 0.005887031555175781, 0.006476163864135742, 0.007065296173095703, 0.007654428482055664, 0.008243560791015625, 0.008832693099975586, 0.009421825408935547, 0.010010957717895508, 0.010600090026855469, 0.01118922233581543, 0.01177835464477539, 0.012367486953735352, 0.012956619262695312, 0.013545751571655273, 0.014134883880615234, 0.014724016189575195, 0.015313148498535156, 0.015902280807495117, 0.016491413116455078, 0.01708054542541504, 0.017669677734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 7.0, 10.0, 9.0, 13.0, 17.0, 26.0, 33.0, 55.0, 57.0, 107.0, 164.0, 231.0, 374.0, 720.0, 1356.0, 3316.0, 10414.0, 67818.0, 855603.0, 89196.0, 12029.0, 3652.0, 1496.0, 716.0, 390.0, 196.0, 150.0, 96.0, 74.0, 42.0, 45.0, 30.0, 28.0, 18.0, 19.0, 9.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.27392578125, -0.26465606689453125, -0.2553863525390625, -0.24611663818359375, -0.236846923828125, -0.22757720947265625, -0.2183074951171875, -0.20903778076171875, -0.19976806640625, -0.19049835205078125, -0.1812286376953125, -0.17195892333984375, -0.162689208984375, -0.15341949462890625, -0.1441497802734375, -0.13488006591796875, -0.1256103515625, -0.11634063720703125, -0.1070709228515625, -0.09780120849609375, -0.088531494140625, -0.07926177978515625, -0.0699920654296875, -0.06072235107421875, -0.05145263671875, -0.04218292236328125, -0.0329132080078125, -0.02364349365234375, -0.014373779296875, -0.00510406494140625, 0.0041656494140625, 0.01343536376953125, 0.022705078125, 0.03197479248046875, 0.0412445068359375, 0.05051422119140625, 0.059783935546875, 0.06905364990234375, 0.0783233642578125, 0.08759307861328125, 0.09686279296875, 0.10613250732421875, 0.1154022216796875, 0.12467193603515625, 0.133941650390625, 0.14321136474609375, 0.1524810791015625, 0.16175079345703125, 0.1710205078125, 0.18029022216796875, 0.1895599365234375, 0.19882965087890625, 0.208099365234375, 0.21736907958984375, 0.2266387939453125, 0.23590850830078125, 0.24517822265625, 0.25444793701171875, 0.2637176513671875, 0.27298736572265625, 0.282257080078125, 0.29152679443359375, 0.3007965087890625, 0.31006622314453125, 0.3193359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 11.0, 11.0, 19.0, 25.0, 20.0, 19.0, 45.0, 31.0, 35.0, 36.0, 25.0, 39.0, 52.0, 43.0, 41.0, 36.0, 44.0, 37.0, 38.0, 41.0, 38.0, 31.0, 34.0, 35.0, 21.0, 23.0, 22.0, 13.0, 21.0, 14.0, 6.0, 14.0, 7.0, 7.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0758056640625, -0.07359504699707031, -0.07138442993164062, -0.06917381286621094, -0.06696319580078125, -0.06475257873535156, -0.06254196166992188, -0.06033134460449219, -0.0581207275390625, -0.05591011047363281, -0.053699493408203125, -0.05148887634277344, -0.04927825927734375, -0.04706764221191406, -0.044857025146484375, -0.04264640808105469, -0.040435791015625, -0.03822517395019531, -0.036014556884765625, -0.03380393981933594, -0.03159332275390625, -0.029382705688476562, -0.027172088623046875, -0.024961471557617188, -0.0227508544921875, -0.020540237426757812, -0.018329620361328125, -0.016119003295898438, -0.01390838623046875, -0.011697769165039062, -0.009487152099609375, -0.0072765350341796875, -0.00506591796875, -0.0028553009033203125, -0.000644683837890625, 0.0015659332275390625, 0.00377655029296875, 0.0059871673583984375, 0.008197784423828125, 0.010408401489257812, 0.0126190185546875, 0.014829635620117188, 0.017040252685546875, 0.019250869750976562, 0.02146148681640625, 0.023672103881835938, 0.025882720947265625, 0.028093338012695312, 0.030303955078125, 0.03251457214355469, 0.034725189208984375, 0.03693580627441406, 0.03914642333984375, 0.04135704040527344, 0.043567657470703125, 0.04577827453613281, 0.0479888916015625, 0.05019950866699219, 0.052410125732421875, 0.05462074279785156, 0.05683135986328125, 0.05904197692871094, 0.061252593994140625, 0.06346321105957031, 0.065673828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 12.0, 31.0, 34.0, 91.0, 275.0, 1006.0, 8241.0, 1021915.0, 15017.0, 1327.0, 360.0, 109.0, 46.0, 28.0, 17.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9337692260742188, -0.9022064208984375, -0.8706436157226562, -0.839080810546875, -0.8075180053710938, -0.7759552001953125, -0.7443923950195312, -0.71282958984375, -0.6812667846679688, -0.6497039794921875, -0.6181411743164062, -0.586578369140625, -0.5550155639648438, -0.5234527587890625, -0.49188995361328125, -0.4603271484375, -0.42876434326171875, -0.3972015380859375, -0.36563873291015625, -0.334075927734375, -0.30251312255859375, -0.2709503173828125, -0.23938751220703125, -0.20782470703125, -0.17626190185546875, -0.1446990966796875, -0.11313629150390625, -0.081573486328125, -0.05001068115234375, -0.0184478759765625, 0.01311492919921875, 0.044677734375, 0.07624053955078125, 0.1078033447265625, 0.13936614990234375, 0.170928955078125, 0.20249176025390625, 0.2340545654296875, 0.26561737060546875, 0.29718017578125, 0.32874298095703125, 0.3603057861328125, 0.39186859130859375, 0.423431396484375, 0.45499420166015625, 0.4865570068359375, 0.5181198120117188, 0.5496826171875, 0.5812454223632812, 0.6128082275390625, 0.6443710327148438, 0.675933837890625, 0.7074966430664062, 0.7390594482421875, 0.7706222534179688, 0.80218505859375, 0.8337478637695312, 0.8653106689453125, 0.8968734741210938, 0.928436279296875, 0.9599990844726562, 0.9915618896484375, 1.0231246948242188, 1.0546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 2.0, 0.0, 0.0, 6.0, 9.0, 8.0, 11.0, 10.0, 18.0, 29.0, 32.0, 45.0, 83.0, 103.0, 225.0, 151.0, 76.0, 54.0, 34.0, 25.0, 21.0, 13.0, 13.0, 8.0, 10.0, 4.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015592575073242188, -0.00015178881585597992, -0.00014765188097953796, -0.000143514946103096, -0.00013937801122665405, -0.0001352410763502121, -0.00013110414147377014, -0.00012696720659732819, -0.00012283027172088623, -0.00011869333684444427, -0.00011455640196800232, -0.00011041946709156036, -0.00010628253221511841, -0.00010214559733867645, -9.80086624622345e-05, -9.387172758579254e-05, -8.973479270935059e-05, -8.559785783290863e-05, -8.146092295646667e-05, -7.732398808002472e-05, -7.318705320358276e-05, -6.905011832714081e-05, -6.491318345069885e-05, -6.07762485742569e-05, -5.663931369781494e-05, -5.2502378821372986e-05, -4.836544394493103e-05, -4.4228509068489075e-05, -4.009157419204712e-05, -3.5954639315605164e-05, -3.181770443916321e-05, -2.7680769562721252e-05, -2.3543834686279297e-05, -1.940689980983734e-05, -1.5269964933395386e-05, -1.113303005695343e-05, -6.996095180511475e-06, -2.859160304069519e-06, 1.2777745723724365e-06, 5.414709448814392e-06, 9.551644325256348e-06, 1.3688579201698303e-05, 1.782551407814026e-05, 2.1962448954582214e-05, 2.609938383102417e-05, 3.0236318707466125e-05, 3.437325358390808e-05, 3.851018846035004e-05, 4.264712333679199e-05, 4.678405821323395e-05, 5.09209930896759e-05, 5.505792796611786e-05, 5.9194862842559814e-05, 6.333179771900177e-05, 6.746873259544373e-05, 7.160566747188568e-05, 7.574260234832764e-05, 7.987953722476959e-05, 8.401647210121155e-05, 8.81534069776535e-05, 9.229034185409546e-05, 9.642727673053741e-05, 0.00010056421160697937, 0.00010470114648342133, 0.00010883808135986328]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 3.0, 13.0, 25.0, 29.0, 44.0, 93.0, 155.0, 317.0, 1029.0, 5976.0, 993255.0, 44182.0, 2275.0, 615.0, 238.0, 109.0, 61.0, 34.0, 29.0, 9.0, 15.0, 16.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0458984375, -1.010772705078125, -0.97564697265625, -0.940521240234375, -0.9053955078125, -0.870269775390625, -0.83514404296875, -0.800018310546875, -0.764892578125, -0.729766845703125, -0.69464111328125, -0.659515380859375, -0.6243896484375, -0.589263916015625, -0.55413818359375, -0.519012451171875, -0.48388671875, -0.448760986328125, -0.41363525390625, -0.378509521484375, -0.3433837890625, -0.308258056640625, -0.27313232421875, -0.238006591796875, -0.202880859375, -0.167755126953125, -0.13262939453125, -0.097503662109375, -0.0623779296875, -0.027252197265625, 0.00787353515625, 0.042999267578125, 0.078125, 0.113250732421875, 0.14837646484375, 0.183502197265625, 0.2186279296875, 0.253753662109375, 0.28887939453125, 0.324005126953125, 0.359130859375, 0.394256591796875, 0.42938232421875, 0.464508056640625, 0.4996337890625, 0.534759521484375, 0.56988525390625, 0.605010986328125, 0.64013671875, 0.675262451171875, 0.71038818359375, 0.745513916015625, 0.7806396484375, 0.815765380859375, 0.85089111328125, 0.886016845703125, 0.921142578125, 0.956268310546875, 0.99139404296875, 1.026519775390625, 1.0616455078125, 1.096771240234375, 1.13189697265625, 1.167022705078125, 1.2021484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 4.0, 13.0, 7.0, 13.0, 24.0, 26.0, 33.0, 53.0, 100.0, 229.0, 206.0, 119.0, 64.0, 28.0, 21.0, 17.0, 5.0, 4.0, 10.0, 4.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.217041015625, -0.21085166931152344, -0.20466232299804688, -0.1984729766845703, -0.19228363037109375, -0.1860942840576172, -0.17990493774414062, -0.17371559143066406, -0.1675262451171875, -0.16133689880371094, -0.15514755249023438, -0.1489582061767578, -0.14276885986328125, -0.1365795135498047, -0.13039016723632812, -0.12420082092285156, -0.118011474609375, -0.11182212829589844, -0.10563278198242188, -0.09944343566894531, -0.09325408935546875, -0.08706474304199219, -0.08087539672851562, -0.07468605041503906, -0.0684967041015625, -0.06230735778808594, -0.056118011474609375, -0.04992866516113281, -0.04373931884765625, -0.03754997253417969, -0.031360626220703125, -0.025171279907226562, -0.01898193359375, -0.012792587280273438, -0.006603240966796875, -0.0004138946533203125, 0.00577545166015625, 0.011964797973632812, 0.018154144287109375, 0.024343490600585938, 0.0305328369140625, 0.03672218322753906, 0.042911529541015625, 0.04910087585449219, 0.05529022216796875, 0.06147956848144531, 0.06766891479492188, 0.07385826110839844, 0.080047607421875, 0.08623695373535156, 0.09242630004882812, 0.09861564636230469, 0.10480499267578125, 0.11099433898925781, 0.11718368530273438, 0.12337303161621094, 0.1295623779296875, 0.13575172424316406, 0.14194107055664062, 0.1481304168701172, 0.15431976318359375, 0.1605091094970703, 0.16669845581054688, 0.17288780212402344, 0.1790771484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 8.0, 14.0, 15.0, 42.0, 97.0, 258.0, 366.0, 116.0, 36.0, 13.0, 5.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0346312522888184, -2.9611363410949707, -2.887641429901123, -2.8141462802886963, -2.7406513690948486, -2.667156457901001, -2.593661308288574, -2.5201663970947266, -2.446671485900879, -2.3731765747070312, -2.2996816635131836, -2.226186513900757, -2.152691602706909, -2.0791966915130615, -2.0057015419006348, -1.932206630706787, -1.8587117195129395, -1.7852168083190918, -1.7117217779159546, -1.6382267475128174, -1.5647318363189697, -1.491236925125122, -1.4177418947219849, -1.3442468643188477, -1.270751953125, -1.1972570419311523, -1.1237620115280151, -1.050266981124878, -0.9767720699310303, -0.9032770991325378, -0.8297821283340454, -0.756287157535553, -0.6827919483184814, -0.609296977519989, -0.5358020067214966, -0.46230703592300415, -0.3888120651245117, -0.3153170943260193, -0.24182212352752686, -0.16832715272903442, -0.09483218193054199, -0.02133721113204956, 0.05215775966644287, 0.1256527304649353, 0.19914770126342773, 0.27264267206192017, 0.3461376428604126, 0.41963261365890503, 0.49312758445739746, 0.5666225552558899, 0.6401175260543823, 0.7136124968528748, 0.7871074676513672, 0.8606024384498596, 0.934097409248352, 1.0075924396514893, 1.081087350845337, 1.1545822620391846, 1.2280772924423218, 1.301572322845459, 1.3750672340393066, 1.4485621452331543, 1.5220571756362915, 1.5955522060394287, 1.6690471172332764]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 7.0, 4.0, 10.0, 5.0, 24.0, 39.0, 50.0, 70.0, 87.0, 90.0, 96.0, 94.0, 104.0, 67.0, 67.0, 53.0, 30.0, 15.0, 18.0, 9.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3302381038665771, -1.2897822856903076, -1.249326467514038, -1.2088706493377686, -1.168414831161499, -1.1279590129852295, -1.08750319480896, -1.04704749584198, -1.0065916776657104, -0.9661358594894409, -0.9256800413131714, -0.8852242231369019, -0.8447684645652771, -0.8043126463890076, -0.763856828212738, -0.7234010696411133, -0.682945191860199, -0.6424893736839294, -0.6020335555076599, -0.5615777969360352, -0.5211219787597656, -0.4806661605834961, -0.44021034240722656, -0.3997545540332794, -0.3592987358570099, -0.31884291768074036, -0.2783871293067932, -0.23793131113052368, -0.19747550785541534, -0.157019704580307, -0.11656388640403748, -0.07610809803009033, -0.0356522798538208, 0.004803527146577835, 0.04525933414697647, 0.0857151448726654, 0.12617094814777374, 0.16662675142288208, 0.2070825695991516, 0.24753835797309875, 0.2879941761493683, 0.3284499943256378, 0.36890578269958496, 0.4093616008758545, 0.449817419052124, 0.49027320742607117, 0.5307290554046631, 0.5711848139762878, 0.6116406321525574, 0.6520964503288269, 0.6925522685050964, 0.7330080270767212, 0.7734638452529907, 0.8139196634292603, 0.8543754816055298, 0.8948312997817993, 0.9352871179580688, 0.9757429361343384, 1.016198754310608, 1.0566545724868774, 1.097110390663147, 1.137566089630127, 1.1780219078063965, 1.218477725982666, 1.2589335441589355]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 12.0, 18.0, 19.0, 47.0, 97.0, 1190.0, 4173175.0, 19108.0, 400.0, 81.0, 39.0, 26.0, 14.0, 16.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.3819580078125, -12.818603515625, -12.2552490234375, -11.69189453125, -11.1285400390625, -10.565185546875, -10.0018310546875, -9.4384765625, -8.8751220703125, -8.311767578125, -7.7484130859375, -7.18505859375, -6.6217041015625, -6.058349609375, -5.4949951171875, -4.931640625, -4.3682861328125, -3.804931640625, -3.2415771484375, -2.67822265625, -2.1148681640625, -1.551513671875, -0.9881591796875, -0.4248046875, 0.1385498046875, 0.701904296875, 1.2652587890625, 1.82861328125, 2.3919677734375, 2.955322265625, 3.5186767578125, 4.08203125, 4.6453857421875, 5.208740234375, 5.7720947265625, 6.33544921875, 6.8988037109375, 7.462158203125, 8.0255126953125, 8.5888671875, 9.1522216796875, 9.715576171875, 10.2789306640625, 10.84228515625, 11.4056396484375, 11.968994140625, 12.5323486328125, 13.095703125, 13.6590576171875, 14.222412109375, 14.7857666015625, 15.34912109375, 15.9124755859375, 16.475830078125, 17.0391845703125, 17.6025390625, 18.1658935546875, 18.729248046875, 19.2926025390625, 19.85595703125, 20.4193115234375, 20.982666015625, 21.5460205078125, 22.109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 9.0, 11.0, 20.0, 51.0, 90.0, 136.0, 150.0, 145.0, 151.0, 81.0, 47.0, 26.0, 20.0, 7.0, 2.0, 7.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0134429931640625, -0.012964963912963867, -0.012486934661865234, -0.012008905410766602, -0.011530876159667969, -0.011052846908569336, -0.010574817657470703, -0.01009678840637207, -0.009618759155273438, -0.009140729904174805, -0.008662700653076172, -0.008184671401977539, -0.007706642150878906, -0.0072286128997802734, -0.006750583648681641, -0.006272554397583008, -0.005794525146484375, -0.005316495895385742, -0.004838466644287109, -0.0043604373931884766, -0.0038824081420898438, -0.003404378890991211, -0.002926349639892578, -0.0024483203887939453, -0.0019702911376953125, -0.0014922618865966797, -0.0010142326354980469, -0.0005362033843994141, -5.817413330078125e-05, 0.00041985511779785156, 0.0008978843688964844, 0.0013759136199951172, 0.00185394287109375, 0.002331972122192383, 0.0028100013732910156, 0.0032880306243896484, 0.0037660598754882812, 0.004244089126586914, 0.004722118377685547, 0.00520014762878418, 0.0056781768798828125, 0.006156206130981445, 0.006634235382080078, 0.007112264633178711, 0.007590293884277344, 0.008068323135375977, 0.00854635238647461, 0.009024381637573242, 0.009502410888671875, 0.009980440139770508, 0.01045846939086914, 0.010936498641967773, 0.011414527893066406, 0.011892557144165039, 0.012370586395263672, 0.012848615646362305, 0.013326644897460938, 0.01380467414855957, 0.014282703399658203, 0.014760732650756836, 0.015238761901855469, 0.0157167911529541, 0.016194820404052734, 0.016672849655151367, 0.01715087890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 3.0, 1.0, 7.0, 8.0, 2.0, 3.0, 9.0, 8.0, 10.0, 6.0, 15.0, 18.0, 15.0, 15.0, 20.0, 35.0, 41.0, 54.0, 89.0, 92.0, 127.0, 129.0, 212.0, 445.0, 2275.0, 154223.0, 4032514.0, 3239.0, 366.0, 119.0, 64.0, 51.0, 22.0, 15.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.466827392578125, -4.35552978515625, -4.244232177734375, -4.1329345703125, -4.021636962890625, -3.91033935546875, -3.799041748046875, -3.687744140625, -3.576446533203125, -3.46514892578125, -3.353851318359375, -3.2425537109375, -3.131256103515625, -3.01995849609375, -2.908660888671875, -2.79736328125, -2.686065673828125, -2.57476806640625, -2.463470458984375, -2.3521728515625, -2.240875244140625, -2.12957763671875, -2.018280029296875, -1.906982421875, -1.795684814453125, -1.68438720703125, -1.573089599609375, -1.4617919921875, -1.350494384765625, -1.23919677734375, -1.127899169921875, -1.0166015625, -0.905303955078125, -0.79400634765625, -0.682708740234375, -0.5714111328125, -0.460113525390625, -0.34881591796875, -0.237518310546875, -0.126220703125, -0.014923095703125, 0.09637451171875, 0.207672119140625, 0.3189697265625, 0.430267333984375, 0.54156494140625, 0.652862548828125, 0.76416015625, 0.875457763671875, 0.98675537109375, 1.098052978515625, 1.2093505859375, 1.320648193359375, 1.43194580078125, 1.543243408203125, 1.654541015625, 1.765838623046875, 1.87713623046875, 1.988433837890625, 2.0997314453125, 2.211029052734375, 2.32232666015625, 2.433624267578125, 2.544921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 2.0, 9.0, 12.0, 8.0, 18.0, 22.0, 30.0, 40.0, 50.0, 89.0, 156.0, 244.0, 354.0, 623.0, 1434.0, 468.0, 243.0, 106.0, 52.0, 35.0, 21.0, 9.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.084716796875, -0.08272171020507812, -0.08072662353515625, -0.07873153686523438, -0.0767364501953125, -0.07474136352539062, -0.07274627685546875, -0.07075119018554688, -0.068756103515625, -0.06676101684570312, -0.06476593017578125, -0.06277084350585938, -0.0607757568359375, -0.058780670166015625, -0.05678558349609375, -0.054790496826171875, -0.05279541015625, -0.050800323486328125, -0.04880523681640625, -0.046810150146484375, -0.0448150634765625, -0.042819976806640625, -0.04082489013671875, -0.038829803466796875, -0.036834716796875, -0.034839630126953125, -0.03284454345703125, -0.030849456787109375, -0.0288543701171875, -0.026859283447265625, -0.02486419677734375, -0.022869110107421875, -0.0208740234375, -0.018878936767578125, -0.01688385009765625, -0.014888763427734375, -0.0128936767578125, -0.010898590087890625, -0.00890350341796875, -0.006908416748046875, -0.004913330078125, -0.002918243408203125, -0.00092315673828125, 0.001071929931640625, 0.0030670166015625, 0.005062103271484375, 0.00705718994140625, 0.009052276611328125, 0.01104736328125, 0.013042449951171875, 0.01503753662109375, 0.017032623291015625, 0.0190277099609375, 0.021022796630859375, 0.02301788330078125, 0.025012969970703125, 0.027008056640625, 0.029003143310546875, 0.03099822998046875, 0.032993316650390625, 0.0349884033203125, 0.036983489990234375, 0.03897857666015625, 0.040973663330078125, 0.04296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 4.0, 7.0, 13.0, 19.0, 15.0, 34.0, 63.0, 78.0, 139.0, 326.0, 193.0, 65.0, 17.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.295771837234497, -2.2316861152648926, -2.167600393295288, -2.1035146713256836, -2.0394287109375, -1.9753429889678955, -1.911257266998291, -1.8471715450286865, -1.783085823059082, -1.7190001010894775, -1.6549142599105835, -1.590828537940979, -1.5267428159713745, -1.4626569747924805, -1.398571252822876, -1.3344855308532715, -1.2703996896743774, -1.206313967704773, -1.142228126525879, -1.0781424045562744, -1.01405668258667, -0.9499709010124207, -0.8858851194381714, -0.8217993974685669, -0.7577136158943176, -0.6936278343200684, -0.6295421123504639, -0.5654563307762146, -0.5013705492019653, -0.43728482723236084, -0.3731990456581116, -0.3091132938861847, -0.24502742290496826, -0.18094167113304138, -0.11685590445995331, -0.052770137786865234, 0.011315613985061646, 0.07540136575698853, 0.1394871473312378, 0.20357289910316467, 0.26765865087509155, 0.33174440264701843, 0.3958301544189453, 0.4599159359931946, 0.5240017175674438, 0.5880874395370483, 0.6521732211112976, 0.7162590026855469, 0.7803447246551514, 0.8444305062294006, 0.9085162281990051, 0.9726020097732544, 1.0366877317428589, 1.100773572921753, 1.1648592948913574, 1.228945016860962, 1.2930307388305664, 1.357116460800171, 1.421202301979065, 1.4852880239486694, 1.549373745918274, 1.613459587097168, 1.6775453090667725, 1.741631031036377, 1.805716872215271]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 11.0, 7.0, 8.0, 13.0, 21.0, 20.0, 26.0, 39.0, 44.0, 50.0, 71.0, 61.0, 67.0, 66.0, 69.0, 63.0, 66.0, 57.0, 48.0, 30.0, 36.0, 24.0, 24.0, 14.0, 9.0, 11.0, 7.0, 7.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349093794822693, -0.7996223568916321, -0.7643353343009949, -0.7290483117103577, -0.6937612891197205, -0.6584742665290833, -0.6231873035430908, -0.5879002809524536, -0.5526132583618164, -0.5173262357711792, -0.482039213180542, -0.4467521905899048, -0.4114651679992676, -0.37617814540863037, -0.34089115262031555, -0.30560413002967834, -0.27031707763671875, -0.23503005504608154, -0.19974303245544434, -0.16445602476596832, -0.12916900217533112, -0.09388197958469391, -0.058594971895217896, -0.02330794930458069, 0.011979073286056519, 0.04726609215140343, 0.08255311101675034, 0.11784012615680695, 0.15312714874744415, 0.18841417133808136, 0.22370117902755737, 0.2589882016181946, 0.294275164604187, 0.3295621871948242, 0.3648492097854614, 0.40013623237609863, 0.43542325496673584, 0.47071027755737305, 0.5059973001480103, 0.5412843227386475, 0.5765713453292847, 0.6118583679199219, 0.6471453905105591, 0.6824324131011963, 0.7177194356918335, 0.7530064582824707, 0.7882934808731079, 0.8235805034637451, 0.8588674664497375, 0.8941544890403748, 0.929441511631012, 0.9647285342216492, 1.0000154972076416, 1.0353025197982788, 1.070589542388916, 1.1058765649795532, 1.1411635875701904, 1.1764506101608276, 1.2117376327514648, 1.247024655342102, 1.2823116779327393, 1.3175987005233765, 1.3528857231140137, 1.3881727457046509, 1.423459768295288]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 9.0, 9.0, 11.0, 9.0, 12.0, 21.0, 24.0, 34.0, 48.0, 70.0, 86.0, 128.0, 197.0, 304.0, 499.0, 856.0, 1488.0, 2743.0, 5039.0, 11057.0, 27104.0, 85720.0, 484511.0, 319894.0, 66565.0, 22183.0, 9480.0, 4493.0, 2458.0, 1338.0, 790.0, 462.0, 280.0, 188.0, 127.0, 92.0, 61.0, 42.0, 34.0, 25.0, 16.0, 10.0, 10.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.39111328125, -0.3792266845703125, -0.367340087890625, -0.3554534912109375, -0.34356689453125, -0.3316802978515625, -0.319793701171875, -0.3079071044921875, -0.2960205078125, -0.2841339111328125, -0.272247314453125, -0.2603607177734375, -0.24847412109375, -0.2365875244140625, -0.224700927734375, -0.2128143310546875, -0.200927734375, -0.1890411376953125, -0.177154541015625, -0.1652679443359375, -0.15338134765625, -0.1414947509765625, -0.129608154296875, -0.1177215576171875, -0.1058349609375, -0.0939483642578125, -0.082061767578125, -0.0701751708984375, -0.05828857421875, -0.0464019775390625, -0.034515380859375, -0.0226287841796875, -0.0107421875, 0.0011444091796875, 0.013031005859375, 0.0249176025390625, 0.03680419921875, 0.0486907958984375, 0.060577392578125, 0.0724639892578125, 0.0843505859375, 0.0962371826171875, 0.108123779296875, 0.1200103759765625, 0.13189697265625, 0.1437835693359375, 0.155670166015625, 0.1675567626953125, 0.179443359375, 0.1913299560546875, 0.203216552734375, 0.2151031494140625, 0.22698974609375, 0.2388763427734375, 0.250762939453125, 0.2626495361328125, 0.2745361328125, 0.2864227294921875, 0.298309326171875, 0.3101959228515625, 0.32208251953125, 0.3339691162109375, 0.345855712890625, 0.3577423095703125, 0.36962890625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 7.0, 9.0, 11.0, 23.0, 26.0, 29.0, 54.0, 79.0, 115.0, 88.0, 101.0, 113.0, 65.0, 86.0, 52.0, 46.0, 26.0, 12.0, 7.0, 11.0, 14.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170135498046875, -0.01631641387939453, -0.015619277954101562, -0.014922142028808594, -0.014225006103515625, -0.013527870178222656, -0.012830734252929688, -0.012133598327636719, -0.01143646240234375, -0.010739326477050781, -0.010042190551757812, -0.009345054626464844, -0.008647918701171875, -0.007950782775878906, -0.0072536468505859375, -0.006556510925292969, -0.005859375, -0.005162239074707031, -0.0044651031494140625, -0.0037679672241210938, -0.003070831298828125, -0.0023736953735351562, -0.0016765594482421875, -0.0009794235229492188, -0.00028228759765625, 0.00041484832763671875, 0.0011119842529296875, 0.0018091201782226562, 0.002506256103515625, 0.0032033920288085938, 0.0039005279541015625, 0.004597663879394531, 0.0052947998046875, 0.005991935729980469, 0.0066890716552734375, 0.007386207580566406, 0.008083343505859375, 0.008780479431152344, 0.009477615356445312, 0.010174751281738281, 0.01087188720703125, 0.011569023132324219, 0.012266159057617188, 0.012963294982910156, 0.013660430908203125, 0.014357566833496094, 0.015054702758789062, 0.01575183868408203, 0.016448974609375, 0.01714611053466797, 0.017843246459960938, 0.018540382385253906, 0.019237518310546875, 0.019934654235839844, 0.020631790161132812, 0.02132892608642578, 0.02202606201171875, 0.02272319793701172, 0.023420333862304688, 0.024117469787597656, 0.024814605712890625, 0.025511741638183594, 0.026208877563476562, 0.02690601348876953, 0.0276031494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 16.0, 13.0, 17.0, 23.0, 19.0, 35.0, 36.0, 57.0, 100.0, 359.0, 5770.0, 1013646.0, 27126.0, 826.0, 163.0, 72.0, 58.0, 42.0, 35.0, 31.0, 19.0, 17.0, 13.0, 6.0, 15.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.526824951171875, -1.47357177734375, -1.420318603515625, -1.3670654296875, -1.313812255859375, -1.26055908203125, -1.207305908203125, -1.154052734375, -1.100799560546875, -1.04754638671875, -0.994293212890625, -0.9410400390625, -0.887786865234375, -0.83453369140625, -0.781280517578125, -0.72802734375, -0.674774169921875, -0.62152099609375, -0.568267822265625, -0.5150146484375, -0.461761474609375, -0.40850830078125, -0.355255126953125, -0.302001953125, -0.248748779296875, -0.19549560546875, -0.142242431640625, -0.0889892578125, -0.035736083984375, 0.01751708984375, 0.070770263671875, 0.1240234375, 0.177276611328125, 0.23052978515625, 0.283782958984375, 0.3370361328125, 0.390289306640625, 0.44354248046875, 0.496795654296875, 0.550048828125, 0.603302001953125, 0.65655517578125, 0.709808349609375, 0.7630615234375, 0.816314697265625, 0.86956787109375, 0.922821044921875, 0.97607421875, 1.029327392578125, 1.08258056640625, 1.135833740234375, 1.1890869140625, 1.242340087890625, 1.29559326171875, 1.348846435546875, 1.402099609375, 1.455352783203125, 1.50860595703125, 1.561859130859375, 1.6151123046875, 1.668365478515625, 1.72161865234375, 1.774871826171875, 1.828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 13.0, 19.0, 15.0, 20.0, 19.0, 33.0, 26.0, 43.0, 48.0, 50.0, 49.0, 52.0, 57.0, 56.0, 50.0, 57.0, 56.0, 46.0, 43.0, 45.0, 37.0, 28.0, 27.0, 14.0, 22.0, 18.0, 9.0, 12.0, 5.0, 4.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08477783203125, -0.08186912536621094, -0.07896041870117188, -0.07605171203613281, -0.07314300537109375, -0.07023429870605469, -0.06732559204101562, -0.06441688537597656, -0.0615081787109375, -0.05859947204589844, -0.055690765380859375, -0.05278205871582031, -0.04987335205078125, -0.04696464538574219, -0.044055938720703125, -0.04114723205566406, -0.038238525390625, -0.03532981872558594, -0.032421112060546875, -0.029512405395507812, -0.02660369873046875, -0.023694992065429688, -0.020786285400390625, -0.017877578735351562, -0.0149688720703125, -0.012060165405273438, -0.009151458740234375, -0.0062427520751953125, -0.00333404541015625, -0.0004253387451171875, 0.002483367919921875, 0.0053920745849609375, 0.00830078125, 0.011209487915039062, 0.014118194580078125, 0.017026901245117188, 0.01993560791015625, 0.022844314575195312, 0.025753021240234375, 0.028661727905273438, 0.0315704345703125, 0.03447914123535156, 0.037387847900390625, 0.04029655456542969, 0.04320526123046875, 0.04611396789550781, 0.049022674560546875, 0.05193138122558594, 0.054840087890625, 0.05774879455566406, 0.060657501220703125, 0.06356620788574219, 0.06647491455078125, 0.06938362121582031, 0.07229232788085938, 0.07520103454589844, 0.0781097412109375, 0.08101844787597656, 0.08392715454101562, 0.08683586120605469, 0.08974456787109375, 0.09265327453613281, 0.09556198120117188, 0.09847068786621094, 0.10137939453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 15.0, 36.0, 116.0, 596.0, 9998.0, 1035103.0, 2285.0, 244.0, 63.0, 25.0, 18.0, 7.0, 3.0, 7.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.007080078125, -3.81884765625, -3.630615234375, -3.4423828125, -3.254150390625, -3.06591796875, -2.877685546875, -2.689453125, -2.501220703125, -2.31298828125, -2.124755859375, -1.9365234375, -1.748291015625, -1.56005859375, -1.371826171875, -1.18359375, -0.995361328125, -0.80712890625, -0.618896484375, -0.4306640625, -0.242431640625, -0.05419921875, 0.134033203125, 0.322265625, 0.510498046875, 0.69873046875, 0.886962890625, 1.0751953125, 1.263427734375, 1.45166015625, 1.639892578125, 1.828125, 2.016357421875, 2.20458984375, 2.392822265625, 2.5810546875, 2.769287109375, 2.95751953125, 3.145751953125, 3.333984375, 3.522216796875, 3.71044921875, 3.898681640625, 4.0869140625, 4.275146484375, 4.46337890625, 4.651611328125, 4.83984375, 5.028076171875, 5.21630859375, 5.404541015625, 5.5927734375, 5.781005859375, 5.96923828125, 6.157470703125, 6.345703125, 6.533935546875, 6.72216796875, 6.910400390625, 7.0986328125, 7.286865234375, 7.47509765625, 7.663330078125, 7.8515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 1.0, 15.0, 7.0, 9.0, 12.0, 12.0, 28.0, 26.0, 34.0, 41.0, 66.0, 79.0, 144.0, 161.0, 85.0, 57.0, 37.0, 23.0, 30.0, 18.0, 20.0, 10.0, 13.0, 10.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 2.0, 6.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020313262939453125, -0.00019588693976402283, -0.0001886412501335144, -0.00018139556050300598, -0.00017414987087249756, -0.00016690418124198914, -0.0001596584916114807, -0.0001524128019809723, -0.00014516711235046387, -0.00013792142271995544, -0.00013067573308944702, -0.0001234300434589386, -0.00011618435382843018, -0.00010893866419792175, -0.00010169297456741333, -9.444728493690491e-05, -8.720159530639648e-05, -7.995590567588806e-05, -7.271021604537964e-05, -6.546452641487122e-05, -5.821883678436279e-05, -5.097314715385437e-05, -4.372745752334595e-05, -3.6481767892837524e-05, -2.92360782623291e-05, -2.199038863182068e-05, -1.4744699001312256e-05, -7.499009370803833e-06, -2.5331974029541016e-07, 6.992369890213013e-06, 1.4238059520721436e-05, 2.148374915122986e-05, 2.872943878173828e-05, 3.5975128412246704e-05, 4.322081804275513e-05, 5.046650767326355e-05, 5.771219730377197e-05, 6.49578869342804e-05, 7.220357656478882e-05, 7.944926619529724e-05, 8.669495582580566e-05, 9.394064545631409e-05, 0.00010118633508682251, 0.00010843202471733093, 0.00011567771434783936, 0.00012292340397834778, 0.0001301690936088562, 0.00013741478323936462, 0.00014466047286987305, 0.00015190616250038147, 0.0001591518521308899, 0.00016639754176139832, 0.00017364323139190674, 0.00018088892102241516, 0.00018813461065292358, 0.000195380300283432, 0.00020262598991394043, 0.00020987167954444885, 0.00021711736917495728, 0.0002243630588054657, 0.00023160874843597412, 0.00023885443806648254, 0.00024610012769699097, 0.0002533458173274994, 0.0002605915069580078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 12.0, 22.0, 22.0, 60.0, 68.0, 125.0, 226.0, 428.0, 882.0, 1973.0, 4581.0, 12044.0, 46142.0, 944599.0, 23476.0, 7975.0, 3134.0, 1344.0, 641.0, 348.0, 167.0, 92.0, 67.0, 38.0, 26.0, 21.0, 5.0, 13.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7344207763671875, -1.686614990234375, -1.6388092041015625, -1.59100341796875, -1.5431976318359375, -1.495391845703125, -1.4475860595703125, -1.3997802734375, -1.3519744873046875, -1.304168701171875, -1.2563629150390625, -1.20855712890625, -1.1607513427734375, -1.112945556640625, -1.0651397705078125, -1.017333984375, -0.9695281982421875, -0.921722412109375, -0.8739166259765625, -0.82611083984375, -0.7783050537109375, -0.730499267578125, -0.6826934814453125, -0.6348876953125, -0.5870819091796875, -0.539276123046875, -0.4914703369140625, -0.44366455078125, -0.3958587646484375, -0.348052978515625, -0.3002471923828125, -0.25244140625, -0.2046356201171875, -0.156829833984375, -0.1090240478515625, -0.06121826171875, -0.0134124755859375, 0.034393310546875, 0.0821990966796875, 0.1300048828125, 0.1778106689453125, 0.225616455078125, 0.2734222412109375, 0.32122802734375, 0.3690338134765625, 0.416839599609375, 0.4646453857421875, 0.512451171875, 0.5602569580078125, 0.608062744140625, 0.6558685302734375, 0.70367431640625, 0.7514801025390625, 0.799285888671875, 0.8470916748046875, 0.8948974609375, 0.9427032470703125, 0.990509033203125, 1.0383148193359375, 1.08612060546875, 1.1339263916015625, 1.181732177734375, 1.2295379638671875, 1.27734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 4.0, 1.0, 8.0, 3.0, 8.0, 3.0, 15.0, 54.0, 708.0, 80.0, 29.0, 9.0, 7.0, 11.0, 7.0, 1.0, 6.0, 10.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47216796875, -0.45223236083984375, -0.4322967529296875, -0.41236114501953125, -0.392425537109375, -0.37248992919921875, -0.3525543212890625, -0.33261871337890625, -0.31268310546875, -0.29274749755859375, -0.2728118896484375, -0.25287628173828125, -0.232940673828125, -0.21300506591796875, -0.1930694580078125, -0.17313385009765625, -0.1531982421875, -0.13326263427734375, -0.1133270263671875, -0.09339141845703125, -0.073455810546875, -0.05352020263671875, -0.0335845947265625, -0.01364898681640625, 0.00628662109375, 0.02622222900390625, 0.0461578369140625, 0.06609344482421875, 0.086029052734375, 0.10596466064453125, 0.1259002685546875, 0.14583587646484375, 0.165771484375, 0.18570709228515625, 0.2056427001953125, 0.22557830810546875, 0.245513916015625, 0.26544952392578125, 0.2853851318359375, 0.30532073974609375, 0.32525634765625, 0.34519195556640625, 0.3651275634765625, 0.38506317138671875, 0.404998779296875, 0.42493438720703125, 0.4448699951171875, 0.46480560302734375, 0.4847412109375, 0.5046768188476562, 0.5246124267578125, 0.5445480346679688, 0.564483642578125, 0.5844192504882812, 0.6043548583984375, 0.6242904663085938, 0.64422607421875, 0.6641616821289062, 0.6840972900390625, 0.7040328979492188, 0.723968505859375, 0.7439041137695312, 0.7638397216796875, 0.7837753295898438, 0.8037109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 12.0, 61.0, 298.0, 511.0, 87.0, 22.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.186628818511963, -5.959205150604248, -5.731781482696533, -5.50435733795166, -5.276933670043945, -5.0495100021362305, -4.822086334228516, -4.594662666320801, -4.367238998413086, -4.139815330505371, -3.912391424179077, -3.6849677562713623, -3.4575438499450684, -3.2301201820373535, -3.0026965141296387, -2.775272846221924, -2.547848701477051, -2.320425033569336, -2.093001127243042, -1.8655774593353271, -1.6381536722183228, -1.4107298851013184, -1.1833062171936035, -0.9558824300765991, -0.7284586429595947, -0.5010348558425903, -0.2736111283302307, -0.046187400817871094, 0.1812363862991333, 0.4086601734161377, 0.6360838413238525, 0.8635076284408569, 1.0909309387207031, 1.3183547258377075, 1.545778512954712, 1.7732021808624268, 2.0006260871887207, 2.2280497550964355, 2.4554734230041504, 2.6828970909118652, 2.910320997238159, 3.137744665145874, 3.365168571472168, 3.592592239379883, 3.8200159072875977, 4.0474395751953125, 4.274863243103027, 4.5022873878479, 4.729711055755615, 4.95713472366333, 5.184558391571045, 5.411982536315918, 5.639406204223633, 5.866829872131348, 6.0942535400390625, 6.321677207946777, 6.549100875854492, 6.776524543762207, 7.003948211669922, 7.231371879577637, 7.45879602432251, 7.686219692230225, 7.9136433601379395, 8.141067504882812, 8.368491172790527]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 10.0, 10.0, 16.0, 35.0, 37.0, 57.0, 77.0, 121.0, 137.0, 108.0, 109.0, 92.0, 68.0, 55.0, 31.0, 13.0, 16.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.9749350547790527, -2.9143307209014893, -2.853726387023926, -2.7931220531463623, -2.732517719268799, -2.6719133853912354, -2.611309051513672, -2.5507044792175293, -2.490100383758545, -2.4294960498809814, -2.368891716003418, -2.3082873821258545, -2.247683048248291, -2.1870787143707275, -2.126474380493164, -2.0658698081970215, -2.005265474319458, -1.9446611404418945, -1.884056806564331, -1.8234524726867676, -1.762848138809204, -1.7022438049316406, -1.6416393518447876, -1.5810350179672241, -1.5204306840896606, -1.4598263502120972, -1.3992220163345337, -1.3386176824569702, -1.2780132293701172, -1.2174088954925537, -1.1568045616149902, -1.0962002277374268, -1.0355957746505737, -0.9749914407730103, -0.9143871068954468, -0.8537827134132385, -0.793178379535675, -0.7325740456581116, -0.6719696521759033, -0.6113653182983398, -0.5507609844207764, -0.4901566505432129, -0.429552286863327, -0.36894792318344116, -0.3083435893058777, -0.2477392554283142, -0.18713489174842834, -0.12653052806854248, -0.065926194190979, -0.0053218454122543335, 0.05528250336647034, 0.11588685214519501, 0.17649120092391968, 0.23709553480148315, 0.297699898481369, 0.3583042621612549, 0.41890859603881836, 0.47951292991638184, 0.5401172637939453, 0.6007216572761536, 0.661325991153717, 0.7219303250312805, 0.7825347185134888, 0.8431390523910522, 0.9037433862686157]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 4.0, 9.0, 6.0, 19.0, 25.0, 47.0, 41.0, 73.0, 118.0, 181.0, 226.0, 346.0, 1105.0, 273430.0, 3916873.0, 1170.0, 175.0, 144.0, 74.0, 49.0, 55.0, 20.0, 25.0, 14.0, 10.0, 10.0, 6.0, 0.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.21875, -4.09844970703125, -3.9781494140625, -3.85784912109375, -3.737548828125, -3.61724853515625, -3.4969482421875, -3.37664794921875, -3.25634765625, -3.13604736328125, -3.0157470703125, -2.89544677734375, -2.775146484375, -2.65484619140625, -2.5345458984375, -2.41424560546875, -2.2939453125, -2.17364501953125, -2.0533447265625, -1.93304443359375, -1.812744140625, -1.69244384765625, -1.5721435546875, -1.45184326171875, -1.33154296875, -1.21124267578125, -1.0909423828125, -0.97064208984375, -0.850341796875, -0.73004150390625, -0.6097412109375, -0.48944091796875, -0.369140625, -0.24884033203125, -0.1285400390625, -0.00823974609375, 0.112060546875, 0.23236083984375, 0.3526611328125, 0.47296142578125, 0.59326171875, 0.71356201171875, 0.8338623046875, 0.95416259765625, 1.074462890625, 1.19476318359375, 1.3150634765625, 1.43536376953125, 1.5556640625, 1.67596435546875, 1.7962646484375, 1.91656494140625, 2.036865234375, 2.15716552734375, 2.2774658203125, 2.39776611328125, 2.51806640625, 2.63836669921875, 2.7586669921875, 2.87896728515625, 2.999267578125, 3.11956787109375, 3.2398681640625, 3.36016845703125, 3.48046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 8.0, 26.0, 50.0, 122.0, 187.0, 212.0, 224.0, 97.0, 53.0, 19.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0965576171875, -0.09474873542785645, -0.09293985366821289, -0.09113097190856934, -0.08932209014892578, -0.08751320838928223, -0.08570432662963867, -0.08389544486999512, -0.08208656311035156, -0.08027768135070801, -0.07846879959106445, -0.0766599178314209, -0.07485103607177734, -0.07304215431213379, -0.07123327255249023, -0.06942439079284668, -0.06761550903320312, -0.06580662727355957, -0.06399774551391602, -0.06218886375427246, -0.060379981994628906, -0.05857110023498535, -0.0567622184753418, -0.05495333671569824, -0.05314445495605469, -0.05133557319641113, -0.04952669143676758, -0.04771780967712402, -0.04590892791748047, -0.044100046157836914, -0.04229116439819336, -0.040482282638549805, -0.03867340087890625, -0.036864519119262695, -0.03505563735961914, -0.033246755599975586, -0.03143787384033203, -0.029628992080688477, -0.027820110321044922, -0.026011228561401367, -0.024202346801757812, -0.022393465042114258, -0.020584583282470703, -0.01877570152282715, -0.016966819763183594, -0.015157938003540039, -0.013349056243896484, -0.01154017448425293, -0.009731292724609375, -0.00792241096496582, -0.006113529205322266, -0.004304647445678711, -0.0024957656860351562, -0.0006868839263916016, 0.0011219978332519531, 0.002930879592895508, 0.0047397613525390625, 0.006548643112182617, 0.008357524871826172, 0.010166406631469727, 0.011975288391113281, 0.013784170150756836, 0.01559305191040039, 0.017401933670043945, 0.0192108154296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 2.0, 7.0, 2.0, 6.0, 6.0, 10.0, 6.0, 8.0, 7.0, 16.0, 23.0, 20.0, 25.0, 32.0, 39.0, 32.0, 46.0, 47.0, 78.0, 101.0, 140.0, 235.0, 450.0, 995.0, 1301541.0, 2889001.0, 750.0, 317.0, 161.0, 81.0, 41.0, 16.0, 16.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.03125, -8.7872314453125, -8.543212890625, -8.2991943359375, -8.05517578125, -7.8111572265625, -7.567138671875, -7.3231201171875, -7.0791015625, -6.8350830078125, -6.591064453125, -6.3470458984375, -6.10302734375, -5.8590087890625, -5.614990234375, -5.3709716796875, -5.126953125, -4.8829345703125, -4.638916015625, -4.3948974609375, -4.15087890625, -3.9068603515625, -3.662841796875, -3.4188232421875, -3.1748046875, -2.9307861328125, -2.686767578125, -2.4427490234375, -2.19873046875, -1.9547119140625, -1.710693359375, -1.4666748046875, -1.22265625, -0.9786376953125, -0.734619140625, -0.4906005859375, -0.24658203125, -0.0025634765625, 0.241455078125, 0.4854736328125, 0.7294921875, 0.9735107421875, 1.217529296875, 1.4615478515625, 1.70556640625, 1.9495849609375, 2.193603515625, 2.4376220703125, 2.681640625, 2.9256591796875, 3.169677734375, 3.4136962890625, 3.65771484375, 3.9017333984375, 4.145751953125, 4.3897705078125, 4.6337890625, 4.8778076171875, 5.121826171875, 5.3658447265625, 5.60986328125, 5.8538818359375, 6.097900390625, 6.3419189453125, 6.5859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 10.0, 13.0, 25.0, 30.0, 56.0, 115.0, 198.0, 387.0, 911.0, 1631.0, 367.0, 166.0, 80.0, 41.0, 18.0, 14.0, 13.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14892578125, -0.14383316040039062, -0.13874053955078125, -0.13364791870117188, -0.1285552978515625, -0.12346267700195312, -0.11837005615234375, -0.11327743530273438, -0.108184814453125, -0.10309219360351562, -0.09799957275390625, -0.09290695190429688, -0.0878143310546875, -0.08272171020507812, -0.07762908935546875, -0.07253646850585938, -0.06744384765625, -0.062351226806640625, -0.05725860595703125, -0.052165985107421875, -0.0470733642578125, -0.041980743408203125, -0.03688812255859375, -0.031795501708984375, -0.026702880859375, -0.021610260009765625, -0.01651763916015625, -0.011425018310546875, -0.0063323974609375, -0.001239776611328125, 0.00385284423828125, 0.008945465087890625, 0.0140380859375, 0.019130706787109375, 0.02422332763671875, 0.029315948486328125, 0.0344085693359375, 0.039501190185546875, 0.04459381103515625, 0.049686431884765625, 0.054779052734375, 0.059871673583984375, 0.06496429443359375, 0.07005691528320312, 0.0751495361328125, 0.08024215698242188, 0.08533477783203125, 0.09042739868164062, 0.09552001953125, 0.10061264038085938, 0.10570526123046875, 0.11079788208007812, 0.1158905029296875, 0.12098312377929688, 0.12607574462890625, 0.13116836547851562, 0.136260986328125, 0.14135360717773438, 0.14644622802734375, 0.15153884887695312, 0.1566314697265625, 0.16172409057617188, 0.16681671142578125, 0.17190933227539062, 0.177001953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 14.0, 20.0, 62.0, 225.0, 446.0, 160.0, 51.0, 14.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671817779541016, -8.355196952819824, -8.03857707977295, -7.721956253051758, -7.405335903167725, -7.088715553283691, -6.7720947265625, -6.455474376678467, -6.138854026794434, -5.8222336769104, -5.505613327026367, -5.188992500305176, -4.872372150421143, -4.555751800537109, -4.239130973815918, -3.9225106239318848, -3.6058902740478516, -3.2892699241638184, -2.972649335861206, -2.6560287475585938, -2.3394083976745605, -2.0227880477905273, -1.706167459487915, -1.3895468711853027, -1.0729265213012695, -0.7563060522079468, -0.439685583114624, -0.12306511402130127, 0.19355535507202148, 0.5101758241653442, 0.826796293258667, 1.1434168815612793, 1.460036277770996, 1.7766567468643188, 2.0932772159576416, 2.409897804260254, 2.726518154144287, 3.0431385040283203, 3.3597590923309326, 3.676379680633545, 3.993000030517578, 4.309620380401611, 4.6262407302856445, 4.942861557006836, 5.259481906890869, 5.576102256774902, 5.892723083496094, 6.209343433380127, 6.52596378326416, 6.842584133148193, 7.159204483032227, 7.475825309753418, 7.792445659637451, 8.109066009521484, 8.425686836242676, 8.742307662963867, 9.058927536010742, 9.375548362731934, 9.692168235778809, 10.0087890625, 10.325408935546875, 10.642029762268066, 10.958650588989258, 11.275270462036133, 11.591891288757324]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 13.0, 18.0, 22.0, 36.0, 49.0, 75.0, 67.0, 89.0, 97.0, 106.0, 72.0, 73.0, 77.0, 56.0, 59.0, 29.0, 24.0, 8.0, 11.0, 11.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.849369525909424, -2.7880735397338867, -2.7267773151397705, -2.6654813289642334, -2.6041853427886963, -2.542889356613159, -2.481593132019043, -2.420297145843506, -2.3590011596679688, -2.2977051734924316, -2.2364089488983154, -2.1751129627227783, -2.113816976547241, -2.052520990371704, -1.9912248849868774, -1.9299287796020508, -1.8686327934265137, -1.807336688041687, -1.74604070186615, -1.6847445964813232, -1.6234486103057861, -1.5621525049209595, -1.5008565187454224, -1.4395604133605957, -1.378264307975769, -1.3169682025909424, -1.2556722164154053, -1.1943761110305786, -1.1330801248550415, -1.0717840194702148, -1.0104880332946777, -0.9491919279098511, -0.887895941734314, -0.8265998959541321, -0.7653038501739502, -0.7040078043937683, -0.6427117586135864, -0.5814156532287598, -0.5201196670532227, -0.4588235914707184, -0.3975275456905365, -0.3362314999103546, -0.27493545413017273, -0.21363939344882965, -0.15234334766864777, -0.09104728698730469, -0.029751241207122803, 0.03154480457305908, 0.09284085035324097, 0.15413689613342285, 0.21543294191360474, 0.2767289876937866, 0.3380250334739685, 0.3993211090564728, 0.46061715483665466, 0.5219131708145142, 0.5832092761993408, 0.6445053219795227, 0.7058013677597046, 0.7670974135398865, 0.8283934593200684, 0.889689564704895, 0.9509855508804321, 1.0122816562652588, 1.073577642440796]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 7.0, 7.0, 8.0, 13.0, 13.0, 16.0, 26.0, 27.0, 47.0, 48.0, 40.0, 64.0, 131.0, 4940.0, 1040175.0, 2562.0, 94.0, 53.0, 54.0, 34.0, 38.0, 27.0, 22.0, 19.0, 13.0, 9.0, 10.0, 12.0, 12.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.21875, -15.7188720703125, -15.218994140625, -14.7191162109375, -14.21923828125, -13.7193603515625, -13.219482421875, -12.7196044921875, -12.2197265625, -11.7198486328125, -11.219970703125, -10.7200927734375, -10.22021484375, -9.7203369140625, -9.220458984375, -8.7205810546875, -8.220703125, -7.7208251953125, -7.220947265625, -6.7210693359375, -6.22119140625, -5.7213134765625, -5.221435546875, -4.7215576171875, -4.2216796875, -3.7218017578125, -3.221923828125, -2.7220458984375, -2.22216796875, -1.7222900390625, -1.222412109375, -0.7225341796875, -0.22265625, 0.2772216796875, 0.777099609375, 1.2769775390625, 1.77685546875, 2.2767333984375, 2.776611328125, 3.2764892578125, 3.7763671875, 4.2762451171875, 4.776123046875, 5.2760009765625, 5.77587890625, 6.2757568359375, 6.775634765625, 7.2755126953125, 7.775390625, 8.2752685546875, 8.775146484375, 9.2750244140625, 9.77490234375, 10.2747802734375, 10.774658203125, 11.2745361328125, 11.7744140625, 12.2742919921875, 12.774169921875, 13.2740478515625, 13.77392578125, 14.2738037109375, 14.773681640625, 15.2735595703125, 15.7734375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 51.0, 115.0, 229.0, 270.0, 211.0, 97.0, 21.0, 10.0, 2.0, 1.0], "bins": [-0.43603515625, -0.4284243583679199, -0.42081356048583984, -0.41320276260375977, -0.4055919647216797, -0.3979811668395996, -0.39037036895751953, -0.38275957107543945, -0.3751487731933594, -0.3675379753112793, -0.3599271774291992, -0.35231637954711914, -0.34470558166503906, -0.337094783782959, -0.3294839859008789, -0.32187318801879883, -0.31426239013671875, -0.30665159225463867, -0.2990407943725586, -0.2914299964904785, -0.28381919860839844, -0.27620840072631836, -0.2685976028442383, -0.2609868049621582, -0.2533760070800781, -0.24576520919799805, -0.23815441131591797, -0.2305436134338379, -0.2229328155517578, -0.21532201766967773, -0.20771121978759766, -0.20010042190551758, -0.1924896240234375, -0.18487882614135742, -0.17726802825927734, -0.16965723037719727, -0.1620464324951172, -0.1544356346130371, -0.14682483673095703, -0.13921403884887695, -0.13160324096679688, -0.1239924430847168, -0.11638164520263672, -0.10877084732055664, -0.10116004943847656, -0.09354925155639648, -0.0859384536743164, -0.07832765579223633, -0.07071685791015625, -0.06310606002807617, -0.055495262145996094, -0.047884464263916016, -0.04027366638183594, -0.03266286849975586, -0.02505207061767578, -0.017441272735595703, -0.009830474853515625, -0.002219676971435547, 0.005391120910644531, 0.01300191879272461, 0.020612716674804688, 0.028223514556884766, 0.035834312438964844, 0.04344511032104492, 0.051055908203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 10.0, 19.0, 21.0, 24.0, 44.0, 64.0, 78.0, 156.0, 328.0, 691.0, 1644.0, 4527.0, 17003.0, 96315.0, 665196.0, 220628.0, 30279.0, 7167.0, 2386.0, 942.0, 455.0, 224.0, 98.0, 85.0, 53.0, 30.0, 23.0, 12.0, 9.0, 11.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.8634033203125, -2.756103515625, -2.6488037109375, -2.54150390625, -2.4342041015625, -2.326904296875, -2.2196044921875, -2.1123046875, -2.0050048828125, -1.897705078125, -1.7904052734375, -1.68310546875, -1.5758056640625, -1.468505859375, -1.3612060546875, -1.25390625, -1.1466064453125, -1.039306640625, -0.9320068359375, -0.82470703125, -0.7174072265625, -0.610107421875, -0.5028076171875, -0.3955078125, -0.2882080078125, -0.180908203125, -0.0736083984375, 0.03369140625, 0.1409912109375, 0.248291015625, 0.3555908203125, 0.462890625, 0.5701904296875, 0.677490234375, 0.7847900390625, 0.89208984375, 0.9993896484375, 1.106689453125, 1.2139892578125, 1.3212890625, 1.4285888671875, 1.535888671875, 1.6431884765625, 1.75048828125, 1.8577880859375, 1.965087890625, 2.0723876953125, 2.1796875, 2.2869873046875, 2.394287109375, 2.5015869140625, 2.60888671875, 2.7161865234375, 2.823486328125, 2.9307861328125, 3.0380859375, 3.1453857421875, 3.252685546875, 3.3599853515625, 3.46728515625, 3.5745849609375, 3.681884765625, 3.7891845703125, 3.896484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 7.0, 14.0, 18.0, 23.0, 24.0, 22.0, 41.0, 46.0, 47.0, 38.0, 57.0, 56.0, 72.0, 63.0, 67.0, 58.0, 47.0, 48.0, 43.0, 40.0, 30.0, 24.0, 21.0, 27.0, 8.0, 8.0, 13.0, 9.0, 4.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3743400573730469, -0.35927581787109375, -0.3442115783691406, -0.3291473388671875, -0.3140830993652344, -0.29901885986328125, -0.2839546203613281, -0.268890380859375, -0.2538261413574219, -0.23876190185546875, -0.22369766235351562, -0.2086334228515625, -0.19356918334960938, -0.17850494384765625, -0.16344070434570312, -0.14837646484375, -0.13331222534179688, -0.11824798583984375, -0.10318374633789062, -0.0881195068359375, -0.07305526733398438, -0.05799102783203125, -0.042926788330078125, -0.027862548828125, -0.012798309326171875, 0.00226593017578125, 0.017330169677734375, 0.0323944091796875, 0.047458648681640625, 0.06252288818359375, 0.07758712768554688, 0.0926513671875, 0.10771560668945312, 0.12277984619140625, 0.13784408569335938, 0.1529083251953125, 0.16797256469726562, 0.18303680419921875, 0.19810104370117188, 0.213165283203125, 0.22822952270507812, 0.24329376220703125, 0.2583580017089844, 0.2734222412109375, 0.2884864807128906, 0.30355072021484375, 0.3186149597167969, 0.33367919921875, 0.3487434387207031, 0.36380767822265625, 0.3788719177246094, 0.3939361572265625, 0.4090003967285156, 0.42406463623046875, 0.4391288757324219, 0.454193115234375, 0.4692573547363281, 0.48432159423828125, 0.4993858337402344, 0.5144500732421875, 0.5295143127441406, 0.5445785522460938, 0.5596427917480469, 0.57470703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 10.0, 20.0, 22.0, 26.0, 48.0, 79.0, 160.0, 319.0, 634.0, 1433.0, 4020.0, 14313.0, 83559.0, 639272.0, 261139.0, 31930.0, 7366.0, 2350.0, 854.0, 407.0, 256.0, 150.0, 76.0, 41.0, 23.0, 14.0, 10.0, 8.0, 4.0, 10.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.353424072265625, -4.23809814453125, -4.122772216796875, -4.0074462890625, -3.892120361328125, -3.77679443359375, -3.661468505859375, -3.546142578125, -3.430816650390625, -3.31549072265625, -3.200164794921875, -3.0848388671875, -2.969512939453125, -2.85418701171875, -2.738861083984375, -2.62353515625, -2.508209228515625, -2.39288330078125, -2.277557373046875, -2.1622314453125, -2.046905517578125, -1.93157958984375, -1.816253662109375, -1.700927734375, -1.585601806640625, -1.47027587890625, -1.354949951171875, -1.2396240234375, -1.124298095703125, -1.00897216796875, -0.893646240234375, -0.7783203125, -0.662994384765625, -0.54766845703125, -0.432342529296875, -0.3170166015625, -0.201690673828125, -0.08636474609375, 0.028961181640625, 0.144287109375, 0.259613037109375, 0.37493896484375, 0.490264892578125, 0.6055908203125, 0.720916748046875, 0.83624267578125, 0.951568603515625, 1.06689453125, 1.182220458984375, 1.29754638671875, 1.412872314453125, 1.5281982421875, 1.643524169921875, 1.75885009765625, 1.874176025390625, 1.989501953125, 2.104827880859375, 2.22015380859375, 2.335479736328125, 2.4508056640625, 2.566131591796875, 2.68145751953125, 2.796783447265625, 2.912109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 9.0, 14.0, 15.0, 35.0, 37.0, 40.0, 64.0, 78.0, 87.0, 100.0, 117.0, 95.0, 70.0, 53.0, 32.0, 31.0, 15.0, 21.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003669261932373047, -0.00035719946026802063, -0.00034747272729873657, -0.0003377459943294525, -0.00032801926136016846, -0.0003182925283908844, -0.00030856579542160034, -0.0002988390624523163, -0.0002891123294830322, -0.00027938559651374817, -0.0002696588635444641, -0.00025993213057518005, -0.000250205397605896, -0.00024047866463661194, -0.00023075193166732788, -0.00022102519869804382, -0.00021129846572875977, -0.0002015717327594757, -0.00019184499979019165, -0.0001821182668209076, -0.00017239153385162354, -0.00016266480088233948, -0.00015293806791305542, -0.00014321133494377136, -0.0001334846019744873, -0.00012375786900520325, -0.00011403113603591919, -0.00010430440306663513, -9.457767009735107e-05, -8.485093712806702e-05, -7.512420415878296e-05, -6.53974711894989e-05, -5.5670738220214844e-05, -4.5944005250930786e-05, -3.621727228164673e-05, -2.649053931236267e-05, -1.6763806343078613e-05, -7.037073373794556e-06, 2.689659595489502e-06, 1.241639256477356e-05, 2.2143125534057617e-05, 3.1869858503341675e-05, 4.159659147262573e-05, 5.132332444190979e-05, 6.105005741119385e-05, 7.07767903804779e-05, 8.050352334976196e-05, 9.023025631904602e-05, 9.995698928833008e-05, 0.00010968372225761414, 0.0001194104552268982, 0.00012913718819618225, 0.0001388639211654663, 0.00014859065413475037, 0.00015831738710403442, 0.00016804412007331848, 0.00017777085304260254, 0.0001874975860118866, 0.00019722431898117065, 0.0002069510519504547, 0.00021667778491973877, 0.00022640451788902283, 0.00023613125085830688, 0.00024585798382759094, 0.000255584716796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 7.0, 15.0, 21.0, 26.0, 61.0, 101.0, 259.0, 758.0, 3870.0, 44508.0, 850955.0, 138014.0, 8003.0, 1333.0, 342.0, 127.0, 58.0, 32.0, 15.0, 13.0, 4.0, 3.0, 7.0, 6.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-8.671875, -8.4686279296875, -8.265380859375, -8.0621337890625, -7.85888671875, -7.6556396484375, -7.452392578125, -7.2491455078125, -7.0458984375, -6.8426513671875, -6.639404296875, -6.4361572265625, -6.23291015625, -6.0296630859375, -5.826416015625, -5.6231689453125, -5.419921875, -5.2166748046875, -5.013427734375, -4.8101806640625, -4.60693359375, -4.4036865234375, -4.200439453125, -3.9971923828125, -3.7939453125, -3.5906982421875, -3.387451171875, -3.1842041015625, -2.98095703125, -2.7777099609375, -2.574462890625, -2.3712158203125, -2.16796875, -1.9647216796875, -1.761474609375, -1.5582275390625, -1.35498046875, -1.1517333984375, -0.948486328125, -0.7452392578125, -0.5419921875, -0.3387451171875, -0.135498046875, 0.0677490234375, 0.27099609375, 0.4742431640625, 0.677490234375, 0.8807373046875, 1.083984375, 1.2872314453125, 1.490478515625, 1.6937255859375, 1.89697265625, 2.1002197265625, 2.303466796875, 2.5067138671875, 2.7099609375, 2.9132080078125, 3.116455078125, 3.3197021484375, 3.52294921875, 3.7261962890625, 3.929443359375, 4.1326904296875, 4.3359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 12.0, 8.0, 18.0, 19.0, 40.0, 25.0, 40.0, 48.0, 75.0, 84.0, 102.0, 102.0, 96.0, 77.0, 55.0, 38.0, 30.0, 37.0, 20.0, 17.0, 15.0, 3.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.486328125, -1.445037841796875, -1.40374755859375, -1.362457275390625, -1.3211669921875, -1.279876708984375, -1.23858642578125, -1.197296142578125, -1.156005859375, -1.114715576171875, -1.07342529296875, -1.032135009765625, -0.9908447265625, -0.949554443359375, -0.90826416015625, -0.866973876953125, -0.82568359375, -0.784393310546875, -0.74310302734375, -0.701812744140625, -0.6605224609375, -0.619232177734375, -0.57794189453125, -0.536651611328125, -0.495361328125, -0.454071044921875, -0.41278076171875, -0.371490478515625, -0.3302001953125, -0.288909912109375, -0.24761962890625, -0.206329345703125, -0.1650390625, -0.123748779296875, -0.08245849609375, -0.041168212890625, 0.0001220703125, 0.041412353515625, 0.08270263671875, 0.123992919921875, 0.165283203125, 0.206573486328125, 0.24786376953125, 0.289154052734375, 0.3304443359375, 0.371734619140625, 0.41302490234375, 0.454315185546875, 0.49560546875, 0.536895751953125, 0.57818603515625, 0.619476318359375, 0.6607666015625, 0.702056884765625, 0.74334716796875, 0.784637451171875, 0.825927734375, 0.867218017578125, 0.90850830078125, 0.949798583984375, 0.9910888671875, 1.032379150390625, 1.07366943359375, 1.114959716796875, 1.15625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 48.0, 200.0, 476.0, 217.0, 45.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.837984085083008, -15.495183944702148, -14.152382850646973, -12.809581756591797, -11.466781616210938, -10.123981475830078, -8.781180381774902, -7.438379287719727, -6.095579147338867, -4.75277853012085, -3.409977912902832, -2.0671772956848145, -0.7243766784667969, 0.6184239387512207, 1.9612245559692383, 3.304025650024414, 4.646825790405273, 5.989626407623291, 7.332427024841309, 8.675228118896484, 10.018028259277344, 11.360828399658203, 12.703629493713379, 14.046430587768555, 15.389230728149414, 16.732030868530273, 18.074832916259766, 19.417633056640625, 20.760433197021484, 22.103233337402344, 23.446033477783203, 24.788835525512695, 26.131637573242188, 27.474437713623047, 28.817237854003906, 30.1600399017334, 31.502840042114258, 32.84564208984375, 34.18844223022461, 35.53124237060547, 36.87404251098633, 38.21684265136719, 39.55964279174805, 40.902442932128906, 42.24524688720703, 43.58804702758789, 44.93084716796875, 46.27364730834961, 47.61644744873047, 48.95924758911133, 50.30204772949219, 51.64484786987305, 52.987648010253906, 54.33045196533203, 55.67325210571289, 57.01605224609375, 58.35885238647461, 59.70165252685547, 61.04445266723633, 62.38725280761719, 63.73005676269531, 65.0728530883789, 66.41565704345703, 67.75845336914062, 69.10125732421875]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 10.0, 16.0, 20.0, 31.0, 24.0, 30.0, 27.0, 34.0, 53.0, 46.0, 48.0, 60.0, 66.0, 50.0, 52.0, 53.0, 52.0, 33.0, 37.0, 39.0, 36.0, 36.0, 18.0, 19.0, 15.0, 12.0, 19.0, 16.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.588022232055664, -3.4592678546905518, -3.3305134773254395, -3.201759099960327, -3.073004722595215, -2.9442505836486816, -2.8154962062835693, -2.686741828918457, -2.5579874515533447, -2.4292330741882324, -2.30047869682312, -2.171724319458008, -2.0429701805114746, -1.9142156839370728, -1.78546142578125, -1.6567070484161377, -1.5279526710510254, -1.399198293685913, -1.2704439163208008, -1.141689658164978, -1.0129352807998657, -0.8841809034347534, -0.7554265856742859, -0.6266722679138184, -0.49791789054870605, -0.36916354298591614, -0.24040919542312622, -0.1116548478603363, 0.017099499702453613, 0.14585387706756592, 0.27460819482803345, 0.403362512588501, 0.5321173667907715, 0.6608717441558838, 0.7896260619163513, 0.9183803796768188, 1.0471347570419312, 1.1758891344070435, 1.3046433925628662, 1.4333977699279785, 1.5621521472930908, 1.6909065246582031, 1.8196609020233154, 1.9484151601791382, 2.077169418334961, 2.2059240341186523, 2.3346781730651855, 2.463432550430298, 2.59218692779541, 2.7209413051605225, 2.8496956825256348, 2.978450059890747, 3.1072044372558594, 3.2359585762023926, 3.364712953567505, 3.493467330932617, 3.6222217082977295, 3.750976085662842, 3.879730463027954, 4.008484840393066, 4.1372389793396, 4.265993595123291, 4.394747734069824, 4.523502349853516, 4.652256488800049]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 6.0, 4.0, 5.0, 4.0, 7.0, 9.0, 7.0, 10.0, 15.0, 11.0, 12.0, 15.0, 15.0, 26.0, 25.0, 30.0, 24.0, 15.0, 24.0, 51.0, 169.0, 1012.0, 3586670.0, 604373.0, 1233.0, 250.0, 103.0, 50.0, 24.0, 24.0, 18.0, 11.0, 5.0, 10.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-31.859375, -31.18115234375, -30.5029296875, -29.82470703125, -29.146484375, -28.46826171875, -27.7900390625, -27.11181640625, -26.43359375, -25.75537109375, -25.0771484375, -24.39892578125, -23.720703125, -23.04248046875, -22.3642578125, -21.68603515625, -21.0078125, -20.32958984375, -19.6513671875, -18.97314453125, -18.294921875, -17.61669921875, -16.9384765625, -16.26025390625, -15.58203125, -14.90380859375, -14.2255859375, -13.54736328125, -12.869140625, -12.19091796875, -11.5126953125, -10.83447265625, -10.15625, -9.47802734375, -8.7998046875, -8.12158203125, -7.443359375, -6.76513671875, -6.0869140625, -5.40869140625, -4.73046875, -4.05224609375, -3.3740234375, -2.69580078125, -2.017578125, -1.33935546875, -0.6611328125, 0.01708984375, 0.6953125, 1.37353515625, 2.0517578125, 2.72998046875, 3.408203125, 4.08642578125, 4.7646484375, 5.44287109375, 6.12109375, 6.79931640625, 7.4775390625, 8.15576171875, 8.833984375, 9.51220703125, 10.1904296875, 10.86865234375, 11.546875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 25.0, 62.0, 98.0, 133.0, 215.0, 171.0, 133.0, 75.0, 55.0, 19.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4527578353881836, -0.4438457489013672, -0.4349336624145508, -0.4260215759277344, -0.41710948944091797, -0.40819740295410156, -0.39928531646728516, -0.39037322998046875, -0.38146114349365234, -0.37254905700683594, -0.36363697052001953, -0.3547248840332031, -0.3458127975463867, -0.3369007110595703, -0.3279886245727539, -0.3190765380859375, -0.3101644515991211, -0.3012523651123047, -0.2923402786254883, -0.2834281921386719, -0.27451610565185547, -0.26560401916503906, -0.25669193267822266, -0.24777984619140625, -0.23886775970458984, -0.22995567321777344, -0.22104358673095703, -0.21213150024414062, -0.20321941375732422, -0.1943073272705078, -0.1853952407836914, -0.176483154296875, -0.1675710678100586, -0.1586589813232422, -0.14974689483642578, -0.14083480834960938, -0.13192272186279297, -0.12301063537597656, -0.11409854888916016, -0.10518646240234375, -0.09627437591552734, -0.08736228942871094, -0.07845020294189453, -0.06953811645507812, -0.06062602996826172, -0.05171394348144531, -0.042801856994628906, -0.0338897705078125, -0.024977684020996094, -0.016065597534179688, -0.007153511047363281, 0.001758575439453125, 0.010670661926269531, 0.019582748413085938, 0.028494834899902344, 0.03740692138671875, 0.046319007873535156, 0.05523109436035156, 0.06414318084716797, 0.07305526733398438, 0.08196735382080078, 0.09087944030761719, 0.0997915267944336, 0.10870361328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 17.0, 32.0, 34.0, 48.0, 66.0, 106.0, 132.0, 186.0, 378.0, 844.0, 2656.0, 13647.0, 193328.0, 3929207.0, 44034.0, 6256.0, 1688.0, 660.0, 338.0, 202.0, 126.0, 100.0, 57.0, 41.0, 30.0, 19.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.768798828125, -14.35009765625, -13.931396484375, -13.5126953125, -13.093994140625, -12.67529296875, -12.256591796875, -11.837890625, -11.419189453125, -11.00048828125, -10.581787109375, -10.1630859375, -9.744384765625, -9.32568359375, -8.906982421875, -8.48828125, -8.069580078125, -7.65087890625, -7.232177734375, -6.8134765625, -6.394775390625, -5.97607421875, -5.557373046875, -5.138671875, -4.719970703125, -4.30126953125, -3.882568359375, -3.4638671875, -3.045166015625, -2.62646484375, -2.207763671875, -1.7890625, -1.370361328125, -0.95166015625, -0.532958984375, -0.1142578125, 0.304443359375, 0.72314453125, 1.141845703125, 1.560546875, 1.979248046875, 2.39794921875, 2.816650390625, 3.2353515625, 3.654052734375, 4.07275390625, 4.491455078125, 4.91015625, 5.328857421875, 5.74755859375, 6.166259765625, 6.5849609375, 7.003662109375, 7.42236328125, 7.841064453125, 8.259765625, 8.678466796875, 9.09716796875, 9.515869140625, 9.9345703125, 10.353271484375, 10.77197265625, 11.190673828125, 11.609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 1.0, 8.0, 6.0, 9.0, 12.0, 26.0, 26.0, 36.0, 61.0, 89.0, 145.0, 258.0, 1190.0, 1510.0, 269.0, 149.0, 77.0, 55.0, 42.0, 23.0, 19.0, 10.0, 15.0, 12.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63232421875, -0.6035995483398438, -0.5748748779296875, -0.5461502075195312, -0.517425537109375, -0.48870086669921875, -0.4599761962890625, -0.43125152587890625, -0.40252685546875, -0.37380218505859375, -0.3450775146484375, -0.31635284423828125, -0.287628173828125, -0.25890350341796875, -0.2301788330078125, -0.20145416259765625, -0.1727294921875, -0.14400482177734375, -0.1152801513671875, -0.08655548095703125, -0.057830810546875, -0.02910614013671875, -0.0003814697265625, 0.02834320068359375, 0.05706787109375, 0.08579254150390625, 0.1145172119140625, 0.14324188232421875, 0.171966552734375, 0.20069122314453125, 0.2294158935546875, 0.25814056396484375, 0.286865234375, 0.31558990478515625, 0.3443145751953125, 0.37303924560546875, 0.401763916015625, 0.43048858642578125, 0.4592132568359375, 0.48793792724609375, 0.51666259765625, 0.5453872680664062, 0.5741119384765625, 0.6028366088867188, 0.631561279296875, 0.6602859497070312, 0.6890106201171875, 0.7177352905273438, 0.7464599609375, 0.7751846313476562, 0.8039093017578125, 0.8326339721679688, 0.861358642578125, 0.8900833129882812, 0.9188079833984375, 0.9475326538085938, 0.97625732421875, 1.0049819946289062, 1.0337066650390625, 1.0624313354492188, 1.091156005859375, 1.1198806762695312, 1.1486053466796875, 1.1773300170898438, 1.2060546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 18.0, 55.0, 168.0, 396.0, 233.0, 84.0, 26.0, 13.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.98967361450195, -33.15276336669922, -32.31584930419922, -31.47893714904785, -30.642024993896484, -29.80511474609375, -28.968202590942383, -28.131290435791016, -27.29437828063965, -26.45746612548828, -25.620553970336914, -24.783641815185547, -23.946731567382812, -23.109817504882812, -22.272907257080078, -21.43599510192871, -20.599082946777344, -19.762170791625977, -18.92525863647461, -18.088346481323242, -17.251434326171875, -16.41452407836914, -15.577611923217773, -14.740699768066406, -13.903787612915039, -13.066875457763672, -12.229963302612305, -11.393052101135254, -10.556139945983887, -9.71922779083252, -8.882316589355469, -8.045404434204102, -7.208492279052734, -6.371580123901367, -5.534668445587158, -4.697756767272949, -3.860844612121582, -3.023932456970215, -2.187020778656006, -1.3501091003417969, -0.5131969451904297, 0.3237149715423584, 1.1606268882751465, 1.9975388050079346, 2.8344507217407227, 3.67136287689209, 4.508274555206299, 5.345186233520508, 6.182098388671875, 7.019010543823242, 7.855922222137451, 8.69283390045166, 9.529746055603027, 10.366658210754395, 11.203569412231445, 12.040481567382812, 12.87739372253418, 13.714305877685547, 14.551218032836914, 15.388129234313965, 16.225040435791016, 17.061954498291016, 17.89886474609375, 18.735776901245117, 19.572689056396484]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 12.0, 15.0, 16.0, 22.0, 38.0, 37.0, 52.0, 55.0, 52.0, 58.0, 66.0, 61.0, 69.0, 64.0, 71.0, 51.0, 44.0, 48.0, 36.0, 25.0, 23.0, 18.0, 17.0, 13.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166264533996582, -3.0437369346618652, -2.9212093353271484, -2.7986817359924316, -2.676154375076294, -2.553626775741577, -2.4310991764068604, -2.3085715770721436, -2.1860439777374268, -2.06351637840271, -1.9409888982772827, -1.818461298942566, -1.6959336996078491, -1.5734062194824219, -1.450878620147705, -1.3283510208129883, -1.205823540687561, -1.0832959413528442, -0.9607684016227722, -0.8382408618927002, -0.7157132625579834, -0.5931857228279114, -0.47065818309783936, -0.34813058376312256, -0.22560304403305054, -0.10307548195123672, 0.019452080130577087, 0.1419796347618103, 0.2645072042942047, 0.3870347738265991, 0.5095623135566711, 0.6320899128913879, 0.75461745262146, 0.877144992351532, 0.9996725916862488, 1.1222001314163208, 1.2447277307510376, 1.3672552108764648, 1.4897828102111816, 1.6123104095458984, 1.7348380088806152, 1.857365608215332, 1.9798930883407593, 2.1024208068847656, 2.2249481678009033, 2.34747576713562, 2.470003366470337, 2.5925309658050537, 2.7150583267211914, 2.837585926055908, 2.960113525390625, 3.082641124725342, 3.2051684856414795, 3.3276960849761963, 3.450223684310913, 3.57275128364563, 3.6952788829803467, 3.8178064823150635, 3.9403340816497803, 4.062861442565918, 4.185389041900635, 4.307916641235352, 4.430444240570068, 4.552971839904785, 4.675499439239502]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 10.0, 12.0, 14.0, 12.0, 14.0, 17.0, 23.0, 31.0, 36.0, 35.0, 36.0, 44.0, 112.0, 407.0, 5801.0, 581808.0, 454674.0, 4689.0, 367.0, 99.0, 47.0, 34.0, 34.0, 37.0, 28.0, 25.0, 24.0, 14.0, 14.0, 12.0, 9.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4375, -12.0224609375, -11.607421875, -11.1923828125, -10.77734375, -10.3623046875, -9.947265625, -9.5322265625, -9.1171875, -8.7021484375, -8.287109375, -7.8720703125, -7.45703125, -7.0419921875, -6.626953125, -6.2119140625, -5.796875, -5.3818359375, -4.966796875, -4.5517578125, -4.13671875, -3.7216796875, -3.306640625, -2.8916015625, -2.4765625, -2.0615234375, -1.646484375, -1.2314453125, -0.81640625, -0.4013671875, 0.013671875, 0.4287109375, 0.84375, 1.2587890625, 1.673828125, 2.0888671875, 2.50390625, 2.9189453125, 3.333984375, 3.7490234375, 4.1640625, 4.5791015625, 4.994140625, 5.4091796875, 5.82421875, 6.2392578125, 6.654296875, 7.0693359375, 7.484375, 7.8994140625, 8.314453125, 8.7294921875, 9.14453125, 9.5595703125, 9.974609375, 10.3896484375, 10.8046875, 11.2197265625, 11.634765625, 12.0498046875, 12.46484375, 12.8798828125, 13.294921875, 13.7099609375, 14.125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 9.0, 14.0, 19.0, 43.0, 57.0, 83.0, 125.0, 134.0, 111.0, 117.0, 92.0, 86.0, 48.0, 32.0, 20.0, 10.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.495849609375, -0.4853515625, -0.474853515625, -0.46435546875, -0.453857421875, -0.443359375, -0.432861328125, -0.42236328125, -0.411865234375, -0.4013671875, -0.390869140625, -0.38037109375, -0.369873046875, -0.359375, -0.348876953125, -0.33837890625, -0.327880859375, -0.3173828125, -0.306884765625, -0.29638671875, -0.285888671875, -0.275390625, -0.264892578125, -0.25439453125, -0.243896484375, -0.2333984375, -0.222900390625, -0.21240234375, -0.201904296875, -0.19140625, -0.180908203125, -0.17041015625, -0.159912109375, -0.1494140625, -0.138916015625, -0.12841796875, -0.117919921875, -0.107421875, -0.096923828125, -0.08642578125, -0.075927734375, -0.0654296875, -0.054931640625, -0.04443359375, -0.033935546875, -0.0234375, -0.012939453125, -0.00244140625, 0.008056640625, 0.0185546875, 0.029052734375, 0.03955078125, 0.050048828125, 0.060546875, 0.071044921875, 0.08154296875, 0.092041015625, 0.1025390625, 0.113037109375, 0.12353515625, 0.134033203125, 0.14453125, 0.155029296875, 0.16552734375, 0.176025390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 4.0, 7.0, 13.0, 18.0, 24.0, 33.0, 51.0, 93.0, 159.0, 303.0, 482.0, 989.0, 2411.0, 7024.0, 31821.0, 230191.0, 610228.0, 135047.0, 20663.0, 5239.0, 1885.0, 842.0, 402.0, 229.0, 134.0, 82.0, 58.0, 20.0, 28.0, 16.0, 7.0, 8.0, 9.0, 7.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.79632568359375, -4.6434326171875, -4.49053955078125, -4.337646484375, -4.18475341796875, -4.0318603515625, -3.87896728515625, -3.72607421875, -3.57318115234375, -3.4202880859375, -3.26739501953125, -3.114501953125, -2.96160888671875, -2.8087158203125, -2.65582275390625, -2.5029296875, -2.35003662109375, -2.1971435546875, -2.04425048828125, -1.891357421875, -1.73846435546875, -1.5855712890625, -1.43267822265625, -1.27978515625, -1.12689208984375, -0.9739990234375, -0.82110595703125, -0.668212890625, -0.51531982421875, -0.3624267578125, -0.20953369140625, -0.056640625, 0.09625244140625, 0.2491455078125, 0.40203857421875, 0.554931640625, 0.70782470703125, 0.8607177734375, 1.01361083984375, 1.16650390625, 1.31939697265625, 1.4722900390625, 1.62518310546875, 1.778076171875, 1.93096923828125, 2.0838623046875, 2.23675537109375, 2.3896484375, 2.54254150390625, 2.6954345703125, 2.84832763671875, 3.001220703125, 3.15411376953125, 3.3070068359375, 3.45989990234375, 3.61279296875, 3.76568603515625, 3.9185791015625, 4.07147216796875, 4.224365234375, 4.37725830078125, 4.5301513671875, 4.68304443359375, 4.8359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 6.0, 8.0, 10.0, 10.0, 16.0, 16.0, 20.0, 40.0, 37.0, 27.0, 44.0, 44.0, 41.0, 34.0, 40.0, 43.0, 39.0, 53.0, 46.0, 53.0, 33.0, 35.0, 30.0, 31.0, 36.0, 27.0, 20.0, 22.0, 21.0, 16.0, 16.0, 8.0, 10.0, 8.0, 8.0, 8.0, 5.0, 4.0, 0.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.669158935546875, -0.64202880859375, -0.614898681640625, -0.5877685546875, -0.560638427734375, -0.53350830078125, -0.506378173828125, -0.479248046875, -0.452117919921875, -0.42498779296875, -0.397857666015625, -0.3707275390625, -0.343597412109375, -0.31646728515625, -0.289337158203125, -0.26220703125, -0.235076904296875, -0.20794677734375, -0.180816650390625, -0.1536865234375, -0.126556396484375, -0.09942626953125, -0.072296142578125, -0.045166015625, -0.018035888671875, 0.00909423828125, 0.036224365234375, 0.0633544921875, 0.090484619140625, 0.11761474609375, 0.144744873046875, 0.171875, 0.199005126953125, 0.22613525390625, 0.253265380859375, 0.2803955078125, 0.307525634765625, 0.33465576171875, 0.361785888671875, 0.388916015625, 0.416046142578125, 0.44317626953125, 0.470306396484375, 0.4974365234375, 0.524566650390625, 0.55169677734375, 0.578826904296875, 0.60595703125, 0.633087158203125, 0.66021728515625, 0.687347412109375, 0.7144775390625, 0.741607666015625, 0.76873779296875, 0.795867919921875, 0.822998046875, 0.850128173828125, 0.87725830078125, 0.904388427734375, 0.9315185546875, 0.958648681640625, 0.98577880859375, 1.012908935546875, 1.0400390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 3.0, 14.0, 22.0, 28.0, 35.0, 37.0, 82.0, 123.0, 191.0, 387.0, 646.0, 1471.0, 3691.0, 12376.0, 53679.0, 311520.0, 527572.0, 105037.0, 21382.0, 5957.0, 2191.0, 921.0, 494.0, 258.0, 150.0, 92.0, 67.0, 29.0, 28.0, 16.0, 8.0, 11.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.61328125, -4.48583984375, -4.3583984375, -4.23095703125, -4.103515625, -3.97607421875, -3.8486328125, -3.72119140625, -3.59375, -3.46630859375, -3.3388671875, -3.21142578125, -3.083984375, -2.95654296875, -2.8291015625, -2.70166015625, -2.57421875, -2.44677734375, -2.3193359375, -2.19189453125, -2.064453125, -1.93701171875, -1.8095703125, -1.68212890625, -1.5546875, -1.42724609375, -1.2998046875, -1.17236328125, -1.044921875, -0.91748046875, -0.7900390625, -0.66259765625, -0.53515625, -0.40771484375, -0.2802734375, -0.15283203125, -0.025390625, 0.10205078125, 0.2294921875, 0.35693359375, 0.484375, 0.61181640625, 0.7392578125, 0.86669921875, 0.994140625, 1.12158203125, 1.2490234375, 1.37646484375, 1.50390625, 1.63134765625, 1.7587890625, 1.88623046875, 2.013671875, 2.14111328125, 2.2685546875, 2.39599609375, 2.5234375, 2.65087890625, 2.7783203125, 2.90576171875, 3.033203125, 3.16064453125, 3.2880859375, 3.41552734375, 3.54296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 9.0, 4.0, 12.0, 17.0, 24.0, 47.0, 66.0, 98.0, 123.0, 156.0, 147.0, 95.0, 72.0, 59.0, 28.0, 15.0, 8.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004620552062988281, -0.0004406645894050598, -0.0004192739725112915, -0.0003978833556175232, -0.0003764927387237549, -0.00035510212182998657, -0.00033371150493621826, -0.00031232088804244995, -0.00029093027114868164, -0.00026953965425491333, -0.000248149037361145, -0.0002267584204673767, -0.0002053678035736084, -0.0001839771866798401, -0.00016258656978607178, -0.00014119595289230347, -0.00011980533599853516, -9.841471910476685e-05, -7.702410221099854e-05, -5.5633485317230225e-05, -3.4242868423461914e-05, -1.2852251529693604e-05, 8.538365364074707e-06, 2.9928982257843018e-05, 5.131959915161133e-05, 7.271021604537964e-05, 9.410083293914795e-05, 0.00011549144983291626, 0.00013688206672668457, 0.00015827268362045288, 0.0001796633005142212, 0.0002010539174079895, 0.0002224445343017578, 0.00024383515119552612, 0.00026522576808929443, 0.00028661638498306274, 0.00030800700187683105, 0.00032939761877059937, 0.0003507882356643677, 0.000372178852558136, 0.0003935694694519043, 0.0004149600863456726, 0.0004363507032394409, 0.00045774132013320923, 0.00047913193702697754, 0.0005005225539207458, 0.0005219131708145142, 0.0005433037877082825, 0.0005646944046020508, 0.0005860850214958191, 0.0006074756383895874, 0.0006288662552833557, 0.000650256872177124, 0.0006716474890708923, 0.0006930381059646606, 0.000714428722858429, 0.0007358193397521973, 0.0007572099566459656, 0.0007786005735397339, 0.0007999911904335022, 0.0008213818073272705, 0.0008427724242210388, 0.0008641630411148071, 0.0008855536580085754, 0.0009069442749023438]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 9.0, 6.0, 10.0, 19.0, 24.0, 46.0, 110.0, 221.0, 565.0, 1633.0, 6336.0, 46885.0, 737165.0, 233767.0, 16847.0, 3199.0, 978.0, 385.0, 153.0, 94.0, 46.0, 18.0, 15.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.24072265625, -7.9892578125, -7.73779296875, -7.486328125, -7.23486328125, -6.9833984375, -6.73193359375, -6.48046875, -6.22900390625, -5.9775390625, -5.72607421875, -5.474609375, -5.22314453125, -4.9716796875, -4.72021484375, -4.46875, -4.21728515625, -3.9658203125, -3.71435546875, -3.462890625, -3.21142578125, -2.9599609375, -2.70849609375, -2.45703125, -2.20556640625, -1.9541015625, -1.70263671875, -1.451171875, -1.19970703125, -0.9482421875, -0.69677734375, -0.4453125, -0.19384765625, 0.0576171875, 0.30908203125, 0.560546875, 0.81201171875, 1.0634765625, 1.31494140625, 1.56640625, 1.81787109375, 2.0693359375, 2.32080078125, 2.572265625, 2.82373046875, 3.0751953125, 3.32666015625, 3.578125, 3.82958984375, 4.0810546875, 4.33251953125, 4.583984375, 4.83544921875, 5.0869140625, 5.33837890625, 5.58984375, 5.84130859375, 6.0927734375, 6.34423828125, 6.595703125, 6.84716796875, 7.0986328125, 7.35009765625, 7.6015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 5.0, 10.0, 4.0, 13.0, 13.0, 18.0, 29.0, 45.0, 57.0, 79.0, 80.0, 90.0, 107.0, 88.0, 87.0, 58.0, 50.0, 32.0, 29.0, 27.0, 11.0, 16.0, 8.0, 11.0, 1.0, 10.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337890625, -2.267486572265625, -2.19708251953125, -2.126678466796875, -2.0562744140625, -1.985870361328125, -1.91546630859375, -1.845062255859375, -1.774658203125, -1.704254150390625, -1.63385009765625, -1.563446044921875, -1.4930419921875, -1.422637939453125, -1.35223388671875, -1.281829833984375, -1.21142578125, -1.141021728515625, -1.07061767578125, -1.000213623046875, -0.9298095703125, -0.859405517578125, -0.78900146484375, -0.718597412109375, -0.648193359375, -0.577789306640625, -0.50738525390625, -0.436981201171875, -0.3665771484375, -0.296173095703125, -0.22576904296875, -0.155364990234375, -0.0849609375, -0.014556884765625, 0.05584716796875, 0.126251220703125, 0.1966552734375, 0.267059326171875, 0.33746337890625, 0.407867431640625, 0.478271484375, 0.548675537109375, 0.61907958984375, 0.689483642578125, 0.7598876953125, 0.830291748046875, 0.90069580078125, 0.971099853515625, 1.04150390625, 1.111907958984375, 1.18231201171875, 1.252716064453125, 1.3231201171875, 1.393524169921875, 1.46392822265625, 1.534332275390625, 1.604736328125, 1.675140380859375, 1.74554443359375, 1.815948486328125, 1.8863525390625, 1.956756591796875, 2.02716064453125, 2.097564697265625, 2.16796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 21.0, 74.0, 229.0, 365.0, 210.0, 70.0, 21.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.436071395874023, -28.695798873901367, -26.95552635192871, -25.215255737304688, -23.47498321533203, -21.734710693359375, -19.99443817138672, -18.254165649414062, -16.513893127441406, -14.77362060546875, -13.033348083496094, -11.293076515197754, -9.552803993225098, -7.812531471252441, -6.072259902954102, -4.331987380981445, -2.591714859008789, -0.8514425754547119, 0.8888297080993652, 2.6291017532348633, 4.3693742752075195, 6.109646797180176, 7.849918365478516, 9.590190887451172, 11.330463409423828, 13.070735931396484, 14.81100845336914, 16.551280975341797, 18.291553497314453, 20.03182601928711, 21.772096633911133, 23.51236915588379, 25.252639770507812, 26.99291229248047, 28.733184814453125, 30.47345733642578, 32.21372985839844, 33.954002380371094, 35.69427490234375, 37.434547424316406, 39.17481994628906, 40.91509246826172, 42.655364990234375, 44.39563751220703, 46.13591003417969, 47.876182556152344, 49.616455078125, 51.356727600097656, 53.09699630737305, 54.8372688293457, 56.57754135131836, 58.317813873291016, 60.05808639526367, 61.79835891723633, 63.53862762451172, 65.27890014648438, 67.01917266845703, 68.75944519042969, 70.49971771240234, 72.239990234375, 73.98026275634766, 75.72053527832031, 77.46080780029297, 79.20108032226562, 80.94135284423828]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 3.0, 8.0, 15.0, 15.0, 20.0, 23.0, 24.0, 35.0, 42.0, 30.0, 42.0, 60.0, 56.0, 50.0, 67.0, 56.0, 48.0, 50.0, 55.0, 41.0, 45.0, 28.0, 30.0, 26.0, 27.0, 24.0, 14.0, 12.0, 9.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.133524894714355, -8.853841781616211, -8.57415771484375, -8.294474601745605, -8.014791488647461, -7.735107898712158, -7.4554243087768555, -7.175741195678711, -6.896057605743408, -6.6163740158081055, -6.336690902709961, -6.057007312774658, -5.7773237228393555, -5.497640609741211, -5.217957019805908, -4.9382734298706055, -4.658590316772461, -4.378906726837158, -4.099223613739014, -3.819540023803711, -3.5398566722869873, -3.2601733207702637, -2.980489730834961, -2.7008063793182373, -2.4211230278015137, -2.14143967628479, -1.8617562055587769, -1.5820727348327637, -1.30238938331604, -1.0227060317993164, -0.7430225610733032, -0.46333909034729004, -0.1836566925048828, 0.0960267186164856, 0.375710129737854, 0.6553935408592224, 0.9350769519805908, 1.2147603034973145, 1.4944437742233276, 1.7741272449493408, 2.0538105964660645, 2.333493947982788, 2.6131772994995117, 2.8928608894348145, 3.172544240951538, 3.4522275924682617, 3.7319111824035645, 4.011594772338867, 4.291277885437012, 4.5709614753723145, 4.850644588470459, 5.130328178405762, 5.410011291503906, 5.689694881439209, 5.969378471374512, 6.249061584472656, 6.528745174407959, 6.808428764343262, 7.088111877441406, 7.367795467376709, 7.647479057312012, 7.927162170410156, 8.2068452835083, 8.486529350280762, 8.766212463378906]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 3.0, 1.0, 7.0, 6.0, 11.0, 8.0, 16.0, 7.0, 17.0, 12.0, 17.0, 28.0, 36.0, 38.0, 123.0, 527.0, 12845.0, 4121683.0, 57041.0, 1421.0, 256.0, 89.0, 37.0, 19.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0], "bins": [-34.375, -33.6961669921875, -33.017333984375, -32.3385009765625, -31.65966796875, -30.9808349609375, -30.302001953125, -29.6231689453125, -28.9443359375, -28.2655029296875, -27.586669921875, -26.9078369140625, -26.22900390625, -25.5501708984375, -24.871337890625, -24.1925048828125, -23.513671875, -22.8348388671875, -22.156005859375, -21.4771728515625, -20.79833984375, -20.1195068359375, -19.440673828125, -18.7618408203125, -18.0830078125, -17.4041748046875, -16.725341796875, -16.0465087890625, -15.36767578125, -14.6888427734375, -14.010009765625, -13.3311767578125, -12.65234375, -11.9735107421875, -11.294677734375, -10.6158447265625, -9.93701171875, -9.2581787109375, -8.579345703125, -7.9005126953125, -7.2216796875, -6.5428466796875, -5.864013671875, -5.1851806640625, -4.50634765625, -3.8275146484375, -3.148681640625, -2.4698486328125, -1.791015625, -1.1121826171875, -0.433349609375, 0.2454833984375, 0.92431640625, 1.6031494140625, 2.281982421875, 2.9608154296875, 3.6396484375, 4.3184814453125, 4.997314453125, 5.6761474609375, 6.35498046875, 7.0338134765625, 7.712646484375, 8.3914794921875, 9.0703125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 16.0, 32.0, 48.0, 52.0, 75.0, 88.0, 110.0, 100.0, 92.0, 101.0, 75.0, 67.0, 48.0, 26.0, 25.0, 10.0, 9.0, 9.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.487060546875, -0.47567176818847656, -0.4642829895019531, -0.4528942108154297, -0.44150543212890625, -0.4301166534423828, -0.4187278747558594, -0.40733909606933594, -0.3959503173828125, -0.38456153869628906, -0.3731727600097656, -0.3617839813232422, -0.35039520263671875, -0.3390064239501953, -0.3276176452636719, -0.31622886657714844, -0.304840087890625, -0.29345130920410156, -0.2820625305175781, -0.2706737518310547, -0.25928497314453125, -0.2478961944580078, -0.23650741577148438, -0.22511863708496094, -0.2137298583984375, -0.20234107971191406, -0.19095230102539062, -0.1795635223388672, -0.16817474365234375, -0.1567859649658203, -0.14539718627929688, -0.13400840759277344, -0.12261962890625, -0.11123085021972656, -0.09984207153320312, -0.08845329284667969, -0.07706451416015625, -0.06567573547363281, -0.054286956787109375, -0.04289817810058594, -0.0315093994140625, -0.020120620727539062, -0.008731842041015625, 0.0026569366455078125, 0.01404571533203125, 0.025434494018554688, 0.036823272705078125, 0.04821205139160156, 0.059600830078125, 0.07098960876464844, 0.08237838745117188, 0.09376716613769531, 0.10515594482421875, 0.11654472351074219, 0.12793350219726562, 0.13932228088378906, 0.1507110595703125, 0.16209983825683594, 0.17348861694335938, 0.1848773956298828, 0.19626617431640625, 0.2076549530029297, 0.21904373168945312, 0.23043251037597656, 0.2418212890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 12.0, 28.0, 38.0, 62.0, 78.0, 159.0, 292.0, 1105.0, 10672.0, 3820274.0, 354772.0, 5457.0, 761.0, 207.0, 150.0, 79.0, 48.0, 34.0, 21.0, 13.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.375, -19.521484375, -18.66796875, -17.814453125, -16.9609375, -16.107421875, -15.25390625, -14.400390625, -13.546875, -12.693359375, -11.83984375, -10.986328125, -10.1328125, -9.279296875, -8.42578125, -7.572265625, -6.71875, -5.865234375, -5.01171875, -4.158203125, -3.3046875, -2.451171875, -1.59765625, -0.744140625, 0.109375, 0.962890625, 1.81640625, 2.669921875, 3.5234375, 4.376953125, 5.23046875, 6.083984375, 6.9375, 7.791015625, 8.64453125, 9.498046875, 10.3515625, 11.205078125, 12.05859375, 12.912109375, 13.765625, 14.619140625, 15.47265625, 16.326171875, 17.1796875, 18.033203125, 18.88671875, 19.740234375, 20.59375, 21.447265625, 22.30078125, 23.154296875, 24.0078125, 24.861328125, 25.71484375, 26.568359375, 27.421875, 28.275390625, 29.12890625, 29.982421875, 30.8359375, 31.689453125, 32.54296875, 33.396484375, 34.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 11.0, 17.0, 44.0, 71.0, 195.0, 505.0, 2221.0, 637.0, 182.0, 83.0, 51.0, 16.0, 17.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.931640625, -1.84222412109375, -1.7528076171875, -1.66339111328125, -1.573974609375, -1.48455810546875, -1.3951416015625, -1.30572509765625, -1.21630859375, -1.12689208984375, -1.0374755859375, -0.94805908203125, -0.858642578125, -0.76922607421875, -0.6798095703125, -0.59039306640625, -0.5009765625, -0.41156005859375, -0.3221435546875, -0.23272705078125, -0.143310546875, -0.05389404296875, 0.0355224609375, 0.12493896484375, 0.21435546875, 0.30377197265625, 0.3931884765625, 0.48260498046875, 0.572021484375, 0.66143798828125, 0.7508544921875, 0.84027099609375, 0.9296875, 1.01910400390625, 1.1085205078125, 1.19793701171875, 1.287353515625, 1.37677001953125, 1.4661865234375, 1.55560302734375, 1.64501953125, 1.73443603515625, 1.8238525390625, 1.91326904296875, 2.002685546875, 2.09210205078125, 2.1815185546875, 2.27093505859375, 2.3603515625, 2.44976806640625, 2.5391845703125, 2.62860107421875, 2.718017578125, 2.80743408203125, 2.8968505859375, 2.98626708984375, 3.07568359375, 3.16510009765625, 3.2545166015625, 3.34393310546875, 3.433349609375, 3.52276611328125, 3.6121826171875, 3.70159912109375, 3.791015625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 9.0, 22.0, 42.0, 114.0, 260.0, 310.0, 163.0, 51.0, 22.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.90584182739258, -47.96759796142578, -47.029354095458984, -46.09111404418945, -45.152870178222656, -44.21462631225586, -43.27638244628906, -42.338138580322266, -41.39989471435547, -40.46165084838867, -39.523406982421875, -38.585166931152344, -37.64692306518555, -36.70867919921875, -35.77043533325195, -34.832191467285156, -33.893951416015625, -32.95570755004883, -32.01746368408203, -31.079221725463867, -30.140979766845703, -29.202735900878906, -28.26449203491211, -27.326248168945312, -26.38800621032715, -25.44976234436035, -24.511520385742188, -23.57327651977539, -22.635032653808594, -21.69679069519043, -20.758546829223633, -19.82030487060547, -18.882061004638672, -17.943817138671875, -17.00557518005371, -16.067331314086914, -15.129088401794434, -14.190845489501953, -13.252601623535156, -12.314358711242676, -11.376116752624512, -10.437873840332031, -9.499629974365234, -8.561387062072754, -7.623144149780273, -6.684901237487793, -5.746657848358154, -4.808414459228516, -3.870171546936035, -2.9319283962249756, -1.993685245513916, -1.0554420948028564, -0.11719894409179688, 0.8210439682006836, 1.7592873573303223, 2.697530746459961, 3.6357736587524414, 4.574016571044922, 5.5122599601745605, 6.450503349304199, 7.38874626159668, 8.32698917388916, 9.26523208618164, 10.203475952148438, 11.141718864440918]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 12.0, 15.0, 18.0, 19.0, 42.0, 31.0, 53.0, 68.0, 66.0, 62.0, 74.0, 88.0, 72.0, 72.0, 55.0, 59.0, 49.0, 32.0, 27.0, 17.0, 20.0, 13.0, 8.0, 10.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.685787200927734, -10.42631721496582, -10.166848182678223, -9.907379150390625, -9.647909164428711, -9.388439178466797, -9.1289701461792, -8.869501113891602, -8.610031127929688, -8.350561141967773, -8.091092109680176, -7.83162260055542, -7.572153091430664, -7.312683582305908, -7.053214073181152, -6.7937445640563965, -6.534275054931641, -6.274805545806885, -6.015336036682129, -5.755866527557373, -5.496397018432617, -5.236927509307861, -4.9774580001831055, -4.71798849105835, -4.458518981933594, -4.199049472808838, -3.939579963684082, -3.680110454559326, -3.4206409454345703, -3.1611714363098145, -2.9017019271850586, -2.6422324180603027, -2.382762908935547, -2.123293399810791, -1.8638238906860352, -1.6043543815612793, -1.3448848724365234, -1.0854153633117676, -0.8259458541870117, -0.5664763450622559, -0.3070068359375, -0.04753732681274414, 0.21193218231201172, 0.4714016914367676, 0.7308712005615234, 0.9903407096862793, 1.2498102188110352, 1.509279727935791, 1.7687492370605469, 2.0282187461853027, 2.2876882553100586, 2.5471577644348145, 2.8066272735595703, 3.066096782684326, 3.325566291809082, 3.585035800933838, 3.8445053100585938, 4.10397481918335, 4.3634443283081055, 4.622913837432861, 4.882383346557617, 5.141852855682373, 5.401322364807129, 5.660791873931885, 5.920261383056641]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 8.0, 17.0, 21.0, 25.0, 29.0, 59.0, 84.0, 280.0, 1242.0, 10949.0, 236827.0, 745441.0, 49008.0, 3608.0, 551.0, 153.0, 83.0, 44.0, 24.0, 19.0, 16.0, 13.0, 11.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.732421875, -8.38671875, -8.041015625, -7.6953125, -7.349609375, -7.00390625, -6.658203125, -6.3125, -5.966796875, -5.62109375, -5.275390625, -4.9296875, -4.583984375, -4.23828125, -3.892578125, -3.546875, -3.201171875, -2.85546875, -2.509765625, -2.1640625, -1.818359375, -1.47265625, -1.126953125, -0.78125, -0.435546875, -0.08984375, 0.255859375, 0.6015625, 0.947265625, 1.29296875, 1.638671875, 1.984375, 2.330078125, 2.67578125, 3.021484375, 3.3671875, 3.712890625, 4.05859375, 4.404296875, 4.75, 5.095703125, 5.44140625, 5.787109375, 6.1328125, 6.478515625, 6.82421875, 7.169921875, 7.515625, 7.861328125, 8.20703125, 8.552734375, 8.8984375, 9.244140625, 9.58984375, 9.935546875, 10.28125, 10.626953125, 10.97265625, 11.318359375, 11.6640625, 12.009765625, 12.35546875, 12.701171875, 13.046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 12.0, 12.0, 17.0, 15.0, 42.0, 38.0, 45.0, 56.0, 62.0, 61.0, 59.0, 68.0, 75.0, 63.0, 62.0, 63.0, 45.0, 43.0, 28.0, 31.0, 37.0, 20.0, 13.0, 9.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.449951171875, -0.4377861022949219, -0.42562103271484375, -0.4134559631347656, -0.4012908935546875, -0.3891258239746094, -0.37696075439453125, -0.3647956848144531, -0.352630615234375, -0.3404655456542969, -0.32830047607421875, -0.3161354064941406, -0.3039703369140625, -0.2918052673339844, -0.27964019775390625, -0.2674751281738281, -0.25531005859375, -0.24314498901367188, -0.23097991943359375, -0.21881484985351562, -0.2066497802734375, -0.19448471069335938, -0.18231964111328125, -0.17015457153320312, -0.157989501953125, -0.14582443237304688, -0.13365936279296875, -0.12149429321289062, -0.1093292236328125, -0.09716415405273438, -0.08499908447265625, -0.07283401489257812, -0.0606689453125, -0.048503875732421875, -0.03633880615234375, -0.024173736572265625, -0.0120086669921875, 0.000156402587890625, 0.01232147216796875, 0.024486541748046875, 0.036651611328125, 0.048816680908203125, 0.06098175048828125, 0.07314682006835938, 0.0853118896484375, 0.09747695922851562, 0.10964202880859375, 0.12180709838867188, 0.13397216796875, 0.14613723754882812, 0.15830230712890625, 0.17046737670898438, 0.1826324462890625, 0.19479751586914062, 0.20696258544921875, 0.21912765502929688, 0.231292724609375, 0.24345779418945312, 0.25562286376953125, 0.2677879333496094, 0.2799530029296875, 0.2921180725097656, 0.30428314208984375, 0.3164482116699219, 0.32861328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 5.0, 12.0, 8.0, 12.0, 18.0, 19.0, 38.0, 36.0, 52.0, 94.0, 127.0, 241.0, 491.0, 1152.0, 3194.0, 12444.0, 70489.0, 408178.0, 449802.0, 81912.0, 14148.0, 3599.0, 1187.0, 531.0, 292.0, 159.0, 87.0, 57.0, 53.0, 29.0, 23.0, 13.0, 14.0, 9.0, 11.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.267822265625, -5.08642578125, -4.905029296875, -4.7236328125, -4.542236328125, -4.36083984375, -4.179443359375, -3.998046875, -3.816650390625, -3.63525390625, -3.453857421875, -3.2724609375, -3.091064453125, -2.90966796875, -2.728271484375, -2.546875, -2.365478515625, -2.18408203125, -2.002685546875, -1.8212890625, -1.639892578125, -1.45849609375, -1.277099609375, -1.095703125, -0.914306640625, -0.73291015625, -0.551513671875, -0.3701171875, -0.188720703125, -0.00732421875, 0.174072265625, 0.35546875, 0.536865234375, 0.71826171875, 0.899658203125, 1.0810546875, 1.262451171875, 1.44384765625, 1.625244140625, 1.806640625, 1.988037109375, 2.16943359375, 2.350830078125, 2.5322265625, 2.713623046875, 2.89501953125, 3.076416015625, 3.2578125, 3.439208984375, 3.62060546875, 3.802001953125, 3.9833984375, 4.164794921875, 4.34619140625, 4.527587890625, 4.708984375, 4.890380859375, 5.07177734375, 5.253173828125, 5.4345703125, 5.615966796875, 5.79736328125, 5.978759765625, 6.16015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 11.0, 8.0, 14.0, 12.0, 25.0, 26.0, 25.0, 26.0, 28.0, 30.0, 42.0, 41.0, 45.0, 47.0, 51.0, 38.0, 42.0, 54.0, 45.0, 48.0, 42.0, 46.0, 39.0, 35.0, 34.0, 21.0, 11.0, 23.0, 25.0, 13.0, 12.0, 13.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.92578125, -1.8679656982421875, -1.810150146484375, -1.7523345947265625, -1.69451904296875, -1.6367034912109375, -1.578887939453125, -1.5210723876953125, -1.4632568359375, -1.4054412841796875, -1.347625732421875, -1.2898101806640625, -1.23199462890625, -1.1741790771484375, -1.116363525390625, -1.0585479736328125, -1.000732421875, -0.9429168701171875, -0.885101318359375, -0.8272857666015625, -0.76947021484375, -0.7116546630859375, -0.653839111328125, -0.5960235595703125, -0.5382080078125, -0.4803924560546875, -0.422576904296875, -0.3647613525390625, -0.30694580078125, -0.2491302490234375, -0.191314697265625, -0.1334991455078125, -0.07568359375, -0.0178680419921875, 0.039947509765625, 0.0977630615234375, 0.15557861328125, 0.2133941650390625, 0.271209716796875, 0.3290252685546875, 0.3868408203125, 0.4446563720703125, 0.502471923828125, 0.5602874755859375, 0.61810302734375, 0.6759185791015625, 0.733734130859375, 0.7915496826171875, 0.849365234375, 0.9071807861328125, 0.964996337890625, 1.0228118896484375, 1.08062744140625, 1.1384429931640625, 1.196258544921875, 1.2540740966796875, 1.3118896484375, 1.3697052001953125, 1.427520751953125, 1.4853363037109375, 1.54315185546875, 1.6009674072265625, 1.658782958984375, 1.7165985107421875, 1.7744140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 11.0, 11.0, 15.0, 27.0, 34.0, 44.0, 66.0, 101.0, 128.0, 199.0, 316.0, 535.0, 1013.0, 1749.0, 3325.0, 6724.0, 16975.0, 56588.0, 258692.0, 492280.0, 150810.0, 35389.0, 12130.0, 5240.0, 2572.0, 1423.0, 814.0, 471.0, 288.0, 173.0, 110.0, 74.0, 70.0, 31.0, 22.0, 30.0, 21.0, 6.0, 5.0, 5.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -3.030914306640625, -2.93096923828125, -2.831024169921875, -2.7310791015625, -2.631134033203125, -2.53118896484375, -2.431243896484375, -2.331298828125, -2.231353759765625, -2.13140869140625, -2.031463623046875, -1.9315185546875, -1.831573486328125, -1.73162841796875, -1.631683349609375, -1.53173828125, -1.431793212890625, -1.33184814453125, -1.231903076171875, -1.1319580078125, -1.032012939453125, -0.93206787109375, -0.832122802734375, -0.732177734375, -0.632232666015625, -0.53228759765625, -0.432342529296875, -0.3323974609375, -0.232452392578125, -0.13250732421875, -0.032562255859375, 0.0673828125, 0.167327880859375, 0.26727294921875, 0.367218017578125, 0.4671630859375, 0.567108154296875, 0.66705322265625, 0.766998291015625, 0.866943359375, 0.966888427734375, 1.06683349609375, 1.166778564453125, 1.2667236328125, 1.366668701171875, 1.46661376953125, 1.566558837890625, 1.66650390625, 1.766448974609375, 1.86639404296875, 1.966339111328125, 2.0662841796875, 2.166229248046875, 2.26617431640625, 2.366119384765625, 2.466064453125, 2.566009521484375, 2.66595458984375, 2.765899658203125, 2.8658447265625, 2.965789794921875, 3.06573486328125, 3.165679931640625, 3.265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 12.0, 18.0, 19.0, 35.0, 57.0, 81.0, 115.0, 139.0, 165.0, 120.0, 91.0, 50.0, 34.0, 20.0, 13.0, 11.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008091926574707031, -0.0007839277386665344, -0.0007586628198623657, -0.000733397901058197, -0.0007081329822540283, -0.0006828680634498596, -0.0006576031446456909, -0.0006323382258415222, -0.0006070733070373535, -0.0005818083882331848, -0.0005565434694290161, -0.0005312785506248474, -0.0005060136318206787, -0.00048074871301651, -0.0004554837942123413, -0.0004302188754081726, -0.0004049539566040039, -0.0003796890377998352, -0.0003544241189956665, -0.0003291592001914978, -0.0003038942813873291, -0.0002786293625831604, -0.0002533644437789917, -0.000228099524974823, -0.0002028346061706543, -0.0001775696873664856, -0.0001523047685623169, -0.0001270398497581482, -0.00010177493095397949, -7.651001214981079e-05, -5.124509334564209e-05, -2.598017454147339e-05, -7.152557373046875e-07, 2.4549663066864014e-05, 4.9814581871032715e-05, 7.507950067520142e-05, 0.00010034441947937012, 0.00012560933828353882, 0.00015087425708770752, 0.00017613917589187622, 0.00020140409469604492, 0.00022666901350021362, 0.0002519339323043823, 0.000277198851108551, 0.0003024637699127197, 0.00032772868871688843, 0.00035299360752105713, 0.00037825852632522583, 0.00040352344512939453, 0.00042878836393356323, 0.00045405328273773193, 0.00047931820154190063, 0.0005045831203460693, 0.000529848039150238, 0.0005551129579544067, 0.0005803778767585754, 0.0006056427955627441, 0.0006309077143669128, 0.0006561726331710815, 0.0006814375519752502, 0.0007067024707794189, 0.0007319673895835876, 0.0007572323083877563, 0.000782497227191925, 0.0008077621459960938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 6.0, 11.0, 14.0, 12.0, 19.0, 21.0, 42.0, 50.0, 93.0, 171.0, 234.0, 390.0, 664.0, 1203.0, 2251.0, 4358.0, 9798.0, 30080.0, 173031.0, 622972.0, 156785.0, 27871.0, 9181.0, 4106.0, 2243.0, 1147.0, 704.0, 388.0, 223.0, 148.0, 103.0, 71.0, 47.0, 27.0, 23.0, 13.0, 6.0, 4.0, 11.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-4.65234375, -4.51739501953125, -4.3824462890625, -4.24749755859375, -4.112548828125, -3.97760009765625, -3.8426513671875, -3.70770263671875, -3.57275390625, -3.43780517578125, -3.3028564453125, -3.16790771484375, -3.032958984375, -2.89801025390625, -2.7630615234375, -2.62811279296875, -2.4931640625, -2.35821533203125, -2.2232666015625, -2.08831787109375, -1.953369140625, -1.81842041015625, -1.6834716796875, -1.54852294921875, -1.41357421875, -1.27862548828125, -1.1436767578125, -1.00872802734375, -0.873779296875, -0.73883056640625, -0.6038818359375, -0.46893310546875, -0.333984375, -0.19903564453125, -0.0640869140625, 0.07086181640625, 0.205810546875, 0.34075927734375, 0.4757080078125, 0.61065673828125, 0.74560546875, 0.88055419921875, 1.0155029296875, 1.15045166015625, 1.285400390625, 1.42034912109375, 1.5552978515625, 1.69024658203125, 1.8251953125, 1.96014404296875, 2.0950927734375, 2.23004150390625, 2.364990234375, 2.49993896484375, 2.6348876953125, 2.76983642578125, 2.90478515625, 3.03973388671875, 3.1746826171875, 3.30963134765625, 3.444580078125, 3.57952880859375, 3.7144775390625, 3.84942626953125, 3.984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 9.0, 9.0, 9.0, 26.0, 41.0, 60.0, 86.0, 111.0, 136.0, 136.0, 113.0, 83.0, 57.0, 32.0, 27.0, 15.0, 13.0, 5.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.767364501953125, -2.67144775390625, -2.575531005859375, -2.4796142578125, -2.383697509765625, -2.28778076171875, -2.191864013671875, -2.095947265625, -2.000030517578125, -1.90411376953125, -1.808197021484375, -1.7122802734375, -1.616363525390625, -1.52044677734375, -1.424530029296875, -1.32861328125, -1.232696533203125, -1.13677978515625, -1.040863037109375, -0.9449462890625, -0.849029541015625, -0.75311279296875, -0.657196044921875, -0.561279296875, -0.465362548828125, -0.36944580078125, -0.273529052734375, -0.1776123046875, -0.081695556640625, 0.01422119140625, 0.110137939453125, 0.2060546875, 0.301971435546875, 0.39788818359375, 0.493804931640625, 0.5897216796875, 0.685638427734375, 0.78155517578125, 0.877471923828125, 0.973388671875, 1.069305419921875, 1.16522216796875, 1.261138916015625, 1.3570556640625, 1.452972412109375, 1.54888916015625, 1.644805908203125, 1.74072265625, 1.836639404296875, 1.93255615234375, 2.028472900390625, 2.1243896484375, 2.220306396484375, 2.31622314453125, 2.412139892578125, 2.508056640625, 2.603973388671875, 2.69989013671875, 2.795806884765625, 2.8917236328125, 2.987640380859375, 3.08355712890625, 3.179473876953125, 3.275390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 30.0, 67.0, 181.0, 226.0, 242.0, 148.0, 60.0, 27.0, 9.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.62193298339844, -50.85947799682617, -49.09702682495117, -47.334571838378906, -45.57211685180664, -43.809661865234375, -42.047210693359375, -40.28475570678711, -38.522300720214844, -36.75984573364258, -34.99739456176758, -33.23493957519531, -31.472484588623047, -29.710031509399414, -27.94757843017578, -26.185123443603516, -24.422670364379883, -22.66021728515625, -20.897762298583984, -19.13530921936035, -17.372854232788086, -15.610401153564453, -13.847947120666504, -12.085493087768555, -10.323039054870605, -8.560585021972656, -6.798130989074707, -5.035677433013916, -3.273223400115967, -1.5107698440551758, 0.25168418884277344, 2.0141382217407227, 3.776592254638672, 5.539046287536621, 7.30150032043457, 9.063953399658203, 10.826408386230469, 12.588861465454102, 14.35131549835205, 16.11376953125, 17.876224517822266, 19.6386775970459, 21.401132583618164, 23.163585662841797, 24.926040649414062, 26.688493728637695, 28.450946807861328, 30.213401794433594, 31.975854873657227, 33.73830795288086, 35.500762939453125, 37.26321792602539, 39.02566909790039, 40.788124084472656, 42.55057907104492, 44.31303405761719, 46.07548522949219, 47.83794021606445, 49.60039138793945, 51.36284637451172, 53.125301361083984, 54.88775634765625, 56.65020751953125, 58.412662506103516, 60.17511749267578]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 8.0, 15.0, 21.0, 32.0, 33.0, 34.0, 40.0, 54.0, 67.0, 66.0, 58.0, 60.0, 68.0, 61.0, 50.0, 51.0, 53.0, 44.0, 37.0, 30.0, 19.0, 17.0, 17.0, 13.0, 6.0, 8.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.976604461669922, -12.451470375061035, -11.926336288452148, -11.401202201843262, -10.876068115234375, -10.350934028625488, -9.825799942016602, -9.300666809082031, -8.775531768798828, -8.250397682189941, -7.725263595581055, -7.200129508972168, -6.674995422363281, -6.1498613357543945, -5.624727725982666, -5.099593639373779, -4.574460029602051, -4.049325942993164, -3.5241918563842773, -2.9990580081939697, -2.473923921585083, -1.9487898349761963, -1.4236559867858887, -0.898521900177002, -0.37338781356811523, 0.1517462134361267, 0.6768802404403687, 1.2020142078399658, 1.7271482944488525, 2.2522823810577393, 2.777416229248047, 3.3025503158569336, 3.8276844024658203, 4.352818489074707, 4.877952575683594, 5.4030866622924805, 5.928220748901367, 6.453354835510254, 6.978488445281982, 7.503622531890869, 8.028757095336914, 8.5538911819458, 9.079025268554688, 9.604159355163574, 10.129293441772461, 10.654427528381348, 11.179561614990234, 11.704694747924805, 12.229828834533691, 12.754962921142578, 13.280097007751465, 13.805231094360352, 14.330365180969238, 14.855499267578125, 15.380632400512695, 15.905767440795898, 16.43090057373047, 16.95603370666504, 17.481168746948242, 18.006301879882812, 18.531436920166016, 19.056570053100586, 19.58170509338379, 20.10683822631836, 20.631973266601562]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 5.0, 4.0, 7.0, 17.0, 19.0, 20.0, 25.0, 65.0, 90.0, 208.0, 627.0, 2153.0, 13223.0, 228213.0, 3872626.0, 67927.0, 6696.0, 1345.0, 466.0, 185.0, 113.0, 75.0, 35.0, 39.0, 17.0, 13.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.109375, -12.7843017578125, -12.459228515625, -12.1341552734375, -11.80908203125, -11.4840087890625, -11.158935546875, -10.8338623046875, -10.5087890625, -10.1837158203125, -9.858642578125, -9.5335693359375, -9.20849609375, -8.8834228515625, -8.558349609375, -8.2332763671875, -7.908203125, -7.5831298828125, -7.258056640625, -6.9329833984375, -6.60791015625, -6.2828369140625, -5.957763671875, -5.6326904296875, -5.3076171875, -4.9825439453125, -4.657470703125, -4.3323974609375, -4.00732421875, -3.6822509765625, -3.357177734375, -3.0321044921875, -2.70703125, -2.3819580078125, -2.056884765625, -1.7318115234375, -1.40673828125, -1.0816650390625, -0.756591796875, -0.4315185546875, -0.1064453125, 0.2186279296875, 0.543701171875, 0.8687744140625, 1.19384765625, 1.5189208984375, 1.843994140625, 2.1690673828125, 2.494140625, 2.8192138671875, 3.144287109375, 3.4693603515625, 3.79443359375, 4.1195068359375, 4.444580078125, 4.7696533203125, 5.0947265625, 5.4197998046875, 5.744873046875, 6.0699462890625, 6.39501953125, 6.7200927734375, 7.045166015625, 7.3702392578125, 7.6953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 22.0, 37.0, 49.0, 74.0, 69.0, 102.0, 119.0, 97.0, 99.0, 87.0, 75.0, 58.0, 35.0, 20.0, 24.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447265625, -0.42710113525390625, -0.4069366455078125, -0.38677215576171875, -0.366607666015625, -0.34644317626953125, -0.3262786865234375, -0.30611419677734375, -0.28594970703125, -0.26578521728515625, -0.2456207275390625, -0.22545623779296875, -0.205291748046875, -0.18512725830078125, -0.1649627685546875, -0.14479827880859375, -0.1246337890625, -0.10446929931640625, -0.0843048095703125, -0.06414031982421875, -0.043975830078125, -0.02381134033203125, -0.0036468505859375, 0.01651763916015625, 0.03668212890625, 0.05684661865234375, 0.0770111083984375, 0.09717559814453125, 0.117340087890625, 0.13750457763671875, 0.1576690673828125, 0.17783355712890625, 0.197998046875, 0.21816253662109375, 0.2383270263671875, 0.25849151611328125, 0.278656005859375, 0.29882049560546875, 0.3189849853515625, 0.33914947509765625, 0.35931396484375, 0.37947845458984375, 0.3996429443359375, 0.41980743408203125, 0.439971923828125, 0.46013641357421875, 0.4803009033203125, 0.5004653930664062, 0.5206298828125, 0.5407943725585938, 0.5609588623046875, 0.5811233520507812, 0.601287841796875, 0.6214523315429688, 0.6416168212890625, 0.6617813110351562, 0.68194580078125, 0.7021102905273438, 0.7222747802734375, 0.7424392700195312, 0.762603759765625, 0.7827682495117188, 0.8029327392578125, 0.8230972290039062, 0.84326171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 12.0, 7.0, 23.0, 13.0, 42.0, 42.0, 82.0, 120.0, 212.0, 485.0, 1127.0, 4025.0, 19587.0, 207062.0, 3789270.0, 150057.0, 16382.0, 3640.0, 1106.0, 422.0, 196.0, 123.0, 72.0, 39.0, 39.0, 22.0, 25.0, 9.0, 9.0, 4.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.2841796875, -10.873046875, -10.4619140625, -10.05078125, -9.6396484375, -9.228515625, -8.8173828125, -8.40625, -7.9951171875, -7.583984375, -7.1728515625, -6.76171875, -6.3505859375, -5.939453125, -5.5283203125, -5.1171875, -4.7060546875, -4.294921875, -3.8837890625, -3.47265625, -3.0615234375, -2.650390625, -2.2392578125, -1.828125, -1.4169921875, -1.005859375, -0.5947265625, -0.18359375, 0.2275390625, 0.638671875, 1.0498046875, 1.4609375, 1.8720703125, 2.283203125, 2.6943359375, 3.10546875, 3.5166015625, 3.927734375, 4.3388671875, 4.75, 5.1611328125, 5.572265625, 5.9833984375, 6.39453125, 6.8056640625, 7.216796875, 7.6279296875, 8.0390625, 8.4501953125, 8.861328125, 9.2724609375, 9.68359375, 10.0947265625, 10.505859375, 10.9169921875, 11.328125, 11.7392578125, 12.150390625, 12.5615234375, 12.97265625, 13.3837890625, 13.794921875, 14.2060546875, 14.6171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 5.0, 6.0, 11.0, 12.0, 10.0, 15.0, 28.0, 50.0, 41.0, 94.0, 146.0, 205.0, 360.0, 903.0, 1056.0, 449.0, 229.0, 137.0, 95.0, 56.0, 37.0, 34.0, 15.0, 21.0, 17.0, 11.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5556640625, -1.503936767578125, -1.45220947265625, -1.400482177734375, -1.3487548828125, -1.297027587890625, -1.24530029296875, -1.193572998046875, -1.141845703125, -1.090118408203125, -1.03839111328125, -0.986663818359375, -0.9349365234375, -0.883209228515625, -0.83148193359375, -0.779754638671875, -0.72802734375, -0.676300048828125, -0.62457275390625, -0.572845458984375, -0.5211181640625, -0.469390869140625, -0.41766357421875, -0.365936279296875, -0.314208984375, -0.262481689453125, -0.21075439453125, -0.159027099609375, -0.1072998046875, -0.055572509765625, -0.00384521484375, 0.047882080078125, 0.099609375, 0.151336669921875, 0.20306396484375, 0.254791259765625, 0.3065185546875, 0.358245849609375, 0.40997314453125, 0.461700439453125, 0.513427734375, 0.565155029296875, 0.61688232421875, 0.668609619140625, 0.7203369140625, 0.772064208984375, 0.82379150390625, 0.875518798828125, 0.92724609375, 0.978973388671875, 1.03070068359375, 1.082427978515625, 1.1341552734375, 1.185882568359375, 1.23760986328125, 1.289337158203125, 1.341064453125, 1.392791748046875, 1.44451904296875, 1.496246337890625, 1.5479736328125, 1.599700927734375, 1.65142822265625, 1.703155517578125, 1.7548828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 16.0, 20.0, 50.0, 95.0, 182.0, 200.0, 176.0, 125.0, 69.0, 25.0, 12.0, 11.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.029675483703613, -13.30925178527832, -12.588827133178711, -11.868403434753418, -11.147979736328125, -10.427555084228516, -9.707131385803223, -8.98670768737793, -8.26628303527832, -7.545858860015869, -6.825435161590576, -6.105010986328125, -5.384587287902832, -4.664163112640381, -3.9437389373779297, -3.2233152389526367, -2.5028915405273438, -1.7824676036834717, -1.06204354763031, -0.34161949157714844, 0.37880444526672363, 1.0992283821105957, 1.8196525573730469, 2.54007625579834, 3.260500431060791, 3.980924367904663, 4.701348304748535, 5.421772480010986, 6.1421966552734375, 6.8626203536987305, 7.583044528961182, 8.303468704223633, 9.023893356323242, 9.744317054748535, 10.464741706848145, 11.185165405273438, 11.90558910369873, 12.626012802124023, 13.346437454223633, 14.066861152648926, 14.787284851074219, 15.507708549499512, 16.228132247924805, 16.948556900024414, 17.668981552124023, 18.389404296875, 19.10982894897461, 19.83025360107422, 20.550678253173828, 21.271102905273438, 21.991525650024414, 22.711950302124023, 23.432374954223633, 24.15279769897461, 24.87322235107422, 25.593647003173828, 26.314069747924805, 27.034494400024414, 27.75491714477539, 28.475341796875, 29.19576644897461, 29.916189193725586, 30.636613845825195, 31.357036590576172, 32.07746124267578]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 17.0, 13.0, 21.0, 21.0, 20.0, 26.0, 27.0, 37.0, 41.0, 39.0, 40.0, 32.0, 45.0, 41.0, 45.0, 37.0, 42.0, 35.0, 32.0, 36.0, 42.0, 34.0, 31.0, 36.0, 25.0, 28.0, 21.0, 24.0, 17.0, 15.0, 13.0, 8.0, 2.0, 3.0, 7.0, 3.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.819750785827637, -5.639033794403076, -5.458316802978516, -5.277599811553955, -5.0968828201293945, -4.916165351867676, -4.735448360443115, -4.554731369018555, -4.374014377593994, -4.193297386169434, -4.012580394744873, -3.8318631649017334, -3.651146173477173, -3.4704291820526123, -3.2897119522094727, -3.108994960784912, -2.9282779693603516, -2.747560977935791, -2.5668439865112305, -2.386126756668091, -2.2054097652435303, -2.0246927738189697, -1.8439756631851196, -1.6632585525512695, -1.482541561126709, -1.3018245697021484, -1.1211074590682983, -0.940390408039093, -0.7596733570098877, -0.5789563059806824, -0.39823925495147705, -0.21752214431762695, -0.036805152893066406, 0.14391189813613892, 0.32462894916534424, 0.5053460001945496, 0.6860630512237549, 0.8667801022529602, 1.0474971532821655, 1.2282142639160156, 1.4089312553405762, 1.5896482467651367, 1.7703653573989868, 1.951082468032837, 2.1317994594573975, 2.312516450881958, 2.4932336807250977, 2.673950672149658, 2.8546676635742188, 3.0353846549987793, 3.21610164642334, 3.3968188762664795, 3.57753586769104, 3.7582528591156006, 3.9389700889587402, 4.119687080383301, 4.300404071807861, 4.481121063232422, 4.661838054656982, 4.842555046081543, 5.023272514343262, 5.203989505767822, 5.384706497192383, 5.565423488616943, 5.746140480041504]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 9.0, 9.0, 10.0, 16.0, 29.0, 40.0, 48.0, 116.0, 703.0, 13273.0, 476633.0, 540746.0, 15820.0, 792.0, 133.0, 62.0, 45.0, 32.0, 26.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3480224609375, -11.922607421875, -11.4971923828125, -11.07177734375, -10.6463623046875, -10.220947265625, -9.7955322265625, -9.3701171875, -8.9447021484375, -8.519287109375, -8.0938720703125, -7.66845703125, -7.2430419921875, -6.817626953125, -6.3922119140625, -5.966796875, -5.5413818359375, -5.115966796875, -4.6905517578125, -4.26513671875, -3.8397216796875, -3.414306640625, -2.9888916015625, -2.5634765625, -2.1380615234375, -1.712646484375, -1.2872314453125, -0.86181640625, -0.4364013671875, -0.010986328125, 0.4144287109375, 0.83984375, 1.2652587890625, 1.690673828125, 2.1160888671875, 2.54150390625, 2.9669189453125, 3.392333984375, 3.8177490234375, 4.2431640625, 4.6685791015625, 5.093994140625, 5.5194091796875, 5.94482421875, 6.3702392578125, 6.795654296875, 7.2210693359375, 7.646484375, 8.0718994140625, 8.497314453125, 8.9227294921875, 9.34814453125, 9.7735595703125, 10.198974609375, 10.6243896484375, 11.0498046875, 11.4752197265625, 11.900634765625, 12.3260498046875, 12.75146484375, 13.1768798828125, 13.602294921875, 14.0277099609375, 14.453125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 9.0, 8.0, 9.0, 15.0, 16.0, 21.0, 38.0, 24.0, 53.0, 56.0, 53.0, 53.0, 56.0, 71.0, 68.0, 69.0, 56.0, 56.0, 58.0, 42.0, 45.0, 36.0, 20.0, 16.0, 18.0, 10.0, 6.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.374267578125, -0.3565559387207031, -0.33884429931640625, -0.3211326599121094, -0.3034210205078125, -0.2857093811035156, -0.26799774169921875, -0.2502861022949219, -0.232574462890625, -0.21486282348632812, -0.19715118408203125, -0.17943954467773438, -0.1617279052734375, -0.14401626586914062, -0.12630462646484375, -0.10859298706054688, -0.09088134765625, -0.07316970825195312, -0.05545806884765625, -0.037746429443359375, -0.0200347900390625, -0.002323150634765625, 0.01538848876953125, 0.033100128173828125, 0.050811767578125, 0.06852340698242188, 0.08623504638671875, 0.10394668579101562, 0.1216583251953125, 0.13936996459960938, 0.15708160400390625, 0.17479324340820312, 0.1925048828125, 0.21021652221679688, 0.22792816162109375, 0.24563980102539062, 0.2633514404296875, 0.2810630798339844, 0.29877471923828125, 0.3164863586425781, 0.334197998046875, 0.3519096374511719, 0.36962127685546875, 0.3873329162597656, 0.4050445556640625, 0.4227561950683594, 0.44046783447265625, 0.4581794738769531, 0.47589111328125, 0.4936027526855469, 0.5113143920898438, 0.5290260314941406, 0.5467376708984375, 0.5644493103027344, 0.5821609497070312, 0.5998725891113281, 0.617584228515625, 0.6352958679199219, 0.6530075073242188, 0.6707191467285156, 0.6884307861328125, 0.7061424255371094, 0.7238540649414062, 0.7415657043457031, 0.75927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 2.0, 12.0, 13.0, 17.0, 30.0, 38.0, 60.0, 85.0, 124.0, 223.0, 348.0, 583.0, 1096.0, 2279.0, 5714.0, 18438.0, 71042.0, 274887.0, 442431.0, 169938.0, 41897.0, 11586.0, 3834.0, 1759.0, 783.0, 475.0, 292.0, 176.0, 116.0, 92.0, 58.0, 32.0, 14.0, 19.0, 11.0, 9.0, 6.0, 6.0, 6.0, 3.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.1640625, -5.009033203125, -4.85400390625, -4.698974609375, -4.5439453125, -4.388916015625, -4.23388671875, -4.078857421875, -3.923828125, -3.768798828125, -3.61376953125, -3.458740234375, -3.3037109375, -3.148681640625, -2.99365234375, -2.838623046875, -2.68359375, -2.528564453125, -2.37353515625, -2.218505859375, -2.0634765625, -1.908447265625, -1.75341796875, -1.598388671875, -1.443359375, -1.288330078125, -1.13330078125, -0.978271484375, -0.8232421875, -0.668212890625, -0.51318359375, -0.358154296875, -0.203125, -0.048095703125, 0.10693359375, 0.261962890625, 0.4169921875, 0.572021484375, 0.72705078125, 0.882080078125, 1.037109375, 1.192138671875, 1.34716796875, 1.502197265625, 1.6572265625, 1.812255859375, 1.96728515625, 2.122314453125, 2.27734375, 2.432373046875, 2.58740234375, 2.742431640625, 2.8974609375, 3.052490234375, 3.20751953125, 3.362548828125, 3.517578125, 3.672607421875, 3.82763671875, 3.982666015625, 4.1376953125, 4.292724609375, 4.44775390625, 4.602783203125, 4.7578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 6.0, 7.0, 8.0, 11.0, 12.0, 17.0, 18.0, 22.0, 20.0, 21.0, 22.0, 19.0, 27.0, 37.0, 36.0, 27.0, 30.0, 40.0, 36.0, 33.0, 40.0, 42.0, 38.0, 38.0, 44.0, 36.0, 37.0, 30.0, 28.0, 27.0, 27.0, 23.0, 9.0, 16.0, 14.0, 14.0, 11.0, 6.0, 12.0, 12.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.072265625, -2.005859375, -1.939453125, -1.873046875, -1.806640625, -1.740234375, -1.673828125, -1.607421875, -1.541015625, -1.474609375, -1.408203125, -1.341796875, -1.275390625, -1.208984375, -1.142578125, -1.076171875, -1.009765625, -0.943359375, -0.876953125, -0.810546875, -0.744140625, -0.677734375, -0.611328125, -0.544921875, -0.478515625, -0.412109375, -0.345703125, -0.279296875, -0.212890625, -0.146484375, -0.080078125, -0.013671875, 0.052734375, 0.119140625, 0.185546875, 0.251953125, 0.318359375, 0.384765625, 0.451171875, 0.517578125, 0.583984375, 0.650390625, 0.716796875, 0.783203125, 0.849609375, 0.916015625, 0.982421875, 1.048828125, 1.115234375, 1.181640625, 1.248046875, 1.314453125, 1.380859375, 1.447265625, 1.513671875, 1.580078125, 1.646484375, 1.712890625, 1.779296875, 1.845703125, 1.912109375, 1.978515625, 2.044921875, 2.111328125, 2.177734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 12.0, 25.0, 22.0, 36.0, 57.0, 91.0, 153.0, 264.0, 406.0, 690.0, 1160.0, 2163.0, 4595.0, 10497.0, 27973.0, 85919.0, 292310.0, 409056.0, 141554.0, 42862.0, 15678.0, 6417.0, 2983.0, 1488.0, 850.0, 484.0, 290.0, 182.0, 107.0, 66.0, 51.0, 38.0, 15.0, 11.0, 15.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.2933349609375, -2.205810546875, -2.1182861328125, -2.03076171875, -1.9432373046875, -1.855712890625, -1.7681884765625, -1.6806640625, -1.5931396484375, -1.505615234375, -1.4180908203125, -1.33056640625, -1.2430419921875, -1.155517578125, -1.0679931640625, -0.98046875, -0.8929443359375, -0.805419921875, -0.7178955078125, -0.63037109375, -0.5428466796875, -0.455322265625, -0.3677978515625, -0.2802734375, -0.1927490234375, -0.105224609375, -0.0177001953125, 0.06982421875, 0.1573486328125, 0.244873046875, 0.3323974609375, 0.419921875, 0.5074462890625, 0.594970703125, 0.6824951171875, 0.77001953125, 0.8575439453125, 0.945068359375, 1.0325927734375, 1.1201171875, 1.2076416015625, 1.295166015625, 1.3826904296875, 1.47021484375, 1.5577392578125, 1.645263671875, 1.7327880859375, 1.8203125, 1.9078369140625, 1.995361328125, 2.0828857421875, 2.17041015625, 2.2579345703125, 2.345458984375, 2.4329833984375, 2.5205078125, 2.6080322265625, 2.695556640625, 2.7830810546875, 2.87060546875, 2.9581298828125, 3.045654296875, 3.1331787109375, 3.220703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 5.0, 6.0, 8.0, 7.0, 17.0, 19.0, 21.0, 30.0, 38.0, 43.0, 40.0, 65.0, 87.0, 80.0, 100.0, 95.0, 52.0, 69.0, 44.0, 44.0, 23.0, 22.0, 20.0, 13.0, 13.0, 9.0, 14.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041484832763671875, -0.0004010796546936035, -0.0003873109817504883, -0.00037354230880737305, -0.0003597736358642578, -0.0003460049629211426, -0.00033223628997802734, -0.0003184676170349121, -0.0003046989440917969, -0.00029093027114868164, -0.0002771615982055664, -0.00026339292526245117, -0.00024962425231933594, -0.0002358555793762207, -0.00022208690643310547, -0.00020831823348999023, -0.000194549560546875, -0.00018078088760375977, -0.00016701221466064453, -0.0001532435417175293, -0.00013947486877441406, -0.00012570619583129883, -0.0001119375228881836, -9.816884994506836e-05, -8.440017700195312e-05, -7.063150405883789e-05, -5.6862831115722656e-05, -4.309415817260742e-05, -2.9325485229492188e-05, -1.5556812286376953e-05, -1.7881393432617188e-06, 1.1980533599853516e-05, 2.574920654296875e-05, 3.9517879486083984e-05, 5.328655242919922e-05, 6.705522537231445e-05, 8.082389831542969e-05, 9.459257125854492e-05, 0.00010836124420166016, 0.0001221299171447754, 0.00013589859008789062, 0.00014966726303100586, 0.0001634359359741211, 0.00017720460891723633, 0.00019097328186035156, 0.0002047419548034668, 0.00021851062774658203, 0.00023227930068969727, 0.0002460479736328125, 0.00025981664657592773, 0.00027358531951904297, 0.0002873539924621582, 0.00030112266540527344, 0.00031489133834838867, 0.0003286600112915039, 0.00034242868423461914, 0.0003561973571777344, 0.0003699660301208496, 0.00038373470306396484, 0.0003975033760070801, 0.0004112720489501953, 0.00042504072189331055, 0.0004388093948364258, 0.000452578067779541, 0.00046634674072265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 15.0, 15.0, 34.0, 30.0, 56.0, 96.0, 113.0, 177.0, 289.0, 463.0, 720.0, 1396.0, 2859.0, 6480.0, 17331.0, 57241.0, 255268.0, 505944.0, 142465.0, 35827.0, 11734.0, 4897.0, 2260.0, 1158.0, 629.0, 390.0, 233.0, 117.0, 99.0, 62.0, 44.0, 31.0, 23.0, 16.0, 11.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.046875, -2.93927001953125, -2.8316650390625, -2.72406005859375, -2.616455078125, -2.50885009765625, -2.4012451171875, -2.29364013671875, -2.18603515625, -2.07843017578125, -1.9708251953125, -1.86322021484375, -1.755615234375, -1.64801025390625, -1.5404052734375, -1.43280029296875, -1.3251953125, -1.21759033203125, -1.1099853515625, -1.00238037109375, -0.894775390625, -0.78717041015625, -0.6795654296875, -0.57196044921875, -0.46435546875, -0.35675048828125, -0.2491455078125, -0.14154052734375, -0.033935546875, 0.07366943359375, 0.1812744140625, 0.28887939453125, 0.396484375, 0.50408935546875, 0.6116943359375, 0.71929931640625, 0.826904296875, 0.93450927734375, 1.0421142578125, 1.14971923828125, 1.25732421875, 1.36492919921875, 1.4725341796875, 1.58013916015625, 1.687744140625, 1.79534912109375, 1.9029541015625, 2.01055908203125, 2.1181640625, 2.22576904296875, 2.3333740234375, 2.44097900390625, 2.548583984375, 2.65618896484375, 2.7637939453125, 2.87139892578125, 2.97900390625, 3.08660888671875, 3.1942138671875, 3.30181884765625, 3.409423828125, 3.51702880859375, 3.6246337890625, 3.73223876953125, 3.83984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 6.0, 20.0, 14.0, 19.0, 22.0, 42.0, 37.0, 41.0, 47.0, 62.0, 84.0, 78.0, 76.0, 78.0, 69.0, 59.0, 52.0, 39.0, 31.0, 26.0, 18.0, 14.0, 8.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.978515625, -1.91253662109375, -1.8465576171875, -1.78057861328125, -1.714599609375, -1.64862060546875, -1.5826416015625, -1.51666259765625, -1.45068359375, -1.38470458984375, -1.3187255859375, -1.25274658203125, -1.186767578125, -1.12078857421875, -1.0548095703125, -0.98883056640625, -0.9228515625, -0.85687255859375, -0.7908935546875, -0.72491455078125, -0.658935546875, -0.59295654296875, -0.5269775390625, -0.46099853515625, -0.39501953125, -0.32904052734375, -0.2630615234375, -0.19708251953125, -0.131103515625, -0.06512451171875, 0.0008544921875, 0.06683349609375, 0.1328125, 0.19879150390625, 0.2647705078125, 0.33074951171875, 0.396728515625, 0.46270751953125, 0.5286865234375, 0.59466552734375, 0.66064453125, 0.72662353515625, 0.7926025390625, 0.85858154296875, 0.924560546875, 0.99053955078125, 1.0565185546875, 1.12249755859375, 1.1884765625, 1.25445556640625, 1.3204345703125, 1.38641357421875, 1.452392578125, 1.51837158203125, 1.5843505859375, 1.65032958984375, 1.71630859375, 1.78228759765625, 1.8482666015625, 1.91424560546875, 1.980224609375, 2.04620361328125, 2.1121826171875, 2.17816162109375, 2.244140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 17.0, 33.0, 62.0, 121.0, 177.0, 188.0, 170.0, 97.0, 52.0, 39.0, 15.0, 15.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.295928955078125, -26.82982635498047, -25.363725662231445, -23.897624969482422, -22.431522369384766, -20.96541976928711, -19.499319076538086, -18.033218383789062, -16.567115783691406, -15.101014137268066, -13.634912490844727, -12.168810844421387, -10.702709197998047, -9.236607551574707, -7.770505905151367, -6.304404258728027, -4.8383026123046875, -3.3722009658813477, -1.9060993194580078, -0.43999767303466797, 1.0261039733886719, 2.4922056198120117, 3.9583072662353516, 5.424408912658691, 6.890510559082031, 8.356612205505371, 9.822713851928711, 11.28881549835205, 12.75491714477539, 14.22101879119873, 15.68712043762207, 17.153221130371094, 18.61932373046875, 20.085426330566406, 21.55152702331543, 23.017627716064453, 24.48373031616211, 25.949832916259766, 27.41593360900879, 28.882034301757812, 30.34813690185547, 31.814239501953125, 33.28034210205078, 34.74644088745117, 36.21254348754883, 37.678646087646484, 39.144744873046875, 40.61084747314453, 42.07695007324219, 43.543052673339844, 45.0091552734375, 46.47525405883789, 47.94135665893555, 49.4074592590332, 50.873558044433594, 52.33966064453125, 53.805763244628906, 55.27186584472656, 56.73796844482422, 58.20406723022461, 59.670169830322266, 61.13627243041992, 62.60237121582031, 64.06847381591797, 65.53457641601562]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 11.0, 8.0, 6.0, 9.0, 14.0, 23.0, 19.0, 29.0, 28.0, 36.0, 30.0, 31.0, 52.0, 53.0, 45.0, 50.0, 57.0, 48.0, 41.0, 40.0, 55.0, 36.0, 47.0, 39.0, 28.0, 20.0, 25.0, 28.0, 19.0, 15.0, 12.0, 8.0, 11.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125003814697266, -18.578582763671875, -18.032161712646484, -17.485740661621094, -16.939319610595703, -16.392898559570312, -15.846477508544922, -15.300056457519531, -14.75363540649414, -14.20721435546875, -13.66079330444336, -13.114372253417969, -12.567951202392578, -12.021530151367188, -11.475109100341797, -10.928688049316406, -10.382266998291016, -9.835845947265625, -9.289424896240234, -8.743003845214844, -8.196582794189453, -7.6501617431640625, -7.103740692138672, -6.557319641113281, -6.010898590087891, -5.4644775390625, -4.918056488037109, -4.371635437011719, -3.825214385986328, -3.2787933349609375, -2.732372283935547, -2.1859512329101562, -1.639531135559082, -1.0931100845336914, -0.5466890335083008, -0.00026798248291015625, 0.5461530685424805, 1.092574119567871, 1.6389951705932617, 2.1854162216186523, 2.731837272644043, 3.2782583236694336, 3.824679374694824, 4.371100425720215, 4.9175214767456055, 5.463942527770996, 6.010363578796387, 6.556784629821777, 7.103205680847168, 7.649626731872559, 8.19604778289795, 8.74246883392334, 9.28888988494873, 9.835310935974121, 10.381731986999512, 10.928153038024902, 11.474574089050293, 12.020995140075684, 12.567416191101074, 13.113837242126465, 13.660258293151855, 14.206679344177246, 14.753100395202637, 15.299521446228027, 15.845942497253418]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 9.0, 6.0, 5.0, 9.0, 11.0, 14.0, 11.0, 12.0, 34.0, 62.0, 151.0, 434.0, 1911.0, 13018.0, 227946.0, 3845832.0, 95668.0, 7452.0, 1189.0, 281.0, 112.0, 51.0, 21.0, 20.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.6484375, -15.318115234375, -14.98779296875, -14.657470703125, -14.3271484375, -13.996826171875, -13.66650390625, -13.336181640625, -13.005859375, -12.675537109375, -12.34521484375, -12.014892578125, -11.6845703125, -11.354248046875, -11.02392578125, -10.693603515625, -10.36328125, -10.032958984375, -9.70263671875, -9.372314453125, -9.0419921875, -8.711669921875, -8.38134765625, -8.051025390625, -7.720703125, -7.390380859375, -7.06005859375, -6.729736328125, -6.3994140625, -6.069091796875, -5.73876953125, -5.408447265625, -5.078125, -4.747802734375, -4.41748046875, -4.087158203125, -3.7568359375, -3.426513671875, -3.09619140625, -2.765869140625, -2.435546875, -2.105224609375, -1.77490234375, -1.444580078125, -1.1142578125, -0.783935546875, -0.45361328125, -0.123291015625, 0.20703125, 0.537353515625, 0.86767578125, 1.197998046875, 1.5283203125, 1.858642578125, 2.18896484375, 2.519287109375, 2.849609375, 3.179931640625, 3.51025390625, 3.840576171875, 4.1708984375, 4.501220703125, 4.83154296875, 5.161865234375, 5.4921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 6.0, 5.0, 11.0, 14.0, 13.0, 15.0, 15.0, 24.0, 27.0, 31.0, 33.0, 29.0, 43.0, 48.0, 49.0, 49.0, 54.0, 39.0, 47.0, 50.0, 67.0, 49.0, 40.0, 34.0, 43.0, 28.0, 24.0, 20.0, 18.0, 25.0, 12.0, 12.0, 12.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.560546875, -0.5463600158691406, -0.5321731567382812, -0.5179862976074219, -0.5037994384765625, -0.4896125793457031, -0.47542572021484375, -0.4612388610839844, -0.447052001953125, -0.4328651428222656, -0.41867828369140625, -0.4044914245605469, -0.3903045654296875, -0.3761177062988281, -0.36193084716796875, -0.3477439880371094, -0.33355712890625, -0.3193702697753906, -0.30518341064453125, -0.2909965515136719, -0.2768096923828125, -0.2626228332519531, -0.24843597412109375, -0.23424911499023438, -0.220062255859375, -0.20587539672851562, -0.19168853759765625, -0.17750167846679688, -0.1633148193359375, -0.14912796020507812, -0.13494110107421875, -0.12075424194335938, -0.1065673828125, -0.09238052368164062, -0.07819366455078125, -0.06400680541992188, -0.0498199462890625, -0.035633087158203125, -0.02144622802734375, -0.007259368896484375, 0.006927490234375, 0.021114349365234375, 0.03530120849609375, 0.049488067626953125, 0.0636749267578125, 0.07786178588867188, 0.09204864501953125, 0.10623550415039062, 0.12042236328125, 0.13460922241210938, 0.14879608154296875, 0.16298294067382812, 0.1771697998046875, 0.19135665893554688, 0.20554351806640625, 0.21973037719726562, 0.233917236328125, 0.24810409545898438, 0.26229095458984375, 0.2764778137207031, 0.2906646728515625, 0.3048515319824219, 0.31903839111328125, 0.3332252502441406, 0.347412109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 7.0, 7.0, 9.0, 13.0, 10.0, 29.0, 31.0, 48.0, 87.0, 125.0, 255.0, 497.0, 1093.0, 2919.0, 10192.0, 58669.0, 1557416.0, 2474844.0, 71109.0, 11602.0, 3139.0, 1142.0, 425.0, 243.0, 131.0, 76.0, 53.0, 40.0, 22.0, 26.0, 12.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.1617431640625, -9.823486328125, -9.4852294921875, -9.14697265625, -8.8087158203125, -8.470458984375, -8.1322021484375, -7.7939453125, -7.4556884765625, -7.117431640625, -6.7791748046875, -6.44091796875, -6.1026611328125, -5.764404296875, -5.4261474609375, -5.087890625, -4.7496337890625, -4.411376953125, -4.0731201171875, -3.73486328125, -3.3966064453125, -3.058349609375, -2.7200927734375, -2.3818359375, -2.0435791015625, -1.705322265625, -1.3670654296875, -1.02880859375, -0.6905517578125, -0.352294921875, -0.0140380859375, 0.32421875, 0.6624755859375, 1.000732421875, 1.3389892578125, 1.67724609375, 2.0155029296875, 2.353759765625, 2.6920166015625, 3.0302734375, 3.3685302734375, 3.706787109375, 4.0450439453125, 4.38330078125, 4.7215576171875, 5.059814453125, 5.3980712890625, 5.736328125, 6.0745849609375, 6.412841796875, 6.7510986328125, 7.08935546875, 7.4276123046875, 7.765869140625, 8.1041259765625, 8.4423828125, 8.7806396484375, 9.118896484375, 9.4571533203125, 9.79541015625, 10.1336669921875, 10.471923828125, 10.8101806640625, 11.1484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 16.0, 40.0, 56.0, 107.0, 188.0, 396.0, 1280.0, 1143.0, 429.0, 177.0, 103.0, 46.0, 42.0, 18.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.14617919921875, -2.0267333984375, -1.90728759765625, -1.787841796875, -1.66839599609375, -1.5489501953125, -1.42950439453125, -1.31005859375, -1.19061279296875, -1.0711669921875, -0.95172119140625, -0.832275390625, -0.71282958984375, -0.5933837890625, -0.47393798828125, -0.3544921875, -0.23504638671875, -0.1156005859375, 0.00384521484375, 0.123291015625, 0.24273681640625, 0.3621826171875, 0.48162841796875, 0.60107421875, 0.72052001953125, 0.8399658203125, 0.95941162109375, 1.078857421875, 1.19830322265625, 1.3177490234375, 1.43719482421875, 1.556640625, 1.67608642578125, 1.7955322265625, 1.91497802734375, 2.034423828125, 2.15386962890625, 2.2733154296875, 2.39276123046875, 2.51220703125, 2.63165283203125, 2.7510986328125, 2.87054443359375, 2.989990234375, 3.10943603515625, 3.2288818359375, 3.34832763671875, 3.4677734375, 3.58721923828125, 3.7066650390625, 3.82611083984375, 3.945556640625, 4.06500244140625, 4.1844482421875, 4.30389404296875, 4.42333984375, 4.54278564453125, 4.6622314453125, 4.78167724609375, 4.901123046875, 5.02056884765625, 5.1400146484375, 5.25946044921875, 5.37890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 5.0, 34.0, 87.0, 233.0, 330.0, 200.0, 74.0, 22.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.905662536621094, -25.269758224487305, -23.633853912353516, -21.99795150756836, -20.362045288085938, -18.72614288330078, -17.090238571166992, -15.454334259033203, -13.818429946899414, -12.182525634765625, -10.546621322631836, -8.910717964172363, -7.274813652038574, -5.638909339904785, -4.0030059814453125, -2.3671016693115234, -0.7311973571777344, 0.9047067165374756, 2.5406107902526855, 4.176514625549316, 5.8124189376831055, 7.4483232498168945, 9.084226608276367, 10.720130920410156, 12.356035232543945, 13.991939544677734, 15.627843856811523, 17.263748168945312, 18.89965057373047, 20.53555679321289, 22.171459197998047, 23.807363510131836, 25.443267822265625, 27.079172134399414, 28.715076446533203, 30.35097885131836, 31.98688507080078, 33.62278747558594, 35.258689880371094, 36.894596099853516, 38.53050231933594, 40.166404724121094, 41.802310943603516, 43.43821334838867, 45.074119567871094, 46.71002197265625, 48.345924377441406, 49.98183059692383, 51.617733001708984, 53.25363540649414, 54.88954162597656, 56.52544403076172, 58.16135025024414, 59.7972526550293, 61.43315887451172, 63.069061279296875, 64.70496368408203, 66.34086608886719, 67.97676849365234, 69.61267852783203, 71.24858093261719, 72.88448333740234, 74.5203857421875, 76.15629577636719, 77.79219818115234]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 11.0, 8.0, 13.0, 15.0, 23.0, 27.0, 33.0, 37.0, 36.0, 48.0, 39.0, 57.0, 50.0, 52.0, 56.0, 48.0, 38.0, 47.0, 45.0, 43.0, 42.0, 47.0, 39.0, 33.0, 23.0, 23.0, 14.0, 9.0, 9.0, 7.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.589573860168457, -11.28075885772705, -10.971942901611328, -10.663127899169922, -10.354312896728516, -10.045496940612793, -9.736681938171387, -9.427865982055664, -9.119050979614258, -8.810235977172852, -8.501420021057129, -8.192605018615723, -7.883789539337158, -7.574974060058594, -7.2661590576171875, -6.957343578338623, -6.648528099060059, -6.339712619781494, -6.03089714050293, -5.722082138061523, -5.413266658782959, -5.1044511795043945, -4.795636177062988, -4.486820697784424, -4.178005218505859, -3.869189739227295, -3.5603744983673096, -3.251559257507324, -2.9427437782287598, -2.6339282989501953, -2.32511305809021, -2.0162978172302246, -1.7074823379516602, -1.3986669778823853, -1.0898516178131104, -0.7810362577438354, -0.47222089767456055, -0.16340553760528564, 0.14540982246398926, 0.4542250633239746, 0.7630405426025391, 1.071855902671814, 1.3806712627410889, 1.6894866228103638, 1.9983019828796387, 2.307117462158203, 2.6159327030181885, 2.924747943878174, 3.2335634231567383, 3.5423789024353027, 3.851194143295288, 4.160009384155273, 4.468824863433838, 4.777640342712402, 5.086455345153809, 5.395270824432373, 5.7040863037109375, 6.012901782989502, 6.321717262268066, 6.630532264709473, 6.939347743988037, 7.248163223266602, 7.556978225708008, 7.865793704986572, 8.174609184265137]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 12.0, 12.0, 15.0, 18.0, 22.0, 38.0, 52.0, 84.0, 126.0, 242.0, 445.0, 760.0, 1623.0, 3872.0, 10583.0, 33664.0, 112431.0, 325874.0, 362582.0, 134986.0, 40279.0, 12359.0, 4555.0, 1914.0, 858.0, 464.0, 237.0, 166.0, 84.0, 55.0, 41.0, 23.0, 22.0, 15.0, 8.0, 10.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.87109375, -3.73321533203125, -3.5953369140625, -3.45745849609375, -3.319580078125, -3.18170166015625, -3.0438232421875, -2.90594482421875, -2.76806640625, -2.63018798828125, -2.4923095703125, -2.35443115234375, -2.216552734375, -2.07867431640625, -1.9407958984375, -1.80291748046875, -1.6650390625, -1.52716064453125, -1.3892822265625, -1.25140380859375, -1.113525390625, -0.97564697265625, -0.8377685546875, -0.69989013671875, -0.56201171875, -0.42413330078125, -0.2862548828125, -0.14837646484375, -0.010498046875, 0.12738037109375, 0.2652587890625, 0.40313720703125, 0.541015625, 0.67889404296875, 0.8167724609375, 0.95465087890625, 1.092529296875, 1.23040771484375, 1.3682861328125, 1.50616455078125, 1.64404296875, 1.78192138671875, 1.9197998046875, 2.05767822265625, 2.195556640625, 2.33343505859375, 2.4713134765625, 2.60919189453125, 2.7470703125, 2.88494873046875, 3.0228271484375, 3.16070556640625, 3.298583984375, 3.43646240234375, 3.5743408203125, 3.71221923828125, 3.85009765625, 3.98797607421875, 4.1258544921875, 4.26373291015625, 4.401611328125, 4.53948974609375, 4.6773681640625, 4.81524658203125, 4.953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 2.0, 4.0, 13.0, 8.0, 12.0, 18.0, 15.0, 19.0, 23.0, 26.0, 33.0, 41.0, 45.0, 43.0, 59.0, 55.0, 55.0, 42.0, 61.0, 68.0, 46.0, 39.0, 39.0, 27.0, 46.0, 26.0, 29.0, 18.0, 23.0, 18.0, 21.0, 10.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5570068359375, -0.539306640625, -0.5216064453125, -0.50390625, -0.4862060546875, -0.468505859375, -0.4508056640625, -0.43310546875, -0.4154052734375, -0.397705078125, -0.3800048828125, -0.3623046875, -0.3446044921875, -0.326904296875, -0.3092041015625, -0.29150390625, -0.2738037109375, -0.256103515625, -0.2384033203125, -0.220703125, -0.2030029296875, -0.185302734375, -0.1676025390625, -0.14990234375, -0.1322021484375, -0.114501953125, -0.0968017578125, -0.0791015625, -0.0614013671875, -0.043701171875, -0.0260009765625, -0.00830078125, 0.0093994140625, 0.027099609375, 0.0447998046875, 0.0625, 0.0802001953125, 0.097900390625, 0.1156005859375, 0.13330078125, 0.1510009765625, 0.168701171875, 0.1864013671875, 0.2041015625, 0.2218017578125, 0.239501953125, 0.2572021484375, 0.27490234375, 0.2926025390625, 0.310302734375, 0.3280029296875, 0.345703125, 0.3634033203125, 0.381103515625, 0.3988037109375, 0.41650390625, 0.4342041015625, 0.451904296875, 0.4696044921875, 0.4873046875, 0.5050048828125, 0.522705078125, 0.5404052734375, 0.55810546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 14.0, 18.0, 13.0, 31.0, 44.0, 56.0, 84.0, 121.0, 174.0, 297.0, 533.0, 1044.0, 2227.0, 5792.0, 16363.0, 51736.0, 159754.0, 372531.0, 286491.0, 101071.0, 31885.0, 10646.0, 3958.0, 1703.0, 770.0, 405.0, 260.0, 160.0, 103.0, 82.0, 50.0, 52.0, 24.0, 21.0, 8.0, 13.0, 8.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.9083251953125, -3.785400390625, -3.6624755859375, -3.53955078125, -3.4166259765625, -3.293701171875, -3.1707763671875, -3.0478515625, -2.9249267578125, -2.802001953125, -2.6790771484375, -2.55615234375, -2.4332275390625, -2.310302734375, -2.1873779296875, -2.064453125, -1.9415283203125, -1.818603515625, -1.6956787109375, -1.57275390625, -1.4498291015625, -1.326904296875, -1.2039794921875, -1.0810546875, -0.9581298828125, -0.835205078125, -0.7122802734375, -0.58935546875, -0.4664306640625, -0.343505859375, -0.2205810546875, -0.09765625, 0.0252685546875, 0.148193359375, 0.2711181640625, 0.39404296875, 0.5169677734375, 0.639892578125, 0.7628173828125, 0.8857421875, 1.0086669921875, 1.131591796875, 1.2545166015625, 1.37744140625, 1.5003662109375, 1.623291015625, 1.7462158203125, 1.869140625, 1.9920654296875, 2.114990234375, 2.2379150390625, 2.36083984375, 2.4837646484375, 2.606689453125, 2.7296142578125, 2.8525390625, 2.9754638671875, 3.098388671875, 3.2213134765625, 3.34423828125, 3.4671630859375, 3.590087890625, 3.7130126953125, 3.8359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 7.0, 6.0, 6.0, 5.0, 11.0, 8.0, 10.0, 17.0, 17.0, 18.0, 11.0, 27.0, 27.0, 33.0, 36.0, 25.0, 39.0, 38.0, 39.0, 47.0, 36.0, 62.0, 32.0, 40.0, 38.0, 25.0, 39.0, 36.0, 31.0, 33.0, 41.0, 18.0, 21.0, 18.0, 20.0, 19.0, 9.0, 11.0, 13.0, 8.0, 6.0, 2.0, 4.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.646484375, -2.57318115234375, -2.4998779296875, -2.42657470703125, -2.353271484375, -2.27996826171875, -2.2066650390625, -2.13336181640625, -2.06005859375, -1.98675537109375, -1.9134521484375, -1.84014892578125, -1.766845703125, -1.69354248046875, -1.6202392578125, -1.54693603515625, -1.4736328125, -1.40032958984375, -1.3270263671875, -1.25372314453125, -1.180419921875, -1.10711669921875, -1.0338134765625, -0.96051025390625, -0.88720703125, -0.81390380859375, -0.7406005859375, -0.66729736328125, -0.593994140625, -0.52069091796875, -0.4473876953125, -0.37408447265625, -0.30078125, -0.22747802734375, -0.1541748046875, -0.08087158203125, -0.007568359375, 0.06573486328125, 0.1390380859375, 0.21234130859375, 0.28564453125, 0.35894775390625, 0.4322509765625, 0.50555419921875, 0.578857421875, 0.65216064453125, 0.7254638671875, 0.79876708984375, 0.8720703125, 0.94537353515625, 1.0186767578125, 1.09197998046875, 1.165283203125, 1.23858642578125, 1.3118896484375, 1.38519287109375, 1.45849609375, 1.53179931640625, 1.6051025390625, 1.67840576171875, 1.751708984375, 1.82501220703125, 1.8983154296875, 1.97161865234375, 2.044921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 9.0, 14.0, 19.0, 18.0, 31.0, 61.0, 108.0, 181.0, 317.0, 690.0, 1410.0, 3285.0, 9556.0, 45504.0, 478179.0, 450931.0, 43017.0, 9380.0, 3092.0, 1318.0, 662.0, 299.0, 176.0, 98.0, 45.0, 39.0, 37.0, 25.0, 9.0, 6.0, 7.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.3580322265625, -4.196533203125, -4.0350341796875, -3.87353515625, -3.7120361328125, -3.550537109375, -3.3890380859375, -3.2275390625, -3.0660400390625, -2.904541015625, -2.7430419921875, -2.58154296875, -2.4200439453125, -2.258544921875, -2.0970458984375, -1.935546875, -1.7740478515625, -1.612548828125, -1.4510498046875, -1.28955078125, -1.1280517578125, -0.966552734375, -0.8050537109375, -0.6435546875, -0.4820556640625, -0.320556640625, -0.1590576171875, 0.00244140625, 0.1639404296875, 0.325439453125, 0.4869384765625, 0.6484375, 0.8099365234375, 0.971435546875, 1.1329345703125, 1.29443359375, 1.4559326171875, 1.617431640625, 1.7789306640625, 1.9404296875, 2.1019287109375, 2.263427734375, 2.4249267578125, 2.58642578125, 2.7479248046875, 2.909423828125, 3.0709228515625, 3.232421875, 3.3939208984375, 3.555419921875, 3.7169189453125, 3.87841796875, 4.0399169921875, 4.201416015625, 4.3629150390625, 4.5244140625, 4.6859130859375, 4.847412109375, 5.0089111328125, 5.17041015625, 5.3319091796875, 5.493408203125, 5.6549072265625, 5.81640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 11.0, 19.0, 27.0, 32.0, 54.0, 85.0, 156.0, 199.0, 140.0, 78.0, 52.0, 31.0, 18.0, 21.0, 19.0, 11.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006098747253417969, -0.0005884021520614624, -0.0005669295787811279, -0.0005454570055007935, -0.000523984432220459, -0.0005025118589401245, -0.00048103928565979004, -0.00045956671237945557, -0.0004380941390991211, -0.0004166215658187866, -0.00039514899253845215, -0.0003736764192581177, -0.0003522038459777832, -0.00033073127269744873, -0.00030925869941711426, -0.0002877861261367798, -0.0002663135528564453, -0.00024484097957611084, -0.00022336840629577637, -0.0002018958330154419, -0.00018042325973510742, -0.00015895068645477295, -0.00013747811317443848, -0.000116005539894104, -9.453296661376953e-05, -7.306039333343506e-05, -5.1587820053100586e-05, -3.0115246772766113e-05, -8.64267349243164e-06, 1.2829899787902832e-05, 3.4302473068237305e-05, 5.577504634857178e-05, 7.724761962890625e-05, 9.872019290924072e-05, 0.0001201927661895752, 0.00014166533946990967, 0.00016313791275024414, 0.0001846104860305786, 0.00020608305931091309, 0.00022755563259124756, 0.00024902820587158203, 0.0002705007791519165, 0.000291973352432251, 0.00031344592571258545, 0.0003349184989929199, 0.0003563910722732544, 0.00037786364555358887, 0.00039933621883392334, 0.0004208087921142578, 0.0004422813653945923, 0.00046375393867492676, 0.00048522651195526123, 0.0005066990852355957, 0.0005281716585159302, 0.0005496442317962646, 0.0005711168050765991, 0.0005925893783569336, 0.0006140619516372681, 0.0006355345249176025, 0.000657007098197937, 0.0006784796714782715, 0.000699952244758606, 0.0007214248180389404, 0.0007428973913192749, 0.0007643699645996094]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 11.0, 26.0, 44.0, 63.0, 106.0, 209.0, 392.0, 724.0, 1659.0, 4141.0, 14596.0, 97438.0, 711587.0, 186125.0, 21978.0, 5590.0, 2019.0, 865.0, 419.0, 206.0, 139.0, 70.0, 40.0, 31.0, 20.0, 14.0, 2.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.2335205078125, -5.056884765625, -4.8802490234375, -4.70361328125, -4.5269775390625, -4.350341796875, -4.1737060546875, -3.9970703125, -3.8204345703125, -3.643798828125, -3.4671630859375, -3.29052734375, -3.1138916015625, -2.937255859375, -2.7606201171875, -2.583984375, -2.4073486328125, -2.230712890625, -2.0540771484375, -1.87744140625, -1.7008056640625, -1.524169921875, -1.3475341796875, -1.1708984375, -0.9942626953125, -0.817626953125, -0.6409912109375, -0.46435546875, -0.2877197265625, -0.111083984375, 0.0655517578125, 0.2421875, 0.4188232421875, 0.595458984375, 0.7720947265625, 0.94873046875, 1.1253662109375, 1.302001953125, 1.4786376953125, 1.6552734375, 1.8319091796875, 2.008544921875, 2.1851806640625, 2.36181640625, 2.5384521484375, 2.715087890625, 2.8917236328125, 3.068359375, 3.2449951171875, 3.421630859375, 3.5982666015625, 3.77490234375, 3.9515380859375, 4.128173828125, 4.3048095703125, 4.4814453125, 4.6580810546875, 4.834716796875, 5.0113525390625, 5.18798828125, 5.3646240234375, 5.541259765625, 5.7178955078125, 5.89453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 6.0, 13.0, 12.0, 20.0, 23.0, 30.0, 25.0, 52.0, 38.0, 82.0, 89.0, 100.0, 96.0, 95.0, 82.0, 42.0, 47.0, 43.0, 23.0, 23.0, 15.0, 15.0, 1.0, 6.0, 7.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.123046875, -2.052764892578125, -1.98248291015625, -1.912200927734375, -1.8419189453125, -1.771636962890625, -1.70135498046875, -1.631072998046875, -1.560791015625, -1.490509033203125, -1.42022705078125, -1.349945068359375, -1.2796630859375, -1.209381103515625, -1.13909912109375, -1.068817138671875, -0.99853515625, -0.928253173828125, -0.85797119140625, -0.787689208984375, -0.7174072265625, -0.647125244140625, -0.57684326171875, -0.506561279296875, -0.436279296875, -0.365997314453125, -0.29571533203125, -0.225433349609375, -0.1551513671875, -0.084869384765625, -0.01458740234375, 0.055694580078125, 0.1259765625, 0.196258544921875, 0.26654052734375, 0.336822509765625, 0.4071044921875, 0.477386474609375, 0.54766845703125, 0.617950439453125, 0.688232421875, 0.758514404296875, 0.82879638671875, 0.899078369140625, 0.9693603515625, 1.039642333984375, 1.10992431640625, 1.180206298828125, 1.25048828125, 1.320770263671875, 1.39105224609375, 1.461334228515625, 1.5316162109375, 1.601898193359375, 1.67218017578125, 1.742462158203125, 1.812744140625, 1.883026123046875, 1.95330810546875, 2.023590087890625, 2.0938720703125, 2.164154052734375, 2.23443603515625, 2.304718017578125, 2.375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 8.0, 6.0, 15.0, 19.0, 27.0, 57.0, 81.0, 97.0, 118.0, 119.0, 121.0, 88.0, 72.0, 57.0, 42.0, 29.0, 13.0, 11.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.882911682128906, -28.897640228271484, -27.912370681762695, -26.927099227905273, -25.941829681396484, -24.956558227539062, -23.971288681030273, -22.98601722717285, -22.000747680664062, -21.01547622680664, -20.03020668029785, -19.04493522644043, -18.05966567993164, -17.07439422607422, -16.08912467956543, -15.103853225708008, -14.118582725524902, -13.133312225341797, -12.148041725158691, -11.162771224975586, -10.17750072479248, -9.192230224609375, -8.206958770751953, -7.221688747406006, -6.2364182472229, -5.251147747039795, -4.2658772468566895, -3.280606508255005, -2.2953360080718994, -1.3100652694702148, -0.3247947692871094, 0.6604757308959961, 1.6457462310791016, 2.631016731262207, 3.6162872314453125, 4.601557731628418, 5.586828231811523, 6.572099208831787, 7.557369709014893, 8.542640686035156, 9.527910232543945, 10.51318073272705, 11.498451232910156, 12.483721733093262, 13.468992233276367, 14.454263687133789, 15.439533233642578, 16.4248046875, 17.410076141357422, 18.395347595214844, 19.380617141723633, 20.365888595581055, 21.351158142089844, 22.336429595947266, 23.321699142456055, 24.306970596313477, 25.292240142822266, 26.277511596679688, 27.262781143188477, 28.2480525970459, 29.233322143554688, 30.21859359741211, 31.2038631439209, 32.18913269042969, 33.17440414428711]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 5.0, 9.0, 13.0, 16.0, 14.0, 25.0, 23.0, 21.0, 25.0, 24.0, 25.0, 13.0, 21.0, 39.0, 35.0, 48.0, 30.0, 42.0, 37.0, 49.0, 41.0, 42.0, 32.0, 34.0, 31.0, 33.0, 32.0, 24.0, 29.0, 18.0, 33.0, 16.0, 13.0, 13.0, 17.0, 11.0, 7.0, 7.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.785497665405273, -12.39074993133545, -11.996002197265625, -11.6012544631958, -11.206506729125977, -10.811758995056152, -10.417011260986328, -10.022263526916504, -9.62751579284668, -9.232768058776855, -8.838020324707031, -8.443272590637207, -8.048524856567383, -7.653777122497559, -7.259029388427734, -6.86428165435791, -6.469534397125244, -6.07478666305542, -5.680038928985596, -5.2852911949157715, -4.890543460845947, -4.495795726776123, -4.101048469543457, -3.7063004970550537, -3.3115527629852295, -2.9168050289154053, -2.522057294845581, -2.127309799194336, -1.7325619459152222, -1.337814211845398, -0.9430665969848633, -0.5483188629150391, -0.15357112884521484, 0.241176575422287, 0.6359242796897888, 1.0306719541549683, 1.4254196882247925, 1.8201674222946167, 2.2149150371551514, 2.6096627712249756, 3.0044105052948, 3.399158239364624, 3.7939059734344482, 4.188653469085693, 4.583401203155518, 4.978148937225342, 5.372896671295166, 5.76764440536499, 6.1623921394348145, 6.557139873504639, 6.951887607574463, 7.346635341644287, 7.741383075714111, 8.136130332946777, 8.530878067016602, 8.925625801086426, 9.32037353515625, 9.715121269226074, 10.109869003295898, 10.504616737365723, 10.899364471435547, 11.294112205505371, 11.688859939575195, 12.08360767364502, 12.478355407714844]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 18.0, 13.0, 13.0, 27.0, 50.0, 60.0, 64.0, 120.0, 223.0, 420.0, 773.0, 1726.0, 4191.0, 13908.0, 62632.0, 843975.0, 3122270.0, 112611.0, 21208.0, 5868.0, 2169.0, 873.0, 440.0, 239.0, 135.0, 85.0, 53.0, 33.0, 15.0, 16.0, 10.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.54296875, -7.35028076171875, -7.1575927734375, -6.96490478515625, -6.772216796875, -6.57952880859375, -6.3868408203125, -6.19415283203125, -6.00146484375, -5.80877685546875, -5.6160888671875, -5.42340087890625, -5.230712890625, -5.03802490234375, -4.8453369140625, -4.65264892578125, -4.4599609375, -4.26727294921875, -4.0745849609375, -3.88189697265625, -3.689208984375, -3.49652099609375, -3.3038330078125, -3.11114501953125, -2.91845703125, -2.72576904296875, -2.5330810546875, -2.34039306640625, -2.147705078125, -1.95501708984375, -1.7623291015625, -1.56964111328125, -1.376953125, -1.18426513671875, -0.9915771484375, -0.79888916015625, -0.606201171875, -0.41351318359375, -0.2208251953125, -0.02813720703125, 0.16455078125, 0.35723876953125, 0.5499267578125, 0.74261474609375, 0.935302734375, 1.12799072265625, 1.3206787109375, 1.51336669921875, 1.7060546875, 1.89874267578125, 2.0914306640625, 2.28411865234375, 2.476806640625, 2.66949462890625, 2.8621826171875, 3.05487060546875, 3.24755859375, 3.44024658203125, 3.6329345703125, 3.82562255859375, 4.018310546875, 4.21099853515625, 4.4036865234375, 4.59637451171875, 4.7890625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 8.0, 13.0, 16.0, 20.0, 22.0, 41.0, 41.0, 42.0, 71.0, 56.0, 88.0, 91.0, 71.0, 74.0, 59.0, 52.0, 46.0, 55.0, 38.0, 31.0, 16.0, 14.0, 15.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6195526123046875, -0.593597412109375, -0.5676422119140625, -0.54168701171875, -0.5157318115234375, -0.489776611328125, -0.4638214111328125, -0.4378662109375, -0.4119110107421875, -0.385955810546875, -0.3600006103515625, -0.33404541015625, -0.3080902099609375, -0.282135009765625, -0.2561798095703125, -0.230224609375, -0.2042694091796875, -0.178314208984375, -0.1523590087890625, -0.12640380859375, -0.1004486083984375, -0.074493408203125, -0.0485382080078125, -0.0225830078125, 0.0033721923828125, 0.029327392578125, 0.0552825927734375, 0.08123779296875, 0.1071929931640625, 0.133148193359375, 0.1591033935546875, 0.18505859375, 0.2110137939453125, 0.236968994140625, 0.2629241943359375, 0.28887939453125, 0.3148345947265625, 0.340789794921875, 0.3667449951171875, 0.3927001953125, 0.4186553955078125, 0.444610595703125, 0.4705657958984375, 0.49652099609375, 0.5224761962890625, 0.548431396484375, 0.5743865966796875, 0.600341796875, 0.6262969970703125, 0.652252197265625, 0.6782073974609375, 0.70416259765625, 0.7301177978515625, 0.756072998046875, 0.7820281982421875, 0.8079833984375, 0.8339385986328125, 0.859893798828125, 0.8858489990234375, 0.91180419921875, 0.9377593994140625, 0.963714599609375, 0.9896697998046875, 1.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 6.0, 13.0, 13.0, 14.0, 22.0, 36.0, 26.0, 32.0, 34.0, 58.0, 90.0, 163.0, 599.0, 2243.0, 11901.0, 108523.0, 3518747.0, 515520.0, 29724.0, 4665.0, 1129.0, 313.0, 113.0, 52.0, 52.0, 33.0, 23.0, 20.0, 18.0, 16.0, 12.0, 10.0, 10.0, 6.0, 6.0, 5.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.20263671875, -8.8583984375, -8.51416015625, -8.169921875, -7.82568359375, -7.4814453125, -7.13720703125, -6.79296875, -6.44873046875, -6.1044921875, -5.76025390625, -5.416015625, -5.07177734375, -4.7275390625, -4.38330078125, -4.0390625, -3.69482421875, -3.3505859375, -3.00634765625, -2.662109375, -2.31787109375, -1.9736328125, -1.62939453125, -1.28515625, -0.94091796875, -0.5966796875, -0.25244140625, 0.091796875, 0.43603515625, 0.7802734375, 1.12451171875, 1.46875, 1.81298828125, 2.1572265625, 2.50146484375, 2.845703125, 3.18994140625, 3.5341796875, 3.87841796875, 4.22265625, 4.56689453125, 4.9111328125, 5.25537109375, 5.599609375, 5.94384765625, 6.2880859375, 6.63232421875, 6.9765625, 7.32080078125, 7.6650390625, 8.00927734375, 8.353515625, 8.69775390625, 9.0419921875, 9.38623046875, 9.73046875, 10.07470703125, 10.4189453125, 10.76318359375, 11.107421875, 11.45166015625, 11.7958984375, 12.14013671875, 12.484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 5.0, 6.0, 5.0, 5.0, 16.0, 14.0, 20.0, 11.0, 32.0, 23.0, 46.0, 74.0, 73.0, 118.0, 161.0, 209.0, 414.0, 647.0, 766.0, 491.0, 276.0, 191.0, 103.0, 97.0, 67.0, 48.0, 39.0, 20.0, 15.0, 19.0, 14.0, 8.0, 6.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6376953125, -1.5881805419921875, -1.538665771484375, -1.4891510009765625, -1.43963623046875, -1.3901214599609375, -1.340606689453125, -1.2910919189453125, -1.2415771484375, -1.1920623779296875, -1.142547607421875, -1.0930328369140625, -1.04351806640625, -0.9940032958984375, -0.944488525390625, -0.8949737548828125, -0.845458984375, -0.7959442138671875, -0.746429443359375, -0.6969146728515625, -0.64739990234375, -0.5978851318359375, -0.548370361328125, -0.4988555908203125, -0.4493408203125, -0.3998260498046875, -0.350311279296875, -0.3007965087890625, -0.25128173828125, -0.2017669677734375, -0.152252197265625, -0.1027374267578125, -0.05322265625, -0.0037078857421875, 0.045806884765625, 0.0953216552734375, 0.14483642578125, 0.1943511962890625, 0.243865966796875, 0.2933807373046875, 0.3428955078125, 0.3924102783203125, 0.441925048828125, 0.4914398193359375, 0.54095458984375, 0.5904693603515625, 0.639984130859375, 0.6894989013671875, 0.739013671875, 0.7885284423828125, 0.838043212890625, 0.8875579833984375, 0.93707275390625, 0.9865875244140625, 1.036102294921875, 1.0856170654296875, 1.1351318359375, 1.1846466064453125, 1.234161376953125, 1.2836761474609375, 1.33319091796875, 1.3827056884765625, 1.432220458984375, 1.4817352294921875, 1.53125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 25.0, 83.0, 248.0, 379.0, 180.0, 59.0, 18.0, 8.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.76914978027344, -69.20992279052734, -67.65070343017578, -66.09147644042969, -64.53225708007812, -62.97303009033203, -61.4138069152832, -59.854583740234375, -58.29535675048828, -56.73613357543945, -55.176910400390625, -53.61768341064453, -52.0584602355957, -50.499237060546875, -48.94001388549805, -47.38079071044922, -45.821563720703125, -44.2623405456543, -42.70311737060547, -41.143890380859375, -39.58466720581055, -38.02544403076172, -36.46622085571289, -34.90699768066406, -33.347774505615234, -31.788551330566406, -30.229326248168945, -28.670103073120117, -27.110877990722656, -25.551654815673828, -23.992431640625, -22.43320655822754, -20.873981475830078, -19.31475830078125, -17.75553321838379, -16.19631004333496, -14.6370849609375, -13.077861785888672, -11.518637657165527, -9.959413528442383, -8.400189399719238, -6.840965270996094, -5.281741142272949, -3.722517490386963, -2.1632933616638184, -0.6040692329406738, 0.9551544189453125, 2.514378547668457, 4.073602676391602, 5.632826805114746, 7.192050933837891, 8.751274108886719, 10.31049919128418, 11.869722366333008, 13.428946495056152, 14.988170623779297, 16.547393798828125, 18.106616973876953, 19.665842056274414, 21.225065231323242, 22.784290313720703, 24.34351348876953, 25.90273666381836, 27.46196174621582, 29.02118682861328]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 2.0, 8.0, 9.0, 14.0, 13.0, 12.0, 10.0, 22.0, 25.0, 27.0, 32.0, 28.0, 51.0, 43.0, 47.0, 39.0, 42.0, 52.0, 46.0, 48.0, 46.0, 47.0, 38.0, 31.0, 40.0, 31.0, 28.0, 20.0, 17.0, 32.0, 21.0, 14.0, 17.0, 10.0, 6.0, 9.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7301154136657715, -7.482206344604492, -7.234297752380371, -6.98638916015625, -6.738480091094971, -6.490571022033691, -6.24266242980957, -5.994753837585449, -5.74684476852417, -5.498935699462891, -5.2510271072387695, -5.003118515014648, -4.755209445953369, -4.50730037689209, -4.259391784667969, -4.011483192443848, -3.7635741233825684, -3.515665292739868, -3.267756462097168, -3.0198476314544678, -2.7719388008117676, -2.5240299701690674, -2.276121139526367, -2.028212308883667, -1.7803034782409668, -1.5323946475982666, -1.2844858169555664, -1.0365769863128662, -0.788668155670166, -0.5407593250274658, -0.2928504943847656, -0.04494166374206543, 0.20296764373779297, 0.45087647438049316, 0.6987853050231934, 0.9466941356658936, 1.1946029663085938, 1.442511796951294, 1.6904206275939941, 1.9383294582366943, 2.1862382888793945, 2.4341471195220947, 2.682055950164795, 2.929964780807495, 3.1778736114501953, 3.4257824420928955, 3.6736912727355957, 3.921600103378296, 4.169508934020996, 4.417417526245117, 4.6653265953063965, 4.913235664367676, 5.161144256591797, 5.409052848815918, 5.656961917877197, 5.904870986938477, 6.152779579162598, 6.400688171386719, 6.648597240447998, 6.896506309509277, 7.144414901733398, 7.3923234939575195, 7.640232563018799, 7.888141632080078, 8.1360502243042]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 17.0, 17.0, 28.0, 28.0, 36.0, 63.0, 114.0, 156.0, 296.0, 499.0, 924.0, 1632.0, 3250.0, 6702.0, 13974.0, 30228.0, 66161.0, 142089.0, 255736.0, 257317.0, 144006.0, 66960.0, 30239.0, 14005.0, 6666.0, 3428.0, 1680.0, 963.0, 537.0, 292.0, 150.0, 120.0, 64.0, 39.0, 35.0, 20.0, 16.0, 14.0, 6.0, 8.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.113372802734375, -3.00604248046875, -2.898712158203125, -2.7913818359375, -2.684051513671875, -2.57672119140625, -2.469390869140625, -2.362060546875, -2.254730224609375, -2.14739990234375, -2.040069580078125, -1.9327392578125, -1.825408935546875, -1.71807861328125, -1.610748291015625, -1.50341796875, -1.396087646484375, -1.28875732421875, -1.181427001953125, -1.0740966796875, -0.966766357421875, -0.85943603515625, -0.752105712890625, -0.644775390625, -0.537445068359375, -0.43011474609375, -0.322784423828125, -0.2154541015625, -0.108123779296875, -0.00079345703125, 0.106536865234375, 0.2138671875, 0.321197509765625, 0.42852783203125, 0.535858154296875, 0.6431884765625, 0.750518798828125, 0.85784912109375, 0.965179443359375, 1.072509765625, 1.179840087890625, 1.28717041015625, 1.394500732421875, 1.5018310546875, 1.609161376953125, 1.71649169921875, 1.823822021484375, 1.93115234375, 2.038482666015625, 2.14581298828125, 2.253143310546875, 2.3604736328125, 2.467803955078125, 2.57513427734375, 2.682464599609375, 2.789794921875, 2.897125244140625, 3.00445556640625, 3.111785888671875, 3.2191162109375, 3.326446533203125, 3.43377685546875, 3.541107177734375, 3.6484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 4.0, 5.0, 9.0, 5.0, 12.0, 16.0, 15.0, 16.0, 22.0, 24.0, 27.0, 47.0, 38.0, 42.0, 44.0, 35.0, 47.0, 54.0, 51.0, 43.0, 54.0, 41.0, 36.0, 39.0, 45.0, 33.0, 39.0, 28.0, 21.0, 25.0, 15.0, 15.0, 17.0, 8.0, 8.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.63671875, -0.6178512573242188, -0.5989837646484375, -0.5801162719726562, -0.561248779296875, -0.5423812866210938, -0.5235137939453125, -0.5046463012695312, -0.48577880859375, -0.46691131591796875, -0.4480438232421875, -0.42917633056640625, -0.410308837890625, -0.39144134521484375, -0.3725738525390625, -0.35370635986328125, -0.3348388671875, -0.31597137451171875, -0.2971038818359375, -0.27823638916015625, -0.259368896484375, -0.24050140380859375, -0.2216339111328125, -0.20276641845703125, -0.18389892578125, -0.16503143310546875, -0.1461639404296875, -0.12729644775390625, -0.108428955078125, -0.08956146240234375, -0.0706939697265625, -0.05182647705078125, -0.032958984375, -0.01409149169921875, 0.0047760009765625, 0.02364349365234375, 0.042510986328125, 0.06137847900390625, 0.0802459716796875, 0.09911346435546875, 0.11798095703125, 0.13684844970703125, 0.1557159423828125, 0.17458343505859375, 0.193450927734375, 0.21231842041015625, 0.2311859130859375, 0.25005340576171875, 0.2689208984375, 0.28778839111328125, 0.3066558837890625, 0.32552337646484375, 0.344390869140625, 0.36325836181640625, 0.3821258544921875, 0.40099334716796875, 0.41986083984375, 0.43872833251953125, 0.4575958251953125, 0.47646331787109375, 0.495330810546875, 0.5141983032226562, 0.5330657958984375, 0.5519332885742188, 0.57080078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 3.0, 6.0, 8.0, 4.0, 10.0, 11.0, 11.0, 13.0, 26.0, 39.0, 58.0, 53.0, 86.0, 116.0, 148.0, 221.0, 288.0, 496.0, 853.0, 1654.0, 4420.0, 13610.0, 49063.0, 174502.0, 408801.0, 274610.0, 83955.0, 23179.0, 6875.0, 2402.0, 1084.0, 614.0, 385.0, 262.0, 179.0, 130.0, 103.0, 65.0, 50.0, 36.0, 40.0, 20.0, 15.0, 6.0, 14.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.50390625, -4.35723876953125, -4.2105712890625, -4.06390380859375, -3.917236328125, -3.77056884765625, -3.6239013671875, -3.47723388671875, -3.33056640625, -3.18389892578125, -3.0372314453125, -2.89056396484375, -2.743896484375, -2.59722900390625, -2.4505615234375, -2.30389404296875, -2.1572265625, -2.01055908203125, -1.8638916015625, -1.71722412109375, -1.570556640625, -1.42388916015625, -1.2772216796875, -1.13055419921875, -0.98388671875, -0.83721923828125, -0.6905517578125, -0.54388427734375, -0.397216796875, -0.25054931640625, -0.1038818359375, 0.04278564453125, 0.189453125, 0.33612060546875, 0.4827880859375, 0.62945556640625, 0.776123046875, 0.92279052734375, 1.0694580078125, 1.21612548828125, 1.36279296875, 1.50946044921875, 1.6561279296875, 1.80279541015625, 1.949462890625, 2.09613037109375, 2.2427978515625, 2.38946533203125, 2.5361328125, 2.68280029296875, 2.8294677734375, 2.97613525390625, 3.122802734375, 3.26947021484375, 3.4161376953125, 3.56280517578125, 3.70947265625, 3.85614013671875, 4.0028076171875, 4.14947509765625, 4.296142578125, 4.44281005859375, 4.5894775390625, 4.73614501953125, 4.8828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 9.0, 5.0, 6.0, 6.0, 5.0, 4.0, 12.0, 13.0, 14.0, 12.0, 15.0, 18.0, 20.0, 29.0, 24.0, 26.0, 38.0, 38.0, 35.0, 42.0, 34.0, 41.0, 51.0, 31.0, 40.0, 45.0, 37.0, 41.0, 36.0, 31.0, 28.0, 32.0, 17.0, 22.0, 21.0, 19.0, 14.0, 18.0, 15.0, 10.0, 14.0, 14.0, 5.0, 7.0, 5.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.70703125, -2.622833251953125, -2.53863525390625, -2.454437255859375, -2.3702392578125, -2.286041259765625, -2.20184326171875, -2.117645263671875, -2.033447265625, -1.949249267578125, -1.86505126953125, -1.780853271484375, -1.6966552734375, -1.612457275390625, -1.52825927734375, -1.444061279296875, -1.35986328125, -1.275665283203125, -1.19146728515625, -1.107269287109375, -1.0230712890625, -0.938873291015625, -0.85467529296875, -0.770477294921875, -0.686279296875, -0.602081298828125, -0.51788330078125, -0.433685302734375, -0.3494873046875, -0.265289306640625, -0.18109130859375, -0.096893310546875, -0.0126953125, 0.071502685546875, 0.15570068359375, 0.239898681640625, 0.3240966796875, 0.408294677734375, 0.49249267578125, 0.576690673828125, 0.660888671875, 0.745086669921875, 0.82928466796875, 0.913482666015625, 0.9976806640625, 1.081878662109375, 1.16607666015625, 1.250274658203125, 1.33447265625, 1.418670654296875, 1.50286865234375, 1.587066650390625, 1.6712646484375, 1.755462646484375, 1.83966064453125, 1.923858642578125, 2.008056640625, 2.092254638671875, 2.17645263671875, 2.260650634765625, 2.3448486328125, 2.429046630859375, 2.51324462890625, 2.597442626953125, 2.681640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 11.0, 10.0, 13.0, 19.0, 17.0, 25.0, 49.0, 63.0, 100.0, 178.0, 317.0, 665.0, 1380.0, 3363.0, 9337.0, 30221.0, 121355.0, 469629.0, 311911.0, 69926.0, 19179.0, 6252.0, 2382.0, 1017.0, 466.0, 257.0, 149.0, 92.0, 59.0, 33.0, 28.0, 16.0, 16.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.193359375, -3.08624267578125, -2.9791259765625, -2.87200927734375, -2.764892578125, -2.65777587890625, -2.5506591796875, -2.44354248046875, -2.33642578125, -2.22930908203125, -2.1221923828125, -2.01507568359375, -1.907958984375, -1.80084228515625, -1.6937255859375, -1.58660888671875, -1.4794921875, -1.37237548828125, -1.2652587890625, -1.15814208984375, -1.051025390625, -0.94390869140625, -0.8367919921875, -0.72967529296875, -0.62255859375, -0.51544189453125, -0.4083251953125, -0.30120849609375, -0.194091796875, -0.08697509765625, 0.0201416015625, 0.12725830078125, 0.234375, 0.34149169921875, 0.4486083984375, 0.55572509765625, 0.662841796875, 0.76995849609375, 0.8770751953125, 0.98419189453125, 1.09130859375, 1.19842529296875, 1.3055419921875, 1.41265869140625, 1.519775390625, 1.62689208984375, 1.7340087890625, 1.84112548828125, 1.9482421875, 2.05535888671875, 2.1624755859375, 2.26959228515625, 2.376708984375, 2.48382568359375, 2.5909423828125, 2.69805908203125, 2.80517578125, 2.91229248046875, 3.0194091796875, 3.12652587890625, 3.233642578125, 3.34075927734375, 3.4478759765625, 3.55499267578125, 3.662109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 4.0, 5.0, 12.0, 6.0, 14.0, 18.0, 17.0, 25.0, 36.0, 38.0, 60.0, 64.0, 89.0, 98.0, 121.0, 82.0, 72.0, 42.0, 39.0, 24.0, 38.0, 14.0, 14.0, 13.0, 6.0, 10.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004730224609375, -0.0004596002399921417, -0.00044617801904678345, -0.00043275579810142517, -0.0004193335771560669, -0.0004059113562107086, -0.00039248913526535034, -0.00037906691431999207, -0.0003656446933746338, -0.0003522224724292755, -0.00033880025148391724, -0.00032537803053855896, -0.0003119558095932007, -0.0002985335886478424, -0.00028511136770248413, -0.00027168914675712585, -0.0002582669258117676, -0.0002448447048664093, -0.00023142248392105103, -0.00021800026297569275, -0.00020457804203033447, -0.0001911558210849762, -0.00017773360013961792, -0.00016431137919425964, -0.00015088915824890137, -0.0001374669373035431, -0.00012404471635818481, -0.00011062249541282654, -9.720027446746826e-05, -8.377805352210999e-05, -7.035583257675171e-05, -5.693361163139343e-05, -4.3511390686035156e-05, -3.008916974067688e-05, -1.6666948795318604e-05, -3.244727849960327e-06, 1.017749309539795e-05, 2.3599714040756226e-05, 3.70219349861145e-05, 5.044415593147278e-05, 6.386637687683105e-05, 7.728859782218933e-05, 9.071081876754761e-05, 0.00010413303971290588, 0.00011755526065826416, 0.00013097748160362244, 0.0001443997025489807, 0.000157821923494339, 0.00017124414443969727, 0.00018466636538505554, 0.00019808858633041382, 0.0002115108072757721, 0.00022493302822113037, 0.00023835524916648865, 0.0002517774701118469, 0.0002651996910572052, 0.0002786219120025635, 0.00029204413294792175, 0.00030546635389328003, 0.0003188885748386383, 0.0003323107957839966, 0.00034573301672935486, 0.00035915523767471313, 0.0003725774586200714, 0.0003859996795654297]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 7.0, 5.0, 8.0, 16.0, 16.0, 14.0, 36.0, 59.0, 63.0, 108.0, 138.0, 273.0, 506.0, 954.0, 1882.0, 4452.0, 10850.0, 30669.0, 108624.0, 450121.0, 327292.0, 74214.0, 22640.0, 8485.0, 3640.0, 1610.0, 814.0, 413.0, 235.0, 144.0, 80.0, 55.0, 34.0, 25.0, 19.0, 15.0, 9.0, 8.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2890625, -3.17510986328125, -3.0611572265625, -2.94720458984375, -2.833251953125, -2.71929931640625, -2.6053466796875, -2.49139404296875, -2.37744140625, -2.26348876953125, -2.1495361328125, -2.03558349609375, -1.921630859375, -1.80767822265625, -1.6937255859375, -1.57977294921875, -1.4658203125, -1.35186767578125, -1.2379150390625, -1.12396240234375, -1.010009765625, -0.89605712890625, -0.7821044921875, -0.66815185546875, -0.55419921875, -0.44024658203125, -0.3262939453125, -0.21234130859375, -0.098388671875, 0.01556396484375, 0.1295166015625, 0.24346923828125, 0.357421875, 0.47137451171875, 0.5853271484375, 0.69927978515625, 0.813232421875, 0.92718505859375, 1.0411376953125, 1.15509033203125, 1.26904296875, 1.38299560546875, 1.4969482421875, 1.61090087890625, 1.724853515625, 1.83880615234375, 1.9527587890625, 2.06671142578125, 2.1806640625, 2.29461669921875, 2.4085693359375, 2.52252197265625, 2.636474609375, 2.75042724609375, 2.8643798828125, 2.97833251953125, 3.09228515625, 3.20623779296875, 3.3201904296875, 3.43414306640625, 3.548095703125, 3.66204833984375, 3.7760009765625, 3.88995361328125, 4.00390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 8.0, 4.0, 9.0, 11.0, 7.0, 15.0, 30.0, 20.0, 42.0, 44.0, 61.0, 80.0, 80.0, 95.0, 93.0, 95.0, 61.0, 52.0, 35.0, 33.0, 21.0, 25.0, 15.0, 9.0, 10.0, 4.0, 5.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.63671875, -2.553955078125, -2.47119140625, -2.388427734375, -2.3056640625, -2.222900390625, -2.14013671875, -2.057373046875, -1.974609375, -1.891845703125, -1.80908203125, -1.726318359375, -1.6435546875, -1.560791015625, -1.47802734375, -1.395263671875, -1.3125, -1.229736328125, -1.14697265625, -1.064208984375, -0.9814453125, -0.898681640625, -0.81591796875, -0.733154296875, -0.650390625, -0.567626953125, -0.48486328125, -0.402099609375, -0.3193359375, -0.236572265625, -0.15380859375, -0.071044921875, 0.01171875, 0.094482421875, 0.17724609375, 0.260009765625, 0.3427734375, 0.425537109375, 0.50830078125, 0.591064453125, 0.673828125, 0.756591796875, 0.83935546875, 0.922119140625, 1.0048828125, 1.087646484375, 1.17041015625, 1.253173828125, 1.3359375, 1.418701171875, 1.50146484375, 1.584228515625, 1.6669921875, 1.749755859375, 1.83251953125, 1.915283203125, 1.998046875, 2.080810546875, 2.16357421875, 2.246337890625, 2.3291015625, 2.411865234375, 2.49462890625, 2.577392578125, 2.66015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 12.0, 17.0, 53.0, 41.0, 90.0, 106.0, 143.0, 145.0, 137.0, 91.0, 56.0, 39.0, 29.0, 17.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.89221954345703, -40.624637603759766, -39.3570556640625, -38.08946990966797, -36.8218879699707, -35.55430603027344, -34.28672409057617, -33.019142150878906, -31.751556396484375, -30.48397445678711, -29.21639060974121, -27.948808670043945, -26.681224822998047, -25.41364288330078, -24.146060943603516, -22.878477096557617, -21.61089515686035, -20.343313217163086, -19.075729370117188, -17.808147430419922, -16.540563583374023, -15.272981643676758, -14.005398750305176, -12.737815856933594, -11.470232963562012, -10.20265007019043, -8.935067176818848, -7.667484760284424, -6.399901866912842, -5.13231897354126, -3.864736557006836, -2.597153663635254, -1.3295707702636719, -0.061987996101379395, 1.205594778060913, 2.473177433013916, 3.740760326385498, 5.00834321975708, 6.275925636291504, 7.543508529663086, 8.811091423034668, 10.07867431640625, 11.346257209777832, 12.613840103149414, 13.88142204284668, 15.149005889892578, 16.416587829589844, 17.68416976928711, 18.951753616333008, 20.219335556030273, 21.486919403076172, 22.754501342773438, 24.022085189819336, 25.2896671295166, 26.5572509765625, 27.824832916259766, 29.09241485595703, 30.359996795654297, 31.627580642700195, 32.895164489746094, 34.16274642944336, 35.430328369140625, 36.69791030883789, 37.965492248535156, 39.23307800292969]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 7.0, 3.0, 12.0, 7.0, 19.0, 15.0, 22.0, 14.0, 19.0, 30.0, 34.0, 26.0, 32.0, 34.0, 44.0, 42.0, 39.0, 50.0, 49.0, 44.0, 45.0, 32.0, 42.0, 42.0, 34.0, 38.0, 34.0, 26.0, 20.0, 20.0, 18.0, 22.0, 15.0, 18.0, 9.0, 8.0, 6.0, 5.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.89603042602539, -19.339414596557617, -18.782798767089844, -18.226184844970703, -17.66956901550293, -17.112953186035156, -16.556337356567383, -15.99972152709961, -15.443106651306152, -14.886490821838379, -14.329875946044922, -13.773260116577148, -13.216644287109375, -12.660029411315918, -12.103413581848145, -11.546798706054688, -10.990182876586914, -10.43356704711914, -9.876952171325684, -9.32033634185791, -8.763721466064453, -8.20710563659668, -7.650489807128906, -7.093874454498291, -6.537259101867676, -5.9806437492370605, -5.424028396606445, -4.867412567138672, -4.310797214508057, -3.7541818618774414, -3.197566270828247, -2.6409506797790527, -2.0843334197998047, -1.5277179479599, -0.9711024761199951, -0.41448700428009033, 0.14212846755981445, 0.6987438201904297, 1.255359411239624, 1.8119750022888184, 2.3685903549194336, 2.925205707550049, 3.481821298599243, 4.0384368896484375, 4.595052242279053, 5.151667594909668, 5.708283424377441, 6.264898777008057, 6.821514129638672, 7.378129482269287, 7.934744834899902, 8.491360664367676, 9.047975540161133, 9.604591369628906, 10.16120719909668, 10.717823028564453, 11.27443790435791, 11.831053733825684, 12.38766860961914, 12.944284439086914, 13.500900268554688, 14.057515144348145, 14.614130973815918, 15.170745849609375, 15.727361679077148]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 5.0, 6.0, 13.0, 11.0, 13.0, 22.0, 30.0, 59.0, 96.0, 141.0, 216.0, 389.0, 779.0, 1855.0, 5204.0, 19172.0, 108364.0, 2984521.0, 985132.0, 67624.0, 13785.0, 4102.0, 1480.0, 622.0, 282.0, 144.0, 71.0, 45.0, 33.0, 19.0, 11.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.20361328125, -6.9970703125, -6.79052734375, -6.583984375, -6.37744140625, -6.1708984375, -5.96435546875, -5.7578125, -5.55126953125, -5.3447265625, -5.13818359375, -4.931640625, -4.72509765625, -4.5185546875, -4.31201171875, -4.10546875, -3.89892578125, -3.6923828125, -3.48583984375, -3.279296875, -3.07275390625, -2.8662109375, -2.65966796875, -2.453125, -2.24658203125, -2.0400390625, -1.83349609375, -1.626953125, -1.42041015625, -1.2138671875, -1.00732421875, -0.80078125, -0.59423828125, -0.3876953125, -0.18115234375, 0.025390625, 0.23193359375, 0.4384765625, 0.64501953125, 0.8515625, 1.05810546875, 1.2646484375, 1.47119140625, 1.677734375, 1.88427734375, 2.0908203125, 2.29736328125, 2.50390625, 2.71044921875, 2.9169921875, 3.12353515625, 3.330078125, 3.53662109375, 3.7431640625, 3.94970703125, 4.15625, 4.36279296875, 4.5693359375, 4.77587890625, 4.982421875, 5.18896484375, 5.3955078125, 5.60205078125, 5.80859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 9.0, 19.0, 17.0, 19.0, 26.0, 20.0, 40.0, 44.0, 61.0, 53.0, 61.0, 66.0, 59.0, 73.0, 71.0, 57.0, 52.0, 47.0, 38.0, 34.0, 27.0, 22.0, 21.0, 12.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.013671875, -0.9874114990234375, -0.961151123046875, -0.9348907470703125, -0.90863037109375, -0.8823699951171875, -0.856109619140625, -0.8298492431640625, -0.8035888671875, -0.7773284912109375, -0.751068115234375, -0.7248077392578125, -0.69854736328125, -0.6722869873046875, -0.646026611328125, -0.6197662353515625, -0.593505859375, -0.5672454833984375, -0.540985107421875, -0.5147247314453125, -0.48846435546875, -0.4622039794921875, -0.435943603515625, -0.4096832275390625, -0.3834228515625, -0.3571624755859375, -0.330902099609375, -0.3046417236328125, -0.27838134765625, -0.2521209716796875, -0.225860595703125, -0.1996002197265625, -0.17333984375, -0.1470794677734375, -0.120819091796875, -0.0945587158203125, -0.06829833984375, -0.0420379638671875, -0.015777587890625, 0.0104827880859375, 0.0367431640625, 0.0630035400390625, 0.089263916015625, 0.1155242919921875, 0.14178466796875, 0.1680450439453125, 0.194305419921875, 0.2205657958984375, 0.246826171875, 0.2730865478515625, 0.299346923828125, 0.3256072998046875, 0.35186767578125, 0.3781280517578125, 0.404388427734375, 0.4306488037109375, 0.4569091796875, 0.4831695556640625, 0.509429931640625, 0.5356903076171875, 0.56195068359375, 0.5882110595703125, 0.614471435546875, 0.6407318115234375, 0.6669921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 9.0, 15.0, 45.0, 62.0, 136.0, 200.0, 401.0, 949.0, 1999.0, 4858.0, 12957.0, 43082.0, 195465.0, 2072949.0, 1628819.0, 172960.0, 39399.0, 11961.0, 4456.0, 1767.0, 893.0, 409.0, 211.0, 104.0, 58.0, 22.0, 20.0, 18.0, 7.0, 5.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.15625, -5.969482421875, -5.78271484375, -5.595947265625, -5.4091796875, -5.222412109375, -5.03564453125, -4.848876953125, -4.662109375, -4.475341796875, -4.28857421875, -4.101806640625, -3.9150390625, -3.728271484375, -3.54150390625, -3.354736328125, -3.16796875, -2.981201171875, -2.79443359375, -2.607666015625, -2.4208984375, -2.234130859375, -2.04736328125, -1.860595703125, -1.673828125, -1.487060546875, -1.30029296875, -1.113525390625, -0.9267578125, -0.739990234375, -0.55322265625, -0.366455078125, -0.1796875, 0.007080078125, 0.19384765625, 0.380615234375, 0.5673828125, 0.754150390625, 0.94091796875, 1.127685546875, 1.314453125, 1.501220703125, 1.68798828125, 1.874755859375, 2.0615234375, 2.248291015625, 2.43505859375, 2.621826171875, 2.80859375, 2.995361328125, 3.18212890625, 3.368896484375, 3.5556640625, 3.742431640625, 3.92919921875, 4.115966796875, 4.302734375, 4.489501953125, 4.67626953125, 4.863037109375, 5.0498046875, 5.236572265625, 5.42333984375, 5.610107421875, 5.796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 6.0, 15.0, 12.0, 27.0, 24.0, 33.0, 41.0, 62.0, 84.0, 120.0, 174.0, 264.0, 530.0, 920.0, 588.0, 362.0, 255.0, 155.0, 106.0, 70.0, 49.0, 36.0, 28.0, 19.0, 15.0, 17.0, 10.0, 12.0, 6.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2247314453125, -2.154541015625, -2.0843505859375, -2.01416015625, -1.9439697265625, -1.873779296875, -1.8035888671875, -1.7333984375, -1.6632080078125, -1.593017578125, -1.5228271484375, -1.45263671875, -1.3824462890625, -1.312255859375, -1.2420654296875, -1.171875, -1.1016845703125, -1.031494140625, -0.9613037109375, -0.89111328125, -0.8209228515625, -0.750732421875, -0.6805419921875, -0.6103515625, -0.5401611328125, -0.469970703125, -0.3997802734375, -0.32958984375, -0.2593994140625, -0.189208984375, -0.1190185546875, -0.048828125, 0.0213623046875, 0.091552734375, 0.1617431640625, 0.23193359375, 0.3021240234375, 0.372314453125, 0.4425048828125, 0.5126953125, 0.5828857421875, 0.653076171875, 0.7232666015625, 0.79345703125, 0.8636474609375, 0.933837890625, 1.0040283203125, 1.07421875, 1.1444091796875, 1.214599609375, 1.2847900390625, 1.35498046875, 1.4251708984375, 1.495361328125, 1.5655517578125, 1.6357421875, 1.7059326171875, 1.776123046875, 1.8463134765625, 1.91650390625, 1.9866943359375, 2.056884765625, 2.1270751953125, 2.197265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 17.0, 36.0, 82.0, 172.0, 219.0, 231.0, 129.0, 68.0, 26.0, 17.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.44394302368164, -36.18145751953125, -34.918968200683594, -33.6564826965332, -32.39399719238281, -31.131511688232422, -29.8690242767334, -28.606536865234375, -27.344051361083984, -26.081565856933594, -24.81907844543457, -23.556591033935547, -22.294105529785156, -21.031620025634766, -19.769132614135742, -18.50664520263672, -17.244159698486328, -15.981673240661621, -14.719186782836914, -13.456700325012207, -12.1942138671875, -10.931727409362793, -9.669240951538086, -8.406754493713379, -7.144268035888672, -5.881781578063965, -4.619295120239258, -3.356808662414551, -2.0943222045898438, -0.8318357467651367, 0.4306507110595703, 1.6931371688842773, 2.95562744140625, 4.218113899230957, 5.480600357055664, 6.743086814880371, 8.005573272705078, 9.268059730529785, 10.530546188354492, 11.7930326461792, 13.055519104003906, 14.318005561828613, 15.58049201965332, 16.842979431152344, 18.105464935302734, 19.367950439453125, 20.63043785095215, 21.892925262451172, 23.155410766601562, 24.417896270751953, 25.680383682250977, 26.94287109375, 28.20535659790039, 29.46784210205078, 30.730329513549805, 31.992816925048828, 33.25530242919922, 34.51778793334961, 35.7802734375, 37.042762756347656, 38.30524826049805, 39.56773376464844, 40.830223083496094, 42.092708587646484, 43.355194091796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 11.0, 10.0, 14.0, 13.0, 11.0, 24.0, 20.0, 25.0, 31.0, 28.0, 30.0, 31.0, 39.0, 29.0, 38.0, 41.0, 49.0, 44.0, 36.0, 51.0, 44.0, 40.0, 33.0, 32.0, 32.0, 29.0, 33.0, 30.0, 24.0, 14.0, 12.0, 19.0, 16.0, 16.0, 4.0, 8.0, 8.0, 6.0, 1.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.835480690002441, -8.52309799194336, -8.210716247558594, -7.898333549499512, -7.585951328277588, -7.273569107055664, -6.96118688583374, -6.648804664611816, -6.336421966552734, -6.0240397453308105, -5.711657524108887, -5.399274826049805, -5.086892604827881, -4.774510383605957, -4.462128162384033, -4.149745941162109, -3.8373637199401855, -3.5249814987182617, -3.212599039077759, -2.900216817855835, -2.587834358215332, -2.275452136993408, -1.9630699157714844, -1.6506874561309814, -1.3383052349090576, -1.0259228944778442, -0.7135406136512756, -0.40115833282470703, -0.08877599239349365, 0.22360634803771973, 0.5359885692596436, 0.8483710289001465, 1.1607532501220703, 1.4731355905532837, 1.785517930984497, 2.097900152206421, 2.410282611846924, 2.7226648330688477, 3.0350470542907715, 3.3474295139312744, 3.6598117351531982, 3.972193956375122, 4.284576416015625, 4.596958637237549, 4.909340858459473, 5.221723556518555, 5.53410530090332, 5.846487998962402, 6.158870220184326, 6.47125244140625, 6.783634662628174, 7.096016883850098, 7.40839958190918, 7.7207818031311035, 8.033164024353027, 8.34554672241211, 8.657928466796875, 8.970311164855957, 9.282692909240723, 9.595075607299805, 9.90745735168457, 10.219840049743652, 10.532222747802734, 10.8446044921875, 11.156987190246582]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 9.0, 10.0, 12.0, 19.0, 30.0, 45.0, 39.0, 92.0, 125.0, 183.0, 272.0, 409.0, 756.0, 1313.0, 2325.0, 4623.0, 9689.0, 21972.0, 53947.0, 141164.0, 331327.0, 287482.0, 113399.0, 43822.0, 18314.0, 8228.0, 3978.0, 2097.0, 1087.0, 654.0, 386.0, 241.0, 151.0, 122.0, 71.0, 40.0, 31.0, 20.0, 19.0, 16.0, 5.0, 11.0, 1.0, 3.0, 5.0, 0.0, 1.0, 5.0, 3.0, 1.0], "bins": [-4.1640625, -4.044708251953125, -3.92535400390625, -3.805999755859375, -3.6866455078125, -3.567291259765625, -3.44793701171875, -3.328582763671875, -3.209228515625, -3.089874267578125, -2.97052001953125, -2.851165771484375, -2.7318115234375, -2.612457275390625, -2.49310302734375, -2.373748779296875, -2.25439453125, -2.135040283203125, -2.01568603515625, -1.896331787109375, -1.7769775390625, -1.657623291015625, -1.53826904296875, -1.418914794921875, -1.299560546875, -1.180206298828125, -1.06085205078125, -0.941497802734375, -0.8221435546875, -0.702789306640625, -0.58343505859375, -0.464080810546875, -0.3447265625, -0.225372314453125, -0.10601806640625, 0.013336181640625, 0.1326904296875, 0.252044677734375, 0.37139892578125, 0.490753173828125, 0.610107421875, 0.729461669921875, 0.84881591796875, 0.968170166015625, 1.0875244140625, 1.206878662109375, 1.32623291015625, 1.445587158203125, 1.56494140625, 1.684295654296875, 1.80364990234375, 1.923004150390625, 2.0423583984375, 2.161712646484375, 2.28106689453125, 2.400421142578125, 2.519775390625, 2.639129638671875, 2.75848388671875, 2.877838134765625, 2.9971923828125, 3.116546630859375, 3.23590087890625, 3.355255126953125, 3.474609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 9.0, 2.0, 4.0, 16.0, 20.0, 10.0, 13.0, 11.0, 15.0, 21.0, 33.0, 18.0, 28.0, 28.0, 38.0, 25.0, 49.0, 42.0, 54.0, 44.0, 43.0, 46.0, 45.0, 44.0, 29.0, 37.0, 24.0, 37.0, 19.0, 35.0, 18.0, 20.0, 17.0, 13.0, 13.0, 13.0, 14.0, 11.0, 6.0, 6.0, 11.0, 6.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65625, -0.6365203857421875, -0.616790771484375, -0.5970611572265625, -0.57733154296875, -0.5576019287109375, -0.537872314453125, -0.5181427001953125, -0.4984130859375, -0.4786834716796875, -0.458953857421875, -0.4392242431640625, -0.41949462890625, -0.3997650146484375, -0.380035400390625, -0.3603057861328125, -0.340576171875, -0.3208465576171875, -0.301116943359375, -0.2813873291015625, -0.26165771484375, -0.2419281005859375, -0.222198486328125, -0.2024688720703125, -0.1827392578125, -0.1630096435546875, -0.143280029296875, -0.1235504150390625, -0.10382080078125, -0.0840911865234375, -0.064361572265625, -0.0446319580078125, -0.02490234375, -0.0051727294921875, 0.014556884765625, 0.0342864990234375, 0.05401611328125, 0.0737457275390625, 0.093475341796875, 0.1132049560546875, 0.1329345703125, 0.1526641845703125, 0.172393798828125, 0.1921234130859375, 0.21185302734375, 0.2315826416015625, 0.251312255859375, 0.2710418701171875, 0.290771484375, 0.3105010986328125, 0.330230712890625, 0.3499603271484375, 0.36968994140625, 0.3894195556640625, 0.409149169921875, 0.4288787841796875, 0.4486083984375, 0.4683380126953125, 0.488067626953125, 0.5077972412109375, 0.52752685546875, 0.5472564697265625, 0.566986083984375, 0.5867156982421875, 0.6064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 10.0, 7.0, 10.0, 14.0, 20.0, 23.0, 43.0, 58.0, 76.0, 125.0, 210.0, 316.0, 566.0, 1259.0, 3110.0, 10287.0, 42306.0, 215531.0, 564235.0, 163456.0, 33486.0, 8279.0, 2593.0, 1095.0, 554.0, 293.0, 220.0, 125.0, 76.0, 41.0, 36.0, 27.0, 11.0, 16.0, 10.0, 12.0, 8.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.55560302734375, -6.3533935546875, -6.15118408203125, -5.948974609375, -5.74676513671875, -5.5445556640625, -5.34234619140625, -5.14013671875, -4.93792724609375, -4.7357177734375, -4.53350830078125, -4.331298828125, -4.12908935546875, -3.9268798828125, -3.72467041015625, -3.5224609375, -3.32025146484375, -3.1180419921875, -2.91583251953125, -2.713623046875, -2.51141357421875, -2.3092041015625, -2.10699462890625, -1.90478515625, -1.70257568359375, -1.5003662109375, -1.29815673828125, -1.095947265625, -0.89373779296875, -0.6915283203125, -0.48931884765625, -0.287109375, -0.08489990234375, 0.1173095703125, 0.31951904296875, 0.521728515625, 0.72393798828125, 0.9261474609375, 1.12835693359375, 1.33056640625, 1.53277587890625, 1.7349853515625, 1.93719482421875, 2.139404296875, 2.34161376953125, 2.5438232421875, 2.74603271484375, 2.9482421875, 3.15045166015625, 3.3526611328125, 3.55487060546875, 3.757080078125, 3.95928955078125, 4.1614990234375, 4.36370849609375, 4.56591796875, 4.76812744140625, 4.9703369140625, 5.17254638671875, 5.374755859375, 5.57696533203125, 5.7791748046875, 5.98138427734375, 6.18359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 6.0, 10.0, 13.0, 17.0, 21.0, 13.0, 19.0, 25.0, 20.0, 20.0, 25.0, 38.0, 38.0, 45.0, 36.0, 52.0, 44.0, 64.0, 39.0, 47.0, 46.0, 46.0, 44.0, 20.0, 30.0, 33.0, 25.0, 17.0, 16.0, 20.0, 21.0, 12.0, 7.0, 10.0, 9.0, 8.0, 6.0, 7.0, 2.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.799468994140625, -2.69073486328125, -2.582000732421875, -2.4732666015625, -2.364532470703125, -2.25579833984375, -2.147064208984375, -2.038330078125, -1.929595947265625, -1.82086181640625, -1.712127685546875, -1.6033935546875, -1.494659423828125, -1.38592529296875, -1.277191162109375, -1.16845703125, -1.059722900390625, -0.95098876953125, -0.842254638671875, -0.7335205078125, -0.624786376953125, -0.51605224609375, -0.407318115234375, -0.298583984375, -0.189849853515625, -0.08111572265625, 0.027618408203125, 0.1363525390625, 0.245086669921875, 0.35382080078125, 0.462554931640625, 0.5712890625, 0.680023193359375, 0.78875732421875, 0.897491455078125, 1.0062255859375, 1.114959716796875, 1.22369384765625, 1.332427978515625, 1.441162109375, 1.549896240234375, 1.65863037109375, 1.767364501953125, 1.8760986328125, 1.984832763671875, 2.09356689453125, 2.202301025390625, 2.31103515625, 2.419769287109375, 2.52850341796875, 2.637237548828125, 2.7459716796875, 2.854705810546875, 2.96343994140625, 3.072174072265625, 3.180908203125, 3.289642333984375, 3.39837646484375, 3.507110595703125, 3.6158447265625, 3.724578857421875, 3.83331298828125, 3.942047119140625, 4.05078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 7.0, 4.0, 6.0, 8.0, 15.0, 13.0, 33.0, 44.0, 68.0, 83.0, 140.0, 243.0, 432.0, 881.0, 1812.0, 4287.0, 12327.0, 42072.0, 196247.0, 581157.0, 155854.0, 35144.0, 10551.0, 3746.0, 1555.0, 772.0, 400.0, 234.0, 137.0, 75.0, 66.0, 39.0, 28.0, 20.0, 19.0, 12.0, 2.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.517578125, -3.418304443359375, -3.31903076171875, -3.219757080078125, -3.1204833984375, -3.021209716796875, -2.92193603515625, -2.822662353515625, -2.723388671875, -2.624114990234375, -2.52484130859375, -2.425567626953125, -2.3262939453125, -2.227020263671875, -2.12774658203125, -2.028472900390625, -1.92919921875, -1.829925537109375, -1.73065185546875, -1.631378173828125, -1.5321044921875, -1.432830810546875, -1.33355712890625, -1.234283447265625, -1.135009765625, -1.035736083984375, -0.93646240234375, -0.837188720703125, -0.7379150390625, -0.638641357421875, -0.53936767578125, -0.440093994140625, -0.3408203125, -0.241546630859375, -0.14227294921875, -0.042999267578125, 0.0562744140625, 0.155548095703125, 0.25482177734375, 0.354095458984375, 0.453369140625, 0.552642822265625, 0.65191650390625, 0.751190185546875, 0.8504638671875, 0.949737548828125, 1.04901123046875, 1.148284912109375, 1.24755859375, 1.346832275390625, 1.44610595703125, 1.545379638671875, 1.6446533203125, 1.743927001953125, 1.84320068359375, 1.942474365234375, 2.041748046875, 2.141021728515625, 2.24029541015625, 2.339569091796875, 2.4388427734375, 2.538116455078125, 2.63739013671875, 2.736663818359375, 2.8359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 10.0, 13.0, 8.0, 22.0, 27.0, 24.0, 63.0, 167.0, 259.0, 179.0, 60.0, 43.0, 26.0, 21.0, 15.0, 11.0, 7.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005092620849609375, -0.0004892870783805847, -0.00046931207180023193, -0.00044933706521987915, -0.00042936205863952637, -0.0004093870520591736, -0.0003894120454788208, -0.000369437038898468, -0.00034946203231811523, -0.00032948702573776245, -0.00030951201915740967, -0.0002895370125770569, -0.0002695620059967041, -0.0002495869994163513, -0.00022961199283599854, -0.00020963698625564575, -0.00018966197967529297, -0.00016968697309494019, -0.0001497119665145874, -0.00012973695993423462, -0.00010976195335388184, -8.978694677352905e-05, -6.981194019317627e-05, -4.9836933612823486e-05, -2.9861927032470703e-05, -9.88692045211792e-06, 1.0088086128234863e-05, 3.0063092708587646e-05, 5.003809928894043e-05, 7.001310586929321e-05, 8.9988112449646e-05, 0.00010996311902999878, 0.00012993812561035156, 0.00014991313219070435, 0.00016988813877105713, 0.0001898631453514099, 0.0002098381519317627, 0.00022981315851211548, 0.00024978816509246826, 0.00026976317167282104, 0.00028973817825317383, 0.0003097131848335266, 0.0003296881914138794, 0.0003496631979942322, 0.00036963820457458496, 0.00038961321115493774, 0.00040958821773529053, 0.0004295632243156433, 0.0004495382308959961, 0.0004695132374763489, 0.0004894882440567017, 0.0005094632506370544, 0.0005294382572174072, 0.00054941326379776, 0.0005693882703781128, 0.0005893632769584656, 0.0006093382835388184, 0.0006293132901191711, 0.0006492882966995239, 0.0006692633032798767, 0.0006892383098602295, 0.0007092133164405823, 0.0007291883230209351, 0.0007491633296012878, 0.0007691383361816406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 5.0, 5.0, 14.0, 11.0, 24.0, 35.0, 42.0, 65.0, 93.0, 183.0, 350.0, 637.0, 1330.0, 3256.0, 9890.0, 34007.0, 188211.0, 663920.0, 110368.0, 24164.0, 7182.0, 2473.0, 1077.0, 486.0, 288.0, 159.0, 97.0, 54.0, 40.0, 26.0, 17.0, 18.0, 4.0, 12.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.31976318359375, -4.1903076171875, -4.06085205078125, -3.931396484375, -3.80194091796875, -3.6724853515625, -3.54302978515625, -3.41357421875, -3.28411865234375, -3.1546630859375, -3.02520751953125, -2.895751953125, -2.76629638671875, -2.6368408203125, -2.50738525390625, -2.3779296875, -2.24847412109375, -2.1190185546875, -1.98956298828125, -1.860107421875, -1.73065185546875, -1.6011962890625, -1.47174072265625, -1.34228515625, -1.21282958984375, -1.0833740234375, -0.95391845703125, -0.824462890625, -0.69500732421875, -0.5655517578125, -0.43609619140625, -0.306640625, -0.17718505859375, -0.0477294921875, 0.08172607421875, 0.211181640625, 0.34063720703125, 0.4700927734375, 0.59954833984375, 0.72900390625, 0.85845947265625, 0.9879150390625, 1.11737060546875, 1.246826171875, 1.37628173828125, 1.5057373046875, 1.63519287109375, 1.7646484375, 1.89410400390625, 2.0235595703125, 2.15301513671875, 2.282470703125, 2.41192626953125, 2.5413818359375, 2.67083740234375, 2.80029296875, 2.92974853515625, 3.0592041015625, 3.18865966796875, 3.318115234375, 3.44757080078125, 3.5770263671875, 3.70648193359375, 3.8359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 3.0, 16.0, 18.0, 27.0, 44.0, 52.0, 79.0, 91.0, 144.0, 119.0, 129.0, 82.0, 62.0, 29.0, 19.0, 10.0, 9.0, 10.0, 9.0, 7.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.583465576171875, -2.50286865234375, -2.422271728515625, -2.3416748046875, -2.261077880859375, -2.18048095703125, -2.099884033203125, -2.019287109375, -1.938690185546875, -1.85809326171875, -1.777496337890625, -1.6968994140625, -1.616302490234375, -1.53570556640625, -1.455108642578125, -1.37451171875, -1.293914794921875, -1.21331787109375, -1.132720947265625, -1.0521240234375, -0.971527099609375, -0.89093017578125, -0.810333251953125, -0.729736328125, -0.649139404296875, -0.56854248046875, -0.487945556640625, -0.4073486328125, -0.326751708984375, -0.24615478515625, -0.165557861328125, -0.0849609375, -0.004364013671875, 0.07623291015625, 0.156829833984375, 0.2374267578125, 0.318023681640625, 0.39862060546875, 0.479217529296875, 0.559814453125, 0.640411376953125, 0.72100830078125, 0.801605224609375, 0.8822021484375, 0.962799072265625, 1.04339599609375, 1.123992919921875, 1.20458984375, 1.285186767578125, 1.36578369140625, 1.446380615234375, 1.5269775390625, 1.607574462890625, 1.68817138671875, 1.768768310546875, 1.849365234375, 1.929962158203125, 2.01055908203125, 2.091156005859375, 2.1717529296875, 2.252349853515625, 2.33294677734375, 2.413543701171875, 2.494140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 13.0, 12.0, 16.0, 38.0, 63.0, 97.0, 144.0, 146.0, 164.0, 135.0, 63.0, 52.0, 36.0, 11.0, 5.0, 5.0, 1.0, 0.0, 3.0], "bins": [-82.4835205078125, -80.91340637207031, -79.34329986572266, -77.77318572998047, -76.20307922363281, -74.63296508789062, -73.06285858154297, -71.49274444580078, -69.92263793945312, -68.35252380371094, -66.78241729736328, -65.2123031616211, -63.64219665527344, -62.07208251953125, -60.50197219848633, -58.931861877441406, -57.36174774169922, -55.7916374206543, -54.221527099609375, -52.65141677856445, -51.08130645751953, -49.511192321777344, -47.94108200073242, -46.3709716796875, -44.80086135864258, -43.230751037597656, -41.660640716552734, -40.09053039550781, -38.520416259765625, -36.9503059387207, -35.38019561767578, -33.81008529663086, -32.23997497558594, -30.669864654541016, -29.099754333496094, -27.52964210510254, -25.959531784057617, -24.389421463012695, -22.81930923461914, -21.24919891357422, -19.679088592529297, -18.108978271484375, -16.538867950439453, -14.968755722045898, -13.398645401000977, -11.828535079956055, -10.258423805236816, -8.688312530517578, -7.118202209472656, -5.548091411590576, -3.977980613708496, -2.407869815826416, -0.8377590179443359, 0.7323517799377441, 2.302462577819824, 3.8725738525390625, 5.442684173583984, 7.0127949714660645, 8.582905769348145, 10.153017044067383, 11.723127365112305, 13.293237686157227, 14.863348960876465, 16.433460235595703, 18.003570556640625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 4.0, 5.0, 12.0, 9.0, 11.0, 15.0, 11.0, 20.0, 30.0, 26.0, 34.0, 30.0, 35.0, 41.0, 33.0, 52.0, 35.0, 44.0, 36.0, 29.0, 45.0, 42.0, 36.0, 38.0, 33.0, 34.0, 38.0, 37.0, 20.0, 22.0, 19.0, 22.0, 14.0, 14.0, 10.0, 7.0, 5.0, 3.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-17.517391204833984, -16.964078903198242, -16.4107666015625, -15.857453346252441, -15.304140090942383, -14.75082778930664, -14.197515487670898, -13.644203186035156, -13.090889930725098, -12.537577629089355, -11.984264373779297, -11.430952072143555, -10.877639770507812, -10.324326515197754, -9.771014213562012, -9.217700958251953, -8.664388656616211, -8.111076354980469, -7.55776309967041, -7.004450798034668, -6.451138019561768, -5.897825241088867, -5.344512939453125, -4.791200160980225, -4.237887382507324, -3.684574604034424, -3.1312620639801025, -2.5779495239257812, -2.024636745452881, -1.4713239669799805, -0.9180114269256592, -0.3646988868713379, 0.1886119842529297, 0.7419246435165405, 1.2952373027801514, 1.8485499620437622, 2.401862621307373, 2.9551753997802734, 3.5084879398345947, 4.061800479888916, 4.615113258361816, 5.168426036834717, 5.721738815307617, 6.275051116943359, 6.82836389541626, 7.38167667388916, 7.934988975524902, 8.488302230834961, 9.041614532470703, 9.594926834106445, 10.148240089416504, 10.701552391052246, 11.254865646362305, 11.808177947998047, 12.361490249633789, 12.914802551269531, 13.46811580657959, 14.021428108215332, 14.57474136352539, 15.128053665161133, 15.681365966796875, 16.23468017578125, 16.787992477416992, 17.341304779052734, 17.894617080688477]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 12.0, 11.0, 12.0, 21.0, 21.0, 21.0, 43.0, 52.0, 87.0, 151.0, 228.0, 416.0, 822.0, 1481.0, 2920.0, 6003.0, 13597.0, 37989.0, 170444.0, 3155423.0, 678016.0, 83474.0, 24134.0, 9736.0, 4388.0, 2267.0, 1100.0, 614.0, 337.0, 202.0, 100.0, 57.0, 37.0, 25.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-6.5859375, -6.424468994140625, -6.26300048828125, -6.101531982421875, -5.9400634765625, -5.778594970703125, -5.61712646484375, -5.455657958984375, -5.294189453125, -5.132720947265625, -4.97125244140625, -4.809783935546875, -4.6483154296875, -4.486846923828125, -4.32537841796875, -4.163909912109375, -4.00244140625, -3.840972900390625, -3.67950439453125, -3.518035888671875, -3.3565673828125, -3.195098876953125, -3.03363037109375, -2.872161865234375, -2.710693359375, -2.549224853515625, -2.38775634765625, -2.226287841796875, -2.0648193359375, -1.903350830078125, -1.74188232421875, -1.580413818359375, -1.4189453125, -1.257476806640625, -1.09600830078125, -0.934539794921875, -0.7730712890625, -0.611602783203125, -0.45013427734375, -0.288665771484375, -0.127197265625, 0.034271240234375, 0.19573974609375, 0.357208251953125, 0.5186767578125, 0.680145263671875, 0.84161376953125, 1.003082275390625, 1.16455078125, 1.326019287109375, 1.48748779296875, 1.648956298828125, 1.8104248046875, 1.971893310546875, 2.13336181640625, 2.294830322265625, 2.456298828125, 2.617767333984375, 2.77923583984375, 2.940704345703125, 3.1021728515625, 3.263641357421875, 3.42510986328125, 3.586578369140625, 3.748046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 5.0, 9.0, 7.0, 10.0, 13.0, 16.0, 19.0, 23.0, 30.0, 21.0, 39.0, 49.0, 31.0, 49.0, 41.0, 57.0, 43.0, 40.0, 46.0, 47.0, 46.0, 38.0, 52.0, 39.0, 32.0, 26.0, 26.0, 30.0, 17.0, 23.0, 12.0, 15.0, 6.0, 10.0, 8.0, 7.0, 9.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.93994140625, -0.9151153564453125, -0.890289306640625, -0.8654632568359375, -0.84063720703125, -0.8158111572265625, -0.790985107421875, -0.7661590576171875, -0.7413330078125, -0.7165069580078125, -0.691680908203125, -0.6668548583984375, -0.64202880859375, -0.6172027587890625, -0.592376708984375, -0.5675506591796875, -0.542724609375, -0.5178985595703125, -0.493072509765625, -0.4682464599609375, -0.44342041015625, -0.4185943603515625, -0.393768310546875, -0.3689422607421875, -0.3441162109375, -0.3192901611328125, -0.294464111328125, -0.2696380615234375, -0.24481201171875, -0.2199859619140625, -0.195159912109375, -0.1703338623046875, -0.1455078125, -0.1206817626953125, -0.095855712890625, -0.0710296630859375, -0.04620361328125, -0.0213775634765625, 0.003448486328125, 0.0282745361328125, 0.0531005859375, 0.0779266357421875, 0.102752685546875, 0.1275787353515625, 0.15240478515625, 0.1772308349609375, 0.202056884765625, 0.2268829345703125, 0.251708984375, 0.2765350341796875, 0.301361083984375, 0.3261871337890625, 0.35101318359375, 0.3758392333984375, 0.400665283203125, 0.4254913330078125, 0.4503173828125, 0.4751434326171875, 0.499969482421875, 0.5247955322265625, 0.54962158203125, 0.5744476318359375, 0.599273681640625, 0.6240997314453125, 0.64892578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 12.0, 11.0, 14.0, 36.0, 55.0, 95.0, 217.0, 489.0, 1315.0, 3749.0, 12229.0, 53719.0, 507310.0, 3393720.0, 180856.0, 28828.0, 7728.0, 2358.0, 862.0, 341.0, 140.0, 73.0, 49.0, 26.0, 13.0, 16.0, 5.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.3824462890625, -6.108642578125, -5.8348388671875, -5.56103515625, -5.2872314453125, -5.013427734375, -4.7396240234375, -4.4658203125, -4.1920166015625, -3.918212890625, -3.6444091796875, -3.37060546875, -3.0968017578125, -2.822998046875, -2.5491943359375, -2.275390625, -2.0015869140625, -1.727783203125, -1.4539794921875, -1.18017578125, -0.9063720703125, -0.632568359375, -0.3587646484375, -0.0849609375, 0.1888427734375, 0.462646484375, 0.7364501953125, 1.01025390625, 1.2840576171875, 1.557861328125, 1.8316650390625, 2.10546875, 2.3792724609375, 2.653076171875, 2.9268798828125, 3.20068359375, 3.4744873046875, 3.748291015625, 4.0220947265625, 4.2958984375, 4.5697021484375, 4.843505859375, 5.1173095703125, 5.39111328125, 5.6649169921875, 5.938720703125, 6.2125244140625, 6.486328125, 6.7601318359375, 7.033935546875, 7.3077392578125, 7.58154296875, 7.8553466796875, 8.129150390625, 8.4029541015625, 8.6767578125, 8.9505615234375, 9.224365234375, 9.4981689453125, 9.77197265625, 10.0457763671875, 10.319580078125, 10.5933837890625, 10.8671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 7.0, 11.0, 19.0, 24.0, 22.0, 32.0, 48.0, 69.0, 107.0, 151.0, 267.0, 482.0, 1150.0, 774.0, 324.0, 193.0, 102.0, 81.0, 51.0, 39.0, 25.0, 16.0, 19.0, 7.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.426177978515625, -2.35430908203125, -2.282440185546875, -2.2105712890625, -2.138702392578125, -2.06683349609375, -1.994964599609375, -1.923095703125, -1.851226806640625, -1.77935791015625, -1.707489013671875, -1.6356201171875, -1.563751220703125, -1.49188232421875, -1.420013427734375, -1.34814453125, -1.276275634765625, -1.20440673828125, -1.132537841796875, -1.0606689453125, -0.988800048828125, -0.91693115234375, -0.845062255859375, -0.773193359375, -0.701324462890625, -0.62945556640625, -0.557586669921875, -0.4857177734375, -0.413848876953125, -0.34197998046875, -0.270111083984375, -0.1982421875, -0.126373291015625, -0.05450439453125, 0.017364501953125, 0.0892333984375, 0.161102294921875, 0.23297119140625, 0.304840087890625, 0.376708984375, 0.448577880859375, 0.52044677734375, 0.592315673828125, 0.6641845703125, 0.736053466796875, 0.80792236328125, 0.879791259765625, 0.95166015625, 1.023529052734375, 1.09539794921875, 1.167266845703125, 1.2391357421875, 1.311004638671875, 1.38287353515625, 1.454742431640625, 1.526611328125, 1.598480224609375, 1.67034912109375, 1.742218017578125, 1.8140869140625, 1.885955810546875, 1.95782470703125, 2.029693603515625, 2.1015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 9.0, 17.0, 16.0, 27.0, 33.0, 65.0, 90.0, 100.0, 119.0, 118.0, 114.0, 101.0, 61.0, 46.0, 33.0, 18.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.462539672851562, -13.897770881652832, -13.333002090454102, -12.768233299255371, -12.20346450805664, -11.63869571685791, -11.07392692565918, -10.509159088134766, -9.944389343261719, -9.379620552062988, -8.814851760864258, -8.250082969665527, -7.685314178466797, -7.120545387268066, -6.555777072906494, -5.991008281707764, -5.426239967346191, -4.861471176147461, -4.2967023849487305, -3.731933832168579, -3.1671650409698486, -2.602396249771118, -2.037627696990967, -1.4728589057922363, -0.9080901145935059, -0.34332138299942017, 0.22144734859466553, 0.7862160205841064, 1.350984811782837, 1.9157536029815674, 2.4805221557617188, 3.045290946960449, 3.6100597381591797, 4.17482852935791, 4.739597320556641, 5.304366111755371, 5.869134902954102, 6.433903694152832, 6.998672008514404, 7.563440799713135, 8.128210067749023, 8.692978858947754, 9.257747650146484, 9.822516441345215, 10.387285232543945, 10.952054023742676, 11.516822814941406, 12.08159065246582, 12.64635944366455, 13.211128234863281, 13.775897026062012, 14.340665817260742, 14.905434608459473, 15.470203399658203, 16.034971237182617, 16.599740982055664, 17.164508819580078, 17.729276657104492, 18.29404640197754, 18.858814239501953, 19.423583984375, 19.988351821899414, 20.55312156677246, 21.117889404296875, 21.682659149169922]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 9.0, 7.0, 11.0, 11.0, 9.0, 18.0, 18.0, 16.0, 18.0, 21.0, 26.0, 30.0, 35.0, 35.0, 50.0, 41.0, 31.0, 31.0, 27.0, 45.0, 36.0, 31.0, 34.0, 39.0, 35.0, 31.0, 32.0, 20.0, 38.0, 26.0, 30.0, 22.0, 25.0, 20.0, 14.0, 11.0, 7.0, 10.0, 7.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.524248123168945, -8.264900207519531, -8.0055513381958, -7.7462029457092285, -7.486854553222656, -7.227506160736084, -6.968157768249512, -6.708809852600098, -6.449460983276367, -6.190112590789795, -5.930764198303223, -5.67141580581665, -5.412067413330078, -5.152719020843506, -4.893370628356934, -4.6340227127075195, -4.374674320220947, -4.115325927734375, -3.8559775352478027, -3.5966291427612305, -3.337280750274658, -3.077932357788086, -2.8185842037200928, -2.5592358112335205, -2.2998874187469482, -2.040539026260376, -1.7811906337738037, -1.521842360496521, -1.2624939680099487, -1.0031455755233765, -0.7437973022460938, -0.4844489097595215, -0.22510051727294922, 0.03424784541130066, 0.29359620809555054, 0.552944540977478, 0.8122929334640503, 1.0716413259506226, 1.3309895992279053, 1.5903379917144775, 1.8496863842010498, 2.109034776687622, 2.3683831691741943, 2.6277313232421875, 2.8870797157287598, 3.146428108215332, 3.4057765007019043, 3.6651248931884766, 3.924473285675049, 4.183821678161621, 4.443170070648193, 4.702518463134766, 4.961866855621338, 5.22121524810791, 5.480563163757324, 5.739912033081055, 5.999259948730469, 6.258608341217041, 6.517956733703613, 6.7773051261901855, 7.036653518676758, 7.29600191116333, 7.555350303649902, 7.814698219299316, 8.074047088623047]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 12.0, 12.0, 11.0, 23.0, 30.0, 28.0, 57.0, 99.0, 175.0, 278.0, 481.0, 831.0, 1511.0, 2842.0, 5904.0, 11860.0, 25250.0, 56953.0, 135944.0, 281688.0, 281691.0, 136610.0, 57225.0, 24809.0, 11858.0, 5753.0, 2972.0, 1527.0, 868.0, 471.0, 278.0, 181.0, 113.0, 76.0, 43.0, 31.0, 22.0, 13.0, 9.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.423828125, -3.31683349609375, -3.2098388671875, -3.10284423828125, -2.995849609375, -2.88885498046875, -2.7818603515625, -2.67486572265625, -2.56787109375, -2.46087646484375, -2.3538818359375, -2.24688720703125, -2.139892578125, -2.03289794921875, -1.9259033203125, -1.81890869140625, -1.7119140625, -1.60491943359375, -1.4979248046875, -1.39093017578125, -1.283935546875, -1.17694091796875, -1.0699462890625, -0.96295166015625, -0.85595703125, -0.74896240234375, -0.6419677734375, -0.53497314453125, -0.427978515625, -0.32098388671875, -0.2139892578125, -0.10699462890625, 0.0, 0.10699462890625, 0.2139892578125, 0.32098388671875, 0.427978515625, 0.53497314453125, 0.6419677734375, 0.74896240234375, 0.85595703125, 0.96295166015625, 1.0699462890625, 1.17694091796875, 1.283935546875, 1.39093017578125, 1.4979248046875, 1.60491943359375, 1.7119140625, 1.81890869140625, 1.9259033203125, 2.03289794921875, 2.139892578125, 2.24688720703125, 2.3538818359375, 2.46087646484375, 2.56787109375, 2.67486572265625, 2.7818603515625, 2.88885498046875, 2.995849609375, 3.10284423828125, 3.2098388671875, 3.31683349609375, 3.423828125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 14.0, 11.0, 10.0, 11.0, 6.0, 19.0, 11.0, 20.0, 20.0, 27.0, 34.0, 33.0, 42.0, 40.0, 46.0, 47.0, 54.0, 42.0, 39.0, 41.0, 45.0, 35.0, 44.0, 33.0, 36.0, 38.0, 30.0, 34.0, 14.0, 13.0, 14.0, 16.0, 15.0, 18.0, 7.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.9755859375, -0.9499053955078125, -0.924224853515625, -0.8985443115234375, -0.87286376953125, -0.8471832275390625, -0.821502685546875, -0.7958221435546875, -0.7701416015625, -0.7444610595703125, -0.718780517578125, -0.6930999755859375, -0.66741943359375, -0.6417388916015625, -0.616058349609375, -0.5903778076171875, -0.564697265625, -0.5390167236328125, -0.513336181640625, -0.4876556396484375, -0.46197509765625, -0.4362945556640625, -0.410614013671875, -0.3849334716796875, -0.3592529296875, -0.3335723876953125, -0.307891845703125, -0.2822113037109375, -0.25653076171875, -0.2308502197265625, -0.205169677734375, -0.1794891357421875, -0.15380859375, -0.1281280517578125, -0.102447509765625, -0.0767669677734375, -0.05108642578125, -0.0254058837890625, 0.000274658203125, 0.0259552001953125, 0.0516357421875, 0.0773162841796875, 0.102996826171875, 0.1286773681640625, 0.15435791015625, 0.1800384521484375, 0.205718994140625, 0.2313995361328125, 0.257080078125, 0.2827606201171875, 0.308441162109375, 0.3341217041015625, 0.35980224609375, 0.3854827880859375, 0.411163330078125, 0.4368438720703125, 0.4625244140625, 0.4882049560546875, 0.513885498046875, 0.5395660400390625, 0.56524658203125, 0.5909271240234375, 0.616607666015625, 0.6422882080078125, 0.66796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 9.0, 14.0, 13.0, 28.0, 45.0, 37.0, 54.0, 103.0, 181.0, 380.0, 806.0, 1906.0, 5597.0, 17524.0, 63735.0, 257805.0, 485297.0, 157264.0, 39778.0, 11549.0, 3705.0, 1417.0, 576.0, 264.0, 155.0, 98.0, 53.0, 40.0, 30.0, 23.0, 21.0, 9.0, 7.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.09197998046875, -4.9183349609375, -4.74468994140625, -4.571044921875, -4.39739990234375, -4.2237548828125, -4.05010986328125, -3.87646484375, -3.70281982421875, -3.5291748046875, -3.35552978515625, -3.181884765625, -3.00823974609375, -2.8345947265625, -2.66094970703125, -2.4873046875, -2.31365966796875, -2.1400146484375, -1.96636962890625, -1.792724609375, -1.61907958984375, -1.4454345703125, -1.27178955078125, -1.09814453125, -0.92449951171875, -0.7508544921875, -0.57720947265625, -0.403564453125, -0.22991943359375, -0.0562744140625, 0.11737060546875, 0.291015625, 0.46466064453125, 0.6383056640625, 0.81195068359375, 0.985595703125, 1.15924072265625, 1.3328857421875, 1.50653076171875, 1.68017578125, 1.85382080078125, 2.0274658203125, 2.20111083984375, 2.374755859375, 2.54840087890625, 2.7220458984375, 2.89569091796875, 3.0693359375, 3.24298095703125, 3.4166259765625, 3.59027099609375, 3.763916015625, 3.93756103515625, 4.1112060546875, 4.28485107421875, 4.45849609375, 4.63214111328125, 4.8057861328125, 4.97943115234375, 5.153076171875, 5.32672119140625, 5.5003662109375, 5.67401123046875, 5.84765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 5.0, 13.0, 11.0, 8.0, 10.0, 21.0, 17.0, 20.0, 19.0, 19.0, 27.0, 32.0, 25.0, 48.0, 35.0, 50.0, 45.0, 35.0, 49.0, 62.0, 52.0, 46.0, 49.0, 47.0, 33.0, 33.0, 35.0, 24.0, 22.0, 14.0, 11.0, 15.0, 15.0, 11.0, 7.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.51171875, -4.384796142578125, -4.25787353515625, -4.130950927734375, -4.0040283203125, -3.877105712890625, -3.75018310546875, -3.623260498046875, -3.496337890625, -3.369415283203125, -3.24249267578125, -3.115570068359375, -2.9886474609375, -2.861724853515625, -2.73480224609375, -2.607879638671875, -2.48095703125, -2.354034423828125, -2.22711181640625, -2.100189208984375, -1.9732666015625, -1.846343994140625, -1.71942138671875, -1.592498779296875, -1.465576171875, -1.338653564453125, -1.21173095703125, -1.084808349609375, -0.9578857421875, -0.830963134765625, -0.70404052734375, -0.577117919921875, -0.4501953125, -0.323272705078125, -0.19635009765625, -0.069427490234375, 0.0574951171875, 0.184417724609375, 0.31134033203125, 0.438262939453125, 0.565185546875, 0.692108154296875, 0.81903076171875, 0.945953369140625, 1.0728759765625, 1.199798583984375, 1.32672119140625, 1.453643798828125, 1.58056640625, 1.707489013671875, 1.83441162109375, 1.961334228515625, 2.0882568359375, 2.215179443359375, 2.34210205078125, 2.469024658203125, 2.595947265625, 2.722869873046875, 2.84979248046875, 2.976715087890625, 3.1036376953125, 3.230560302734375, 3.35748291015625, 3.484405517578125, 3.611328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 15.0, 19.0, 20.0, 48.0, 69.0, 95.0, 146.0, 307.0, 509.0, 1007.0, 2188.0, 5253.0, 12856.0, 35409.0, 114803.0, 417417.0, 326533.0, 85189.0, 27952.0, 10706.0, 4228.0, 1831.0, 871.0, 418.0, 223.0, 115.0, 92.0, 53.0, 49.0, 34.0, 19.0, 14.0, 13.0, 9.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.974609375, -1.910675048828125, -1.84674072265625, -1.782806396484375, -1.7188720703125, -1.654937744140625, -1.59100341796875, -1.527069091796875, -1.463134765625, -1.399200439453125, -1.33526611328125, -1.271331787109375, -1.2073974609375, -1.143463134765625, -1.07952880859375, -1.015594482421875, -0.95166015625, -0.887725830078125, -0.82379150390625, -0.759857177734375, -0.6959228515625, -0.631988525390625, -0.56805419921875, -0.504119873046875, -0.440185546875, -0.376251220703125, -0.31231689453125, -0.248382568359375, -0.1844482421875, -0.120513916015625, -0.05657958984375, 0.007354736328125, 0.0712890625, 0.135223388671875, 0.19915771484375, 0.263092041015625, 0.3270263671875, 0.390960693359375, 0.45489501953125, 0.518829345703125, 0.582763671875, 0.646697998046875, 0.71063232421875, 0.774566650390625, 0.8385009765625, 0.902435302734375, 0.96636962890625, 1.030303955078125, 1.09423828125, 1.158172607421875, 1.22210693359375, 1.286041259765625, 1.3499755859375, 1.413909912109375, 1.47784423828125, 1.541778564453125, 1.605712890625, 1.669647216796875, 1.73358154296875, 1.797515869140625, 1.8614501953125, 1.925384521484375, 1.98931884765625, 2.053253173828125, 2.1171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 8.0, 4.0, 8.0, 7.0, 17.0, 22.0, 30.0, 58.0, 134.0, 299.0, 191.0, 80.0, 43.0, 25.0, 17.0, 12.0, 9.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007677078247070312, -0.0007467716932296753, -0.0007258355617523193, -0.0007048994302749634, -0.0006839632987976074, -0.0006630271673202515, -0.0006420910358428955, -0.0006211549043655396, -0.0006002187728881836, -0.0005792826414108276, -0.0005583465099334717, -0.0005374103784561157, -0.0005164742469787598, -0.0004955381155014038, -0.00047460198402404785, -0.0004536658525466919, -0.00043272972106933594, -0.00041179358959198, -0.000390857458114624, -0.00036992132663726807, -0.0003489851951599121, -0.00032804906368255615, -0.0003071129322052002, -0.00028617680072784424, -0.0002652406692504883, -0.0002443045377731323, -0.00022336840629577637, -0.0002024322748184204, -0.00018149614334106445, -0.0001605600118637085, -0.00013962388038635254, -0.00011868774890899658, -9.775161743164062e-05, -7.681548595428467e-05, -5.587935447692871e-05, -3.4943222999572754e-05, -1.4007091522216797e-05, 6.92903995513916e-06, 2.7865171432495117e-05, 4.8801302909851074e-05, 6.973743438720703e-05, 9.067356586456299e-05, 0.00011160969734191895, 0.0001325458288192749, 0.00015348196029663086, 0.00017441809177398682, 0.00019535422325134277, 0.00021629035472869873, 0.0002372264862060547, 0.00025816261768341064, 0.0002790987491607666, 0.00030003488063812256, 0.0003209710121154785, 0.00034190714359283447, 0.00036284327507019043, 0.0003837794065475464, 0.00040471553802490234, 0.0004256516695022583, 0.00044658780097961426, 0.0004675239324569702, 0.0004884600639343262, 0.0005093961954116821, 0.0005303323268890381, 0.000551268458366394, 0.00057220458984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 9.0, 29.0, 21.0, 30.0, 42.0, 61.0, 114.0, 155.0, 259.0, 445.0, 773.0, 1716.0, 4004.0, 11217.0, 32954.0, 115929.0, 482032.0, 296849.0, 67843.0, 21086.0, 7316.0, 2837.0, 1256.0, 614.0, 330.0, 212.0, 127.0, 96.0, 59.0, 38.0, 30.0, 16.0, 13.0, 9.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.501953125, -2.43206787109375, -2.3621826171875, -2.29229736328125, -2.222412109375, -2.15252685546875, -2.0826416015625, -2.01275634765625, -1.94287109375, -1.87298583984375, -1.8031005859375, -1.73321533203125, -1.663330078125, -1.59344482421875, -1.5235595703125, -1.45367431640625, -1.3837890625, -1.31390380859375, -1.2440185546875, -1.17413330078125, -1.104248046875, -1.03436279296875, -0.9644775390625, -0.89459228515625, -0.82470703125, -0.75482177734375, -0.6849365234375, -0.61505126953125, -0.545166015625, -0.47528076171875, -0.4053955078125, -0.33551025390625, -0.265625, -0.19573974609375, -0.1258544921875, -0.05596923828125, 0.013916015625, 0.08380126953125, 0.1536865234375, 0.22357177734375, 0.29345703125, 0.36334228515625, 0.4332275390625, 0.50311279296875, 0.572998046875, 0.64288330078125, 0.7127685546875, 0.78265380859375, 0.8525390625, 0.92242431640625, 0.9923095703125, 1.06219482421875, 1.132080078125, 1.20196533203125, 1.2718505859375, 1.34173583984375, 1.41162109375, 1.48150634765625, 1.5513916015625, 1.62127685546875, 1.691162109375, 1.76104736328125, 1.8309326171875, 1.90081787109375, 1.970703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 10.0, 6.0, 13.0, 18.0, 10.0, 20.0, 30.0, 25.0, 38.0, 56.0, 52.0, 95.0, 93.0, 108.0, 90.0, 72.0, 65.0, 46.0, 35.0, 24.0, 18.0, 12.0, 9.0, 9.0, 6.0, 6.0, 8.0, 8.0, 10.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8451080322265625, -1.790802001953125, -1.7364959716796875, -1.68218994140625, -1.6278839111328125, -1.573577880859375, -1.5192718505859375, -1.4649658203125, -1.4106597900390625, -1.356353759765625, -1.3020477294921875, -1.24774169921875, -1.1934356689453125, -1.139129638671875, -1.0848236083984375, -1.030517578125, -0.9762115478515625, -0.921905517578125, -0.8675994873046875, -0.81329345703125, -0.7589874267578125, -0.704681396484375, -0.6503753662109375, -0.5960693359375, -0.5417633056640625, -0.487457275390625, -0.4331512451171875, -0.37884521484375, -0.3245391845703125, -0.270233154296875, -0.2159271240234375, -0.16162109375, -0.1073150634765625, -0.053009033203125, 0.0012969970703125, 0.05560302734375, 0.1099090576171875, 0.164215087890625, 0.2185211181640625, 0.2728271484375, 0.3271331787109375, 0.381439208984375, 0.4357452392578125, 0.49005126953125, 0.5443572998046875, 0.598663330078125, 0.6529693603515625, 0.707275390625, 0.7615814208984375, 0.815887451171875, 0.8701934814453125, 0.92449951171875, 0.9788055419921875, 1.033111572265625, 1.0874176025390625, 1.1417236328125, 1.1960296630859375, 1.250335693359375, 1.3046417236328125, 1.35894775390625, 1.4132537841796875, 1.467559814453125, 1.5218658447265625, 1.576171875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 16.0, 44.0, 47.0, 83.0, 123.0, 162.0, 143.0, 130.0, 100.0, 63.0, 30.0, 25.0, 14.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.93492889404297, -55.58319091796875, -54.23145294189453, -52.87971496582031, -51.527976989746094, -50.176239013671875, -48.824501037597656, -47.47275924682617, -46.12102127075195, -44.769283294677734, -43.417545318603516, -42.0658073425293, -40.71406936645508, -39.362327575683594, -38.010589599609375, -36.658851623535156, -35.30711364746094, -33.95537567138672, -32.6036376953125, -31.25189971923828, -29.90015983581543, -28.54842185974121, -27.196683883666992, -25.84494400024414, -24.493209838867188, -23.14147186279297, -21.78973388671875, -20.43799591064453, -19.08625602722168, -17.73451805114746, -16.382780075073242, -15.031041145324707, -13.679300308227539, -12.32756233215332, -10.975823402404785, -9.624085426330566, -8.272346496582031, -6.9206085205078125, -5.568870544433594, -4.217131614685059, -2.86539363861084, -1.5136553049087524, -0.16191697120666504, 1.1898212432861328, 2.5415596961975098, 3.8932981491088867, 5.2450361251831055, 6.596775054931641, 7.948513031005859, 9.300251007080078, 10.651989936828613, 12.003727912902832, 13.355466842651367, 14.707204818725586, 16.058942794799805, 17.410682678222656, 18.762420654296875, 20.114158630371094, 21.465896606445312, 22.81763458251953, 24.169374465942383, 25.5211124420166, 26.87285041809082, 28.224590301513672, 29.576326370239258]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 2.0, 7.0, 7.0, 7.0, 8.0, 17.0, 20.0, 14.0, 11.0, 19.0, 11.0, 14.0, 24.0, 26.0, 19.0, 27.0, 41.0, 39.0, 31.0, 41.0, 43.0, 41.0, 26.0, 50.0, 47.0, 38.0, 34.0, 38.0, 33.0, 31.0, 23.0, 33.0, 11.0, 14.0, 30.0, 24.0, 17.0, 13.0, 11.0, 15.0, 6.0, 10.0, 5.0, 4.0, 3.0, 7.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.0833158493042, -14.593104362487793, -14.102892875671387, -13.61268138885498, -13.122468948364258, -12.632257461547852, -12.142045974731445, -11.651834487915039, -11.161623001098633, -10.671411514282227, -10.18120002746582, -9.690988540649414, -9.200777053833008, -8.710565567016602, -8.220353126525879, -7.730141639709473, -7.239930152893066, -6.74971866607666, -6.259507179260254, -5.7692952156066895, -5.279083728790283, -4.788872241973877, -4.2986602783203125, -3.8084487915039062, -3.3182373046875, -2.8280258178710938, -2.3378140926361084, -1.8476024866104126, -1.3573908805847168, -0.8671793937683105, -0.3769676685333252, 0.11324405670166016, 0.6034564971923828, 1.0936681032180786, 1.5838797092437744, 2.0740914344787598, 2.564302921295166, 3.0545144081115723, 3.5447261333465576, 4.034937858581543, 4.525149345397949, 5.0153608322143555, 5.505572319030762, 5.995784282684326, 6.485995769500732, 6.976207256317139, 7.466419219970703, 7.956630706787109, 8.446842193603516, 8.937053680419922, 9.427265167236328, 9.917476654052734, 10.40768814086914, 10.897899627685547, 11.38811206817627, 11.878323554992676, 12.368535041809082, 12.858746528625488, 13.348958015441895, 13.8391695022583, 14.329381942749023, 14.81959342956543, 15.309804916381836, 15.800016403198242, 16.29022789001465]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 11.0, 5.0, 12.0, 8.0, 7.0, 19.0, 22.0, 48.0, 76.0, 90.0, 125.0, 203.0, 311.0, 527.0, 780.0, 1246.0, 2225.0, 4159.0, 8403.0, 22399.0, 88874.0, 3385975.0, 588255.0, 58204.0, 16955.0, 7157.0, 3438.0, 1906.0, 1041.0, 623.0, 412.0, 250.0, 177.0, 114.0, 72.0, 47.0, 46.0, 13.0, 19.0, 7.0, 5.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8203125, -8.5810546875, -8.341796875, -8.1025390625, -7.86328125, -7.6240234375, -7.384765625, -7.1455078125, -6.90625, -6.6669921875, -6.427734375, -6.1884765625, -5.94921875, -5.7099609375, -5.470703125, -5.2314453125, -4.9921875, -4.7529296875, -4.513671875, -4.2744140625, -4.03515625, -3.7958984375, -3.556640625, -3.3173828125, -3.078125, -2.8388671875, -2.599609375, -2.3603515625, -2.12109375, -1.8818359375, -1.642578125, -1.4033203125, -1.1640625, -0.9248046875, -0.685546875, -0.4462890625, -0.20703125, 0.0322265625, 0.271484375, 0.5107421875, 0.75, 0.9892578125, 1.228515625, 1.4677734375, 1.70703125, 1.9462890625, 2.185546875, 2.4248046875, 2.6640625, 2.9033203125, 3.142578125, 3.3818359375, 3.62109375, 3.8603515625, 4.099609375, 4.3388671875, 4.578125, 4.8173828125, 5.056640625, 5.2958984375, 5.53515625, 5.7744140625, 6.013671875, 6.2529296875, 6.4921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 10.0, 10.0, 11.0, 13.0, 15.0, 19.0, 12.0, 21.0, 26.0, 29.0, 33.0, 29.0, 34.0, 36.0, 42.0, 41.0, 50.0, 47.0, 52.0, 50.0, 43.0, 47.0, 42.0, 26.0, 27.0, 25.0, 29.0, 32.0, 20.0, 25.0, 16.0, 15.0, 14.0, 11.0, 10.0, 8.0, 5.0, 3.0, 5.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.9892578125, -0.9626388549804688, -0.9360198974609375, -0.9094009399414062, -0.882781982421875, -0.8561630249023438, -0.8295440673828125, -0.8029251098632812, -0.77630615234375, -0.7496871948242188, -0.7230682373046875, -0.6964492797851562, -0.669830322265625, -0.6432113647460938, -0.6165924072265625, -0.5899734497070312, -0.5633544921875, -0.5367355346679688, -0.5101165771484375, -0.48349761962890625, -0.456878662109375, -0.43025970458984375, -0.4036407470703125, -0.37702178955078125, -0.35040283203125, -0.32378387451171875, -0.2971649169921875, -0.27054595947265625, -0.243927001953125, -0.21730804443359375, -0.1906890869140625, -0.16407012939453125, -0.137451171875, -0.11083221435546875, -0.0842132568359375, -0.05759429931640625, -0.030975341796875, -0.00435638427734375, 0.0222625732421875, 0.04888153076171875, 0.07550048828125, 0.10211944580078125, 0.1287384033203125, 0.15535736083984375, 0.181976318359375, 0.20859527587890625, 0.2352142333984375, 0.26183319091796875, 0.2884521484375, 0.31507110595703125, 0.3416900634765625, 0.36830902099609375, 0.394927978515625, 0.42154693603515625, 0.4481658935546875, 0.47478485107421875, 0.50140380859375, 0.5280227661132812, 0.5546417236328125, 0.5812606811523438, 0.607879638671875, 0.6344985961914062, 0.6611175537109375, 0.6877365112304688, 0.71435546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 7.0, 9.0, 20.0, 33.0, 50.0, 91.0, 130.0, 186.0, 319.0, 492.0, 795.0, 1516.0, 2780.0, 5584.0, 12080.0, 29563.0, 81433.0, 353829.0, 3291667.0, 291132.0, 73004.0, 27156.0, 11255.0, 5199.0, 2560.0, 1369.0, 787.0, 431.0, 286.0, 166.0, 108.0, 79.0, 46.0, 31.0, 23.0, 20.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.859375, -5.694091796875, -5.52880859375, -5.363525390625, -5.1982421875, -5.032958984375, -4.86767578125, -4.702392578125, -4.537109375, -4.371826171875, -4.20654296875, -4.041259765625, -3.8759765625, -3.710693359375, -3.54541015625, -3.380126953125, -3.21484375, -3.049560546875, -2.88427734375, -2.718994140625, -2.5537109375, -2.388427734375, -2.22314453125, -2.057861328125, -1.892578125, -1.727294921875, -1.56201171875, -1.396728515625, -1.2314453125, -1.066162109375, -0.90087890625, -0.735595703125, -0.5703125, -0.405029296875, -0.23974609375, -0.074462890625, 0.0908203125, 0.256103515625, 0.42138671875, 0.586669921875, 0.751953125, 0.917236328125, 1.08251953125, 1.247802734375, 1.4130859375, 1.578369140625, 1.74365234375, 1.908935546875, 2.07421875, 2.239501953125, 2.40478515625, 2.570068359375, 2.7353515625, 2.900634765625, 3.06591796875, 3.231201171875, 3.396484375, 3.561767578125, 3.72705078125, 3.892333984375, 4.0576171875, 4.222900390625, 4.38818359375, 4.553466796875, 4.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 11.0, 6.0, 8.0, 12.0, 13.0, 16.0, 25.0, 31.0, 28.0, 39.0, 68.0, 89.0, 160.0, 288.0, 891.0, 1506.0, 322.0, 154.0, 106.0, 76.0, 59.0, 35.0, 28.0, 23.0, 13.0, 12.0, 9.0, 6.0, 9.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7734375, -1.7125244140625, -1.651611328125, -1.5906982421875, -1.52978515625, -1.4688720703125, -1.407958984375, -1.3470458984375, -1.2861328125, -1.2252197265625, -1.164306640625, -1.1033935546875, -1.04248046875, -0.9815673828125, -0.920654296875, -0.8597412109375, -0.798828125, -0.7379150390625, -0.677001953125, -0.6160888671875, -0.55517578125, -0.4942626953125, -0.433349609375, -0.3724365234375, -0.3115234375, -0.2506103515625, -0.189697265625, -0.1287841796875, -0.06787109375, -0.0069580078125, 0.053955078125, 0.1148681640625, 0.17578125, 0.2366943359375, 0.297607421875, 0.3585205078125, 0.41943359375, 0.4803466796875, 0.541259765625, 0.6021728515625, 0.6630859375, 0.7239990234375, 0.784912109375, 0.8458251953125, 0.90673828125, 0.9676513671875, 1.028564453125, 1.0894775390625, 1.150390625, 1.2113037109375, 1.272216796875, 1.3331298828125, 1.39404296875, 1.4549560546875, 1.515869140625, 1.5767822265625, 1.6376953125, 1.6986083984375, 1.759521484375, 1.8204345703125, 1.88134765625, 1.9422607421875, 2.003173828125, 2.0640869140625, 2.125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 10.0, 18.0, 40.0, 112.0, 220.0, 270.0, 188.0, 88.0, 41.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.471782684326172, -19.633644104003906, -18.795507431030273, -17.957368850708008, -17.119232177734375, -16.28109359741211, -15.442956924438477, -14.604818344116211, -13.766681671142578, -12.928544044494629, -12.09040641784668, -11.25226879119873, -10.414131164550781, -9.575992584228516, -8.737855911254883, -7.899717807769775, -7.061579704284668, -6.223442077636719, -5.3853044509887695, -4.54716682434082, -3.709028959274292, -2.8708910942077637, -2.0327534675598145, -1.1946158409118652, -0.356478214263916, 0.481659471988678, 1.319797158241272, 2.1579349040985107, 2.99607253074646, 3.8342103958129883, 4.6723480224609375, 5.510485649108887, 6.348623275756836, 7.186760902404785, 8.024898529052734, 8.863036155700684, 9.701173782348633, 10.539312362670898, 11.377449035644531, 12.215587615966797, 13.05372428894043, 13.891861915588379, 14.729999542236328, 15.568137168884277, 16.406274795532227, 17.244413375854492, 18.082550048828125, 18.92068862915039, 19.758827209472656, 20.596965789794922, 21.435102462768555, 22.27324104309082, 23.111377716064453, 23.94951629638672, 24.78765296936035, 25.625791549682617, 26.46392822265625, 27.302066802978516, 28.14020347595215, 28.978342056274414, 29.816478729248047, 30.654617309570312, 31.492753982543945, 32.33089065551758, 33.169029235839844]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 8.0, 13.0, 13.0, 7.0, 27.0, 19.0, 23.0, 22.0, 20.0, 42.0, 16.0, 36.0, 42.0, 47.0, 23.0, 63.0, 42.0, 50.0, 42.0, 37.0, 44.0, 38.0, 42.0, 43.0, 30.0, 28.0, 22.0, 29.0, 20.0, 15.0, 16.0, 15.0, 5.0, 11.0, 11.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.043807506561279, -5.846083641052246, -5.648359775543213, -5.4506354331970215, -5.252911567687988, -5.055187702178955, -4.857463836669922, -4.6597394943237305, -4.462015628814697, -4.264291763305664, -4.066567897796631, -3.8688437938690186, -3.6711196899414062, -3.473395824432373, -3.27567195892334, -3.0779478549957275, -2.8802239894866943, -2.682500123977661, -2.484776020050049, -2.2870521545410156, -2.0893280506134033, -1.8916041851043701, -1.6938802003860474, -1.4961562156677246, -1.2984322309494019, -1.100708246231079, -0.9029842615127563, -0.7052603363990784, -0.5075363516807556, -0.30981236696243286, -0.11208844184875488, 0.08563554286956787, 0.2833595275878906, 0.4810835123062134, 0.6788074970245361, 0.8765314221382141, 1.0742554664611816, 1.2719793319702148, 1.4697033166885376, 1.6674273014068604, 1.865151286125183, 2.062875270843506, 2.260599136352539, 2.4583232402801514, 2.6560471057891846, 2.853771209716797, 3.05149507522583, 3.2492189407348633, 3.4469430446624756, 3.644666910171509, 3.842391014099121, 4.040114879608154, 4.2378387451171875, 4.435563087463379, 4.633286952972412, 4.831010818481445, 5.0287346839904785, 5.226458549499512, 5.424182415008545, 5.621906757354736, 5.8196306228637695, 6.017354488372803, 6.215078353881836, 6.412802696228027, 6.6105265617370605]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 12.0, 8.0, 16.0, 28.0, 26.0, 39.0, 63.0, 78.0, 102.0, 140.0, 212.0, 325.0, 521.0, 892.0, 1517.0, 2593.0, 4513.0, 8580.0, 17152.0, 36239.0, 80347.0, 179032.0, 315048.0, 216163.0, 97421.0, 43918.0, 20539.0, 10172.0, 5399.0, 2959.0, 1620.0, 1072.0, 602.0, 384.0, 243.0, 168.0, 120.0, 75.0, 67.0, 43.0, 31.0, 27.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 12.0, 14.0, 10.0, 12.0, 19.0, 14.0, 27.0, 24.0, 18.0, 34.0, 38.0, 31.0, 45.0, 43.0, 49.0, 46.0, 44.0, 45.0, 50.0, 35.0, 34.0, 36.0, 37.0, 32.0, 30.0, 28.0, 27.0, 32.0, 15.0, 17.0, 10.0, 15.0, 12.0, 6.0, 13.0, 6.0, 3.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9309234619140625, -0.904327392578125, -0.8777313232421875, -0.85113525390625, -0.8245391845703125, -0.797943115234375, -0.7713470458984375, -0.7447509765625, -0.7181549072265625, -0.691558837890625, -0.6649627685546875, -0.63836669921875, -0.6117706298828125, -0.585174560546875, -0.5585784912109375, -0.531982421875, -0.5053863525390625, -0.478790283203125, -0.4521942138671875, -0.42559814453125, -0.3990020751953125, -0.372406005859375, -0.3458099365234375, -0.3192138671875, -0.2926177978515625, -0.266021728515625, -0.2394256591796875, -0.21282958984375, -0.1862335205078125, -0.159637451171875, -0.1330413818359375, -0.1064453125, -0.0798492431640625, -0.053253173828125, -0.0266571044921875, -6.103515625e-05, 0.0265350341796875, 0.053131103515625, 0.0797271728515625, 0.1063232421875, 0.1329193115234375, 0.159515380859375, 0.1861114501953125, 0.21270751953125, 0.2393035888671875, 0.265899658203125, 0.2924957275390625, 0.319091796875, 0.3456878662109375, 0.372283935546875, 0.3988800048828125, 0.42547607421875, 0.4520721435546875, 0.478668212890625, 0.5052642822265625, 0.5318603515625, 0.5584564208984375, 0.585052490234375, 0.6116485595703125, 0.63824462890625, 0.6648406982421875, 0.691436767578125, 0.7180328369140625, 0.74462890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 9.0, 11.0, 17.0, 25.0, 34.0, 51.0, 83.0, 156.0, 222.0, 452.0, 974.0, 3029.0, 11818.0, 61242.0, 338395.0, 498514.0, 106772.0, 19705.0, 4408.0, 1324.0, 593.0, 281.0, 150.0, 92.0, 58.0, 49.0, 30.0, 10.0, 15.0, 16.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73046875, -7.504150390625, -7.27783203125, -7.051513671875, -6.8251953125, -6.598876953125, -6.37255859375, -6.146240234375, -5.919921875, -5.693603515625, -5.46728515625, -5.240966796875, -5.0146484375, -4.788330078125, -4.56201171875, -4.335693359375, -4.109375, -3.883056640625, -3.65673828125, -3.430419921875, -3.2041015625, -2.977783203125, -2.75146484375, -2.525146484375, -2.298828125, -2.072509765625, -1.84619140625, -1.619873046875, -1.3935546875, -1.167236328125, -0.94091796875, -0.714599609375, -0.48828125, -0.261962890625, -0.03564453125, 0.190673828125, 0.4169921875, 0.643310546875, 0.86962890625, 1.095947265625, 1.322265625, 1.548583984375, 1.77490234375, 2.001220703125, 2.2275390625, 2.453857421875, 2.68017578125, 2.906494140625, 3.1328125, 3.359130859375, 3.58544921875, 3.811767578125, 4.0380859375, 4.264404296875, 4.49072265625, 4.717041015625, 4.943359375, 5.169677734375, 5.39599609375, 5.622314453125, 5.8486328125, 6.074951171875, 6.30126953125, 6.527587890625, 6.75390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 4.0, 11.0, 12.0, 12.0, 9.0, 14.0, 9.0, 27.0, 29.0, 42.0, 44.0, 39.0, 43.0, 50.0, 36.0, 40.0, 50.0, 53.0, 45.0, 45.0, 45.0, 34.0, 35.0, 47.0, 33.0, 26.0, 23.0, 25.0, 25.0, 20.0, 16.0, 14.0, 9.0, 7.0, 8.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.1015625, -4.95599365234375, -4.8104248046875, -4.66485595703125, -4.519287109375, -4.37371826171875, -4.2281494140625, -4.08258056640625, -3.93701171875, -3.79144287109375, -3.6458740234375, -3.50030517578125, -3.354736328125, -3.20916748046875, -3.0635986328125, -2.91802978515625, -2.7724609375, -2.62689208984375, -2.4813232421875, -2.33575439453125, -2.190185546875, -2.04461669921875, -1.8990478515625, -1.75347900390625, -1.60791015625, -1.46234130859375, -1.3167724609375, -1.17120361328125, -1.025634765625, -0.88006591796875, -0.7344970703125, -0.58892822265625, -0.443359375, -0.29779052734375, -0.1522216796875, -0.00665283203125, 0.138916015625, 0.28448486328125, 0.4300537109375, 0.57562255859375, 0.72119140625, 0.86676025390625, 1.0123291015625, 1.15789794921875, 1.303466796875, 1.44903564453125, 1.5946044921875, 1.74017333984375, 1.8857421875, 2.03131103515625, 2.1768798828125, 2.32244873046875, 2.468017578125, 2.61358642578125, 2.7591552734375, 2.90472412109375, 3.05029296875, 3.19586181640625, 3.3414306640625, 3.48699951171875, 3.632568359375, 3.77813720703125, 3.9237060546875, 4.06927490234375, 4.21484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 12.0, 7.0, 11.0, 19.0, 27.0, 46.0, 70.0, 115.0, 234.0, 599.0, 1273.0, 3047.0, 8803.0, 30007.0, 121299.0, 485366.0, 300243.0, 69718.0, 17996.0, 5802.0, 2071.0, 865.0, 413.0, 226.0, 109.0, 52.0, 34.0, 22.0, 18.0, 9.0, 7.0, 12.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.21820068359375, -3.1102294921875, -3.00225830078125, -2.894287109375, -2.78631591796875, -2.6783447265625, -2.57037353515625, -2.46240234375, -2.35443115234375, -2.2464599609375, -2.13848876953125, -2.030517578125, -1.92254638671875, -1.8145751953125, -1.70660400390625, -1.5986328125, -1.49066162109375, -1.3826904296875, -1.27471923828125, -1.166748046875, -1.05877685546875, -0.9508056640625, -0.84283447265625, -0.73486328125, -0.62689208984375, -0.5189208984375, -0.41094970703125, -0.302978515625, -0.19500732421875, -0.0870361328125, 0.02093505859375, 0.12890625, 0.23687744140625, 0.3448486328125, 0.45281982421875, 0.560791015625, 0.66876220703125, 0.7767333984375, 0.88470458984375, 0.99267578125, 1.10064697265625, 1.2086181640625, 1.31658935546875, 1.424560546875, 1.53253173828125, 1.6405029296875, 1.74847412109375, 1.8564453125, 1.96441650390625, 2.0723876953125, 2.18035888671875, 2.288330078125, 2.39630126953125, 2.5042724609375, 2.61224365234375, 2.72021484375, 2.82818603515625, 2.9361572265625, 3.04412841796875, 3.152099609375, 3.26007080078125, 3.3680419921875, 3.47601318359375, 3.583984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 17.0, 11.0, 21.0, 24.0, 30.0, 25.0, 56.0, 37.0, 61.0, 79.0, 130.0, 131.0, 86.0, 60.0, 50.0, 29.0, 30.0, 26.0, 17.0, 18.0, 5.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004696846008300781, -0.0004558674991130829, -0.00044205039739608765, -0.0004282332956790924, -0.00041441619396209717, -0.00040059909224510193, -0.0003867819905281067, -0.00037296488881111145, -0.0003591477870941162, -0.00034533068537712097, -0.00033151358366012573, -0.0003176964819431305, -0.00030387938022613525, -0.00029006227850914, -0.0002762451767921448, -0.00026242807507514954, -0.0002486109733581543, -0.00023479387164115906, -0.00022097676992416382, -0.00020715966820716858, -0.00019334256649017334, -0.0001795254647731781, -0.00016570836305618286, -0.00015189126133918762, -0.00013807415962219238, -0.00012425705790519714, -0.0001104399561882019, -9.662285447120667e-05, -8.280575275421143e-05, -6.898865103721619e-05, -5.517154932022095e-05, -4.135444760322571e-05, -2.753734588623047e-05, -1.372024416923523e-05, 9.685754776000977e-08, 1.3913959264755249e-05, 2.7731060981750488e-05, 4.154816269874573e-05, 5.536526441574097e-05, 6.91823661327362e-05, 8.299946784973145e-05, 9.681656956672668e-05, 0.00011063367128372192, 0.00012445077300071716, 0.0001382678747177124, 0.00015208497643470764, 0.00016590207815170288, 0.00017971917986869812, 0.00019353628158569336, 0.0002073533833026886, 0.00022117048501968384, 0.00023498758673667908, 0.0002488046884536743, 0.00026262179017066956, 0.0002764388918876648, 0.00029025599360466003, 0.0003040730953216553, 0.0003178901970386505, 0.00033170729875564575, 0.000345524400472641, 0.00035934150218963623, 0.00037315860390663147, 0.0003869757056236267, 0.00040079280734062195, 0.0004146099090576172]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 9.0, 7.0, 12.0, 21.0, 30.0, 54.0, 72.0, 120.0, 164.0, 248.0, 413.0, 775.0, 1547.0, 3523.0, 9247.0, 30542.0, 122326.0, 484019.0, 297583.0, 68180.0, 18259.0, 6054.0, 2528.0, 1235.0, 590.0, 380.0, 212.0, 131.0, 86.0, 48.0, 49.0, 22.0, 19.0, 15.0, 6.0, 10.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.82421875, -3.703948974609375, -3.58367919921875, -3.463409423828125, -3.3431396484375, -3.222869873046875, -3.10260009765625, -2.982330322265625, -2.862060546875, -2.741790771484375, -2.62152099609375, -2.501251220703125, -2.3809814453125, -2.260711669921875, -2.14044189453125, -2.020172119140625, -1.89990234375, -1.779632568359375, -1.65936279296875, -1.539093017578125, -1.4188232421875, -1.298553466796875, -1.17828369140625, -1.058013916015625, -0.937744140625, -0.817474365234375, -0.69720458984375, -0.576934814453125, -0.4566650390625, -0.336395263671875, -0.21612548828125, -0.095855712890625, 0.0244140625, 0.144683837890625, 0.26495361328125, 0.385223388671875, 0.5054931640625, 0.625762939453125, 0.74603271484375, 0.866302490234375, 0.986572265625, 1.106842041015625, 1.22711181640625, 1.347381591796875, 1.4676513671875, 1.587921142578125, 1.70819091796875, 1.828460693359375, 1.94873046875, 2.069000244140625, 2.18927001953125, 2.309539794921875, 2.4298095703125, 2.550079345703125, 2.67034912109375, 2.790618896484375, 2.910888671875, 3.031158447265625, 3.15142822265625, 3.271697998046875, 3.3919677734375, 3.512237548828125, 3.63250732421875, 3.752777099609375, 3.873046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 13.0, 17.0, 14.0, 20.0, 26.0, 27.0, 30.0, 57.0, 58.0, 76.0, 96.0, 86.0, 88.0, 78.0, 67.0, 46.0, 43.0, 29.0, 29.0, 28.0, 18.0, 6.0, 7.0, 9.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.677734375, -3.5751953125, -3.47265625, -3.3701171875, -3.267578125, -3.1650390625, -3.0625, -2.9599609375, -2.857421875, -2.7548828125, -2.65234375, -2.5498046875, -2.447265625, -2.3447265625, -2.2421875, -2.1396484375, -2.037109375, -1.9345703125, -1.83203125, -1.7294921875, -1.626953125, -1.5244140625, -1.421875, -1.3193359375, -1.216796875, -1.1142578125, -1.01171875, -0.9091796875, -0.806640625, -0.7041015625, -0.6015625, -0.4990234375, -0.396484375, -0.2939453125, -0.19140625, -0.0888671875, 0.013671875, 0.1162109375, 0.21875, 0.3212890625, 0.423828125, 0.5263671875, 0.62890625, 0.7314453125, 0.833984375, 0.9365234375, 1.0390625, 1.1416015625, 1.244140625, 1.3466796875, 1.44921875, 1.5517578125, 1.654296875, 1.7568359375, 1.859375, 1.9619140625, 2.064453125, 2.1669921875, 2.26953125, 2.3720703125, 2.474609375, 2.5771484375, 2.6796875, 2.7822265625, 2.884765625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 13.0, 16.0, 30.0, 61.0, 94.0, 141.0, 180.0, 158.0, 127.0, 83.0, 42.0, 21.0, 18.0, 13.0, 5.0, 6.0, 1.0], "bins": [-101.78441619873047, -99.88369750976562, -97.98297119140625, -96.0822525024414, -94.18152618408203, -92.28080749511719, -90.38008117675781, -88.47936248779297, -86.5786361694336, -84.67791748046875, -82.77719116210938, -80.87647247314453, -78.97574615478516, -77.07502746582031, -75.17430114746094, -73.2735824584961, -71.37286376953125, -69.4721450805664, -67.57141876220703, -65.67070007324219, -63.76997375488281, -61.8692512512207, -59.968528747558594, -58.06781005859375, -56.167083740234375, -54.266361236572266, -52.365638732910156, -50.46491622924805, -48.56419372558594, -46.66347122192383, -44.76274871826172, -42.862030029296875, -40.961299896240234, -39.060577392578125, -37.159854888916016, -35.259132385253906, -33.3584098815918, -31.457687377929688, -29.55696678161621, -27.6562442779541, -25.755521774291992, -23.854799270629883, -21.954076766967773, -20.053356170654297, -18.152633666992188, -16.251911163330078, -14.351188659667969, -12.45046615600586, -10.54974365234375, -8.64902114868164, -6.7482991218566895, -4.847577095031738, -2.946854591369629, -1.0461320877075195, 0.8545894622802734, 2.755311965942383, 4.656034469604492, 6.556756973266602, 8.457479476928711, 10.358201026916504, 12.258923530578613, 14.159646034240723, 16.060367584228516, 17.961090087890625, 19.861812591552734]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 9.0, 11.0, 8.0, 7.0, 8.0, 20.0, 18.0, 19.0, 25.0, 32.0, 43.0, 34.0, 40.0, 44.0, 48.0, 35.0, 38.0, 60.0, 43.0, 66.0, 36.0, 49.0, 43.0, 40.0, 34.0, 32.0, 28.0, 26.0, 18.0, 21.0, 18.0, 11.0, 14.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.79796600341797, -26.89493751525879, -25.991907119750977, -25.088878631591797, -24.185850143432617, -23.282819747924805, -22.379791259765625, -21.476760864257812, -20.573732376098633, -19.670703887939453, -18.76767349243164, -17.86464500427246, -16.96161651611328, -16.05858612060547, -15.155557632446289, -14.252528190612793, -13.349499702453613, -12.446470260620117, -11.543441772460938, -10.640412330627441, -9.737382888793945, -8.834354400634766, -7.9313249588012695, -7.028295516967773, -6.1252665519714355, -5.222237586975098, -4.319208145141602, -3.4161791801452637, -2.5131499767303467, -1.6101207733154297, -0.7070918083190918, 0.1959376335144043, 1.0989665985107422, 2.001995801925659, 2.905025005340576, 3.808053970336914, 4.71108341217041, 5.614112377166748, 6.517141342163086, 7.420170783996582, 8.323200225830078, 9.226229667663574, 10.129258155822754, 11.03228759765625, 11.935317039489746, 12.838346481323242, 13.741374969482422, 14.644404411315918, 15.547432899475098, 16.450462341308594, 17.353490829467773, 18.256519317626953, 19.159549713134766, 20.062578201293945, 20.965606689453125, 21.868637084960938, 22.771665573120117, 23.674694061279297, 24.57772445678711, 25.48075294494629, 26.38378143310547, 27.28681182861328, 28.18984031677246, 29.09286880493164, 29.995899200439453]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 17.0, 22.0, 28.0, 30.0, 61.0, 101.0, 136.0, 217.0, 297.0, 526.0, 832.0, 1620.0, 3177.0, 6836.0, 16970.0, 50837.0, 209373.0, 2746136.0, 968984.0, 127942.0, 36125.0, 12895.0, 5432.0, 2535.0, 1326.0, 718.0, 427.0, 287.0, 119.0, 112.0, 50.0, 36.0, 23.0, 11.0, 11.0, 8.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -8.07763671875, -7.8583984375, -7.63916015625, -7.419921875, -7.20068359375, -6.9814453125, -6.76220703125, -6.54296875, -6.32373046875, -6.1044921875, -5.88525390625, -5.666015625, -5.44677734375, -5.2275390625, -5.00830078125, -4.7890625, -4.56982421875, -4.3505859375, -4.13134765625, -3.912109375, -3.69287109375, -3.4736328125, -3.25439453125, -3.03515625, -2.81591796875, -2.5966796875, -2.37744140625, -2.158203125, -1.93896484375, -1.7197265625, -1.50048828125, -1.28125, -1.06201171875, -0.8427734375, -0.62353515625, -0.404296875, -0.18505859375, 0.0341796875, 0.25341796875, 0.47265625, 0.69189453125, 0.9111328125, 1.13037109375, 1.349609375, 1.56884765625, 1.7880859375, 2.00732421875, 2.2265625, 2.44580078125, 2.6650390625, 2.88427734375, 3.103515625, 3.32275390625, 3.5419921875, 3.76123046875, 3.98046875, 4.19970703125, 4.4189453125, 4.63818359375, 4.857421875, 5.07666015625, 5.2958984375, 5.51513671875, 5.734375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 10.0, 10.0, 8.0, 17.0, 32.0, 24.0, 35.0, 22.0, 44.0, 37.0, 76.0, 55.0, 51.0, 44.0, 62.0, 63.0, 57.0, 42.0, 57.0, 37.0, 38.0, 25.0, 35.0, 21.0, 20.0, 20.0, 15.0, 14.0, 3.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.607421875, -1.56658935546875, -1.5257568359375, -1.48492431640625, -1.444091796875, -1.40325927734375, -1.3624267578125, -1.32159423828125, -1.28076171875, -1.23992919921875, -1.1990966796875, -1.15826416015625, -1.117431640625, -1.07659912109375, -1.0357666015625, -0.99493408203125, -0.9541015625, -0.91326904296875, -0.8724365234375, -0.83160400390625, -0.790771484375, -0.74993896484375, -0.7091064453125, -0.66827392578125, -0.62744140625, -0.58660888671875, -0.5457763671875, -0.50494384765625, -0.464111328125, -0.42327880859375, -0.3824462890625, -0.34161376953125, -0.30078125, -0.25994873046875, -0.2191162109375, -0.17828369140625, -0.137451171875, -0.09661865234375, -0.0557861328125, -0.01495361328125, 0.02587890625, 0.06671142578125, 0.1075439453125, 0.14837646484375, 0.189208984375, 0.23004150390625, 0.2708740234375, 0.31170654296875, 0.3525390625, 0.39337158203125, 0.4342041015625, 0.47503662109375, 0.515869140625, 0.55670166015625, 0.5975341796875, 0.63836669921875, 0.67919921875, 0.72003173828125, 0.7608642578125, 0.80169677734375, 0.842529296875, 0.88336181640625, 0.9241943359375, 0.96502685546875, 1.005859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 12.0, 6.0, 24.0, 38.0, 61.0, 123.0, 185.0, 436.0, 869.0, 2018.0, 4922.0, 13539.0, 44638.0, 199302.0, 2233195.0, 1477225.0, 160278.0, 37823.0, 11914.0, 4261.0, 1774.0, 782.0, 395.0, 204.0, 107.0, 46.0, 33.0, 20.0, 18.0, 6.0, 5.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.49786376953125, -6.2652587890625, -6.03265380859375, -5.800048828125, -5.56744384765625, -5.3348388671875, -5.10223388671875, -4.86962890625, -4.63702392578125, -4.4044189453125, -4.17181396484375, -3.939208984375, -3.70660400390625, -3.4739990234375, -3.24139404296875, -3.0087890625, -2.77618408203125, -2.5435791015625, -2.31097412109375, -2.078369140625, -1.84576416015625, -1.6131591796875, -1.38055419921875, -1.14794921875, -0.91534423828125, -0.6827392578125, -0.45013427734375, -0.217529296875, 0.01507568359375, 0.2476806640625, 0.48028564453125, 0.712890625, 0.94549560546875, 1.1781005859375, 1.41070556640625, 1.643310546875, 1.87591552734375, 2.1085205078125, 2.34112548828125, 2.57373046875, 2.80633544921875, 3.0389404296875, 3.27154541015625, 3.504150390625, 3.73675537109375, 3.9693603515625, 4.20196533203125, 4.4345703125, 4.66717529296875, 4.8997802734375, 5.13238525390625, 5.364990234375, 5.59759521484375, 5.8302001953125, 6.06280517578125, 6.29541015625, 6.52801513671875, 6.7606201171875, 6.99322509765625, 7.225830078125, 7.45843505859375, 7.6910400390625, 7.92364501953125, 8.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 12.0, 21.0, 14.0, 38.0, 42.0, 53.0, 83.0, 131.0, 204.0, 396.0, 810.0, 987.0, 504.0, 245.0, 168.0, 103.0, 59.0, 56.0, 41.0, 26.0, 12.0, 15.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.336517333984375, -3.21795654296875, -3.099395751953125, -2.9808349609375, -2.862274169921875, -2.74371337890625, -2.625152587890625, -2.506591796875, -2.388031005859375, -2.26947021484375, -2.150909423828125, -2.0323486328125, -1.913787841796875, -1.79522705078125, -1.676666259765625, -1.55810546875, -1.439544677734375, -1.32098388671875, -1.202423095703125, -1.0838623046875, -0.965301513671875, -0.84674072265625, -0.728179931640625, -0.609619140625, -0.491058349609375, -0.37249755859375, -0.253936767578125, -0.1353759765625, -0.016815185546875, 0.10174560546875, 0.220306396484375, 0.3388671875, 0.457427978515625, 0.57598876953125, 0.694549560546875, 0.8131103515625, 0.931671142578125, 1.05023193359375, 1.168792724609375, 1.287353515625, 1.405914306640625, 1.52447509765625, 1.643035888671875, 1.7615966796875, 1.880157470703125, 1.99871826171875, 2.117279052734375, 2.23583984375, 2.354400634765625, 2.47296142578125, 2.591522216796875, 2.7100830078125, 2.828643798828125, 2.94720458984375, 3.065765380859375, 3.184326171875, 3.302886962890625, 3.42144775390625, 3.540008544921875, 3.6585693359375, 3.777130126953125, 3.89569091796875, 4.014251708984375, 4.1328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 34.0, 79.0, 159.0, 248.0, 213.0, 146.0, 60.0, 22.0, 19.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.01478958129883, -57.13423156738281, -55.25366973876953, -53.373111724853516, -51.4925537109375, -49.611995697021484, -47.73143768310547, -45.85087585449219, -43.97031784057617, -42.089759826660156, -40.209197998046875, -38.32863998413086, -36.448081970214844, -34.56752395629883, -32.68696594238281, -30.80640411376953, -28.925846099853516, -27.0452880859375, -25.16472816467285, -23.284168243408203, -21.403610229492188, -19.523052215576172, -17.642492294311523, -15.761933326721191, -13.88137435913086, -12.000815391540527, -10.120256423950195, -8.239697456359863, -6.359138488769531, -4.478579521179199, -2.598020553588867, -0.7174615859985352, 1.1631011962890625, 3.0436601638793945, 4.924219131469727, 6.804778099060059, 8.68533706665039, 10.565896034240723, 12.446455001831055, 14.327013969421387, 16.20757293701172, 18.088130950927734, 19.968690872192383, 21.84925079345703, 23.729808807373047, 25.610366821289062, 27.49092674255371, 29.37148666381836, 31.252044677734375, 33.13260269165039, 35.013160705566406, 36.89372253417969, 38.7742805480957, 40.65483856201172, 42.535400390625, 44.415958404541016, 46.29651641845703, 48.17707443237305, 50.05763244628906, 51.938194274902344, 53.81875228881836, 55.699310302734375, 57.579872131347656, 59.46043014526367, 61.34098815917969]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 5.0, 13.0, 11.0, 17.0, 8.0, 11.0, 13.0, 17.0, 29.0, 19.0, 13.0, 31.0, 27.0, 23.0, 36.0, 30.0, 49.0, 36.0, 23.0, 29.0, 35.0, 28.0, 27.0, 32.0, 39.0, 38.0, 35.0, 28.0, 34.0, 30.0, 27.0, 23.0, 29.0, 17.0, 21.0, 24.0, 15.0, 9.0, 10.0, 5.0, 8.0, 5.0, 7.0, 7.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.17978572845459, -14.717570304870605, -14.255355834960938, -13.793140411376953, -13.330924987792969, -12.868709564208984, -12.406495094299316, -11.944279670715332, -11.482065200805664, -11.01984977722168, -10.557635307312012, -10.095419883728027, -9.633204460144043, -9.170989990234375, -8.70877456665039, -8.246559143066406, -7.784343719482422, -7.322128772735596, -6.859913349151611, -6.397698402404785, -5.935482978820801, -5.473268032073975, -5.011053085327148, -4.548837661743164, -4.086622714996338, -3.6244075298309326, -3.1621923446655273, -2.699977397918701, -2.237762212753296, -1.7755470275878906, -1.3133320808410645, -0.8511168956756592, -0.3889026641845703, 0.07331246137619019, 0.5355275869369507, 0.9977426528930664, 1.4599578380584717, 1.922173023223877, 2.384387969970703, 2.8466031551361084, 3.3088183403015137, 3.771033525466919, 4.233248710632324, 4.69546365737915, 5.157678604125977, 5.619894027709961, 6.082108974456787, 6.544323921203613, 7.006539344787598, 7.468754291534424, 7.930969715118408, 8.393184661865234, 8.855400085449219, 9.317615509033203, 9.779829978942871, 10.242045402526855, 10.704259872436523, 11.166475296020508, 11.628689765930176, 12.09090518951416, 12.553120613098145, 13.015335083007812, 13.477550506591797, 13.939765930175781, 14.401981353759766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 8.0, 6.0, 16.0, 25.0, 31.0, 55.0, 71.0, 110.0, 169.0, 289.0, 514.0, 818.0, 1457.0, 2627.0, 4660.0, 8760.0, 16160.0, 31166.0, 58067.0, 101850.0, 159486.0, 198809.0, 179488.0, 124896.0, 73069.0, 40002.0, 21065.0, 11252.0, 5944.0, 3296.0, 1804.0, 1014.0, 614.0, 370.0, 189.0, 134.0, 82.0, 55.0, 35.0, 35.0, 12.0, 10.0, 10.0, 6.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.845703125, -3.73797607421875, -3.6302490234375, -3.52252197265625, -3.414794921875, -3.30706787109375, -3.1993408203125, -3.09161376953125, -2.98388671875, -2.87615966796875, -2.7684326171875, -2.66070556640625, -2.552978515625, -2.44525146484375, -2.3375244140625, -2.22979736328125, -2.1220703125, -2.01434326171875, -1.9066162109375, -1.79888916015625, -1.691162109375, -1.58343505859375, -1.4757080078125, -1.36798095703125, -1.26025390625, -1.15252685546875, -1.0447998046875, -0.93707275390625, -0.829345703125, -0.72161865234375, -0.6138916015625, -0.50616455078125, -0.3984375, -0.29071044921875, -0.1829833984375, -0.07525634765625, 0.032470703125, 0.14019775390625, 0.2479248046875, 0.35565185546875, 0.46337890625, 0.57110595703125, 0.6788330078125, 0.78656005859375, 0.894287109375, 1.00201416015625, 1.1097412109375, 1.21746826171875, 1.3251953125, 1.43292236328125, 1.5406494140625, 1.64837646484375, 1.756103515625, 1.86383056640625, 1.9715576171875, 2.07928466796875, 2.18701171875, 2.29473876953125, 2.4024658203125, 2.51019287109375, 2.617919921875, 2.72564697265625, 2.8333740234375, 2.94110107421875, 3.048828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 5.0, 4.0, 12.0, 18.0, 8.0, 9.0, 20.0, 12.0, 15.0, 26.0, 25.0, 18.0, 28.0, 41.0, 39.0, 37.0, 38.0, 39.0, 45.0, 48.0, 52.0, 29.0, 43.0, 42.0, 38.0, 39.0, 34.0, 32.0, 32.0, 42.0, 17.0, 23.0, 23.0, 14.0, 10.0, 9.0, 9.0, 9.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4756011962890625, -1.433624267578125, -1.3916473388671875, -1.34967041015625, -1.3076934814453125, -1.265716552734375, -1.2237396240234375, -1.1817626953125, -1.1397857666015625, -1.097808837890625, -1.0558319091796875, -1.01385498046875, -0.9718780517578125, -0.929901123046875, -0.8879241943359375, -0.845947265625, -0.8039703369140625, -0.761993408203125, -0.7200164794921875, -0.67803955078125, -0.6360626220703125, -0.594085693359375, -0.5521087646484375, -0.5101318359375, -0.4681549072265625, -0.426177978515625, -0.3842010498046875, -0.34222412109375, -0.3002471923828125, -0.258270263671875, -0.2162933349609375, -0.17431640625, -0.1323394775390625, -0.090362548828125, -0.0483856201171875, -0.00640869140625, 0.0355682373046875, 0.077545166015625, 0.1195220947265625, 0.1614990234375, 0.2034759521484375, 0.245452880859375, 0.2874298095703125, 0.32940673828125, 0.3713836669921875, 0.413360595703125, 0.4553375244140625, 0.497314453125, 0.5392913818359375, 0.581268310546875, 0.6232452392578125, 0.66522216796875, 0.7071990966796875, 0.749176025390625, 0.7911529541015625, 0.8331298828125, 0.8751068115234375, 0.917083740234375, 0.9590606689453125, 1.00103759765625, 1.0430145263671875, 1.084991455078125, 1.1269683837890625, 1.1689453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 3.0, 13.0, 17.0, 20.0, 19.0, 49.0, 36.0, 68.0, 111.0, 180.0, 260.0, 440.0, 876.0, 2039.0, 5646.0, 20214.0, 84827.0, 323734.0, 424961.0, 139068.0, 32181.0, 8447.0, 2790.0, 1152.0, 531.0, 299.0, 174.0, 126.0, 79.0, 51.0, 39.0, 31.0, 30.0, 12.0, 6.0, 6.0, 5.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0694580078125, -7.818603515625, -7.5677490234375, -7.31689453125, -7.0660400390625, -6.815185546875, -6.5643310546875, -6.3134765625, -6.0626220703125, -5.811767578125, -5.5609130859375, -5.31005859375, -5.0592041015625, -4.808349609375, -4.5574951171875, -4.306640625, -4.0557861328125, -3.804931640625, -3.5540771484375, -3.30322265625, -3.0523681640625, -2.801513671875, -2.5506591796875, -2.2998046875, -2.0489501953125, -1.798095703125, -1.5472412109375, -1.29638671875, -1.0455322265625, -0.794677734375, -0.5438232421875, -0.29296875, -0.0421142578125, 0.208740234375, 0.4595947265625, 0.71044921875, 0.9613037109375, 1.212158203125, 1.4630126953125, 1.7138671875, 1.9647216796875, 2.215576171875, 2.4664306640625, 2.71728515625, 2.9681396484375, 3.218994140625, 3.4698486328125, 3.720703125, 3.9715576171875, 4.222412109375, 4.4732666015625, 4.72412109375, 4.9749755859375, 5.225830078125, 5.4766845703125, 5.7275390625, 5.9783935546875, 6.229248046875, 6.4801025390625, 6.73095703125, 6.9818115234375, 7.232666015625, 7.4835205078125, 7.734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 11.0, 12.0, 16.0, 17.0, 26.0, 28.0, 32.0, 31.0, 30.0, 42.0, 44.0, 46.0, 53.0, 53.0, 43.0, 42.0, 42.0, 55.0, 51.0, 35.0, 33.0, 38.0, 35.0, 25.0, 31.0, 21.0, 19.0, 18.0, 12.0, 11.0, 7.0, 6.0, 4.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.20654296875, -8.9208984375, -8.63525390625, -8.349609375, -8.06396484375, -7.7783203125, -7.49267578125, -7.20703125, -6.92138671875, -6.6357421875, -6.35009765625, -6.064453125, -5.77880859375, -5.4931640625, -5.20751953125, -4.921875, -4.63623046875, -4.3505859375, -4.06494140625, -3.779296875, -3.49365234375, -3.2080078125, -2.92236328125, -2.63671875, -2.35107421875, -2.0654296875, -1.77978515625, -1.494140625, -1.20849609375, -0.9228515625, -0.63720703125, -0.3515625, -0.06591796875, 0.2197265625, 0.50537109375, 0.791015625, 1.07666015625, 1.3623046875, 1.64794921875, 1.93359375, 2.21923828125, 2.5048828125, 2.79052734375, 3.076171875, 3.36181640625, 3.6474609375, 3.93310546875, 4.21875, 4.50439453125, 4.7900390625, 5.07568359375, 5.361328125, 5.64697265625, 5.9326171875, 6.21826171875, 6.50390625, 6.78955078125, 7.0751953125, 7.36083984375, 7.646484375, 7.93212890625, 8.2177734375, 8.50341796875, 8.7890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 15.0, 17.0, 49.0, 64.0, 115.0, 209.0, 485.0, 1199.0, 3748.0, 15580.0, 90561.0, 491916.0, 369418.0, 59530.0, 11041.0, 2802.0, 948.0, 399.0, 179.0, 116.0, 62.0, 32.0, 19.0, 18.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.98590087890625, -5.7921142578125, -5.59832763671875, -5.404541015625, -5.21075439453125, -5.0169677734375, -4.82318115234375, -4.62939453125, -4.43560791015625, -4.2418212890625, -4.04803466796875, -3.854248046875, -3.66046142578125, -3.4666748046875, -3.27288818359375, -3.0791015625, -2.88531494140625, -2.6915283203125, -2.49774169921875, -2.303955078125, -2.11016845703125, -1.9163818359375, -1.72259521484375, -1.52880859375, -1.33502197265625, -1.1412353515625, -0.94744873046875, -0.753662109375, -0.55987548828125, -0.3660888671875, -0.17230224609375, 0.021484375, 0.21527099609375, 0.4090576171875, 0.60284423828125, 0.796630859375, 0.99041748046875, 1.1842041015625, 1.37799072265625, 1.57177734375, 1.76556396484375, 1.9593505859375, 2.15313720703125, 2.346923828125, 2.54071044921875, 2.7344970703125, 2.92828369140625, 3.1220703125, 3.31585693359375, 3.5096435546875, 3.70343017578125, 3.897216796875, 4.09100341796875, 4.2847900390625, 4.47857666015625, 4.67236328125, 4.86614990234375, 5.0599365234375, 5.25372314453125, 5.447509765625, 5.64129638671875, 5.8350830078125, 6.02886962890625, 6.22265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 6.0, 16.0, 18.0, 18.0, 22.0, 36.0, 40.0, 69.0, 70.0, 105.0, 102.0, 97.0, 100.0, 83.0, 60.0, 38.0, 28.0, 24.0, 20.0, 5.0, 6.0, 7.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006837844848632812, -0.0006629824638366699, -0.0006421804428100586, -0.0006213784217834473, -0.0006005764007568359, -0.0005797743797302246, -0.0005589723587036133, -0.000538170337677002, -0.0005173683166503906, -0.0004965662956237793, -0.00047576427459716797, -0.00045496225357055664, -0.0004341602325439453, -0.000413358211517334, -0.00039255619049072266, -0.00037175416946411133, -0.0003509521484375, -0.00033015012741088867, -0.00030934810638427734, -0.000288546085357666, -0.0002677440643310547, -0.00024694204330444336, -0.00022614002227783203, -0.0002053380012512207, -0.00018453598022460938, -0.00016373395919799805, -0.00014293193817138672, -0.0001221299171447754, -0.00010132789611816406, -8.052587509155273e-05, -5.9723854064941406e-05, -3.892183303833008e-05, -1.811981201171875e-05, 2.682209014892578e-06, 2.3484230041503906e-05, 4.4286251068115234e-05, 6.508827209472656e-05, 8.589029312133789e-05, 0.00010669231414794922, 0.00012749433517456055, 0.00014829635620117188, 0.0001690983772277832, 0.00018990039825439453, 0.00021070241928100586, 0.0002315044403076172, 0.0002523064613342285, 0.00027310848236083984, 0.00029391050338745117, 0.0003147125244140625, 0.00033551454544067383, 0.00035631656646728516, 0.0003771185874938965, 0.0003979206085205078, 0.00041872262954711914, 0.00043952465057373047, 0.0004603266716003418, 0.0004811286926269531, 0.0005019307136535645, 0.0005227327346801758, 0.0005435347557067871, 0.0005643367767333984, 0.0005851387977600098, 0.0006059408187866211, 0.0006267428398132324, 0.0006475448608398438]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 18.0, 11.0, 9.0, 39.0, 38.0, 66.0, 74.0, 140.0, 194.0, 372.0, 725.0, 1309.0, 3360.0, 9154.0, 34335.0, 162669.0, 506441.0, 253807.0, 54458.0, 13304.0, 4337.0, 1775.0, 781.0, 407.0, 246.0, 139.0, 99.0, 66.0, 55.0, 23.0, 24.0, 21.0, 12.0, 6.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.73828125, -5.5677490234375, -5.397216796875, -5.2266845703125, -5.05615234375, -4.8856201171875, -4.715087890625, -4.5445556640625, -4.3740234375, -4.2034912109375, -4.032958984375, -3.8624267578125, -3.69189453125, -3.5213623046875, -3.350830078125, -3.1802978515625, -3.009765625, -2.8392333984375, -2.668701171875, -2.4981689453125, -2.32763671875, -2.1571044921875, -1.986572265625, -1.8160400390625, -1.6455078125, -1.4749755859375, -1.304443359375, -1.1339111328125, -0.96337890625, -0.7928466796875, -0.622314453125, -0.4517822265625, -0.28125, -0.1107177734375, 0.059814453125, 0.2303466796875, 0.40087890625, 0.5714111328125, 0.741943359375, 0.9124755859375, 1.0830078125, 1.2535400390625, 1.424072265625, 1.5946044921875, 1.76513671875, 1.9356689453125, 2.106201171875, 2.2767333984375, 2.447265625, 2.6177978515625, 2.788330078125, 2.9588623046875, 3.12939453125, 3.2999267578125, 3.470458984375, 3.6409912109375, 3.8115234375, 3.9820556640625, 4.152587890625, 4.3231201171875, 4.49365234375, 4.6641845703125, 4.834716796875, 5.0052490234375, 5.17578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 8.0, 18.0, 22.0, 17.0, 25.0, 49.0, 52.0, 58.0, 76.0, 80.0, 96.0, 96.0, 74.0, 60.0, 62.0, 37.0, 37.0, 27.0, 21.0, 20.0, 11.0, 9.0, 13.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.370361328125, -4.18603515625, -4.001708984375, -3.8173828125, -3.633056640625, -3.44873046875, -3.264404296875, -3.080078125, -2.895751953125, -2.71142578125, -2.527099609375, -2.3427734375, -2.158447265625, -1.97412109375, -1.789794921875, -1.60546875, -1.421142578125, -1.23681640625, -1.052490234375, -0.8681640625, -0.683837890625, -0.49951171875, -0.315185546875, -0.130859375, 0.053466796875, 0.23779296875, 0.422119140625, 0.6064453125, 0.790771484375, 0.97509765625, 1.159423828125, 1.34375, 1.528076171875, 1.71240234375, 1.896728515625, 2.0810546875, 2.265380859375, 2.44970703125, 2.634033203125, 2.818359375, 3.002685546875, 3.18701171875, 3.371337890625, 3.5556640625, 3.739990234375, 3.92431640625, 4.108642578125, 4.29296875, 4.477294921875, 4.66162109375, 4.845947265625, 5.0302734375, 5.214599609375, 5.39892578125, 5.583251953125, 5.767578125, 5.951904296875, 6.13623046875, 6.320556640625, 6.5048828125, 6.689208984375, 6.87353515625, 7.057861328125, 7.2421875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 14.0, 27.0, 111.0, 213.0, 311.0, 189.0, 93.0, 34.0, 13.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-225.731689453125, -220.9584503173828, -216.1852264404297, -211.4119873046875, -206.63876342773438, -201.8655242919922, -197.09230041503906, -192.31906127929688, -187.54583740234375, -182.77259826660156, -177.99937438964844, -173.22613525390625, -168.45291137695312, -163.67967224121094, -158.9064483642578, -154.13320922851562, -149.35997009277344, -144.58673095703125, -139.81350708007812, -135.04026794433594, -130.2670440673828, -125.49380493164062, -120.72057342529297, -115.94734191894531, -111.17411041259766, -106.40087890625, -101.62764739990234, -96.85441589355469, -92.0811767578125, -87.30795288085938, -82.53471374511719, -77.76148223876953, -72.98825073242188, -68.21501922607422, -63.44178771972656, -58.66855239868164, -53.895320892333984, -49.12208938598633, -44.348854064941406, -39.57562255859375, -34.802391052246094, -30.029159545898438, -25.25592613220215, -20.48269271850586, -15.709461212158203, -10.936229705810547, -6.162996292114258, -1.3897628784179688, 3.3834686279296875, 8.15670108795166, 12.929933547973633, 17.703166961669922, 22.476398468017578, 27.249629974365234, 32.022865295410156, 36.79609680175781, 41.56932830810547, 46.342559814453125, 51.11579132080078, 55.8890266418457, 60.66225814819336, 65.43548583984375, 70.20872497558594, 74.9819564819336, 79.75518798828125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 2.0, 10.0, 8.0, 12.0, 13.0, 16.0, 16.0, 28.0, 19.0, 24.0, 31.0, 43.0, 36.0, 43.0, 39.0, 56.0, 51.0, 50.0, 46.0, 45.0, 44.0, 52.0, 33.0, 39.0, 38.0, 30.0, 26.0, 19.0, 22.0, 22.0, 13.0, 15.0, 13.0, 13.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.506988525390625, -52.98828125, -51.469573974609375, -49.95086669921875, -48.43215560913086, -46.913448333740234, -45.39474105834961, -43.876033782958984, -42.357322692871094, -40.83861541748047, -39.319908142089844, -37.80120086669922, -36.28248977661133, -34.7637825012207, -33.24507522583008, -31.726367950439453, -30.207660675048828, -28.688953399658203, -27.170244216918945, -25.65153694152832, -24.132827758789062, -22.614120483398438, -21.095413208007812, -19.576705932617188, -18.05799674987793, -16.539289474487305, -15.020580291748047, -13.501873016357422, -11.98316478729248, -10.464456558227539, -8.945749282836914, -7.427041053771973, -5.908332824707031, -4.38962459564209, -2.8709168434143066, -1.3522090911865234, 0.16649913787841797, 1.6852073669433594, 3.2039146423339844, 4.722622871398926, 6.241331100463867, 7.760039329528809, 9.27874755859375, 10.797454833984375, 12.316163063049316, 13.834871292114258, 15.353578567504883, 16.87228775024414, 18.390995025634766, 19.90970230102539, 21.42841148376465, 22.947118759155273, 24.46582794189453, 25.984535217285156, 27.50324249267578, 29.021949768066406, 30.540658950805664, 32.05936813354492, 33.57807540893555, 35.09678268432617, 36.6154899597168, 38.13420104980469, 39.65290832519531, 41.17161560058594, 42.69032287597656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 9.0, 6.0, 9.0, 18.0, 16.0, 42.0, 38.0, 47.0, 80.0, 153.0, 215.0, 331.0, 547.0, 864.0, 1567.0, 3364.0, 8748.0, 33542.0, 408178.0, 3673188.0, 44449.0, 10695.0, 3822.0, 1781.0, 924.0, 599.0, 357.0, 236.0, 139.0, 107.0, 72.0, 39.0, 32.0, 24.0, 12.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796875, -7.5460205078125, -7.295166015625, -7.0443115234375, -6.79345703125, -6.5426025390625, -6.291748046875, -6.0408935546875, -5.7900390625, -5.5391845703125, -5.288330078125, -5.0374755859375, -4.78662109375, -4.5357666015625, -4.284912109375, -4.0340576171875, -3.783203125, -3.5323486328125, -3.281494140625, -3.0306396484375, -2.77978515625, -2.5289306640625, -2.278076171875, -2.0272216796875, -1.7763671875, -1.5255126953125, -1.274658203125, -1.0238037109375, -0.77294921875, -0.5220947265625, -0.271240234375, -0.0203857421875, 0.23046875, 0.4813232421875, 0.732177734375, 0.9830322265625, 1.23388671875, 1.4847412109375, 1.735595703125, 1.9864501953125, 2.2373046875, 2.4881591796875, 2.739013671875, 2.9898681640625, 3.24072265625, 3.4915771484375, 3.742431640625, 3.9932861328125, 4.244140625, 4.4949951171875, 4.745849609375, 4.9967041015625, 5.24755859375, 5.4984130859375, 5.749267578125, 6.0001220703125, 6.2509765625, 6.5018310546875, 6.752685546875, 7.0035400390625, 7.25439453125, 7.5052490234375, 7.756103515625, 8.0069580078125, 8.2578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 10.0, 4.0, 19.0, 12.0, 20.0, 26.0, 35.0, 35.0, 49.0, 45.0, 66.0, 61.0, 74.0, 70.0, 69.0, 52.0, 53.0, 57.0, 46.0, 45.0, 40.0, 21.0, 23.0, 15.0, 13.0, 10.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.130859375, -3.049407958984375, -2.96795654296875, -2.886505126953125, -2.8050537109375, -2.723602294921875, -2.64215087890625, -2.560699462890625, -2.479248046875, -2.397796630859375, -2.31634521484375, -2.234893798828125, -2.1534423828125, -2.071990966796875, -1.99053955078125, -1.909088134765625, -1.82763671875, -1.746185302734375, -1.66473388671875, -1.583282470703125, -1.5018310546875, -1.420379638671875, -1.33892822265625, -1.257476806640625, -1.176025390625, -1.094573974609375, -1.01312255859375, -0.931671142578125, -0.8502197265625, -0.768768310546875, -0.68731689453125, -0.605865478515625, -0.5244140625, -0.442962646484375, -0.36151123046875, -0.280059814453125, -0.1986083984375, -0.117156982421875, -0.03570556640625, 0.045745849609375, 0.127197265625, 0.208648681640625, 0.29010009765625, 0.371551513671875, 0.4530029296875, 0.534454345703125, 0.61590576171875, 0.697357177734375, 0.77880859375, 0.860260009765625, 0.94171142578125, 1.023162841796875, 1.1046142578125, 1.186065673828125, 1.26751708984375, 1.348968505859375, 1.430419921875, 1.511871337890625, 1.59332275390625, 1.674774169921875, 1.7562255859375, 1.837677001953125, 1.91912841796875, 2.000579833984375, 2.08203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 5.0, 6.0, 9.0, 16.0, 21.0, 27.0, 28.0, 54.0, 79.0, 126.0, 242.0, 347.0, 618.0, 1254.0, 2667.0, 7794.0, 39109.0, 3567029.0, 534863.0, 28520.0, 6544.0, 2244.0, 1101.0, 632.0, 330.0, 207.0, 129.0, 81.0, 48.0, 42.0, 25.0, 24.0, 14.0, 10.0, 4.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.2734375, -11.9317626953125, -11.590087890625, -11.2484130859375, -10.90673828125, -10.5650634765625, -10.223388671875, -9.8817138671875, -9.5400390625, -9.1983642578125, -8.856689453125, -8.5150146484375, -8.17333984375, -7.8316650390625, -7.489990234375, -7.1483154296875, -6.806640625, -6.4649658203125, -6.123291015625, -5.7816162109375, -5.43994140625, -5.0982666015625, -4.756591796875, -4.4149169921875, -4.0732421875, -3.7315673828125, -3.389892578125, -3.0482177734375, -2.70654296875, -2.3648681640625, -2.023193359375, -1.6815185546875, -1.33984375, -0.9981689453125, -0.656494140625, -0.3148193359375, 0.02685546875, 0.3685302734375, 0.710205078125, 1.0518798828125, 1.3935546875, 1.7352294921875, 2.076904296875, 2.4185791015625, 2.76025390625, 3.1019287109375, 3.443603515625, 3.7852783203125, 4.126953125, 4.4686279296875, 4.810302734375, 5.1519775390625, 5.49365234375, 5.8353271484375, 6.177001953125, 6.5186767578125, 6.8603515625, 7.2020263671875, 7.543701171875, 7.8853759765625, 8.22705078125, 8.5687255859375, 8.910400390625, 9.2520751953125, 9.59375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 12.0, 17.0, 25.0, 51.0, 128.0, 410.0, 3052.0, 227.0, 67.0, 29.0, 15.0, 13.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.98028564453125, -1.9019775390625, -1.82366943359375, -1.745361328125, -1.66705322265625, -1.5887451171875, -1.51043701171875, -1.43212890625, -1.35382080078125, -1.2755126953125, -1.19720458984375, -1.118896484375, -1.04058837890625, -0.9622802734375, -0.88397216796875, -0.8056640625, -0.72735595703125, -0.6490478515625, -0.57073974609375, -0.492431640625, -0.41412353515625, -0.3358154296875, -0.25750732421875, -0.17919921875, -0.10089111328125, -0.0225830078125, 0.05572509765625, 0.134033203125, 0.21234130859375, 0.2906494140625, 0.36895751953125, 0.447265625, 0.52557373046875, 0.6038818359375, 0.68218994140625, 0.760498046875, 0.83880615234375, 0.9171142578125, 0.99542236328125, 1.07373046875, 1.15203857421875, 1.2303466796875, 1.30865478515625, 1.386962890625, 1.46527099609375, 1.5435791015625, 1.62188720703125, 1.7001953125, 1.77850341796875, 1.8568115234375, 1.93511962890625, 2.013427734375, 2.09173583984375, 2.1700439453125, 2.24835205078125, 2.32666015625, 2.40496826171875, 2.4832763671875, 2.56158447265625, 2.639892578125, 2.71820068359375, 2.7965087890625, 2.87481689453125, 2.953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 17.0, 20.0, 61.0, 88.0, 125.0, 174.0, 159.0, 135.0, 84.0, 55.0, 32.0, 13.0, 18.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.694076538085938, -9.361105918884277, -9.028136253356934, -8.695165634155273, -8.36219596862793, -8.02922534942627, -7.696255207061768, -7.363285064697266, -7.030314922332764, -6.697344779968262, -6.36437463760376, -6.031404495239258, -5.698433876037598, -5.365464210510254, -5.032493591308594, -4.699523448944092, -4.36655330657959, -4.033583164215088, -3.700613021850586, -3.367642641067505, -3.034672498703003, -2.701702356338501, -2.36873197555542, -2.035761833190918, -1.702791690826416, -1.369821548461914, -1.0368512868881226, -0.7038810849189758, -0.3709108829498291, -0.03794074058532715, 0.29502952098846436, 0.6279997825622559, 0.9609689712524414, 1.2939391136169434, 1.6269093751907349, 1.9598796367645264, 2.2928497791290283, 2.6258199214935303, 2.9587903022766113, 3.2917604446411133, 3.6247305870056152, 3.957700729370117, 4.290670871734619, 4.623641014099121, 4.956611633300781, 5.289581298828125, 5.622551918029785, 5.955522060394287, 6.288492202758789, 6.621462345123291, 6.954432487487793, 7.287402629852295, 7.620372772216797, 7.953343391418457, 8.2863130569458, 8.619283676147461, 8.952253341674805, 9.285223960876465, 9.618193626403809, 9.951164245605469, 10.284133911132812, 10.617104530334473, 10.950074195861816, 11.283044815063477, 11.616015434265137]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 7.0, 9.0, 9.0, 8.0, 19.0, 14.0, 22.0, 22.0, 30.0, 29.0, 41.0, 39.0, 48.0, 38.0, 42.0, 49.0, 46.0, 51.0, 47.0, 48.0, 41.0, 34.0, 36.0, 31.0, 35.0, 26.0, 21.0, 16.0, 19.0, 15.0, 14.0, 22.0, 13.0, 14.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5824785232543945, -3.458566665649414, -3.3346548080444336, -3.210742950439453, -3.0868310928344727, -2.962919235229492, -2.8390073776245117, -2.7150957584381104, -2.59118390083313, -2.4672720432281494, -2.343360185623169, -2.2194483280181885, -2.095536470413208, -1.971624732017517, -1.8477128744125366, -1.7238011360168457, -1.5998891592025757, -1.4759773015975952, -1.3520654439926147, -1.2281537055969238, -1.1042418479919434, -0.9803299903869629, -0.8564181327819824, -0.7325063347816467, -0.6085944771766663, -0.4846826493740082, -0.3607708215713501, -0.23685896396636963, -0.11294713616371155, 0.010964691638946533, 0.134876549243927, 0.2587883472442627, 0.38270020484924316, 0.5066120624542236, 0.6305238604545593, 0.7544357180595398, 0.8783475160598755, 1.002259373664856, 1.1261712312698364, 1.2500829696655273, 1.3739948272705078, 1.4979066848754883, 1.6218185424804688, 1.7457304000854492, 1.8696421384811401, 1.9935539960861206, 2.1174659729003906, 2.241377592086792, 2.3652896881103516, 2.489201545715332, 2.6131134033203125, 2.737025260925293, 2.8609371185302734, 2.984848976135254, 3.1087608337402344, 3.2326724529266357, 3.356584310531616, 3.4804961681365967, 3.604408025741577, 3.7283198833465576, 3.852231740951538, 3.9761433601379395, 4.10005521774292, 4.2239670753479, 4.347878932952881]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 19.0, 21.0, 35.0, 74.0, 112.0, 202.0, 340.0, 693.0, 1845.0, 5281.0, 16161.0, 52278.0, 159825.0, 331581.0, 296573.0, 124585.0, 39760.0, 12207.0, 4058.0, 1540.0, 623.0, 286.0, 188.0, 105.0, 60.0, 32.0, 18.0, 10.0, 11.0, 6.0, 9.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6484375, -7.446533203125, -7.24462890625, -7.042724609375, -6.8408203125, -6.638916015625, -6.43701171875, -6.235107421875, -6.033203125, -5.831298828125, -5.62939453125, -5.427490234375, -5.2255859375, -5.023681640625, -4.82177734375, -4.619873046875, -4.41796875, -4.216064453125, -4.01416015625, -3.812255859375, -3.6103515625, -3.408447265625, -3.20654296875, -3.004638671875, -2.802734375, -2.600830078125, -2.39892578125, -2.197021484375, -1.9951171875, -1.793212890625, -1.59130859375, -1.389404296875, -1.1875, -0.985595703125, -0.78369140625, -0.581787109375, -0.3798828125, -0.177978515625, 0.02392578125, 0.225830078125, 0.427734375, 0.629638671875, 0.83154296875, 1.033447265625, 1.2353515625, 1.437255859375, 1.63916015625, 1.841064453125, 2.04296875, 2.244873046875, 2.44677734375, 2.648681640625, 2.8505859375, 3.052490234375, 3.25439453125, 3.456298828125, 3.658203125, 3.860107421875, 4.06201171875, 4.263916015625, 4.4658203125, 4.667724609375, 4.86962890625, 5.071533203125, 5.2734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 6.0, 11.0, 19.0, 21.0, 17.0, 31.0, 42.0, 35.0, 52.0, 57.0, 71.0, 58.0, 73.0, 59.0, 63.0, 47.0, 57.0, 47.0, 38.0, 41.0, 40.0, 25.0, 22.0, 11.0, 12.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.27734375, -3.193023681640625, -3.10870361328125, -3.024383544921875, -2.9400634765625, -2.855743408203125, -2.77142333984375, -2.687103271484375, -2.602783203125, -2.518463134765625, -2.43414306640625, -2.349822998046875, -2.2655029296875, -2.181182861328125, -2.09686279296875, -2.012542724609375, -1.92822265625, -1.843902587890625, -1.75958251953125, -1.675262451171875, -1.5909423828125, -1.506622314453125, -1.42230224609375, -1.337982177734375, -1.253662109375, -1.169342041015625, -1.08502197265625, -1.000701904296875, -0.9163818359375, -0.832061767578125, -0.74774169921875, -0.663421630859375, -0.5791015625, -0.494781494140625, -0.41046142578125, -0.326141357421875, -0.2418212890625, -0.157501220703125, -0.07318115234375, 0.011138916015625, 0.095458984375, 0.179779052734375, 0.26409912109375, 0.348419189453125, 0.4327392578125, 0.517059326171875, 0.60137939453125, 0.685699462890625, 0.77001953125, 0.854339599609375, 0.93865966796875, 1.022979736328125, 1.1072998046875, 1.191619873046875, 1.27593994140625, 1.360260009765625, 1.444580078125, 1.528900146484375, 1.61322021484375, 1.697540283203125, 1.7818603515625, 1.866180419921875, 1.95050048828125, 2.034820556640625, 2.119140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 11.0, 8.0, 17.0, 20.0, 44.0, 59.0, 77.0, 130.0, 200.0, 402.0, 828.0, 2409.0, 9130.0, 52266.0, 359281.0, 518995.0, 85819.0, 13551.0, 3019.0, 1105.0, 461.0, 261.0, 172.0, 102.0, 54.0, 43.0, 32.0, 22.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.200927734375, -10.86279296875, -10.524658203125, -10.1865234375, -9.848388671875, -9.51025390625, -9.172119140625, -8.833984375, -8.495849609375, -8.15771484375, -7.819580078125, -7.4814453125, -7.143310546875, -6.80517578125, -6.467041015625, -6.12890625, -5.790771484375, -5.45263671875, -5.114501953125, -4.7763671875, -4.438232421875, -4.10009765625, -3.761962890625, -3.423828125, -3.085693359375, -2.74755859375, -2.409423828125, -2.0712890625, -1.733154296875, -1.39501953125, -1.056884765625, -0.71875, -0.380615234375, -0.04248046875, 0.295654296875, 0.6337890625, 0.971923828125, 1.31005859375, 1.648193359375, 1.986328125, 2.324462890625, 2.66259765625, 3.000732421875, 3.3388671875, 3.677001953125, 4.01513671875, 4.353271484375, 4.69140625, 5.029541015625, 5.36767578125, 5.705810546875, 6.0439453125, 6.382080078125, 6.72021484375, 7.058349609375, 7.396484375, 7.734619140625, 8.07275390625, 8.410888671875, 8.7490234375, 9.087158203125, 9.42529296875, 9.763427734375, 10.1015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 10.0, 10.0, 8.0, 7.0, 14.0, 20.0, 18.0, 14.0, 13.0, 13.0, 29.0, 29.0, 38.0, 42.0, 37.0, 39.0, 48.0, 41.0, 44.0, 40.0, 40.0, 34.0, 43.0, 33.0, 45.0, 29.0, 36.0, 43.0, 18.0, 29.0, 25.0, 19.0, 15.0, 16.0, 12.0, 6.0, 10.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0], "bins": [-12.0625, -11.7242431640625, -11.385986328125, -11.0477294921875, -10.70947265625, -10.3712158203125, -10.032958984375, -9.6947021484375, -9.3564453125, -9.0181884765625, -8.679931640625, -8.3416748046875, -8.00341796875, -7.6651611328125, -7.326904296875, -6.9886474609375, -6.650390625, -6.3121337890625, -5.973876953125, -5.6356201171875, -5.29736328125, -4.9591064453125, -4.620849609375, -4.2825927734375, -3.9443359375, -3.6060791015625, -3.267822265625, -2.9295654296875, -2.59130859375, -2.2530517578125, -1.914794921875, -1.5765380859375, -1.23828125, -0.9000244140625, -0.561767578125, -0.2235107421875, 0.11474609375, 0.4530029296875, 0.791259765625, 1.1295166015625, 1.4677734375, 1.8060302734375, 2.144287109375, 2.4825439453125, 2.82080078125, 3.1590576171875, 3.497314453125, 3.8355712890625, 4.173828125, 4.5120849609375, 4.850341796875, 5.1885986328125, 5.52685546875, 5.8651123046875, 6.203369140625, 6.5416259765625, 6.8798828125, 7.2181396484375, 7.556396484375, 7.8946533203125, 8.23291015625, 8.5711669921875, 8.909423828125, 9.2476806640625, 9.5859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 26.0, 24.0, 34.0, 64.0, 108.0, 185.0, 431.0, 1129.0, 3537.0, 14899.0, 92776.0, 585109.0, 298804.0, 40083.0, 7829.0, 2044.0, 757.0, 300.0, 190.0, 72.0, 35.0, 36.0, 22.0, 13.0, 10.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0], "bins": [-7.39453125, -7.22564697265625, -7.0567626953125, -6.88787841796875, -6.718994140625, -6.55010986328125, -6.3812255859375, -6.21234130859375, -6.04345703125, -5.87457275390625, -5.7056884765625, -5.53680419921875, -5.367919921875, -5.19903564453125, -5.0301513671875, -4.86126708984375, -4.6923828125, -4.52349853515625, -4.3546142578125, -4.18572998046875, -4.016845703125, -3.84796142578125, -3.6790771484375, -3.51019287109375, -3.34130859375, -3.17242431640625, -3.0035400390625, -2.83465576171875, -2.665771484375, -2.49688720703125, -2.3280029296875, -2.15911865234375, -1.990234375, -1.82135009765625, -1.6524658203125, -1.48358154296875, -1.314697265625, -1.14581298828125, -0.9769287109375, -0.80804443359375, -0.63916015625, -0.47027587890625, -0.3013916015625, -0.13250732421875, 0.036376953125, 0.20526123046875, 0.3741455078125, 0.54302978515625, 0.7119140625, 0.88079833984375, 1.0496826171875, 1.21856689453125, 1.387451171875, 1.55633544921875, 1.7252197265625, 1.89410400390625, 2.06298828125, 2.23187255859375, 2.4007568359375, 2.56964111328125, 2.738525390625, 2.90740966796875, 3.0762939453125, 3.24517822265625, 3.4140625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 18.0, 11.0, 19.0, 32.0, 34.0, 43.0, 53.0, 56.0, 79.0, 104.0, 93.0, 83.0, 70.0, 69.0, 47.0, 43.0, 33.0, 22.0, 30.0, 10.0, 10.0, 8.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005908012390136719, -0.000573672354221344, -0.0005565434694290161, -0.0005394145846366882, -0.0005222856998443604, -0.0005051568150520325, -0.0004880279302597046, -0.0004708990454673767, -0.00045377016067504883, -0.00043664127588272095, -0.00041951239109039307, -0.0004023835062980652, -0.0003852546215057373, -0.0003681257367134094, -0.00035099685192108154, -0.00033386796712875366, -0.0003167390823364258, -0.0002996101975440979, -0.00028248131275177, -0.00026535242795944214, -0.00024822354316711426, -0.00023109465837478638, -0.0002139657735824585, -0.00019683688879013062, -0.00017970800399780273, -0.00016257911920547485, -0.00014545023441314697, -0.0001283213496208191, -0.00011119246482849121, -9.406358003616333e-05, -7.693469524383545e-05, -5.980581045150757e-05, -4.267692565917969e-05, -2.5548040866851807e-05, -8.419156074523926e-06, 8.709728717803955e-06, 2.5838613510131836e-05, 4.296749830245972e-05, 6.00963830947876e-05, 7.722526788711548e-05, 9.435415267944336e-05, 0.00011148303747177124, 0.00012861192226409912, 0.000145740807056427, 0.00016286969184875488, 0.00017999857664108276, 0.00019712746143341064, 0.00021425634622573853, 0.0002313852310180664, 0.0002485141158103943, 0.00026564300060272217, 0.00028277188539505005, 0.00029990077018737793, 0.0003170296549797058, 0.0003341585397720337, 0.00035128742456436157, 0.00036841630935668945, 0.00038554519414901733, 0.0004026740789413452, 0.0004198029637336731, 0.000436931848526001, 0.00045406073331832886, 0.00047118961811065674, 0.0004883185029029846, 0.0005054473876953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 6.0, 17.0, 29.0, 48.0, 87.0, 157.0, 335.0, 673.0, 1751.0, 5454.0, 24356.0, 188474.0, 655111.0, 144886.0, 19809.0, 4515.0, 1572.0, 645.0, 291.0, 141.0, 70.0, 34.0, 27.0, 18.0, 10.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4921875, -6.31402587890625, -6.1358642578125, -5.95770263671875, -5.779541015625, -5.60137939453125, -5.4232177734375, -5.24505615234375, -5.06689453125, -4.88873291015625, -4.7105712890625, -4.53240966796875, -4.354248046875, -4.17608642578125, -3.9979248046875, -3.81976318359375, -3.6416015625, -3.46343994140625, -3.2852783203125, -3.10711669921875, -2.928955078125, -2.75079345703125, -2.5726318359375, -2.39447021484375, -2.21630859375, -2.03814697265625, -1.8599853515625, -1.68182373046875, -1.503662109375, -1.32550048828125, -1.1473388671875, -0.96917724609375, -0.791015625, -0.61285400390625, -0.4346923828125, -0.25653076171875, -0.078369140625, 0.09979248046875, 0.2779541015625, 0.45611572265625, 0.63427734375, 0.81243896484375, 0.9906005859375, 1.16876220703125, 1.346923828125, 1.52508544921875, 1.7032470703125, 1.88140869140625, 2.0595703125, 2.23773193359375, 2.4158935546875, 2.59405517578125, 2.772216796875, 2.95037841796875, 3.1285400390625, 3.30670166015625, 3.48486328125, 3.66302490234375, 3.8411865234375, 4.01934814453125, 4.197509765625, 4.37567138671875, 4.5538330078125, 4.73199462890625, 4.91015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 21.0, 12.0, 18.0, 30.0, 35.0, 48.0, 52.0, 66.0, 74.0, 80.0, 74.0, 89.0, 84.0, 61.0, 64.0, 45.0, 31.0, 27.0, 17.0, 12.0, 11.0, 9.0, 5.0, 9.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.65625, -5.50048828125, -5.3447265625, -5.18896484375, -5.033203125, -4.87744140625, -4.7216796875, -4.56591796875, -4.41015625, -4.25439453125, -4.0986328125, -3.94287109375, -3.787109375, -3.63134765625, -3.4755859375, -3.31982421875, -3.1640625, -3.00830078125, -2.8525390625, -2.69677734375, -2.541015625, -2.38525390625, -2.2294921875, -2.07373046875, -1.91796875, -1.76220703125, -1.6064453125, -1.45068359375, -1.294921875, -1.13916015625, -0.9833984375, -0.82763671875, -0.671875, -0.51611328125, -0.3603515625, -0.20458984375, -0.048828125, 0.10693359375, 0.2626953125, 0.41845703125, 0.57421875, 0.72998046875, 0.8857421875, 1.04150390625, 1.197265625, 1.35302734375, 1.5087890625, 1.66455078125, 1.8203125, 1.97607421875, 2.1318359375, 2.28759765625, 2.443359375, 2.59912109375, 2.7548828125, 2.91064453125, 3.06640625, 3.22216796875, 3.3779296875, 3.53369140625, 3.689453125, 3.84521484375, 4.0009765625, 4.15673828125, 4.3125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 4.0, 9.0, 10.0, 12.0, 27.0, 37.0, 66.0, 69.0, 68.0, 69.0, 108.0, 118.0, 61.0, 71.0, 83.0, 55.0, 38.0, 26.0, 22.0, 9.0, 7.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.66703796386719, -33.99700927734375, -32.32697677612305, -30.656946182250977, -28.986915588378906, -27.316884994506836, -25.646854400634766, -23.976823806762695, -22.306793212890625, -20.636762619018555, -18.966732025146484, -17.296701431274414, -15.626670837402344, -13.956640243530273, -12.286609649658203, -10.616579055786133, -8.946548461914062, -7.276517868041992, -5.606487274169922, -3.9364566802978516, -2.2664260864257812, -0.5963954925537109, 1.0736351013183594, 2.7436656951904297, 4.4136962890625, 6.08372688293457, 7.753757476806641, 9.423788070678711, 11.093818664550781, 12.763849258422852, 14.433879852294922, 16.103910446166992, 17.773941040039062, 19.443971633911133, 21.114002227783203, 22.784032821655273, 24.454063415527344, 26.124094009399414, 27.794124603271484, 29.464155197143555, 31.134185791015625, 32.80421447753906, 34.474246978759766, 36.14427947998047, 37.814308166503906, 39.484336853027344, 41.15436935424805, 42.82440185546875, 44.49443054199219, 46.164459228515625, 47.83449172973633, 49.50452423095703, 51.17455291748047, 52.844581604003906, 54.51461410522461, 56.18464660644531, 57.85467529296875, 59.52470397949219, 61.19473648071289, 62.864768981933594, 64.53479766845703, 66.20482635498047, 67.87486267089844, 69.54489135742188, 71.21492004394531]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 9.0, 18.0, 16.0, 22.0, 22.0, 36.0, 27.0, 42.0, 53.0, 49.0, 43.0, 44.0, 58.0, 52.0, 49.0, 54.0, 40.0, 48.0, 40.0, 37.0, 27.0, 22.0, 25.0, 20.0, 24.0, 19.0, 11.0, 11.0, 7.0, 7.0, 5.0, 5.0, 6.0, 10.0, 0.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.57819747924805, -49.90336990356445, -48.22854232788086, -46.553714752197266, -44.87888717651367, -43.20405960083008, -41.52922821044922, -39.854400634765625, -38.17957305908203, -36.50474548339844, -34.829917907714844, -33.15509033203125, -31.480262756347656, -29.805435180664062, -28.130605697631836, -26.455778121948242, -24.78095245361328, -23.106124877929688, -21.431297302246094, -19.7564697265625, -18.081642150878906, -16.406814575195312, -14.731985092163086, -13.057157516479492, -11.382329940795898, -9.707502365112305, -8.032674789428711, -6.357846260070801, -4.683018684387207, -3.0081911087036133, -1.3333625793457031, 0.3414649963378906, 2.0162925720214844, 3.6911203861236572, 5.36594820022583, 7.040776252746582, 8.715603828430176, 10.39043140411377, 12.06525993347168, 13.740087509155273, 15.414915084838867, 17.08974266052246, 18.764570236206055, 20.43939971923828, 22.114227294921875, 23.78905487060547, 25.463882446289062, 27.138710021972656, 28.81353759765625, 30.488365173339844, 32.16319274902344, 33.83802032470703, 35.512847900390625, 37.18767547607422, 38.86250305175781, 40.537330627441406, 42.212158203125, 43.886985778808594, 45.56181335449219, 47.23664093017578, 48.911468505859375, 50.58629608154297, 52.26112365722656, 53.935951232910156, 55.610782623291016]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 13.0, 9.0, 20.0, 18.0, 38.0, 49.0, 82.0, 112.0, 188.0, 239.0, 354.0, 590.0, 870.0, 1729.0, 3922.0, 12503.0, 65150.0, 3872268.0, 201673.0, 22621.0, 6053.0, 2394.0, 1204.0, 707.0, 464.0, 339.0, 215.0, 144.0, 90.0, 68.0, 46.0, 38.0, 20.0, 17.0, 9.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.7109375, -10.43426513671875, -10.1575927734375, -9.88092041015625, -9.604248046875, -9.32757568359375, -9.0509033203125, -8.77423095703125, -8.49755859375, -8.22088623046875, -7.9442138671875, -7.66754150390625, -7.390869140625, -7.11419677734375, -6.8375244140625, -6.56085205078125, -6.2841796875, -6.00750732421875, -5.7308349609375, -5.45416259765625, -5.177490234375, -4.90081787109375, -4.6241455078125, -4.34747314453125, -4.07080078125, -3.79412841796875, -3.5174560546875, -3.24078369140625, -2.964111328125, -2.68743896484375, -2.4107666015625, -2.13409423828125, -1.857421875, -1.58074951171875, -1.3040771484375, -1.02740478515625, -0.750732421875, -0.47406005859375, -0.1973876953125, 0.07928466796875, 0.35595703125, 0.63262939453125, 0.9093017578125, 1.18597412109375, 1.462646484375, 1.73931884765625, 2.0159912109375, 2.29266357421875, 2.5693359375, 2.84600830078125, 3.1226806640625, 3.39935302734375, 3.676025390625, 3.95269775390625, 4.2293701171875, 4.50604248046875, 4.78271484375, 5.05938720703125, 5.3360595703125, 5.61273193359375, 5.889404296875, 6.16607666015625, 6.4427490234375, 6.71942138671875, 6.99609375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 5.0, 7.0, 11.0, 15.0, 19.0, 17.0, 32.0, 27.0, 36.0, 34.0, 42.0, 42.0, 45.0, 60.0, 55.0, 58.0, 52.0, 42.0, 45.0, 52.0, 45.0, 43.0, 41.0, 28.0, 21.0, 21.0, 21.0, 13.0, 12.0, 10.0, 9.0, 7.0, 2.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.220703125, -2.14837646484375, -2.0760498046875, -2.00372314453125, -1.931396484375, -1.85906982421875, -1.7867431640625, -1.71441650390625, -1.64208984375, -1.56976318359375, -1.4974365234375, -1.42510986328125, -1.352783203125, -1.28045654296875, -1.2081298828125, -1.13580322265625, -1.0634765625, -0.99114990234375, -0.9188232421875, -0.84649658203125, -0.774169921875, -0.70184326171875, -0.6295166015625, -0.55718994140625, -0.48486328125, -0.41253662109375, -0.3402099609375, -0.26788330078125, -0.195556640625, -0.12322998046875, -0.0509033203125, 0.02142333984375, 0.09375, 0.16607666015625, 0.2384033203125, 0.31072998046875, 0.383056640625, 0.45538330078125, 0.5277099609375, 0.60003662109375, 0.67236328125, 0.74468994140625, 0.8170166015625, 0.88934326171875, 0.961669921875, 1.03399658203125, 1.1063232421875, 1.17864990234375, 1.2509765625, 1.32330322265625, 1.3956298828125, 1.46795654296875, 1.540283203125, 1.61260986328125, 1.6849365234375, 1.75726318359375, 1.82958984375, 1.90191650390625, 1.9742431640625, 2.04656982421875, 2.118896484375, 2.19122314453125, 2.2635498046875, 2.33587646484375, 2.408203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 5.0, 17.0, 19.0, 17.0, 24.0, 37.0, 63.0, 96.0, 169.0, 230.0, 378.0, 613.0, 984.0, 1862.0, 3583.0, 7691.0, 20534.0, 82242.0, 2666552.0, 1294609.0, 78691.0, 20056.0, 7545.0, 3570.0, 1869.0, 1027.0, 623.0, 384.0, 261.0, 183.0, 104.0, 81.0, 49.0, 35.0, 20.0, 23.0, 14.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.11859130859375, -6.9207763671875, -6.72296142578125, -6.525146484375, -6.32733154296875, -6.1295166015625, -5.93170166015625, -5.73388671875, -5.53607177734375, -5.3382568359375, -5.14044189453125, -4.942626953125, -4.74481201171875, -4.5469970703125, -4.34918212890625, -4.1513671875, -3.95355224609375, -3.7557373046875, -3.55792236328125, -3.360107421875, -3.16229248046875, -2.9644775390625, -2.76666259765625, -2.56884765625, -2.37103271484375, -2.1732177734375, -1.97540283203125, -1.777587890625, -1.57977294921875, -1.3819580078125, -1.18414306640625, -0.986328125, -0.78851318359375, -0.5906982421875, -0.39288330078125, -0.195068359375, 0.00274658203125, 0.2005615234375, 0.39837646484375, 0.59619140625, 0.79400634765625, 0.9918212890625, 1.18963623046875, 1.387451171875, 1.58526611328125, 1.7830810546875, 1.98089599609375, 2.1787109375, 2.37652587890625, 2.5743408203125, 2.77215576171875, 2.969970703125, 3.16778564453125, 3.3656005859375, 3.56341552734375, 3.76123046875, 3.95904541015625, 4.1568603515625, 4.35467529296875, 4.552490234375, 4.75030517578125, 4.9481201171875, 5.14593505859375, 5.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 0.0, 5.0, 8.0, 7.0, 9.0, 16.0, 23.0, 46.0, 89.0, 223.0, 777.0, 2363.0, 273.0, 93.0, 44.0, 33.0, 13.0, 16.0, 7.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.97216796875, -1.8994140625, -1.82666015625, -1.75390625, -1.68115234375, -1.6083984375, -1.53564453125, -1.462890625, -1.39013671875, -1.3173828125, -1.24462890625, -1.171875, -1.09912109375, -1.0263671875, -0.95361328125, -0.880859375, -0.80810546875, -0.7353515625, -0.66259765625, -0.58984375, -0.51708984375, -0.4443359375, -0.37158203125, -0.298828125, -0.22607421875, -0.1533203125, -0.08056640625, -0.0078125, 0.06494140625, 0.1376953125, 0.21044921875, 0.283203125, 0.35595703125, 0.4287109375, 0.50146484375, 0.57421875, 0.64697265625, 0.7197265625, 0.79248046875, 0.865234375, 0.93798828125, 1.0107421875, 1.08349609375, 1.15625, 1.22900390625, 1.3017578125, 1.37451171875, 1.447265625, 1.52001953125, 1.5927734375, 1.66552734375, 1.73828125, 1.81103515625, 1.8837890625, 1.95654296875, 2.029296875, 2.10205078125, 2.1748046875, 2.24755859375, 2.3203125, 2.39306640625, 2.4658203125, 2.53857421875, 2.611328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 16.0, 44.0, 69.0, 124.0, 188.0, 216.0, 175.0, 93.0, 39.0, 13.0, 11.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.381927490234375, -25.828771591186523, -25.275615692138672, -24.72245979309082, -24.16930389404297, -23.61614990234375, -23.0629940032959, -22.509838104248047, -21.956682205200195, -21.403526306152344, -20.850370407104492, -20.29721450805664, -19.744060516357422, -19.19090461730957, -18.63774871826172, -18.084592819213867, -17.531436920166016, -16.978281021118164, -16.425125122070312, -15.871970176696777, -15.318814277648926, -14.765658378601074, -14.212503433227539, -13.659347534179688, -13.106191635131836, -12.553035736083984, -11.999879837036133, -11.446724891662598, -10.893568992614746, -10.340413093566895, -9.78725814819336, -9.234102249145508, -8.680944442749023, -8.127788543701172, -7.5746331214904785, -7.021477699279785, -6.468321800231934, -5.915165901184082, -5.362010478973389, -4.808855056762695, -4.255699157714844, -3.7025434970855713, -3.149387836456299, -2.5962321758270264, -2.043076515197754, -1.4899208545684814, -0.936765193939209, -0.3836095333099365, 0.16954612731933594, 0.7227017879486084, 1.2758574485778809, 1.8290131092071533, 2.382168769836426, 2.9353244304656982, 3.4884800910949707, 4.041635513305664, 4.594791412353516, 5.147947311401367, 5.7011027336120605, 6.254258155822754, 6.8074140548706055, 7.360569953918457, 7.91372537612915, 8.466880798339844, 9.020036697387695]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 8.0, 7.0, 11.0, 14.0, 19.0, 13.0, 20.0, 26.0, 19.0, 17.0, 22.0, 23.0, 31.0, 28.0, 33.0, 33.0, 33.0, 30.0, 35.0, 30.0, 34.0, 39.0, 28.0, 31.0, 31.0, 26.0, 39.0, 26.0, 30.0, 28.0, 16.0, 20.0, 20.0, 16.0, 24.0, 20.0, 13.0, 10.0, 10.0, 18.0, 8.0, 5.0, 8.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0], "bins": [-5.2497735023498535, -5.093287944793701, -4.936802864074707, -4.780317306518555, -4.623831748962402, -4.46734619140625, -4.310861110687256, -4.1543755531311035, -3.9978902339935303, -3.841404914855957, -3.6849193572998047, -3.5284340381622314, -3.371948719024658, -3.215463161468506, -3.0589778423309326, -2.9024925231933594, -2.746006965637207, -2.589521646499634, -2.4330360889434814, -2.276550769805908, -2.120065212249756, -1.9635798931121826, -1.8070945739746094, -1.6506091356277466, -1.4941236972808838, -1.337638258934021, -1.1811528205871582, -1.024667501449585, -0.8681820631027222, -0.7116966247558594, -0.5552112460136414, -0.39872586727142334, -0.24223995208740234, -0.08575454354286194, 0.07073086500167847, 0.22721627354621887, 0.3837016820907593, 0.5401871204376221, 0.6966724991798401, 0.8531578779220581, 1.009643316268921, 1.1661287546157837, 1.3226141929626465, 1.4790995121002197, 1.6355849504470825, 1.7920703887939453, 1.9485557079315186, 2.105041027069092, 2.261526584625244, 2.4180119037628174, 2.5744974613189697, 2.730982780456543, 2.8874683380126953, 3.0439536571502686, 3.200438976287842, 3.356924533843994, 3.5134098529815674, 3.6698951721191406, 3.826380729675293, 3.982866048812866, 4.1393513679504395, 4.295836925506592, 4.452322483062744, 4.608807563781738, 4.765293121337891]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 2.0, 9.0, 15.0, 11.0, 22.0, 29.0, 39.0, 53.0, 75.0, 124.0, 184.0, 281.0, 417.0, 686.0, 1219.0, 2095.0, 4075.0, 7840.0, 16055.0, 33056.0, 69722.0, 137739.0, 223200.0, 234663.0, 157308.0, 82048.0, 39028.0, 18662.0, 9015.0, 4689.0, 2620.0, 1349.0, 828.0, 496.0, 313.0, 173.0, 119.0, 65.0, 69.0, 37.0, 32.0, 16.0, 16.0, 12.0, 8.0, 7.0, 3.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.552734375, -3.4454345703125, -3.338134765625, -3.2308349609375, -3.12353515625, -3.0162353515625, -2.908935546875, -2.8016357421875, -2.6943359375, -2.5870361328125, -2.479736328125, -2.3724365234375, -2.26513671875, -2.1578369140625, -2.050537109375, -1.9432373046875, -1.8359375, -1.7286376953125, -1.621337890625, -1.5140380859375, -1.40673828125, -1.2994384765625, -1.192138671875, -1.0848388671875, -0.9775390625, -0.8702392578125, -0.762939453125, -0.6556396484375, -0.54833984375, -0.4410400390625, -0.333740234375, -0.2264404296875, -0.119140625, -0.0118408203125, 0.095458984375, 0.2027587890625, 0.31005859375, 0.4173583984375, 0.524658203125, 0.6319580078125, 0.7392578125, 0.8465576171875, 0.953857421875, 1.0611572265625, 1.16845703125, 1.2757568359375, 1.383056640625, 1.4903564453125, 1.59765625, 1.7049560546875, 1.812255859375, 1.9195556640625, 2.02685546875, 2.1341552734375, 2.241455078125, 2.3487548828125, 2.4560546875, 2.5633544921875, 2.670654296875, 2.7779541015625, 2.88525390625, 2.9925537109375, 3.099853515625, 3.2071533203125, 3.314453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 12.0, 12.0, 17.0, 26.0, 22.0, 34.0, 36.0, 35.0, 29.0, 59.0, 51.0, 48.0, 47.0, 52.0, 40.0, 52.0, 55.0, 46.0, 38.0, 36.0, 32.0, 28.0, 35.0, 20.0, 23.0, 14.0, 13.0, 12.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.361328125, -2.287353515625, -2.21337890625, -2.139404296875, -2.0654296875, -1.991455078125, -1.91748046875, -1.843505859375, -1.76953125, -1.695556640625, -1.62158203125, -1.547607421875, -1.4736328125, -1.399658203125, -1.32568359375, -1.251708984375, -1.177734375, -1.103759765625, -1.02978515625, -0.955810546875, -0.8818359375, -0.807861328125, -0.73388671875, -0.659912109375, -0.5859375, -0.511962890625, -0.43798828125, -0.364013671875, -0.2900390625, -0.216064453125, -0.14208984375, -0.068115234375, 0.005859375, 0.079833984375, 0.15380859375, 0.227783203125, 0.3017578125, 0.375732421875, 0.44970703125, 0.523681640625, 0.59765625, 0.671630859375, 0.74560546875, 0.819580078125, 0.8935546875, 0.967529296875, 1.04150390625, 1.115478515625, 1.189453125, 1.263427734375, 1.33740234375, 1.411376953125, 1.4853515625, 1.559326171875, 1.63330078125, 1.707275390625, 1.78125, 1.855224609375, 1.92919921875, 2.003173828125, 2.0771484375, 2.151123046875, 2.22509765625, 2.299072265625, 2.373046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 13.0, 17.0, 27.0, 57.0, 62.0, 84.0, 120.0, 193.0, 314.0, 457.0, 782.0, 1543.0, 4147.0, 18029.0, 134369.0, 646566.0, 206290.0, 25898.0, 5408.0, 1883.0, 874.0, 510.0, 297.0, 185.0, 118.0, 82.0, 57.0, 44.0, 21.0, 20.0, 17.0, 11.0, 11.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7412109375, -8.435546875, -8.1298828125, -7.82421875, -7.5185546875, -7.212890625, -6.9072265625, -6.6015625, -6.2958984375, -5.990234375, -5.6845703125, -5.37890625, -5.0732421875, -4.767578125, -4.4619140625, -4.15625, -3.8505859375, -3.544921875, -3.2392578125, -2.93359375, -2.6279296875, -2.322265625, -2.0166015625, -1.7109375, -1.4052734375, -1.099609375, -0.7939453125, -0.48828125, -0.1826171875, 0.123046875, 0.4287109375, 0.734375, 1.0400390625, 1.345703125, 1.6513671875, 1.95703125, 2.2626953125, 2.568359375, 2.8740234375, 3.1796875, 3.4853515625, 3.791015625, 4.0966796875, 4.40234375, 4.7080078125, 5.013671875, 5.3193359375, 5.625, 5.9306640625, 6.236328125, 6.5419921875, 6.84765625, 7.1533203125, 7.458984375, 7.7646484375, 8.0703125, 8.3759765625, 8.681640625, 8.9873046875, 9.29296875, 9.5986328125, 9.904296875, 10.2099609375, 10.515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 6.0, 15.0, 7.0, 14.0, 17.0, 24.0, 26.0, 33.0, 49.0, 34.0, 64.0, 62.0, 51.0, 50.0, 80.0, 56.0, 51.0, 45.0, 58.0, 39.0, 47.0, 34.0, 23.0, 19.0, 17.0, 11.0, 16.0, 7.0, 9.0, 9.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.580322265625, -15.11376953125, -14.647216796875, -14.1806640625, -13.714111328125, -13.24755859375, -12.781005859375, -12.314453125, -11.847900390625, -11.38134765625, -10.914794921875, -10.4482421875, -9.981689453125, -9.51513671875, -9.048583984375, -8.58203125, -8.115478515625, -7.64892578125, -7.182373046875, -6.7158203125, -6.249267578125, -5.78271484375, -5.316162109375, -4.849609375, -4.383056640625, -3.91650390625, -3.449951171875, -2.9833984375, -2.516845703125, -2.05029296875, -1.583740234375, -1.1171875, -0.650634765625, -0.18408203125, 0.282470703125, 0.7490234375, 1.215576171875, 1.68212890625, 2.148681640625, 2.615234375, 3.081787109375, 3.54833984375, 4.014892578125, 4.4814453125, 4.947998046875, 5.41455078125, 5.881103515625, 6.34765625, 6.814208984375, 7.28076171875, 7.747314453125, 8.2138671875, 8.680419921875, 9.14697265625, 9.613525390625, 10.080078125, 10.546630859375, 11.01318359375, 11.479736328125, 11.9462890625, 12.412841796875, 12.87939453125, 13.345947265625, 13.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 15.0, 13.0, 18.0, 18.0, 38.0, 49.0, 66.0, 68.0, 153.0, 206.0, 405.0, 774.0, 1860.0, 5560.0, 28657.0, 312214.0, 622707.0, 61498.0, 9218.0, 2662.0, 1035.0, 513.0, 293.0, 170.0, 113.0, 71.0, 51.0, 19.0, 21.0, 13.0, 13.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.77734375, -4.6077880859375, -4.438232421875, -4.2686767578125, -4.09912109375, -3.9295654296875, -3.760009765625, -3.5904541015625, -3.4208984375, -3.2513427734375, -3.081787109375, -2.9122314453125, -2.74267578125, -2.5731201171875, -2.403564453125, -2.2340087890625, -2.064453125, -1.8948974609375, -1.725341796875, -1.5557861328125, -1.38623046875, -1.2166748046875, -1.047119140625, -0.8775634765625, -0.7080078125, -0.5384521484375, -0.368896484375, -0.1993408203125, -0.02978515625, 0.1397705078125, 0.309326171875, 0.4788818359375, 0.6484375, 0.8179931640625, 0.987548828125, 1.1571044921875, 1.32666015625, 1.4962158203125, 1.665771484375, 1.8353271484375, 2.0048828125, 2.1744384765625, 2.343994140625, 2.5135498046875, 2.68310546875, 2.8526611328125, 3.022216796875, 3.1917724609375, 3.361328125, 3.5308837890625, 3.700439453125, 3.8699951171875, 4.03955078125, 4.2091064453125, 4.378662109375, 4.5482177734375, 4.7177734375, 4.8873291015625, 5.056884765625, 5.2264404296875, 5.39599609375, 5.5655517578125, 5.735107421875, 5.9046630859375, 6.07421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 14.0, 8.0, 12.0, 19.0, 30.0, 36.0, 36.0, 53.0, 85.0, 68.0, 76.0, 86.0, 90.0, 76.0, 63.0, 49.0, 45.0, 34.0, 27.0, 21.0, 15.0, 9.0, 10.0, 5.0, 8.0, 1.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004684925079345703, -0.00045326724648475647, -0.0004380419850349426, -0.0004228167235851288, -0.00040759146213531494, -0.0003923662006855011, -0.00037714093923568726, -0.0003619156777858734, -0.00034669041633605957, -0.00033146515488624573, -0.0003162398934364319, -0.00030101463198661804, -0.0002857893705368042, -0.00027056410908699036, -0.0002553388476371765, -0.00024011358618736267, -0.00022488832473754883, -0.00020966306328773499, -0.00019443780183792114, -0.0001792125403881073, -0.00016398727893829346, -0.00014876201748847961, -0.00013353675603866577, -0.00011831149458885193, -0.00010308623313903809, -8.786097168922424e-05, -7.26357102394104e-05, -5.741044878959656e-05, -4.2185187339782715e-05, -2.6959925889968872e-05, -1.173466444015503e-05, 3.4905970096588135e-06, 1.8715858459472656e-05, 3.39411199092865e-05, 4.916638135910034e-05, 6.439164280891418e-05, 7.961690425872803e-05, 9.484216570854187e-05, 0.00011006742715835571, 0.00012529268860816956, 0.0001405179500579834, 0.00015574321150779724, 0.00017096847295761108, 0.00018619373440742493, 0.00020141899585723877, 0.0002166442573070526, 0.00023186951875686646, 0.0002470947802066803, 0.00026232004165649414, 0.000277545303106308, 0.0002927705645561218, 0.00030799582600593567, 0.0003232210874557495, 0.00033844634890556335, 0.0003536716103553772, 0.00036889687180519104, 0.0003841221332550049, 0.0003993473947048187, 0.00041457265615463257, 0.0004297979176044464, 0.00044502317905426025, 0.0004602484405040741, 0.00047547370195388794, 0.0004906989634037018, 0.0005059242248535156]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 6.0, 9.0, 6.0, 15.0, 32.0, 39.0, 62.0, 143.0, 306.0, 711.0, 2384.0, 16077.0, 380260.0, 617595.0, 26136.0, 3288.0, 831.0, 317.0, 136.0, 72.0, 48.0, 26.0, 13.0, 15.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.19610595703125, -5.9586181640625, -5.72113037109375, -5.483642578125, -5.24615478515625, -5.0086669921875, -4.77117919921875, -4.53369140625, -4.29620361328125, -4.0587158203125, -3.82122802734375, -3.583740234375, -3.34625244140625, -3.1087646484375, -2.87127685546875, -2.6337890625, -2.39630126953125, -2.1588134765625, -1.92132568359375, -1.683837890625, -1.44635009765625, -1.2088623046875, -0.97137451171875, -0.73388671875, -0.49639892578125, -0.2589111328125, -0.02142333984375, 0.216064453125, 0.45355224609375, 0.6910400390625, 0.92852783203125, 1.166015625, 1.40350341796875, 1.6409912109375, 1.87847900390625, 2.115966796875, 2.35345458984375, 2.5909423828125, 2.82843017578125, 3.06591796875, 3.30340576171875, 3.5408935546875, 3.77838134765625, 4.015869140625, 4.25335693359375, 4.4908447265625, 4.72833251953125, 4.9658203125, 5.20330810546875, 5.4407958984375, 5.67828369140625, 5.915771484375, 6.15325927734375, 6.3907470703125, 6.62823486328125, 6.86572265625, 7.10321044921875, 7.3406982421875, 7.57818603515625, 7.815673828125, 8.05316162109375, 8.2906494140625, 8.52813720703125, 8.765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 28.0, 54.0, 88.0, 180.0, 226.0, 197.0, 112.0, 56.0, 27.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -4.98236083984375, -4.6170654296875, -4.25177001953125, -3.886474609375, -3.52117919921875, -3.1558837890625, -2.79058837890625, -2.42529296875, -2.05999755859375, -1.6947021484375, -1.32940673828125, -0.964111328125, -0.59881591796875, -0.2335205078125, 0.13177490234375, 0.4970703125, 0.86236572265625, 1.2276611328125, 1.59295654296875, 1.958251953125, 2.32354736328125, 2.6888427734375, 3.05413818359375, 3.41943359375, 3.78472900390625, 4.1500244140625, 4.51531982421875, 4.880615234375, 5.24591064453125, 5.6112060546875, 5.97650146484375, 6.341796875, 6.70709228515625, 7.0723876953125, 7.43768310546875, 7.802978515625, 8.16827392578125, 8.5335693359375, 8.89886474609375, 9.26416015625, 9.62945556640625, 9.9947509765625, 10.36004638671875, 10.725341796875, 11.09063720703125, 11.4559326171875, 11.82122802734375, 12.1865234375, 12.55181884765625, 12.9171142578125, 13.28240966796875, 13.647705078125, 14.01300048828125, 14.3782958984375, 14.74359130859375, 15.10888671875, 15.47418212890625, 15.8394775390625, 16.20477294921875, 16.570068359375, 16.93536376953125, 17.3006591796875, 17.66595458984375, 18.03125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 30.0, 63.0, 129.0, 208.0, 254.0, 167.0, 88.0, 33.0, 16.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.628143310546875, -42.76857376098633, -38.90900421142578, -35.04943084716797, -31.189863204956055, -27.330293655395508, -23.470722198486328, -19.61115264892578, -15.751583099365234, -11.892013549804688, -8.032443046569824, -4.172872543334961, -0.31330299377441406, 3.546266555786133, 7.4058380126953125, 11.26540756225586, 15.124977111816406, 18.984546661376953, 22.8441162109375, 26.70368766784668, 30.563257217407227, 34.422828674316406, 38.28239822387695, 42.1419677734375, 46.00153732299805, 49.861106872558594, 53.72067642211914, 57.58024597167969, 61.4398193359375, 65.29938507080078, 69.1589584350586, 73.01852416992188, 76.87809753417969, 80.7376708984375, 84.59723663330078, 88.4568099975586, 92.31637573242188, 96.17594909667969, 100.0355224609375, 103.89508819580078, 107.75465393066406, 111.61422729492188, 115.47379302978516, 119.33336639404297, 123.19293212890625, 127.05250549316406, 130.91207885742188, 134.77163696289062, 138.6312255859375, 142.4907989501953, 146.35037231445312, 150.20993041992188, 154.0695037841797, 157.9290771484375, 161.7886505126953, 165.64822387695312, 169.50778198242188, 173.3673553466797, 177.2269287109375, 181.08648681640625, 184.94606018066406, 188.80563354492188, 192.6652069091797, 196.5247802734375, 200.38433837890625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 4.0, 2.0, 8.0, 6.0, 11.0, 13.0, 17.0, 18.0, 25.0, 29.0, 27.0, 22.0, 38.0, 38.0, 40.0, 55.0, 39.0, 55.0, 36.0, 52.0, 45.0, 42.0, 62.0, 49.0, 36.0, 31.0, 25.0, 28.0, 24.0, 15.0, 16.0, 15.0, 15.0, 5.0, 7.0, 12.0, 11.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.16802215576172, -44.405155181884766, -42.64228820800781, -40.879425048828125, -39.11655807495117, -37.35369110107422, -35.590824127197266, -33.82795715332031, -32.06509017944336, -30.302223205566406, -28.539358139038086, -26.776491165161133, -25.01362419128418, -23.25075912475586, -21.487892150878906, -19.725025177001953, -17.962160110473633, -16.19929313659668, -14.436427116394043, -12.673561096191406, -10.910694122314453, -9.147828102111816, -7.38496208190918, -5.622095108032227, -3.85922908782959, -2.096362590789795, -0.3334963321685791, 1.4293699264526367, 3.1922364234924316, 4.955102920532227, 6.717968940734863, 8.480835914611816, 10.243701934814453, 12.00656795501709, 13.769434928894043, 15.53230094909668, 17.295167922973633, 19.058032989501953, 20.820899963378906, 22.58376693725586, 24.346633911132812, 26.109500885009766, 27.872365951538086, 29.63523292541504, 31.398099899291992, 33.16096496582031, 34.923831939697266, 36.68669891357422, 38.449562072753906, 40.21242904663086, 41.97529602050781, 43.7381591796875, 45.50102615356445, 47.263893127441406, 49.02676010131836, 50.78962707519531, 52.552494049072266, 54.31536102294922, 56.07822799682617, 57.841094970703125, 59.60395812988281, 61.366825103759766, 63.12969207763672, 64.89256286621094, 66.65542602539062]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 14.0, 26.0, 28.0, 44.0, 93.0, 142.0, 252.0, 480.0, 788.0, 1609.0, 3875.0, 12027.0, 58492.0, 3979652.0, 109536.0, 17722.0, 5166.0, 2076.0, 961.0, 520.0, 285.0, 198.0, 111.0, 60.0, 36.0, 23.0, 17.0, 10.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.62823486328125, -6.3697509765625, -6.11126708984375, -5.852783203125, -5.59429931640625, -5.3358154296875, -5.07733154296875, -4.81884765625, -4.56036376953125, -4.3018798828125, -4.04339599609375, -3.784912109375, -3.52642822265625, -3.2679443359375, -3.00946044921875, -2.7509765625, -2.49249267578125, -2.2340087890625, -1.97552490234375, -1.717041015625, -1.45855712890625, -1.2000732421875, -0.94158935546875, -0.68310546875, -0.42462158203125, -0.1661376953125, 0.09234619140625, 0.350830078125, 0.60931396484375, 0.8677978515625, 1.12628173828125, 1.384765625, 1.64324951171875, 1.9017333984375, 2.16021728515625, 2.418701171875, 2.67718505859375, 2.9356689453125, 3.19415283203125, 3.45263671875, 3.71112060546875, 3.9696044921875, 4.22808837890625, 4.486572265625, 4.74505615234375, 5.0035400390625, 5.26202392578125, 5.5205078125, 5.77899169921875, 6.0374755859375, 6.29595947265625, 6.554443359375, 6.81292724609375, 7.0714111328125, 7.32989501953125, 7.58837890625, 7.84686279296875, 8.1053466796875, 8.36383056640625, 8.622314453125, 8.88079833984375, 9.1392822265625, 9.39776611328125, 9.65625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 9.0, 6.0, 5.0, 15.0, 17.0, 26.0, 24.0, 31.0, 52.0, 40.0, 50.0, 60.0, 68.0, 82.0, 61.0, 68.0, 67.0, 51.0, 50.0, 33.0, 28.0, 23.0, 22.0, 18.0, 30.0, 14.0, 9.0, 10.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.367767333984375, -2.26678466796875, -2.165802001953125, -2.0648193359375, -1.963836669921875, -1.86285400390625, -1.761871337890625, -1.660888671875, -1.559906005859375, -1.45892333984375, -1.357940673828125, -1.2569580078125, -1.155975341796875, -1.05499267578125, -0.954010009765625, -0.85302734375, -0.752044677734375, -0.65106201171875, -0.550079345703125, -0.4490966796875, -0.348114013671875, -0.24713134765625, -0.146148681640625, -0.045166015625, 0.055816650390625, 0.15679931640625, 0.257781982421875, 0.3587646484375, 0.459747314453125, 0.56072998046875, 0.661712646484375, 0.7626953125, 0.863677978515625, 0.96466064453125, 1.065643310546875, 1.1666259765625, 1.267608642578125, 1.36859130859375, 1.469573974609375, 1.570556640625, 1.671539306640625, 1.77252197265625, 1.873504638671875, 1.9744873046875, 2.075469970703125, 2.17645263671875, 2.277435302734375, 2.37841796875, 2.479400634765625, 2.58038330078125, 2.681365966796875, 2.7823486328125, 2.883331298828125, 2.98431396484375, 3.085296630859375, 3.186279296875, 3.287261962890625, 3.38824462890625, 3.489227294921875, 3.5902099609375, 3.691192626953125, 3.79217529296875, 3.893157958984375, 3.994140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 0.0, 3.0, 8.0, 3.0, 19.0, 18.0, 26.0, 26.0, 33.0, 43.0, 67.0, 98.0, 146.0, 225.0, 400.0, 672.0, 1283.0, 2612.0, 5979.0, 15580.0, 58535.0, 3499236.0, 537313.0, 47826.0, 13527.0, 5316.0, 2445.0, 1149.0, 658.0, 341.0, 239.0, 141.0, 98.0, 49.0, 49.0, 27.0, 28.0, 22.0, 12.0, 9.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.76934814453125, -5.5699462890625, -5.37054443359375, -5.171142578125, -4.97174072265625, -4.7723388671875, -4.57293701171875, -4.37353515625, -4.17413330078125, -3.9747314453125, -3.77532958984375, -3.575927734375, -3.37652587890625, -3.1771240234375, -2.97772216796875, -2.7783203125, -2.57891845703125, -2.3795166015625, -2.18011474609375, -1.980712890625, -1.78131103515625, -1.5819091796875, -1.38250732421875, -1.18310546875, -0.98370361328125, -0.7843017578125, -0.58489990234375, -0.385498046875, -0.18609619140625, 0.0133056640625, 0.21270751953125, 0.412109375, 0.61151123046875, 0.8109130859375, 1.01031494140625, 1.209716796875, 1.40911865234375, 1.6085205078125, 1.80792236328125, 2.00732421875, 2.20672607421875, 2.4061279296875, 2.60552978515625, 2.804931640625, 3.00433349609375, 3.2037353515625, 3.40313720703125, 3.6025390625, 3.80194091796875, 4.0013427734375, 4.20074462890625, 4.400146484375, 4.59954833984375, 4.7989501953125, 4.99835205078125, 5.19775390625, 5.39715576171875, 5.5965576171875, 5.79595947265625, 5.995361328125, 6.19476318359375, 6.3941650390625, 6.59356689453125, 6.79296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 12.0, 15.0, 29.0, 44.0, 57.0, 135.0, 383.0, 2967.0, 202.0, 81.0, 38.0, 27.0, 18.0, 13.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9658203125, -1.91156005859375, -1.8572998046875, -1.80303955078125, -1.748779296875, -1.69451904296875, -1.6402587890625, -1.58599853515625, -1.53173828125, -1.47747802734375, -1.4232177734375, -1.36895751953125, -1.314697265625, -1.26043701171875, -1.2061767578125, -1.15191650390625, -1.09765625, -1.04339599609375, -0.9891357421875, -0.93487548828125, -0.880615234375, -0.82635498046875, -0.7720947265625, -0.71783447265625, -0.66357421875, -0.60931396484375, -0.5550537109375, -0.50079345703125, -0.446533203125, -0.39227294921875, -0.3380126953125, -0.28375244140625, -0.2294921875, -0.17523193359375, -0.1209716796875, -0.06671142578125, -0.012451171875, 0.04180908203125, 0.0960693359375, 0.15032958984375, 0.20458984375, 0.25885009765625, 0.3131103515625, 0.36737060546875, 0.421630859375, 0.47589111328125, 0.5301513671875, 0.58441162109375, 0.638671875, 0.69293212890625, 0.7471923828125, 0.80145263671875, 0.855712890625, 0.90997314453125, 0.9642333984375, 1.01849365234375, 1.07275390625, 1.12701416015625, 1.1812744140625, 1.23553466796875, 1.289794921875, 1.34405517578125, 1.3983154296875, 1.45257568359375, 1.5068359375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 11.0, 15.0, 40.0, 81.0, 123.0, 151.0, 202.0, 161.0, 96.0, 59.0, 38.0, 8.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.50107192993164, -16.143199920654297, -15.785329818725586, -15.427458763122559, -15.069587707519531, -14.711715698242188, -14.35384464263916, -13.995973587036133, -13.638102531433105, -13.280231475830078, -12.92236042022705, -12.564489364624023, -12.20661735534668, -11.848746299743652, -11.490875244140625, -11.133004188537598, -10.77513313293457, -10.417262077331543, -10.059391021728516, -9.701519966125488, -9.343648910522461, -8.985776901245117, -8.62790584564209, -8.270034790039062, -7.912163734436035, -7.554292678833008, -7.1964216232299805, -6.838550090789795, -6.480679035186768, -6.12280797958374, -5.764936447143555, -5.407065391540527, -5.0491943359375, -4.691323280334473, -4.333452224731445, -3.9755806922912598, -3.6177096366882324, -3.259838581085205, -2.9019672870635986, -2.544095993041992, -2.186224937438965, -1.828353762626648, -1.470482587814331, -1.1126114130020142, -0.7547402381896973, -0.39686906337738037, -0.03899788856506348, 0.31887340545654297, 0.6767444610595703, 1.0346156358718872, 1.392486810684204, 1.750357985496521, 2.108229160308838, 2.4661002159118652, 2.8239715099334717, 3.181842803955078, 3.5397138595581055, 3.897584915161133, 4.25545597076416, 4.613327503204346, 4.971198558807373, 5.3290696144104, 5.686941146850586, 6.044812202453613, 6.402683258056641]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 7.0, 9.0, 8.0, 7.0, 10.0, 11.0, 19.0, 10.0, 22.0, 22.0, 24.0, 25.0, 27.0, 36.0, 29.0, 35.0, 47.0, 38.0, 37.0, 44.0, 46.0, 39.0, 55.0, 37.0, 39.0, 35.0, 27.0, 35.0, 31.0, 26.0, 25.0, 18.0, 19.0, 23.0, 19.0, 10.0, 11.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7666194438934326, -3.6550705432891846, -3.5435218811035156, -3.4319729804992676, -3.3204240798950195, -3.2088751792907715, -3.0973265171051025, -2.9857776165008545, -2.8742289543151855, -2.7626800537109375, -2.6511313915252686, -2.5395824909210205, -2.4280335903167725, -2.3164849281311035, -2.2049360275268555, -2.0933871269226074, -1.9818382263183594, -1.8702894449234009, -1.7587405443191528, -1.6471917629241943, -1.5356428623199463, -1.4240940809249878, -1.3125452995300293, -1.2009963989257812, -1.0894476175308228, -0.9778987765312195, -0.8663499355316162, -0.7548011541366577, -0.6432523131370544, -0.5317034721374512, -0.4201546907424927, -0.3086058497428894, -0.19705724716186523, -0.08550842106342316, 0.02604040503501892, 0.1375892162322998, 0.24913805723190308, 0.36068689823150635, 0.47223567962646484, 0.5837845206260681, 0.6953333616256714, 0.8068822026252747, 0.9184310436248779, 1.0299798250198364, 1.141528606414795, 1.253077507019043, 1.3646262884140015, 1.47617506980896, 1.587723970413208, 1.6992727518081665, 1.8108216524124146, 1.922370433807373, 2.033919334411621, 2.145468235015869, 2.257016897201538, 2.368565797805786, 2.480114459991455, 2.591663360595703, 2.703212022781372, 2.81476092338562, 2.926309823989868, 3.037858486175537, 3.149407386779785, 3.260956287384033, 3.3725051879882812]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 21.0, 20.0, 39.0, 53.0, 66.0, 103.0, 151.0, 207.0, 405.0, 537.0, 840.0, 1278.0, 2111.0, 3528.0, 6176.0, 10732.0, 19413.0, 35917.0, 67055.0, 120388.0, 187857.0, 213212.0, 162665.0, 97247.0, 53205.0, 28228.0, 15501.0, 8715.0, 4980.0, 2888.0, 1846.0, 1058.0, 681.0, 446.0, 297.0, 184.0, 141.0, 99.0, 74.0, 59.0, 36.0, 22.0, 15.0, 14.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-2.638671875, -2.5570068359375, -2.475341796875, -2.3936767578125, -2.31201171875, -2.2303466796875, -2.148681640625, -2.0670166015625, -1.9853515625, -1.9036865234375, -1.822021484375, -1.7403564453125, -1.65869140625, -1.5770263671875, -1.495361328125, -1.4136962890625, -1.33203125, -1.2503662109375, -1.168701171875, -1.0870361328125, -1.00537109375, -0.9237060546875, -0.842041015625, -0.7603759765625, -0.6787109375, -0.5970458984375, -0.515380859375, -0.4337158203125, -0.35205078125, -0.2703857421875, -0.188720703125, -0.1070556640625, -0.025390625, 0.0562744140625, 0.137939453125, 0.2196044921875, 0.30126953125, 0.3829345703125, 0.464599609375, 0.5462646484375, 0.6279296875, 0.7095947265625, 0.791259765625, 0.8729248046875, 0.95458984375, 1.0362548828125, 1.117919921875, 1.1995849609375, 1.28125, 1.3629150390625, 1.444580078125, 1.5262451171875, 1.60791015625, 1.6895751953125, 1.771240234375, 1.8529052734375, 1.9345703125, 2.0162353515625, 2.097900390625, 2.1795654296875, 2.26123046875, 2.3428955078125, 2.424560546875, 2.5062255859375, 2.587890625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 11.0, 9.0, 15.0, 13.0, 19.0, 14.0, 26.0, 30.0, 38.0, 34.0, 39.0, 55.0, 64.0, 60.0, 57.0, 63.0, 54.0, 49.0, 55.0, 57.0, 41.0, 28.0, 26.0, 26.0, 17.0, 15.0, 11.0, 13.0, 13.0, 7.0, 7.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.396484375, -2.304840087890625, -2.21319580078125, -2.121551513671875, -2.0299072265625, -1.938262939453125, -1.84661865234375, -1.754974365234375, -1.663330078125, -1.571685791015625, -1.48004150390625, -1.388397216796875, -1.2967529296875, -1.205108642578125, -1.11346435546875, -1.021820068359375, -0.93017578125, -0.838531494140625, -0.74688720703125, -0.655242919921875, -0.5635986328125, -0.471954345703125, -0.38031005859375, -0.288665771484375, -0.197021484375, -0.105377197265625, -0.01373291015625, 0.077911376953125, 0.1695556640625, 0.261199951171875, 0.35284423828125, 0.444488525390625, 0.5361328125, 0.627777099609375, 0.71942138671875, 0.811065673828125, 0.9027099609375, 0.994354248046875, 1.08599853515625, 1.177642822265625, 1.269287109375, 1.360931396484375, 1.45257568359375, 1.544219970703125, 1.6358642578125, 1.727508544921875, 1.81915283203125, 1.910797119140625, 2.00244140625, 2.094085693359375, 2.18572998046875, 2.277374267578125, 2.3690185546875, 2.460662841796875, 2.55230712890625, 2.643951416015625, 2.735595703125, 2.827239990234375, 2.91888427734375, 3.010528564453125, 3.1021728515625, 3.193817138671875, 3.28546142578125, 3.377105712890625, 3.46875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 11.0, 22.0, 39.0, 47.0, 113.0, 158.0, 372.0, 711.0, 1927.0, 8999.0, 120073.0, 819021.0, 86624.0, 7338.0, 1744.0, 622.0, 314.0, 169.0, 104.0, 50.0, 34.0, 22.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.495849609375, -12.08544921875, -11.675048828125, -11.2646484375, -10.854248046875, -10.44384765625, -10.033447265625, -9.623046875, -9.212646484375, -8.80224609375, -8.391845703125, -7.9814453125, -7.571044921875, -7.16064453125, -6.750244140625, -6.33984375, -5.929443359375, -5.51904296875, -5.108642578125, -4.6982421875, -4.287841796875, -3.87744140625, -3.467041015625, -3.056640625, -2.646240234375, -2.23583984375, -1.825439453125, -1.4150390625, -1.004638671875, -0.59423828125, -0.183837890625, 0.2265625, 0.636962890625, 1.04736328125, 1.457763671875, 1.8681640625, 2.278564453125, 2.68896484375, 3.099365234375, 3.509765625, 3.920166015625, 4.33056640625, 4.740966796875, 5.1513671875, 5.561767578125, 5.97216796875, 6.382568359375, 6.79296875, 7.203369140625, 7.61376953125, 8.024169921875, 8.4345703125, 8.844970703125, 9.25537109375, 9.665771484375, 10.076171875, 10.486572265625, 10.89697265625, 11.307373046875, 11.7177734375, 12.128173828125, 12.53857421875, 12.948974609375, 13.359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 11.0, 9.0, 7.0, 7.0, 20.0, 21.0, 19.0, 28.0, 32.0, 38.0, 33.0, 36.0, 45.0, 47.0, 57.0, 64.0, 62.0, 58.0, 40.0, 53.0, 48.0, 33.0, 27.0, 35.0, 26.0, 27.0, 19.0, 23.0, 14.0, 17.0, 8.0, 4.0, 8.0, 5.0, 6.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.046875, -15.597412109375, -15.14794921875, -14.698486328125, -14.2490234375, -13.799560546875, -13.35009765625, -12.900634765625, -12.451171875, -12.001708984375, -11.55224609375, -11.102783203125, -10.6533203125, -10.203857421875, -9.75439453125, -9.304931640625, -8.85546875, -8.406005859375, -7.95654296875, -7.507080078125, -7.0576171875, -6.608154296875, -6.15869140625, -5.709228515625, -5.259765625, -4.810302734375, -4.36083984375, -3.911376953125, -3.4619140625, -3.012451171875, -2.56298828125, -2.113525390625, -1.6640625, -1.214599609375, -0.76513671875, -0.315673828125, 0.1337890625, 0.583251953125, 1.03271484375, 1.482177734375, 1.931640625, 2.381103515625, 2.83056640625, 3.280029296875, 3.7294921875, 4.178955078125, 4.62841796875, 5.077880859375, 5.52734375, 5.976806640625, 6.42626953125, 6.875732421875, 7.3251953125, 7.774658203125, 8.22412109375, 8.673583984375, 9.123046875, 9.572509765625, 10.02197265625, 10.471435546875, 10.9208984375, 11.370361328125, 11.81982421875, 12.269287109375, 12.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 9.0, 13.0, 20.0, 32.0, 43.0, 58.0, 85.0, 108.0, 204.0, 362.0, 834.0, 2993.0, 23448.0, 671209.0, 332619.0, 12908.0, 2100.0, 687.0, 325.0, 165.0, 111.0, 62.0, 43.0, 29.0, 25.0, 16.0, 6.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.44921875, -7.24163818359375, -7.0340576171875, -6.82647705078125, -6.618896484375, -6.41131591796875, -6.2037353515625, -5.99615478515625, -5.78857421875, -5.58099365234375, -5.3734130859375, -5.16583251953125, -4.958251953125, -4.75067138671875, -4.5430908203125, -4.33551025390625, -4.1279296875, -3.92034912109375, -3.7127685546875, -3.50518798828125, -3.297607421875, -3.09002685546875, -2.8824462890625, -2.67486572265625, -2.46728515625, -2.25970458984375, -2.0521240234375, -1.84454345703125, -1.636962890625, -1.42938232421875, -1.2218017578125, -1.01422119140625, -0.806640625, -0.59906005859375, -0.3914794921875, -0.18389892578125, 0.023681640625, 0.23126220703125, 0.4388427734375, 0.64642333984375, 0.85400390625, 1.06158447265625, 1.2691650390625, 1.47674560546875, 1.684326171875, 1.89190673828125, 2.0994873046875, 2.30706787109375, 2.5146484375, 2.72222900390625, 2.9298095703125, 3.13739013671875, 3.344970703125, 3.55255126953125, 3.7601318359375, 3.96771240234375, 4.17529296875, 4.38287353515625, 4.5904541015625, 4.79803466796875, 5.005615234375, 5.21319580078125, 5.4207763671875, 5.62835693359375, 5.8359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 10.0, 18.0, 27.0, 36.0, 59.0, 105.0, 128.0, 157.0, 135.0, 121.0, 78.0, 46.0, 34.0, 17.0, 8.0, 12.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.0006847977638244629, -0.0006600618362426758, -0.0006353259086608887, -0.0006105899810791016, -0.0005858540534973145, -0.0005611181259155273, -0.0005363821983337402, -0.0005116462707519531, -0.000486910343170166, -0.0004621744155883789, -0.0004374384880065918, -0.0004127025604248047, -0.0003879666328430176, -0.00036323070526123047, -0.00033849477767944336, -0.00031375885009765625, -0.00028902292251586914, -0.00026428699493408203, -0.00023955106735229492, -0.0002148151397705078, -0.0001900792121887207, -0.0001653432846069336, -0.00014060735702514648, -0.00011587142944335938, -9.113550186157227e-05, -6.639957427978516e-05, -4.166364669799805e-05, -1.6927719116210938e-05, 7.808208465576172e-06, 3.254413604736328e-05, 5.728006362915039e-05, 8.20159912109375e-05, 0.00010675191879272461, 0.00013148784637451172, 0.00015622377395629883, 0.00018095970153808594, 0.00020569562911987305, 0.00023043155670166016, 0.00025516748428344727, 0.0002799034118652344, 0.0003046393394470215, 0.0003293752670288086, 0.0003541111946105957, 0.0003788471221923828, 0.0004035830497741699, 0.00042831897735595703, 0.00045305490493774414, 0.00047779083251953125, 0.0005025267601013184, 0.0005272626876831055, 0.0005519986152648926, 0.0005767345428466797, 0.0006014704704284668, 0.0006262063980102539, 0.000650942325592041, 0.0006756782531738281, 0.0007004141807556152, 0.0007251501083374023, 0.0007498860359191895, 0.0007746219635009766, 0.0007993578910827637, 0.0008240938186645508, 0.0008488297462463379, 0.000873565673828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 10.0, 7.0, 14.0, 24.0, 34.0, 44.0, 92.0, 141.0, 205.0, 396.0, 848.0, 2165.0, 7979.0, 59432.0, 666418.0, 280261.0, 23316.0, 4374.0, 1349.0, 625.0, 330.0, 188.0, 98.0, 63.0, 39.0, 27.0, 20.0, 13.0, 7.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.147705078125, -4.99072265625, -4.833740234375, -4.6767578125, -4.519775390625, -4.36279296875, -4.205810546875, -4.048828125, -3.891845703125, -3.73486328125, -3.577880859375, -3.4208984375, -3.263916015625, -3.10693359375, -2.949951171875, -2.79296875, -2.635986328125, -2.47900390625, -2.322021484375, -2.1650390625, -2.008056640625, -1.85107421875, -1.694091796875, -1.537109375, -1.380126953125, -1.22314453125, -1.066162109375, -0.9091796875, -0.752197265625, -0.59521484375, -0.438232421875, -0.28125, -0.124267578125, 0.03271484375, 0.189697265625, 0.3466796875, 0.503662109375, 0.66064453125, 0.817626953125, 0.974609375, 1.131591796875, 1.28857421875, 1.445556640625, 1.6025390625, 1.759521484375, 1.91650390625, 2.073486328125, 2.23046875, 2.387451171875, 2.54443359375, 2.701416015625, 2.8583984375, 3.015380859375, 3.17236328125, 3.329345703125, 3.486328125, 3.643310546875, 3.80029296875, 3.957275390625, 4.1142578125, 4.271240234375, 4.42822265625, 4.585205078125, 4.7421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 12.0, 13.0, 25.0, 23.0, 28.0, 48.0, 55.0, 54.0, 70.0, 80.0, 91.0, 86.0, 98.0, 75.0, 44.0, 42.0, 31.0, 20.0, 15.0, 15.0, 10.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.60546875, -4.4644775390625, -4.323486328125, -4.1824951171875, -4.04150390625, -3.9005126953125, -3.759521484375, -3.6185302734375, -3.4775390625, -3.3365478515625, -3.195556640625, -3.0545654296875, -2.91357421875, -2.7725830078125, -2.631591796875, -2.4906005859375, -2.349609375, -2.2086181640625, -2.067626953125, -1.9266357421875, -1.78564453125, -1.6446533203125, -1.503662109375, -1.3626708984375, -1.2216796875, -1.0806884765625, -0.939697265625, -0.7987060546875, -0.65771484375, -0.5167236328125, -0.375732421875, -0.2347412109375, -0.09375, 0.0472412109375, 0.188232421875, 0.3292236328125, 0.47021484375, 0.6112060546875, 0.752197265625, 0.8931884765625, 1.0341796875, 1.1751708984375, 1.316162109375, 1.4571533203125, 1.59814453125, 1.7391357421875, 1.880126953125, 2.0211181640625, 2.162109375, 2.3031005859375, 2.444091796875, 2.5850830078125, 2.72607421875, 2.8670654296875, 3.008056640625, 3.1490478515625, 3.2900390625, 3.4310302734375, 3.572021484375, 3.7130126953125, 3.85400390625, 3.9949951171875, 4.135986328125, 4.2769775390625, 4.41796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 10.0, 32.0, 71.0, 105.0, 158.0, 216.0, 194.0, 110.0, 57.0, 24.0, 11.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5589599609375, -87.68548583984375, -84.81201171875, -81.93853759765625, -79.0650634765625, -76.19158935546875, -73.318115234375, -70.44463348388672, -67.57115936279297, -64.69768524169922, -61.82421112060547, -58.95073699951172, -56.0772590637207, -53.20378494262695, -50.3303108215332, -47.45683288574219, -44.5833625793457, -41.70988845825195, -38.8364143371582, -35.96293640136719, -33.08946228027344, -30.215988159179688, -27.342514038085938, -24.469038009643555, -21.595563888549805, -18.722089767456055, -15.848613739013672, -12.975139617919922, -10.101664543151855, -7.228189468383789, -4.354715347290039, -1.4812393188476562, 1.3922348022460938, 4.26570987701416, 7.139184474945068, 10.012659072875977, 12.886134147644043, 15.75960922241211, 18.63308334350586, 21.506559371948242, 24.380033493041992, 27.253507614135742, 30.126983642578125, 33.000457763671875, 35.873931884765625, 38.747406005859375, 41.620880126953125, 44.49435806274414, 47.36783218383789, 50.24130630493164, 53.11478042602539, 55.988258361816406, 58.861732482910156, 61.735206604003906, 64.60868072509766, 67.4821548461914, 70.35562896728516, 73.2291030883789, 76.10257720947266, 78.9760513305664, 81.84952545166016, 84.72300720214844, 87.59648132324219, 90.46995544433594, 93.34342956542969]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 7.0, 14.0, 16.0, 14.0, 22.0, 22.0, 18.0, 33.0, 31.0, 44.0, 47.0, 46.0, 69.0, 53.0, 70.0, 66.0, 62.0, 55.0, 42.0, 45.0, 27.0, 37.0, 34.0, 18.0, 28.0, 6.0, 21.0, 13.0, 3.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25326538085938, -63.185848236083984, -61.11842727661133, -59.05101013183594, -56.98359298706055, -54.916175842285156, -52.8487548828125, -50.78133773803711, -48.71392059326172, -46.64650344848633, -44.57908248901367, -42.51166534423828, -40.44424819946289, -38.3768310546875, -36.309410095214844, -34.24199295043945, -32.1745719909668, -30.107152938842773, -28.039735794067383, -25.97231674194336, -23.90489959716797, -21.837480545043945, -19.770061492919922, -17.70264434814453, -15.635225296020508, -13.5678071975708, -11.500389099121094, -9.43297004699707, -7.365551948547363, -5.298133850097656, -3.230714797973633, -1.1632966995239258, 0.9041213989257812, 2.9715397357940674, 5.0389580726623535, 7.106376647949219, 9.173794746398926, 11.241212844848633, 13.308631896972656, 15.376049995422363, 17.44346809387207, 19.510887145996094, 21.578304290771484, 23.645723342895508, 25.71314239501953, 27.780559539794922, 29.847978591918945, 31.91539764404297, 33.98281478881836, 36.05023193359375, 38.117652893066406, 40.1850700378418, 42.25248718261719, 44.319908142089844, 46.387325286865234, 48.454742431640625, 50.52216339111328, 52.58958053588867, 54.65700149536133, 56.72441864013672, 58.79183578491211, 60.8592529296875, 62.926673889160156, 64.99409484863281, 67.06150817871094]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 19.0, 18.0, 17.0, 20.0, 42.0, 69.0, 94.0, 154.0, 230.0, 402.0, 681.0, 1268.0, 2371.0, 5147.0, 13269.0, 48918.0, 479102.0, 3544351.0, 68633.0, 16842.0, 6113.0, 2951.0, 1451.0, 817.0, 474.0, 274.0, 164.0, 101.0, 81.0, 54.0, 40.0, 31.0, 11.0, 16.0, 8.0, 3.0, 3.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.44140625, -5.2818603515625, -5.122314453125, -4.9627685546875, -4.80322265625, -4.6436767578125, -4.484130859375, -4.3245849609375, -4.1650390625, -4.0054931640625, -3.845947265625, -3.6864013671875, -3.52685546875, -3.3673095703125, -3.207763671875, -3.0482177734375, -2.888671875, -2.7291259765625, -2.569580078125, -2.4100341796875, -2.25048828125, -2.0909423828125, -1.931396484375, -1.7718505859375, -1.6123046875, -1.4527587890625, -1.293212890625, -1.1336669921875, -0.97412109375, -0.8145751953125, -0.655029296875, -0.4954833984375, -0.3359375, -0.1763916015625, -0.016845703125, 0.1427001953125, 0.30224609375, 0.4617919921875, 0.621337890625, 0.7808837890625, 0.9404296875, 1.0999755859375, 1.259521484375, 1.4190673828125, 1.57861328125, 1.7381591796875, 1.897705078125, 2.0572509765625, 2.216796875, 2.3763427734375, 2.535888671875, 2.6954345703125, 2.85498046875, 3.0145263671875, 3.174072265625, 3.3336181640625, 3.4931640625, 3.6527099609375, 3.812255859375, 3.9718017578125, 4.13134765625, 4.2908935546875, 4.450439453125, 4.6099853515625, 4.76953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 7.0, 7.0, 6.0, 14.0, 21.0, 19.0, 30.0, 41.0, 43.0, 64.0, 69.0, 81.0, 81.0, 71.0, 82.0, 80.0, 59.0, 45.0, 43.0, 29.0, 29.0, 19.0, 14.0, 17.0, 6.0, 6.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.69921875, -4.58184814453125, -4.4644775390625, -4.34710693359375, -4.229736328125, -4.11236572265625, -3.9949951171875, -3.87762451171875, -3.76025390625, -3.64288330078125, -3.5255126953125, -3.40814208984375, -3.290771484375, -3.17340087890625, -3.0560302734375, -2.93865966796875, -2.8212890625, -2.70391845703125, -2.5865478515625, -2.46917724609375, -2.351806640625, -2.23443603515625, -2.1170654296875, -1.99969482421875, -1.88232421875, -1.76495361328125, -1.6475830078125, -1.53021240234375, -1.412841796875, -1.29547119140625, -1.1781005859375, -1.06072998046875, -0.943359375, -0.82598876953125, -0.7086181640625, -0.59124755859375, -0.473876953125, -0.35650634765625, -0.2391357421875, -0.12176513671875, -0.00439453125, 0.11297607421875, 0.2303466796875, 0.34771728515625, 0.465087890625, 0.58245849609375, 0.6998291015625, 0.81719970703125, 0.9345703125, 1.05194091796875, 1.1693115234375, 1.28668212890625, 1.404052734375, 1.52142333984375, 1.6387939453125, 1.75616455078125, 1.87353515625, 1.99090576171875, 2.1082763671875, 2.22564697265625, 2.343017578125, 2.46038818359375, 2.5777587890625, 2.69512939453125, 2.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 7.0, 10.0, 19.0, 30.0, 20.0, 25.0, 38.0, 66.0, 86.0, 103.0, 183.0, 261.0, 452.0, 783.0, 1661.0, 3948.0, 11717.0, 51400.0, 594119.0, 3422025.0, 81574.0, 16350.0, 5039.0, 1962.0, 925.0, 498.0, 321.0, 214.0, 114.0, 92.0, 64.0, 39.0, 30.0, 26.0, 17.0, 16.0, 15.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.20703125, -6.0196533203125, -5.832275390625, -5.6448974609375, -5.45751953125, -5.2701416015625, -5.082763671875, -4.8953857421875, -4.7080078125, -4.5206298828125, -4.333251953125, -4.1458740234375, -3.95849609375, -3.7711181640625, -3.583740234375, -3.3963623046875, -3.208984375, -3.0216064453125, -2.834228515625, -2.6468505859375, -2.45947265625, -2.2720947265625, -2.084716796875, -1.8973388671875, -1.7099609375, -1.5225830078125, -1.335205078125, -1.1478271484375, -0.96044921875, -0.7730712890625, -0.585693359375, -0.3983154296875, -0.2109375, -0.0235595703125, 0.163818359375, 0.3511962890625, 0.53857421875, 0.7259521484375, 0.913330078125, 1.1007080078125, 1.2880859375, 1.4754638671875, 1.662841796875, 1.8502197265625, 2.03759765625, 2.2249755859375, 2.412353515625, 2.5997314453125, 2.787109375, 2.9744873046875, 3.161865234375, 3.3492431640625, 3.53662109375, 3.7239990234375, 3.911376953125, 4.0987548828125, 4.2861328125, 4.4735107421875, 4.660888671875, 4.8482666015625, 5.03564453125, 5.2230224609375, 5.410400390625, 5.5977783203125, 5.78515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 9.0, 11.0, 12.0, 32.0, 42.0, 47.0, 112.0, 215.0, 1938.0, 1050.0, 272.0, 131.0, 76.0, 39.0, 20.0, 19.0, 24.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.26953125, -3.18341064453125, -3.0972900390625, -3.01116943359375, -2.925048828125, -2.83892822265625, -2.7528076171875, -2.66668701171875, -2.58056640625, -2.49444580078125, -2.4083251953125, -2.32220458984375, -2.236083984375, -2.14996337890625, -2.0638427734375, -1.97772216796875, -1.8916015625, -1.80548095703125, -1.7193603515625, -1.63323974609375, -1.547119140625, -1.46099853515625, -1.3748779296875, -1.28875732421875, -1.20263671875, -1.11651611328125, -1.0303955078125, -0.94427490234375, -0.858154296875, -0.77203369140625, -0.6859130859375, -0.59979248046875, -0.513671875, -0.42755126953125, -0.3414306640625, -0.25531005859375, -0.169189453125, -0.08306884765625, 0.0030517578125, 0.08917236328125, 0.17529296875, 0.26141357421875, 0.3475341796875, 0.43365478515625, 0.519775390625, 0.60589599609375, 0.6920166015625, 0.77813720703125, 0.8642578125, 0.95037841796875, 1.0364990234375, 1.12261962890625, 1.208740234375, 1.29486083984375, 1.3809814453125, 1.46710205078125, 1.55322265625, 1.63934326171875, 1.7254638671875, 1.81158447265625, 1.897705078125, 1.98382568359375, 2.0699462890625, 2.15606689453125, 2.2421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 9.0, 18.0, 18.0, 19.0, 29.0, 60.0, 73.0, 64.0, 102.0, 108.0, 84.0, 74.0, 76.0, 60.0, 49.0, 36.0, 24.0, 21.0, 11.0, 6.0, 8.0, 10.0, 2.0, 2.0, 6.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.339654922485352, -7.031867980957031, -6.724080562591553, -6.416293144226074, -6.108506202697754, -5.800719261169434, -5.492931842803955, -5.185144424438477, -4.877357482910156, -4.569570541381836, -4.261783123016357, -3.953995943069458, -3.6462087631225586, -3.338421583175659, -3.0306344032287598, -2.7228472232818604, -2.415060043334961, -2.1072728633880615, -1.799485683441162, -1.4916985034942627, -1.1839113235473633, -0.8761241436004639, -0.5683369636535645, -0.26054978370666504, 0.047237396240234375, 0.3550245761871338, 0.6628117561340332, 0.9705989360809326, 1.278386116027832, 1.5861732959747314, 1.8939604759216309, 2.2017476558685303, 2.5095348358154297, 2.817322015762329, 3.1251091957092285, 3.432896375656128, 3.7406835556030273, 4.048470497131348, 4.356257915496826, 4.664045333862305, 4.971832275390625, 5.279619216918945, 5.587406635284424, 5.895194053649902, 6.202980995178223, 6.510767936706543, 6.8185553550720215, 7.1263427734375, 7.43412971496582, 7.741916656494141, 8.049703598022461, 8.357491493225098, 8.665278434753418, 8.973065376281738, 9.280853271484375, 9.588640213012695, 9.896427154541016, 10.204214096069336, 10.512001037597656, 10.819788932800293, 11.127575874328613, 11.435362815856934, 11.74315071105957, 12.05093765258789, 12.358724594116211]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 4.0, 14.0, 21.0, 22.0, 23.0, 19.0, 20.0, 30.0, 39.0, 42.0, 41.0, 55.0, 42.0, 51.0, 48.0, 51.0, 58.0, 49.0, 41.0, 52.0, 39.0, 35.0, 28.0, 27.0, 26.0, 10.0, 20.0, 12.0, 9.0, 14.0, 8.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.787613868713379, -8.54937744140625, -8.311141967773438, -8.072905540466309, -7.834670066833496, -7.596434116363525, -7.358198165893555, -7.119962215423584, -6.881726264953613, -6.643490314483643, -6.405254364013672, -6.167018413543701, -5.9287824630737305, -5.69054651260376, -5.452310562133789, -5.214074611663818, -4.975838661193848, -4.737602710723877, -4.499366760253906, -4.2611308097839355, -4.022894859313965, -3.784658908843994, -3.5464229583740234, -3.3081870079040527, -3.069950580596924, -2.831714630126953, -2.5934786796569824, -2.3552427291870117, -2.117006778717041, -1.8787707090377808, -1.64053475856781, -1.4022988080978394, -1.1640629768371582, -0.9258270263671875, -0.6875910758972168, -0.4493550658226013, -0.21111911535263062, 0.027116894721984863, 0.26535284519195557, 0.5035887956619263, 0.741824746131897, 0.9800606966018677, 1.2182966470718384, 1.4565327167510986, 1.6947686672210693, 1.93300461769104, 2.1712405681610107, 2.4094765186309814, 2.647712469100952, 2.885948419570923, 3.1241843700408936, 3.3624203205108643, 3.600656270980835, 3.8388924598693848, 4.0771284103393555, 4.315364360809326, 4.553600311279297, 4.791836261749268, 5.030072212219238, 5.268308162689209, 5.50654411315918, 5.74478006362915, 5.983016014099121, 6.221251964569092, 6.4594879150390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 8.0, 4.0, 9.0, 11.0, 20.0, 42.0, 51.0, 109.0, 192.0, 364.0, 772.0, 2013.0, 5997.0, 22300.0, 110224.0, 468676.0, 347012.0, 68689.0, 14991.0, 4245.0, 1529.0, 638.0, 276.0, 169.0, 86.0, 42.0, 30.0, 22.0, 14.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5, -7.26458740234375, -7.0291748046875, -6.79376220703125, -6.558349609375, -6.32293701171875, -6.0875244140625, -5.85211181640625, -5.61669921875, -5.38128662109375, -5.1458740234375, -4.91046142578125, -4.675048828125, -4.43963623046875, -4.2042236328125, -3.96881103515625, -3.7333984375, -3.49798583984375, -3.2625732421875, -3.02716064453125, -2.791748046875, -2.55633544921875, -2.3209228515625, -2.08551025390625, -1.85009765625, -1.61468505859375, -1.3792724609375, -1.14385986328125, -0.908447265625, -0.67303466796875, -0.4376220703125, -0.20220947265625, 0.033203125, 0.26861572265625, 0.5040283203125, 0.73944091796875, 0.974853515625, 1.21026611328125, 1.4456787109375, 1.68109130859375, 1.91650390625, 2.15191650390625, 2.3873291015625, 2.62274169921875, 2.858154296875, 3.09356689453125, 3.3289794921875, 3.56439208984375, 3.7998046875, 4.03521728515625, 4.2706298828125, 4.50604248046875, 4.741455078125, 4.97686767578125, 5.2122802734375, 5.44769287109375, 5.68310546875, 5.91851806640625, 6.1539306640625, 6.38934326171875, 6.624755859375, 6.86016845703125, 7.0955810546875, 7.33099365234375, 7.56640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 12.0, 16.0, 15.0, 20.0, 20.0, 30.0, 38.0, 38.0, 41.0, 63.0, 65.0, 52.0, 64.0, 71.0, 62.0, 59.0, 66.0, 30.0, 36.0, 37.0, 26.0, 33.0, 17.0, 15.0, 14.0, 11.0, 9.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.552734375, -3.45361328125, -3.3544921875, -3.25537109375, -3.15625, -3.05712890625, -2.9580078125, -2.85888671875, -2.759765625, -2.66064453125, -2.5615234375, -2.46240234375, -2.36328125, -2.26416015625, -2.1650390625, -2.06591796875, -1.966796875, -1.86767578125, -1.7685546875, -1.66943359375, -1.5703125, -1.47119140625, -1.3720703125, -1.27294921875, -1.173828125, -1.07470703125, -0.9755859375, -0.87646484375, -0.77734375, -0.67822265625, -0.5791015625, -0.47998046875, -0.380859375, -0.28173828125, -0.1826171875, -0.08349609375, 0.015625, 0.11474609375, 0.2138671875, 0.31298828125, 0.412109375, 0.51123046875, 0.6103515625, 0.70947265625, 0.80859375, 0.90771484375, 1.0068359375, 1.10595703125, 1.205078125, 1.30419921875, 1.4033203125, 1.50244140625, 1.6015625, 1.70068359375, 1.7998046875, 1.89892578125, 1.998046875, 2.09716796875, 2.1962890625, 2.29541015625, 2.39453125, 2.49365234375, 2.5927734375, 2.69189453125, 2.791015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 4.0, 9.0, 9.0, 12.0, 19.0, 20.0, 40.0, 70.0, 94.0, 171.0, 230.0, 435.0, 804.0, 1703.0, 4273.0, 18339.0, 154602.0, 701810.0, 141084.0, 17262.0, 4113.0, 1571.0, 767.0, 403.0, 258.0, 159.0, 92.0, 65.0, 38.0, 23.0, 16.0, 15.0, 15.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2265625, -10.9188232421875, -10.611083984375, -10.3033447265625, -9.99560546875, -9.6878662109375, -9.380126953125, -9.0723876953125, -8.7646484375, -8.4569091796875, -8.149169921875, -7.8414306640625, -7.53369140625, -7.2259521484375, -6.918212890625, -6.6104736328125, -6.302734375, -5.9949951171875, -5.687255859375, -5.3795166015625, -5.07177734375, -4.7640380859375, -4.456298828125, -4.1485595703125, -3.8408203125, -3.5330810546875, -3.225341796875, -2.9176025390625, -2.60986328125, -2.3021240234375, -1.994384765625, -1.6866455078125, -1.37890625, -1.0711669921875, -0.763427734375, -0.4556884765625, -0.14794921875, 0.1597900390625, 0.467529296875, 0.7752685546875, 1.0830078125, 1.3907470703125, 1.698486328125, 2.0062255859375, 2.31396484375, 2.6217041015625, 2.929443359375, 3.2371826171875, 3.544921875, 3.8526611328125, 4.160400390625, 4.4681396484375, 4.77587890625, 5.0836181640625, 5.391357421875, 5.6990966796875, 6.0068359375, 6.3145751953125, 6.622314453125, 6.9300537109375, 7.23779296875, 7.5455322265625, 7.853271484375, 8.1610107421875, 8.46875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 6.0, 6.0, 8.0, 9.0, 11.0, 18.0, 17.0, 21.0, 26.0, 37.0, 40.0, 38.0, 40.0, 51.0, 43.0, 55.0, 61.0, 63.0, 62.0, 49.0, 45.0, 49.0, 41.0, 28.0, 29.0, 33.0, 21.0, 21.0, 17.0, 17.0, 11.0, 8.0, 7.0, 3.0, 0.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.939453125, -10.55078125, -10.162109375, -9.7734375, -9.384765625, -8.99609375, -8.607421875, -8.21875, -7.830078125, -7.44140625, -7.052734375, -6.6640625, -6.275390625, -5.88671875, -5.498046875, -5.109375, -4.720703125, -4.33203125, -3.943359375, -3.5546875, -3.166015625, -2.77734375, -2.388671875, -2.0, -1.611328125, -1.22265625, -0.833984375, -0.4453125, -0.056640625, 0.33203125, 0.720703125, 1.109375, 1.498046875, 1.88671875, 2.275390625, 2.6640625, 3.052734375, 3.44140625, 3.830078125, 4.21875, 4.607421875, 4.99609375, 5.384765625, 5.7734375, 6.162109375, 6.55078125, 6.939453125, 7.328125, 7.716796875, 8.10546875, 8.494140625, 8.8828125, 9.271484375, 9.66015625, 10.048828125, 10.4375, 10.826171875, 11.21484375, 11.603515625, 11.9921875, 12.380859375, 12.76953125, 13.158203125, 13.546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 6.0, 9.0, 7.0, 13.0, 16.0, 30.0, 39.0, 57.0, 92.0, 172.0, 314.0, 657.0, 1598.0, 5225.0, 27516.0, 249985.0, 663177.0, 82903.0, 11849.0, 2840.0, 1022.0, 417.0, 226.0, 124.0, 91.0, 49.0, 34.0, 17.0, 18.0, 8.0, 10.0, 6.0, 6.0, 7.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.591796875, -3.48046875, -3.369140625, -3.2578125, -3.146484375, -3.03515625, -2.923828125, -2.8125, -2.701171875, -2.58984375, -2.478515625, -2.3671875, -2.255859375, -2.14453125, -2.033203125, -1.921875, -1.810546875, -1.69921875, -1.587890625, -1.4765625, -1.365234375, -1.25390625, -1.142578125, -1.03125, -0.919921875, -0.80859375, -0.697265625, -0.5859375, -0.474609375, -0.36328125, -0.251953125, -0.140625, -0.029296875, 0.08203125, 0.193359375, 0.3046875, 0.416015625, 0.52734375, 0.638671875, 0.75, 0.861328125, 0.97265625, 1.083984375, 1.1953125, 1.306640625, 1.41796875, 1.529296875, 1.640625, 1.751953125, 1.86328125, 1.974609375, 2.0859375, 2.197265625, 2.30859375, 2.419921875, 2.53125, 2.642578125, 2.75390625, 2.865234375, 2.9765625, 3.087890625, 3.19921875, 3.310546875, 3.421875, 3.533203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 8.0, 7.0, 9.0, 20.0, 9.0, 27.0, 33.0, 48.0, 47.0, 69.0, 111.0, 97.0, 130.0, 85.0, 56.0, 55.0, 47.0, 33.0, 31.0, 19.0, 13.0, 12.0, 8.0, 3.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005121231079101562, -0.0004954710602760315, -0.00047881901264190674, -0.000462166965007782, -0.0004455149173736572, -0.00042886286973953247, -0.0004122108221054077, -0.00039555877447128296, -0.0003789067268371582, -0.00036225467920303345, -0.0003456026315689087, -0.00032895058393478394, -0.0003122985363006592, -0.0002956464886665344, -0.00027899444103240967, -0.0002623423933982849, -0.00024569034576416016, -0.0002290382981300354, -0.00021238625049591064, -0.0001957342028617859, -0.00017908215522766113, -0.00016243010759353638, -0.00014577805995941162, -0.00012912601232528687, -0.00011247396469116211, -9.582191705703735e-05, -7.91698694229126e-05, -6.251782178878784e-05, -4.5865774154663086e-05, -2.921372652053833e-05, -1.2561678886413574e-05, 4.090368747711182e-06, 2.0742416381835938e-05, 3.739446401596069e-05, 5.404651165008545e-05, 7.06985592842102e-05, 8.735060691833496e-05, 0.00010400265455245972, 0.00012065470218658447, 0.00013730674982070923, 0.00015395879745483398, 0.00017061084508895874, 0.0001872628927230835, 0.00020391494035720825, 0.000220566987991333, 0.00023721903562545776, 0.0002538710832595825, 0.0002705231308937073, 0.00028717517852783203, 0.0003038272261619568, 0.00032047927379608154, 0.0003371313214302063, 0.00035378336906433105, 0.0003704354166984558, 0.00038708746433258057, 0.0004037395119667053, 0.0004203915596008301, 0.00043704360723495483, 0.0004536956548690796, 0.00047034770250320435, 0.0004869997501373291, 0.0005036517977714539, 0.0005203038454055786, 0.0005369558930397034, 0.0005536079406738281]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 11.0, 11.0, 21.0, 28.0, 34.0, 65.0, 90.0, 139.0, 259.0, 451.0, 866.0, 2024.0, 6038.0, 25260.0, 190112.0, 682769.0, 114898.0, 17449.0, 4555.0, 1707.0, 753.0, 403.0, 221.0, 133.0, 79.0, 54.0, 34.0, 22.0, 11.0, 14.0, 10.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.133209228515625, -3.01446533203125, -2.895721435546875, -2.7769775390625, -2.658233642578125, -2.53948974609375, -2.420745849609375, -2.302001953125, -2.183258056640625, -2.06451416015625, -1.945770263671875, -1.8270263671875, -1.708282470703125, -1.58953857421875, -1.470794677734375, -1.35205078125, -1.233306884765625, -1.11456298828125, -0.995819091796875, -0.8770751953125, -0.758331298828125, -0.63958740234375, -0.520843505859375, -0.402099609375, -0.283355712890625, -0.16461181640625, -0.045867919921875, 0.0728759765625, 0.191619873046875, 0.31036376953125, 0.429107666015625, 0.5478515625, 0.666595458984375, 0.78533935546875, 0.904083251953125, 1.0228271484375, 1.141571044921875, 1.26031494140625, 1.379058837890625, 1.497802734375, 1.616546630859375, 1.73529052734375, 1.854034423828125, 1.9727783203125, 2.091522216796875, 2.21026611328125, 2.329010009765625, 2.44775390625, 2.566497802734375, 2.68524169921875, 2.803985595703125, 2.9227294921875, 3.041473388671875, 3.16021728515625, 3.278961181640625, 3.397705078125, 3.516448974609375, 3.63519287109375, 3.753936767578125, 3.8726806640625, 3.991424560546875, 4.11016845703125, 4.228912353515625, 4.34765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 11.0, 6.0, 12.0, 25.0, 24.0, 25.0, 38.0, 51.0, 66.0, 97.0, 100.0, 97.0, 104.0, 66.0, 67.0, 52.0, 35.0, 22.0, 17.0, 14.0, 14.0, 13.0, 7.0, 7.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-5.00390625, -4.884796142578125, -4.76568603515625, -4.646575927734375, -4.5274658203125, -4.408355712890625, -4.28924560546875, -4.170135498046875, -4.051025390625, -3.931915283203125, -3.81280517578125, -3.693695068359375, -3.5745849609375, -3.455474853515625, -3.33636474609375, -3.217254638671875, -3.09814453125, -2.979034423828125, -2.85992431640625, -2.740814208984375, -2.6217041015625, -2.502593994140625, -2.38348388671875, -2.264373779296875, -2.145263671875, -2.026153564453125, -1.90704345703125, -1.787933349609375, -1.6688232421875, -1.549713134765625, -1.43060302734375, -1.311492919921875, -1.1923828125, -1.073272705078125, -0.95416259765625, -0.835052490234375, -0.7159423828125, -0.596832275390625, -0.47772216796875, -0.358612060546875, -0.239501953125, -0.120391845703125, -0.00128173828125, 0.117828369140625, 0.2369384765625, 0.356048583984375, 0.47515869140625, 0.594268798828125, 0.71337890625, 0.832489013671875, 0.95159912109375, 1.070709228515625, 1.1898193359375, 1.308929443359375, 1.42803955078125, 1.547149658203125, 1.666259765625, 1.785369873046875, 1.90447998046875, 2.023590087890625, 2.1427001953125, 2.261810302734375, 2.38092041015625, 2.500030517578125, 2.619140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 17.0, 35.0, 77.0, 143.0, 171.0, 172.0, 159.0, 94.0, 56.0, 25.0, 18.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.88885498046875, -90.41629028320312, -87.9437255859375, -85.47115325927734, -82.99858856201172, -80.5260238647461, -78.05345916748047, -75.58088684082031, -73.10832214355469, -70.63575744628906, -68.16319274902344, -65.69062042236328, -63.218055725097656, -60.74549102783203, -58.272926330566406, -55.800357818603516, -53.32779312133789, -50.855228424072266, -48.382659912109375, -45.91009521484375, -43.43752670288086, -40.964962005615234, -38.492393493652344, -36.01982879638672, -33.547264099121094, -31.074697494506836, -28.602130889892578, -26.129566192626953, -23.656997680664062, -21.184432983398438, -18.71186637878418, -16.239299774169922, -13.766731262207031, -11.294164657592773, -8.821598052978516, -6.349032402038574, -3.8764657974243164, -1.4038991928100586, 1.0686664581298828, 3.5412330627441406, 6.013799667358398, 8.486366271972656, 10.958932876586914, 13.431498527526855, 15.904065132141113, 18.376632690429688, 20.849197387695312, 23.32176399230957, 25.794330596923828, 28.266897201538086, 30.739463806152344, 33.21202850341797, 35.68459701538086, 38.157161712646484, 40.629730224609375, 43.102294921875, 45.574859619140625, 48.04742431640625, 50.51999282836914, 52.992557525634766, 55.465126037597656, 57.93769073486328, 60.410255432128906, 62.8828239440918, 65.35539245605469]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 7.0, 7.0, 5.0, 11.0, 12.0, 17.0, 23.0, 23.0, 28.0, 27.0, 53.0, 52.0, 38.0, 41.0, 52.0, 41.0, 55.0, 46.0, 55.0, 46.0, 45.0, 50.0, 41.0, 41.0, 26.0, 25.0, 21.0, 27.0, 18.0, 11.0, 9.0, 7.0, 4.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.47792053222656, -48.893672943115234, -47.309425354003906, -45.725181579589844, -44.140933990478516, -42.55668640136719, -40.97243881225586, -39.38819122314453, -37.80394744873047, -36.21969985961914, -34.63545227050781, -33.05120849609375, -31.466960906982422, -29.882713317871094, -28.298465728759766, -26.714218139648438, -25.12997055053711, -23.54572296142578, -21.961477279663086, -20.377229690551758, -18.792984008789062, -17.208736419677734, -15.624488830566406, -14.040242195129395, -12.455995559692383, -10.871748924255371, -9.28750228881836, -7.703254699707031, -6.1190080642700195, -4.534761428833008, -2.9505138397216797, -1.366267204284668, 0.21797943115234375, 1.8022263050079346, 3.3864731788635254, 4.970720291137695, 6.554966926574707, 8.139213562011719, 9.723461151123047, 11.307707786560059, 12.89195442199707, 14.476201057434082, 16.060447692871094, 17.644695281982422, 19.22894287109375, 20.813188552856445, 22.397436141967773, 23.98168182373047, 25.565929412841797, 27.150177001953125, 28.73442268371582, 30.31867027282715, 31.902915954589844, 33.48716354370117, 35.0714111328125, 36.65565872192383, 38.239906311035156, 39.824153900146484, 41.40840148925781, 42.992645263671875, 44.5768928527832, 46.16114044189453, 47.74538803100586, 49.32963562011719, 50.91387939453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 10.0, 11.0, 14.0, 20.0, 32.0, 47.0, 74.0, 142.0, 329.0, 753.0, 2347.0, 8279.0, 53345.0, 3156785.0, 931987.0, 31613.0, 5834.0, 1598.0, 515.0, 208.0, 116.0, 76.0, 39.0, 35.0, 14.0, 12.0, 8.0, 12.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.9453125, -9.6517333984375, -9.358154296875, -9.0645751953125, -8.77099609375, -8.4774169921875, -8.183837890625, -7.8902587890625, -7.5966796875, -7.3031005859375, -7.009521484375, -6.7159423828125, -6.42236328125, -6.1287841796875, -5.835205078125, -5.5416259765625, -5.248046875, -4.9544677734375, -4.660888671875, -4.3673095703125, -4.07373046875, -3.7801513671875, -3.486572265625, -3.1929931640625, -2.8994140625, -2.6058349609375, -2.312255859375, -2.0186767578125, -1.72509765625, -1.4315185546875, -1.137939453125, -0.8443603515625, -0.55078125, -0.2572021484375, 0.036376953125, 0.3299560546875, 0.62353515625, 0.9171142578125, 1.210693359375, 1.5042724609375, 1.7978515625, 2.0914306640625, 2.385009765625, 2.6785888671875, 2.97216796875, 3.2657470703125, 3.559326171875, 3.8529052734375, 4.146484375, 4.4400634765625, 4.733642578125, 5.0272216796875, 5.32080078125, 5.6143798828125, 5.907958984375, 6.2015380859375, 6.4951171875, 6.7886962890625, 7.082275390625, 7.3758544921875, 7.66943359375, 7.9630126953125, 8.256591796875, 8.5501708984375, 8.84375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 19.0, 13.0, 22.0, 28.0, 40.0, 32.0, 45.0, 58.0, 70.0, 85.0, 77.0, 76.0, 70.0, 72.0, 74.0, 45.0, 42.0, 30.0, 23.0, 20.0, 18.0, 9.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0859375, -3.97796630859375, -3.8699951171875, -3.76202392578125, -3.654052734375, -3.54608154296875, -3.4381103515625, -3.33013916015625, -3.22216796875, -3.11419677734375, -3.0062255859375, -2.89825439453125, -2.790283203125, -2.68231201171875, -2.5743408203125, -2.46636962890625, -2.3583984375, -2.25042724609375, -2.1424560546875, -2.03448486328125, -1.926513671875, -1.81854248046875, -1.7105712890625, -1.60260009765625, -1.49462890625, -1.38665771484375, -1.2786865234375, -1.17071533203125, -1.062744140625, -0.95477294921875, -0.8468017578125, -0.73883056640625, -0.630859375, -0.52288818359375, -0.4149169921875, -0.30694580078125, -0.198974609375, -0.09100341796875, 0.0169677734375, 0.12493896484375, 0.23291015625, 0.34088134765625, 0.4488525390625, 0.55682373046875, 0.664794921875, 0.77276611328125, 0.8807373046875, 0.98870849609375, 1.0966796875, 1.20465087890625, 1.3126220703125, 1.42059326171875, 1.528564453125, 1.63653564453125, 1.7445068359375, 1.85247802734375, 1.96044921875, 2.06842041015625, 2.1763916015625, 2.28436279296875, 2.392333984375, 2.50030517578125, 2.6082763671875, 2.71624755859375, 2.82421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 14.0, 28.0, 35.0, 40.0, 83.0, 201.0, 613.0, 2436.0, 13385.0, 118333.0, 3823996.0, 212635.0, 18092.0, 3143.0, 785.0, 203.0, 92.0, 44.0, 21.0, 14.0, 11.0, 11.0, 9.0, 9.0, 11.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -8.9298095703125, -8.593994140625, -8.2581787109375, -7.92236328125, -7.5865478515625, -7.250732421875, -6.9149169921875, -6.5791015625, -6.2432861328125, -5.907470703125, -5.5716552734375, -5.23583984375, -4.9000244140625, -4.564208984375, -4.2283935546875, -3.892578125, -3.5567626953125, -3.220947265625, -2.8851318359375, -2.54931640625, -2.2135009765625, -1.877685546875, -1.5418701171875, -1.2060546875, -0.8702392578125, -0.534423828125, -0.1986083984375, 0.13720703125, 0.4730224609375, 0.808837890625, 1.1446533203125, 1.48046875, 1.8162841796875, 2.152099609375, 2.4879150390625, 2.82373046875, 3.1595458984375, 3.495361328125, 3.8311767578125, 4.1669921875, 4.5028076171875, 4.838623046875, 5.1744384765625, 5.51025390625, 5.8460693359375, 6.181884765625, 6.5177001953125, 6.853515625, 7.1893310546875, 7.525146484375, 7.8609619140625, 8.19677734375, 8.5325927734375, 8.868408203125, 9.2042236328125, 9.5400390625, 9.8758544921875, 10.211669921875, 10.5474853515625, 10.88330078125, 11.2191162109375, 11.554931640625, 11.8907470703125, 12.2265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 8.0, 5.0, 8.0, 5.0, 11.0, 16.0, 12.0, 25.0, 36.0, 29.0, 44.0, 79.0, 152.0, 286.0, 486.0, 827.0, 882.0, 524.0, 271.0, 144.0, 59.0, 38.0, 26.0, 25.0, 17.0, 10.0, 12.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-7.18359375, -6.994384765625, -6.80517578125, -6.615966796875, -6.4267578125, -6.237548828125, -6.04833984375, -5.859130859375, -5.669921875, -5.480712890625, -5.29150390625, -5.102294921875, -4.9130859375, -4.723876953125, -4.53466796875, -4.345458984375, -4.15625, -3.967041015625, -3.77783203125, -3.588623046875, -3.3994140625, -3.210205078125, -3.02099609375, -2.831787109375, -2.642578125, -2.453369140625, -2.26416015625, -2.074951171875, -1.8857421875, -1.696533203125, -1.50732421875, -1.318115234375, -1.12890625, -0.939697265625, -0.75048828125, -0.561279296875, -0.3720703125, -0.182861328125, 0.00634765625, 0.195556640625, 0.384765625, 0.573974609375, 0.76318359375, 0.952392578125, 1.1416015625, 1.330810546875, 1.52001953125, 1.709228515625, 1.8984375, 2.087646484375, 2.27685546875, 2.466064453125, 2.6552734375, 2.844482421875, 3.03369140625, 3.222900390625, 3.412109375, 3.601318359375, 3.79052734375, 3.979736328125, 4.1689453125, 4.358154296875, 4.54736328125, 4.736572265625, 4.92578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 5.0, 14.0, 28.0, 55.0, 117.0, 221.0, 230.0, 156.0, 97.0, 41.0, 21.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56529235839844, -61.93910217285156, -59.31291198730469, -56.68672180175781, -54.06052780151367, -51.4343376159668, -48.80814743041992, -46.18195343017578, -43.555763244628906, -40.92957305908203, -38.303382873535156, -35.67719268798828, -33.05099868774414, -30.424808502197266, -27.79861831665039, -25.172426223754883, -22.54623794555664, -19.920047760009766, -17.293855667114258, -14.667665481567383, -12.041474342346191, -9.415283203125, -6.789093017578125, -4.162900924682617, -1.5367107391357422, 1.0894801616668701, 3.7156710624694824, 6.341861724853516, 8.968052864074707, 11.594244003295898, 14.220434188842773, 16.84662628173828, 19.472816467285156, 22.09900665283203, 24.72519874572754, 27.351388931274414, 29.977581024169922, 32.6037712097168, 35.22996139526367, 37.85615539550781, 40.48234558105469, 43.10853576660156, 45.73472595214844, 48.36091613769531, 50.98711013793945, 53.61330032348633, 56.2394905090332, 58.865684509277344, 61.49187088012695, 64.1180648803711, 66.74425506591797, 69.37044525146484, 71.99663543701172, 74.6228256225586, 77.24901580810547, 79.87520599365234, 82.50139617919922, 85.1275863647461, 87.75377655029297, 90.37996673583984, 93.00615692138672, 95.63235473632812, 98.258544921875, 100.88473510742188, 103.51092529296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 9.0, 3.0, 9.0, 15.0, 19.0, 8.0, 23.0, 28.0, 20.0, 26.0, 36.0, 27.0, 40.0, 40.0, 49.0, 41.0, 38.0, 39.0, 49.0, 49.0, 57.0, 46.0, 30.0, 36.0, 42.0, 36.0, 27.0, 25.0, 18.0, 21.0, 18.0, 14.0, 7.0, 10.0, 12.0, 6.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0], "bins": [-30.106956481933594, -29.327640533447266, -28.54832649230957, -27.769010543823242, -26.989696502685547, -26.21038055419922, -25.43106460571289, -24.651750564575195, -23.8724365234375, -23.093120574951172, -22.313806533813477, -21.53449058532715, -20.755176544189453, -19.975860595703125, -19.196544647216797, -18.4172306060791, -17.637914657592773, -16.858598709106445, -16.07928466796875, -15.299968719482422, -14.520654678344727, -13.741338729858398, -12.962023735046387, -12.182708740234375, -11.403393745422363, -10.624078750610352, -9.84476375579834, -9.065448760986328, -8.2861328125, -7.5068182945251465, -6.727502822875977, -5.948187828063965, -5.16887092590332, -4.389555931091309, -3.6102406978607178, -2.830925464630127, -2.0516104698181152, -1.2722954750061035, -0.4929800033569336, 0.2863349914550781, 1.0656499862670898, 1.8449651002883911, 2.6242802143096924, 3.403595447540283, 4.182910442352295, 4.962225437164307, 5.741540908813477, 6.520855903625488, 7.3001708984375, 8.079485893249512, 8.858800888061523, 9.638116836547852, 10.417430877685547, 11.196746826171875, 11.976061820983887, 12.755376815795898, 13.53469181060791, 14.314006805419922, 15.093321800231934, 15.872636795043945, 16.651952743530273, 17.43126678466797, 18.210582733154297, 18.989898681640625, 19.76921272277832]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 12.0, 12.0, 12.0, 27.0, 33.0, 35.0, 58.0, 79.0, 140.0, 191.0, 353.0, 479.0, 735.0, 1315.0, 2163.0, 3791.0, 6902.0, 12616.0, 23313.0, 44461.0, 85909.0, 166175.0, 258528.0, 207317.0, 110759.0, 57235.0, 29669.0, 15763.0, 8666.0, 4757.0, 2753.0, 1633.0, 911.0, 618.0, 359.0, 236.0, 164.0, 109.0, 81.0, 65.0, 40.0, 26.0, 16.0, 15.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.28515625, -3.190460205078125, -3.09576416015625, -3.001068115234375, -2.9063720703125, -2.811676025390625, -2.71697998046875, -2.622283935546875, -2.527587890625, -2.432891845703125, -2.33819580078125, -2.243499755859375, -2.1488037109375, -2.054107666015625, -1.95941162109375, -1.864715576171875, -1.77001953125, -1.675323486328125, -1.58062744140625, -1.485931396484375, -1.3912353515625, -1.296539306640625, -1.20184326171875, -1.107147216796875, -1.012451171875, -0.917755126953125, -0.82305908203125, -0.728363037109375, -0.6336669921875, -0.538970947265625, -0.44427490234375, -0.349578857421875, -0.2548828125, -0.160186767578125, -0.06549072265625, 0.029205322265625, 0.1239013671875, 0.218597412109375, 0.31329345703125, 0.407989501953125, 0.502685546875, 0.597381591796875, 0.69207763671875, 0.786773681640625, 0.8814697265625, 0.976165771484375, 1.07086181640625, 1.165557861328125, 1.26025390625, 1.354949951171875, 1.44964599609375, 1.544342041015625, 1.6390380859375, 1.733734130859375, 1.82843017578125, 1.923126220703125, 2.017822265625, 2.112518310546875, 2.20721435546875, 2.301910400390625, 2.3966064453125, 2.491302490234375, 2.58599853515625, 2.680694580078125, 2.775390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 15.0, 13.0, 17.0, 21.0, 22.0, 34.0, 34.0, 31.0, 45.0, 61.0, 63.0, 49.0, 45.0, 53.0, 55.0, 42.0, 56.0, 41.0, 41.0, 40.0, 33.0, 30.0, 16.0, 21.0, 12.0, 14.0, 18.0, 10.0, 14.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.8125, -2.7389678955078125, -2.665435791015625, -2.5919036865234375, -2.51837158203125, -2.4448394775390625, -2.371307373046875, -2.2977752685546875, -2.2242431640625, -2.1507110595703125, -2.077178955078125, -2.0036468505859375, -1.93011474609375, -1.8565826416015625, -1.783050537109375, -1.7095184326171875, -1.635986328125, -1.5624542236328125, -1.488922119140625, -1.4153900146484375, -1.34185791015625, -1.2683258056640625, -1.194793701171875, -1.1212615966796875, -1.0477294921875, -0.9741973876953125, -0.900665283203125, -0.8271331787109375, -0.75360107421875, -0.6800689697265625, -0.606536865234375, -0.5330047607421875, -0.45947265625, -0.3859405517578125, -0.312408447265625, -0.2388763427734375, -0.16534423828125, -0.0918121337890625, -0.018280029296875, 0.0552520751953125, 0.1287841796875, 0.2023162841796875, 0.275848388671875, 0.3493804931640625, 0.42291259765625, 0.4964447021484375, 0.569976806640625, 0.6435089111328125, 0.717041015625, 0.7905731201171875, 0.864105224609375, 0.9376373291015625, 1.01116943359375, 1.0847015380859375, 1.158233642578125, 1.2317657470703125, 1.3052978515625, 1.3788299560546875, 1.452362060546875, 1.5258941650390625, 1.59942626953125, 1.6729583740234375, 1.746490478515625, 1.8200225830078125, 1.8935546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 6.0, 12.0, 21.0, 19.0, 35.0, 49.0, 67.0, 149.0, 218.0, 382.0, 685.0, 1342.0, 4029.0, 21451.0, 306748.0, 663016.0, 40602.0, 5931.0, 1879.0, 812.0, 412.0, 270.0, 150.0, 98.0, 69.0, 31.0, 24.0, 17.0, 13.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.703125, -11.3272705078125, -10.951416015625, -10.5755615234375, -10.19970703125, -9.8238525390625, -9.447998046875, -9.0721435546875, -8.6962890625, -8.3204345703125, -7.944580078125, -7.5687255859375, -7.19287109375, -6.8170166015625, -6.441162109375, -6.0653076171875, -5.689453125, -5.3135986328125, -4.937744140625, -4.5618896484375, -4.18603515625, -3.8101806640625, -3.434326171875, -3.0584716796875, -2.6826171875, -2.3067626953125, -1.930908203125, -1.5550537109375, -1.17919921875, -0.8033447265625, -0.427490234375, -0.0516357421875, 0.32421875, 0.7000732421875, 1.075927734375, 1.4517822265625, 1.82763671875, 2.2034912109375, 2.579345703125, 2.9552001953125, 3.3310546875, 3.7069091796875, 4.082763671875, 4.4586181640625, 4.83447265625, 5.2103271484375, 5.586181640625, 5.9620361328125, 6.337890625, 6.7137451171875, 7.089599609375, 7.4654541015625, 7.84130859375, 8.2171630859375, 8.593017578125, 8.9688720703125, 9.3447265625, 9.7205810546875, 10.096435546875, 10.4722900390625, 10.84814453125, 11.2239990234375, 11.599853515625, 11.9757080078125, 12.3515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 10.0, 5.0, 4.0, 8.0, 11.0, 9.0, 12.0, 14.0, 14.0, 18.0, 28.0, 29.0, 43.0, 41.0, 43.0, 49.0, 36.0, 42.0, 46.0, 48.0, 45.0, 41.0, 49.0, 47.0, 46.0, 37.0, 45.0, 37.0, 32.0, 16.0, 22.0, 13.0, 11.0, 11.0, 5.0, 6.0, 7.0, 2.0, 9.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3460693359375, -10.020263671875, -9.6944580078125, -9.36865234375, -9.0428466796875, -8.717041015625, -8.3912353515625, -8.0654296875, -7.7396240234375, -7.413818359375, -7.0880126953125, -6.76220703125, -6.4364013671875, -6.110595703125, -5.7847900390625, -5.458984375, -5.1331787109375, -4.807373046875, -4.4815673828125, -4.15576171875, -3.8299560546875, -3.504150390625, -3.1783447265625, -2.8525390625, -2.5267333984375, -2.200927734375, -1.8751220703125, -1.54931640625, -1.2235107421875, -0.897705078125, -0.5718994140625, -0.24609375, 0.0797119140625, 0.405517578125, 0.7313232421875, 1.05712890625, 1.3829345703125, 1.708740234375, 2.0345458984375, 2.3603515625, 2.6861572265625, 3.011962890625, 3.3377685546875, 3.66357421875, 3.9893798828125, 4.315185546875, 4.6409912109375, 4.966796875, 5.2926025390625, 5.618408203125, 5.9442138671875, 6.27001953125, 6.5958251953125, 6.921630859375, 7.2474365234375, 7.5732421875, 7.8990478515625, 8.224853515625, 8.5506591796875, 8.87646484375, 9.2022705078125, 9.528076171875, 9.8538818359375, 10.1796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 13.0, 10.0, 26.0, 38.0, 72.0, 119.0, 308.0, 1132.0, 8423.0, 261979.0, 758516.0, 15486.0, 1721.0, 398.0, 138.0, 60.0, 37.0, 24.0, 12.0, 10.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.11041259765625, -9.8380126953125, -9.56561279296875, -9.293212890625, -9.02081298828125, -8.7484130859375, -8.47601318359375, -8.20361328125, -7.93121337890625, -7.6588134765625, -7.38641357421875, -7.114013671875, -6.84161376953125, -6.5692138671875, -6.29681396484375, -6.0244140625, -5.75201416015625, -5.4796142578125, -5.20721435546875, -4.934814453125, -4.66241455078125, -4.3900146484375, -4.11761474609375, -3.84521484375, -3.57281494140625, -3.3004150390625, -3.02801513671875, -2.755615234375, -2.48321533203125, -2.2108154296875, -1.93841552734375, -1.666015625, -1.39361572265625, -1.1212158203125, -0.84881591796875, -0.576416015625, -0.30401611328125, -0.0316162109375, 0.24078369140625, 0.51318359375, 0.78558349609375, 1.0579833984375, 1.33038330078125, 1.602783203125, 1.87518310546875, 2.1475830078125, 2.41998291015625, 2.6923828125, 2.96478271484375, 3.2371826171875, 3.50958251953125, 3.781982421875, 4.05438232421875, 4.3267822265625, 4.59918212890625, 4.87158203125, 5.14398193359375, 5.4163818359375, 5.68878173828125, 5.961181640625, 6.23358154296875, 6.5059814453125, 6.77838134765625, 7.05078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 11.0, 4.0, 12.0, 11.0, 8.0, 22.0, 22.0, 35.0, 58.0, 79.0, 117.0, 124.0, 145.0, 99.0, 56.0, 52.0, 34.0, 20.0, 17.0, 17.0, 7.0, 11.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000881195068359375, -0.0008565932512283325, -0.00083199143409729, -0.0008073896169662476, -0.0007827877998352051, -0.0007581859827041626, -0.0007335841655731201, -0.0007089823484420776, -0.0006843805313110352, -0.0006597787141799927, -0.0006351768970489502, -0.0006105750799179077, -0.0005859732627868652, -0.0005613714456558228, -0.0005367696285247803, -0.0005121678113937378, -0.0004875659942626953, -0.00046296417713165283, -0.00043836236000061035, -0.00041376054286956787, -0.0003891587257385254, -0.0003645569086074829, -0.00033995509147644043, -0.00031535327434539795, -0.00029075145721435547, -0.000266149640083313, -0.0002415478229522705, -0.00021694600582122803, -0.00019234418869018555, -0.00016774237155914307, -0.00014314055442810059, -0.0001185387372970581, -9.393692016601562e-05, -6.933510303497314e-05, -4.4733285903930664e-05, -2.0131468772888184e-05, 4.470348358154297e-06, 2.9072165489196777e-05, 5.367398262023926e-05, 7.827579975128174e-05, 0.00010287761688232422, 0.0001274794340133667, 0.00015208125114440918, 0.00017668306827545166, 0.00020128488540649414, 0.00022588670253753662, 0.0002504885196685791, 0.0002750903367996216, 0.00029969215393066406, 0.00032429397106170654, 0.000348895788192749, 0.0003734976053237915, 0.000398099422454834, 0.00042270123958587646, 0.00044730305671691895, 0.0004719048738479614, 0.0004965066909790039, 0.0005211085081100464, 0.0005457103252410889, 0.0005703121423721313, 0.0005949139595031738, 0.0006195157766342163, 0.0006441175937652588, 0.0006687194108963013, 0.0006933212280273438]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 4.0, 9.0, 12.0, 15.0, 20.0, 34.0, 39.0, 55.0, 100.0, 163.0, 266.0, 461.0, 796.0, 1771.0, 4292.0, 14196.0, 69589.0, 587714.0, 310183.0, 42518.0, 9934.0, 3276.0, 1376.0, 666.0, 373.0, 236.0, 134.0, 85.0, 61.0, 48.0, 24.0, 31.0, 22.0, 14.0, 10.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.39697265625, -3.2705078125, -3.14404296875, -3.017578125, -2.89111328125, -2.7646484375, -2.63818359375, -2.51171875, -2.38525390625, -2.2587890625, -2.13232421875, -2.005859375, -1.87939453125, -1.7529296875, -1.62646484375, -1.5, -1.37353515625, -1.2470703125, -1.12060546875, -0.994140625, -0.86767578125, -0.7412109375, -0.61474609375, -0.48828125, -0.36181640625, -0.2353515625, -0.10888671875, 0.017578125, 0.14404296875, 0.2705078125, 0.39697265625, 0.5234375, 0.64990234375, 0.7763671875, 0.90283203125, 1.029296875, 1.15576171875, 1.2822265625, 1.40869140625, 1.53515625, 1.66162109375, 1.7880859375, 1.91455078125, 2.041015625, 2.16748046875, 2.2939453125, 2.42041015625, 2.546875, 2.67333984375, 2.7998046875, 2.92626953125, 3.052734375, 3.17919921875, 3.3056640625, 3.43212890625, 3.55859375, 3.68505859375, 3.8115234375, 3.93798828125, 4.064453125, 4.19091796875, 4.3173828125, 4.44384765625, 4.5703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 14.0, 14.0, 17.0, 21.0, 29.0, 30.0, 39.0, 67.0, 71.0, 97.0, 111.0, 104.0, 103.0, 64.0, 57.0, 47.0, 34.0, 19.0, 12.0, 16.0, 5.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.5455322265625, -4.415283203125, -4.2850341796875, -4.15478515625, -4.0245361328125, -3.894287109375, -3.7640380859375, -3.6337890625, -3.5035400390625, -3.373291015625, -3.2430419921875, -3.11279296875, -2.9825439453125, -2.852294921875, -2.7220458984375, -2.591796875, -2.4615478515625, -2.331298828125, -2.2010498046875, -2.07080078125, -1.9405517578125, -1.810302734375, -1.6800537109375, -1.5498046875, -1.4195556640625, -1.289306640625, -1.1590576171875, -1.02880859375, -0.8985595703125, -0.768310546875, -0.6380615234375, -0.5078125, -0.3775634765625, -0.247314453125, -0.1170654296875, 0.01318359375, 0.1434326171875, 0.273681640625, 0.4039306640625, 0.5341796875, 0.6644287109375, 0.794677734375, 0.9249267578125, 1.05517578125, 1.1854248046875, 1.315673828125, 1.4459228515625, 1.576171875, 1.7064208984375, 1.836669921875, 1.9669189453125, 2.09716796875, 2.2274169921875, 2.357666015625, 2.4879150390625, 2.6181640625, 2.7484130859375, 2.878662109375, 3.0089111328125, 3.13916015625, 3.2694091796875, 3.399658203125, 3.5299072265625, 3.66015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 23.0, 31.0, 87.0, 163.0, 248.0, 207.0, 109.0, 61.0, 34.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.43703079223633, -53.697696685791016, -50.9583625793457, -48.219032287597656, -45.479698181152344, -42.74036407470703, -40.00102996826172, -37.261695861816406, -34.522361755371094, -31.78302764892578, -29.04369354248047, -26.30436134338379, -23.565027236938477, -20.825693130493164, -18.086360931396484, -15.347026824951172, -12.60769271850586, -9.868358612060547, -7.129025459289551, -4.389692306518555, -1.6503582000732422, 1.0889759063720703, 3.82830810546875, 6.5676422119140625, 9.306976318359375, 12.046310424804688, 14.785643577575684, 17.52497673034668, 20.264310836791992, 23.003644943237305, 25.742977142333984, 28.482311248779297, 31.221649169921875, 33.96098327636719, 36.7003173828125, 39.43965148925781, 42.178985595703125, 44.91831970214844, 47.657649993896484, 50.3969841003418, 53.13631820678711, 55.87565231323242, 58.614986419677734, 61.35431671142578, 64.0936508178711, 66.8329849243164, 69.57231903076172, 72.31165313720703, 75.05098724365234, 77.79032135009766, 80.52965545654297, 83.26898956298828, 86.0083236694336, 88.7476577758789, 91.48698425292969, 94.226318359375, 96.96565246582031, 99.70498657226562, 102.44432067871094, 105.18365478515625, 107.92298889160156, 110.66232299804688, 113.40165710449219, 116.1409912109375, 118.88032531738281]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 5.0, 8.0, 12.0, 18.0, 17.0, 20.0, 34.0, 28.0, 25.0, 46.0, 29.0, 42.0, 52.0, 63.0, 69.0, 82.0, 57.0, 42.0, 54.0, 46.0, 28.0, 30.0, 28.0, 28.0, 19.0, 25.0, 13.0, 19.0, 15.0, 5.0, 5.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.704566955566406, -44.30210876464844, -42.8996467590332, -41.497188568115234, -40.0947265625, -38.69226837158203, -37.28981018066406, -35.887351989746094, -34.48488998413086, -33.08243179321289, -31.679969787597656, -30.277511596679688, -28.875051498413086, -27.472591400146484, -26.070133209228516, -24.667673110961914, -23.265213012695312, -21.86275291442871, -20.46029281616211, -19.05783462524414, -17.65537452697754, -16.252914428710938, -14.850455284118652, -13.447996139526367, -12.045536041259766, -10.643075942993164, -9.240616798400879, -7.8381571769714355, -6.435697555541992, -5.033237934112549, -3.6307783126831055, -2.2283191680908203, -0.8258552551269531, 0.5766043663024902, 1.9790639877319336, 3.381523609161377, 4.78398323059082, 6.186442852020264, 7.588902473449707, 8.991361618041992, 10.393821716308594, 11.796281814575195, 13.19874095916748, 14.601200103759766, 16.003660202026367, 17.40612030029297, 18.808578491210938, 20.21103858947754, 21.61349868774414, 23.015958786010742, 24.418418884277344, 25.820877075195312, 27.223337173461914, 28.625797271728516, 30.028255462646484, 31.430715560913086, 32.83317565917969, 34.235633850097656, 35.63809585571289, 37.04055404663086, 38.443016052246094, 39.84547424316406, 41.24793243408203, 42.650390625, 44.052852630615234]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 8.0, 8.0, 8.0, 10.0, 14.0, 16.0, 20.0, 42.0, 49.0, 96.0, 123.0, 204.0, 305.0, 510.0, 880.0, 1570.0, 2932.0, 5738.0, 12793.0, 33104.0, 124595.0, 1012787.0, 2593085.0, 308657.0, 59527.0, 19453.0, 8465.0, 4027.0, 2235.0, 1230.0, 640.0, 420.0, 256.0, 150.0, 109.0, 75.0, 45.0, 30.0, 15.0, 10.0, 14.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.8046875, -3.69024658203125, -3.5758056640625, -3.46136474609375, -3.346923828125, -3.23248291015625, -3.1180419921875, -3.00360107421875, -2.88916015625, -2.77471923828125, -2.6602783203125, -2.54583740234375, -2.431396484375, -2.31695556640625, -2.2025146484375, -2.08807373046875, -1.9736328125, -1.85919189453125, -1.7447509765625, -1.63031005859375, -1.515869140625, -1.40142822265625, -1.2869873046875, -1.17254638671875, -1.05810546875, -0.94366455078125, -0.8292236328125, -0.71478271484375, -0.600341796875, -0.48590087890625, -0.3714599609375, -0.25701904296875, -0.142578125, -0.02813720703125, 0.0863037109375, 0.20074462890625, 0.315185546875, 0.42962646484375, 0.5440673828125, 0.65850830078125, 0.77294921875, 0.88739013671875, 1.0018310546875, 1.11627197265625, 1.230712890625, 1.34515380859375, 1.4595947265625, 1.57403564453125, 1.6884765625, 1.80291748046875, 1.9173583984375, 2.03179931640625, 2.146240234375, 2.26068115234375, 2.3751220703125, 2.48956298828125, 2.60400390625, 2.71844482421875, 2.8328857421875, 2.94732666015625, 3.061767578125, 3.17620849609375, 3.2906494140625, 3.40509033203125, 3.51953125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 11.0, 16.0, 9.0, 36.0, 34.0, 48.0, 63.0, 70.0, 103.0, 99.0, 102.0, 89.0, 73.0, 70.0, 50.0, 49.0, 24.0, 22.0, 18.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.679229736328125, -4.54986572265625, -4.420501708984375, -4.2911376953125, -4.161773681640625, -4.03240966796875, -3.903045654296875, -3.773681640625, -3.644317626953125, -3.51495361328125, -3.385589599609375, -3.2562255859375, -3.126861572265625, -2.99749755859375, -2.868133544921875, -2.73876953125, -2.609405517578125, -2.48004150390625, -2.350677490234375, -2.2213134765625, -2.091949462890625, -1.96258544921875, -1.833221435546875, -1.703857421875, -1.574493408203125, -1.44512939453125, -1.315765380859375, -1.1864013671875, -1.057037353515625, -0.92767333984375, -0.798309326171875, -0.6689453125, -0.539581298828125, -0.41021728515625, -0.280853271484375, -0.1514892578125, -0.022125244140625, 0.10723876953125, 0.236602783203125, 0.365966796875, 0.495330810546875, 0.62469482421875, 0.754058837890625, 0.8834228515625, 1.012786865234375, 1.14215087890625, 1.271514892578125, 1.40087890625, 1.530242919921875, 1.65960693359375, 1.788970947265625, 1.9183349609375, 2.047698974609375, 2.17706298828125, 2.306427001953125, 2.435791015625, 2.565155029296875, 2.69451904296875, 2.823883056640625, 2.9532470703125, 3.082611083984375, 3.21197509765625, 3.341339111328125, 3.470703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 13.0, 19.0, 42.0, 57.0, 118.0, 245.0, 569.0, 1260.0, 3337.0, 9641.0, 35868.0, 265266.0, 3291076.0, 514707.0, 52359.0, 12670.0, 4203.0, 1577.0, 621.0, 307.0, 153.0, 64.0, 43.0, 23.0, 15.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0625, -6.86419677734375, -6.6658935546875, -6.46759033203125, -6.269287109375, -6.07098388671875, -5.8726806640625, -5.67437744140625, -5.47607421875, -5.27777099609375, -5.0794677734375, -4.88116455078125, -4.682861328125, -4.48455810546875, -4.2862548828125, -4.08795166015625, -3.8896484375, -3.69134521484375, -3.4930419921875, -3.29473876953125, -3.096435546875, -2.89813232421875, -2.6998291015625, -2.50152587890625, -2.30322265625, -2.10491943359375, -1.9066162109375, -1.70831298828125, -1.510009765625, -1.31170654296875, -1.1134033203125, -0.91510009765625, -0.716796875, -0.51849365234375, -0.3201904296875, -0.12188720703125, 0.076416015625, 0.27471923828125, 0.4730224609375, 0.67132568359375, 0.86962890625, 1.06793212890625, 1.2662353515625, 1.46453857421875, 1.662841796875, 1.86114501953125, 2.0594482421875, 2.25775146484375, 2.4560546875, 2.65435791015625, 2.8526611328125, 3.05096435546875, 3.249267578125, 3.44757080078125, 3.6458740234375, 3.84417724609375, 4.04248046875, 4.24078369140625, 4.4390869140625, 4.63739013671875, 4.835693359375, 5.03399658203125, 5.2322998046875, 5.43060302734375, 5.62890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 4.0, 12.0, 10.0, 11.0, 26.0, 49.0, 77.0, 153.0, 264.0, 550.0, 938.0, 890.0, 493.0, 241.0, 141.0, 72.0, 44.0, 28.0, 19.0, 11.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.0428466796875, -6.835693359375, -6.6285400390625, -6.42138671875, -6.2142333984375, -6.007080078125, -5.7999267578125, -5.5927734375, -5.3856201171875, -5.178466796875, -4.9713134765625, -4.76416015625, -4.5570068359375, -4.349853515625, -4.1427001953125, -3.935546875, -3.7283935546875, -3.521240234375, -3.3140869140625, -3.10693359375, -2.8997802734375, -2.692626953125, -2.4854736328125, -2.2783203125, -2.0711669921875, -1.864013671875, -1.6568603515625, -1.44970703125, -1.2425537109375, -1.035400390625, -0.8282470703125, -0.62109375, -0.4139404296875, -0.206787109375, 0.0003662109375, 0.20751953125, 0.4146728515625, 0.621826171875, 0.8289794921875, 1.0361328125, 1.2432861328125, 1.450439453125, 1.6575927734375, 1.86474609375, 2.0718994140625, 2.279052734375, 2.4862060546875, 2.693359375, 2.9005126953125, 3.107666015625, 3.3148193359375, 3.52197265625, 3.7291259765625, 3.936279296875, 4.1434326171875, 4.3505859375, 4.5577392578125, 4.764892578125, 4.9720458984375, 5.17919921875, 5.3863525390625, 5.593505859375, 5.8006591796875, 6.0078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 6.0, 1.0, 4.0, 17.0, 27.0, 49.0, 107.0, 124.0, 164.0, 167.0, 140.0, 86.0, 53.0, 17.0, 9.0, 7.0, 5.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.944496154785156, -52.30963134765625, -50.674766540527344, -49.03990173339844, -47.405033111572266, -45.77016830444336, -44.13530349731445, -42.50043869018555, -40.865570068359375, -39.23070526123047, -37.59584045410156, -35.960975646972656, -34.326107025146484, -32.69124221801758, -31.056377410888672, -29.421512603759766, -27.78664779663086, -26.151782989501953, -24.516916275024414, -22.882051467895508, -21.24718475341797, -19.612319946289062, -17.977455139160156, -16.34259033203125, -14.707723617553711, -13.072857856750488, -11.437992095947266, -9.80312728881836, -8.168261528015137, -6.533395767211914, -4.898530960083008, -3.263665199279785, -1.6287994384765625, 0.006066083908081055, 1.6409316062927246, 3.275796890258789, 4.910662651062012, 6.545528411865234, 8.18039321899414, 9.815258979797363, 11.450124740600586, 13.084990501403809, 14.719856262207031, 16.354721069335938, 17.989585876464844, 19.624452590942383, 21.25931739807129, 22.894184112548828, 24.529048919677734, 26.16391372680664, 27.79878044128418, 29.433645248413086, 31.068511962890625, 32.70337677001953, 34.33824157714844, 35.973106384277344, 37.60797119140625, 39.242835998535156, 40.87770080566406, 42.51256561279297, 44.14743423461914, 45.78229904174805, 47.41716384887695, 49.05202865600586, 50.68689727783203]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 11.0, 10.0, 21.0, 24.0, 25.0, 25.0, 33.0, 37.0, 41.0, 49.0, 65.0, 59.0, 58.0, 72.0, 58.0, 57.0, 56.0, 38.0, 41.0, 42.0, 38.0, 28.0, 30.0, 7.0, 16.0, 18.0, 8.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.646453857421875, -25.773265838623047, -24.90007781982422, -24.02688980102539, -23.153703689575195, -22.280515670776367, -21.40732765197754, -20.53413963317871, -19.660953521728516, -18.787765502929688, -17.91457748413086, -17.04138946533203, -16.168203353881836, -15.295015335083008, -14.42182731628418, -13.548639297485352, -12.675451278686523, -11.802263259887695, -10.929076194763184, -10.055888175964355, -9.182701110839844, -8.309513092041016, -7.4363250732421875, -6.563137531280518, -5.689949989318848, -4.816762447357178, -3.9435746669769287, -3.0703868865966797, -2.1971993446350098, -1.3240118026733398, -0.4508237838745117, 0.4223637580871582, 1.2955513000488281, 2.168738842010498, 3.041926622390747, 3.915114402770996, 4.788301944732666, 5.661489486694336, 6.534677505493164, 7.407865047454834, 8.281052589416504, 9.154240608215332, 10.027427673339844, 10.900615692138672, 11.7738037109375, 12.646990776062012, 13.52017879486084, 14.393365859985352, 15.26655387878418, 16.139741897583008, 17.012929916381836, 17.88611602783203, 18.75930404663086, 19.632492065429688, 20.505680084228516, 21.378868103027344, 22.252056121826172, 23.125244140625, 23.998432159423828, 24.871620178222656, 25.74480628967285, 26.61799430847168, 27.491182327270508, 28.364370346069336, 29.23755645751953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 8.0, 11.0, 21.0, 29.0, 43.0, 77.0, 150.0, 243.0, 427.0, 945.0, 2007.0, 4416.0, 10615.0, 26717.0, 71194.0, 194779.0, 388785.0, 218282.0, 79121.0, 29808.0, 11722.0, 4802.0, 2217.0, 982.0, 510.0, 270.0, 146.0, 73.0, 54.0, 34.0, 19.0, 11.0, 12.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.20294189453125, -4.0504150390625, -3.89788818359375, -3.745361328125, -3.59283447265625, -3.4403076171875, -3.28778076171875, -3.13525390625, -2.98272705078125, -2.8302001953125, -2.67767333984375, -2.525146484375, -2.37261962890625, -2.2200927734375, -2.06756591796875, -1.9150390625, -1.76251220703125, -1.6099853515625, -1.45745849609375, -1.304931640625, -1.15240478515625, -0.9998779296875, -0.84735107421875, -0.69482421875, -0.54229736328125, -0.3897705078125, -0.23724365234375, -0.084716796875, 0.06781005859375, 0.2203369140625, 0.37286376953125, 0.525390625, 0.67791748046875, 0.8304443359375, 0.98297119140625, 1.135498046875, 1.28802490234375, 1.4405517578125, 1.59307861328125, 1.74560546875, 1.89813232421875, 2.0506591796875, 2.20318603515625, 2.355712890625, 2.50823974609375, 2.6607666015625, 2.81329345703125, 2.9658203125, 3.11834716796875, 3.2708740234375, 3.42340087890625, 3.575927734375, 3.72845458984375, 3.8809814453125, 4.03350830078125, 4.18603515625, 4.33856201171875, 4.4910888671875, 4.64361572265625, 4.796142578125, 4.94866943359375, 5.1011962890625, 5.25372314453125, 5.40625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 10.0, 7.0, 7.0, 11.0, 16.0, 22.0, 12.0, 23.0, 21.0, 33.0, 41.0, 51.0, 47.0, 60.0, 64.0, 53.0, 60.0, 54.0, 43.0, 58.0, 41.0, 47.0, 36.0, 26.0, 25.0, 31.0, 27.0, 12.0, 14.0, 12.0, 13.0, 11.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.45703125, -2.379058837890625, -2.30108642578125, -2.223114013671875, -2.1451416015625, -2.067169189453125, -1.98919677734375, -1.911224365234375, -1.833251953125, -1.755279541015625, -1.67730712890625, -1.599334716796875, -1.5213623046875, -1.443389892578125, -1.36541748046875, -1.287445068359375, -1.20947265625, -1.131500244140625, -1.05352783203125, -0.975555419921875, -0.8975830078125, -0.819610595703125, -0.74163818359375, -0.663665771484375, -0.585693359375, -0.507720947265625, -0.42974853515625, -0.351776123046875, -0.2738037109375, -0.195831298828125, -0.11785888671875, -0.039886474609375, 0.0380859375, 0.116058349609375, 0.19403076171875, 0.272003173828125, 0.3499755859375, 0.427947998046875, 0.50592041015625, 0.583892822265625, 0.661865234375, 0.739837646484375, 0.81781005859375, 0.895782470703125, 0.9737548828125, 1.051727294921875, 1.12969970703125, 1.207672119140625, 1.28564453125, 1.363616943359375, 1.44158935546875, 1.519561767578125, 1.5975341796875, 1.675506591796875, 1.75347900390625, 1.831451416015625, 1.909423828125, 1.987396240234375, 2.06536865234375, 2.143341064453125, 2.2213134765625, 2.299285888671875, 2.37725830078125, 2.455230712890625, 2.533203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 15.0, 27.0, 33.0, 47.0, 70.0, 92.0, 138.0, 202.0, 321.0, 618.0, 1161.0, 2845.0, 8132.0, 31970.0, 174554.0, 655118.0, 134868.0, 26409.0, 6905.0, 2337.0, 1115.0, 577.0, 327.0, 220.0, 155.0, 86.0, 54.0, 32.0, 26.0, 27.0, 15.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.942138671875, -7.68115234375, -7.420166015625, -7.1591796875, -6.898193359375, -6.63720703125, -6.376220703125, -6.115234375, -5.854248046875, -5.59326171875, -5.332275390625, -5.0712890625, -4.810302734375, -4.54931640625, -4.288330078125, -4.02734375, -3.766357421875, -3.50537109375, -3.244384765625, -2.9833984375, -2.722412109375, -2.46142578125, -2.200439453125, -1.939453125, -1.678466796875, -1.41748046875, -1.156494140625, -0.8955078125, -0.634521484375, -0.37353515625, -0.112548828125, 0.1484375, 0.409423828125, 0.67041015625, 0.931396484375, 1.1923828125, 1.453369140625, 1.71435546875, 1.975341796875, 2.236328125, 2.497314453125, 2.75830078125, 3.019287109375, 3.2802734375, 3.541259765625, 3.80224609375, 4.063232421875, 4.32421875, 4.585205078125, 4.84619140625, 5.107177734375, 5.3681640625, 5.629150390625, 5.89013671875, 6.151123046875, 6.412109375, 6.673095703125, 6.93408203125, 7.195068359375, 7.4560546875, 7.717041015625, 7.97802734375, 8.239013671875, 8.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 3.0, 6.0, 9.0, 7.0, 10.0, 14.0, 26.0, 19.0, 26.0, 34.0, 38.0, 34.0, 29.0, 52.0, 43.0, 48.0, 47.0, 48.0, 49.0, 38.0, 52.0, 40.0, 51.0, 29.0, 44.0, 34.0, 28.0, 29.0, 22.0, 15.0, 23.0, 7.0, 6.0, 10.0, 4.0, 2.0, 7.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62890625, -7.35308837890625, -7.0772705078125, -6.80145263671875, -6.525634765625, -6.24981689453125, -5.9739990234375, -5.69818115234375, -5.42236328125, -5.14654541015625, -4.8707275390625, -4.59490966796875, -4.319091796875, -4.04327392578125, -3.7674560546875, -3.49163818359375, -3.2158203125, -2.94000244140625, -2.6641845703125, -2.38836669921875, -2.112548828125, -1.83673095703125, -1.5609130859375, -1.28509521484375, -1.00927734375, -0.73345947265625, -0.4576416015625, -0.18182373046875, 0.093994140625, 0.36981201171875, 0.6456298828125, 0.92144775390625, 1.197265625, 1.47308349609375, 1.7489013671875, 2.02471923828125, 2.300537109375, 2.57635498046875, 2.8521728515625, 3.12799072265625, 3.40380859375, 3.67962646484375, 3.9554443359375, 4.23126220703125, 4.507080078125, 4.78289794921875, 5.0587158203125, 5.33453369140625, 5.6103515625, 5.88616943359375, 6.1619873046875, 6.43780517578125, 6.713623046875, 6.98944091796875, 7.2652587890625, 7.54107666015625, 7.81689453125, 8.09271240234375, 8.3685302734375, 8.64434814453125, 8.920166015625, 9.19598388671875, 9.4718017578125, 9.74761962890625, 10.0234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 7.0, 5.0, 2.0, 10.0, 13.0, 24.0, 25.0, 56.0, 145.0, 380.0, 1955.0, 25659.0, 876425.0, 137717.0, 5000.0, 745.0, 209.0, 81.0, 30.0, 23.0, 16.0, 10.0, 4.0, 7.0, 6.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1341552734375, -7.877685546875, -7.6212158203125, -7.36474609375, -7.1082763671875, -6.851806640625, -6.5953369140625, -6.3388671875, -6.0823974609375, -5.825927734375, -5.5694580078125, -5.31298828125, -5.0565185546875, -4.800048828125, -4.5435791015625, -4.287109375, -4.0306396484375, -3.774169921875, -3.5177001953125, -3.26123046875, -3.0047607421875, -2.748291015625, -2.4918212890625, -2.2353515625, -1.9788818359375, -1.722412109375, -1.4659423828125, -1.20947265625, -0.9530029296875, -0.696533203125, -0.4400634765625, -0.18359375, 0.0728759765625, 0.329345703125, 0.5858154296875, 0.84228515625, 1.0987548828125, 1.355224609375, 1.6116943359375, 1.8681640625, 2.1246337890625, 2.381103515625, 2.6375732421875, 2.89404296875, 3.1505126953125, 3.406982421875, 3.6634521484375, 3.919921875, 4.1763916015625, 4.432861328125, 4.6893310546875, 4.94580078125, 5.2022705078125, 5.458740234375, 5.7152099609375, 5.9716796875, 6.2281494140625, 6.484619140625, 6.7410888671875, 6.99755859375, 7.2540283203125, 7.510498046875, 7.7669677734375, 8.0234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 7.0, 13.0, 17.0, 19.0, 25.0, 23.0, 31.0, 43.0, 72.0, 80.0, 95.0, 113.0, 103.0, 72.0, 52.0, 43.0, 35.0, 38.0, 24.0, 22.0, 8.0, 4.0, 9.0, 5.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000560760498046875, -0.0005396828055381775, -0.00051860511302948, -0.0004975274205207825, -0.00047644972801208496, -0.00045537203550338745, -0.00043429434299468994, -0.00041321665048599243, -0.0003921389579772949, -0.0003710612654685974, -0.0003499835729598999, -0.0003289058804512024, -0.0003078281879425049, -0.0002867504954338074, -0.00026567280292510986, -0.00024459511041641235, -0.00022351741790771484, -0.00020243972539901733, -0.00018136203289031982, -0.00016028434038162231, -0.0001392066478729248, -0.0001181289553642273, -9.705126285552979e-05, -7.597357034683228e-05, -5.4895877838134766e-05, -3.3818185329437256e-05, -1.2740492820739746e-05, 8.337199687957764e-06, 2.9414892196655273e-05, 5.049258470535278e-05, 7.157027721405029e-05, 9.26479697227478e-05, 0.00011372566223144531, 0.00013480335474014282, 0.00015588104724884033, 0.00017695873975753784, 0.00019803643226623535, 0.00021911412477493286, 0.00024019181728363037, 0.0002612695097923279, 0.0002823472023010254, 0.0003034248948097229, 0.0003245025873184204, 0.0003455802798271179, 0.00036665797233581543, 0.00038773566484451294, 0.00040881335735321045, 0.00042989104986190796, 0.00045096874237060547, 0.000472046434879303, 0.0004931241273880005, 0.000514201819896698, 0.0005352795124053955, 0.000556357204914093, 0.0005774348974227905, 0.000598512589931488, 0.0006195902824401855, 0.0006406679749488831, 0.0006617456674575806, 0.0006828233599662781, 0.0007039010524749756, 0.0007249787449836731, 0.0007460564374923706, 0.0007671341300010681, 0.0007882118225097656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 9.0, 15.0, 39.0, 45.0, 75.0, 101.0, 194.0, 322.0, 536.0, 1166.0, 2796.0, 8488.0, 35211.0, 213917.0, 630226.0, 122641.0, 22503.0, 6041.0, 2135.0, 923.0, 473.0, 264.0, 147.0, 95.0, 50.0, 43.0, 24.0, 17.0, 4.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.17578125, -4.069671630859375, -3.96356201171875, -3.857452392578125, -3.7513427734375, -3.645233154296875, -3.53912353515625, -3.433013916015625, -3.326904296875, -3.220794677734375, -3.11468505859375, -3.008575439453125, -2.9024658203125, -2.796356201171875, -2.69024658203125, -2.584136962890625, -2.47802734375, -2.371917724609375, -2.26580810546875, -2.159698486328125, -2.0535888671875, -1.947479248046875, -1.84136962890625, -1.735260009765625, -1.629150390625, -1.523040771484375, -1.41693115234375, -1.310821533203125, -1.2047119140625, -1.098602294921875, -0.99249267578125, -0.886383056640625, -0.7802734375, -0.674163818359375, -0.56805419921875, -0.461944580078125, -0.3558349609375, -0.249725341796875, -0.14361572265625, -0.037506103515625, 0.068603515625, 0.174713134765625, 0.28082275390625, 0.386932373046875, 0.4930419921875, 0.599151611328125, 0.70526123046875, 0.811370849609375, 0.91748046875, 1.023590087890625, 1.12969970703125, 1.235809326171875, 1.3419189453125, 1.448028564453125, 1.55413818359375, 1.660247802734375, 1.766357421875, 1.872467041015625, 1.97857666015625, 2.084686279296875, 2.1907958984375, 2.296905517578125, 2.40301513671875, 2.509124755859375, 2.615234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 2.0, 4.0, 1.0, 4.0, 10.0, 16.0, 24.0, 14.0, 26.0, 40.0, 50.0, 62.0, 68.0, 71.0, 81.0, 90.0, 79.0, 84.0, 57.0, 60.0, 31.0, 34.0, 16.0, 13.0, 20.0, 14.0, 8.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.705963134765625, -2.61309814453125, -2.520233154296875, -2.4273681640625, -2.334503173828125, -2.24163818359375, -2.148773193359375, -2.055908203125, -1.963043212890625, -1.87017822265625, -1.777313232421875, -1.6844482421875, -1.591583251953125, -1.49871826171875, -1.405853271484375, -1.31298828125, -1.220123291015625, -1.12725830078125, -1.034393310546875, -0.9415283203125, -0.848663330078125, -0.75579833984375, -0.662933349609375, -0.570068359375, -0.477203369140625, -0.38433837890625, -0.291473388671875, -0.1986083984375, -0.105743408203125, -0.01287841796875, 0.079986572265625, 0.1728515625, 0.265716552734375, 0.35858154296875, 0.451446533203125, 0.5443115234375, 0.637176513671875, 0.73004150390625, 0.822906494140625, 0.915771484375, 1.008636474609375, 1.10150146484375, 1.194366455078125, 1.2872314453125, 1.380096435546875, 1.47296142578125, 1.565826416015625, 1.65869140625, 1.751556396484375, 1.84442138671875, 1.937286376953125, 2.0301513671875, 2.123016357421875, 2.21588134765625, 2.308746337890625, 2.401611328125, 2.494476318359375, 2.58734130859375, 2.680206298828125, 2.7730712890625, 2.865936279296875, 2.95880126953125, 3.051666259765625, 3.14453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 9.0, 6.0, 18.0, 39.0, 70.0, 121.0, 165.0, 207.0, 145.0, 98.0, 50.0, 35.0, 15.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.3342514038086, -64.2274398803711, -62.12063217163086, -60.013824462890625, -57.907012939453125, -55.80020523071289, -53.693397521972656, -51.586585998535156, -49.47977828979492, -47.37297058105469, -45.26615905761719, -43.15935134887695, -41.05254364013672, -38.94573211669922, -36.838924407958984, -34.73211669921875, -32.62530517578125, -30.518495559692383, -28.411685943603516, -26.30487823486328, -24.198068618774414, -22.091259002685547, -19.984451293945312, -17.877641677856445, -15.770832061767578, -13.664022445678711, -11.55721378326416, -9.45040512084961, -7.343595504760742, -5.236785888671875, -3.129977226257324, -1.0231685638427734, 1.083648681640625, 3.190457820892334, 5.297266960144043, 7.404076099395752, 9.510885238647461, 11.617694854736328, 13.724503517150879, 15.83131217956543, 17.938121795654297, 20.044931411743164, 22.15174102783203, 24.258548736572266, 26.365358352661133, 28.47216796875, 30.578975677490234, 32.68578338623047, 34.79259490966797, 36.8994026184082, 39.0062141418457, 41.11302185058594, 43.21983337402344, 45.32664108276367, 47.433448791503906, 49.540260314941406, 51.64706802368164, 53.753875732421875, 55.860687255859375, 57.96749496459961, 60.074302673339844, 62.181114196777344, 64.28792572021484, 66.39472961425781, 68.50154113769531]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 0.0, 4.0, 10.0, 13.0, 18.0, 16.0, 16.0, 21.0, 34.0, 28.0, 36.0, 41.0, 36.0, 56.0, 55.0, 70.0, 72.0, 66.0, 62.0, 43.0, 39.0, 39.0, 44.0, 30.0, 30.0, 28.0, 14.0, 18.0, 16.0, 11.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.135398864746094, -33.82848358154297, -32.52157211303711, -31.214656829833984, -29.90774154663086, -28.600828170776367, -27.293914794921875, -25.98699951171875, -24.680084228515625, -23.373170852661133, -22.066255569458008, -20.759342193603516, -19.45242691040039, -18.1455135345459, -16.838600158691406, -15.531684875488281, -14.224771499633789, -12.91785717010498, -11.610942840576172, -10.30402946472168, -8.997114181518555, -7.690200328826904, -6.383286476135254, -5.076372146606445, -3.7694578170776367, -2.462543487548828, -1.1556293964385986, 0.15128469467163086, 1.4581990242004395, 2.765113353729248, 4.072027206420898, 5.378941535949707, 6.685855865478516, 7.992770195007324, 9.299684524536133, 10.606597900390625, 11.91351318359375, 13.220426559448242, 14.52734088897705, 15.83425521850586, 17.141170501708984, 18.448083877563477, 19.7549991607666, 21.061912536621094, 22.36882781982422, 23.67574119567871, 24.982654571533203, 26.289569854736328, 27.59648323059082, 28.903396606445312, 30.210311889648438, 31.51722526550293, 32.82413864135742, 34.13105392456055, 35.43796920776367, 36.74488067626953, 38.051795959472656, 39.35871124267578, 40.66562271118164, 41.972537994384766, 43.27945327758789, 44.586368560791016, 45.893280029296875, 47.2001953125, 48.507110595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 10.0, 14.0, 16.0, 31.0, 55.0, 86.0, 120.0, 184.0, 326.0, 616.0, 1106.0, 2161.0, 4417.0, 9517.0, 22769.0, 59949.0, 200745.0, 1010914.0, 2181179.0, 508356.0, 120829.0, 40789.0, 16097.0, 7071.0, 3360.0, 1622.0, 869.0, 411.0, 272.0, 151.0, 86.0, 67.0, 25.0, 20.0, 12.0, 10.0, 5.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.40234375, -3.308624267578125, -3.21490478515625, -3.121185302734375, -3.0274658203125, -2.933746337890625, -2.84002685546875, -2.746307373046875, -2.652587890625, -2.558868408203125, -2.46514892578125, -2.371429443359375, -2.2777099609375, -2.183990478515625, -2.09027099609375, -1.996551513671875, -1.90283203125, -1.809112548828125, -1.71539306640625, -1.621673583984375, -1.5279541015625, -1.434234619140625, -1.34051513671875, -1.246795654296875, -1.153076171875, -1.059356689453125, -0.96563720703125, -0.871917724609375, -0.7781982421875, -0.684478759765625, -0.59075927734375, -0.497039794921875, -0.4033203125, -0.309600830078125, -0.21588134765625, -0.122161865234375, -0.0284423828125, 0.065277099609375, 0.15899658203125, 0.252716064453125, 0.346435546875, 0.440155029296875, 0.53387451171875, 0.627593994140625, 0.7213134765625, 0.815032958984375, 0.90875244140625, 1.002471923828125, 1.09619140625, 1.189910888671875, 1.28363037109375, 1.377349853515625, 1.4710693359375, 1.564788818359375, 1.65850830078125, 1.752227783203125, 1.845947265625, 1.939666748046875, 2.03338623046875, 2.127105712890625, 2.2208251953125, 2.314544677734375, 2.40826416015625, 2.501983642578125, 2.595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 11.0, 5.0, 5.0, 9.0, 10.0, 16.0, 26.0, 9.0, 21.0, 22.0, 28.0, 27.0, 21.0, 36.0, 29.0, 30.0, 39.0, 38.0, 44.0, 54.0, 47.0, 38.0, 53.0, 48.0, 40.0, 40.0, 34.0, 21.0, 22.0, 26.0, 26.0, 22.0, 17.0, 17.0, 13.0, 12.0, 11.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.677734375, -1.623626708984375, -1.56951904296875, -1.515411376953125, -1.4613037109375, -1.407196044921875, -1.35308837890625, -1.298980712890625, -1.244873046875, -1.190765380859375, -1.13665771484375, -1.082550048828125, -1.0284423828125, -0.974334716796875, -0.92022705078125, -0.866119384765625, -0.81201171875, -0.757904052734375, -0.70379638671875, -0.649688720703125, -0.5955810546875, -0.541473388671875, -0.48736572265625, -0.433258056640625, -0.379150390625, -0.325042724609375, -0.27093505859375, -0.216827392578125, -0.1627197265625, -0.108612060546875, -0.05450439453125, -0.000396728515625, 0.0537109375, 0.107818603515625, 0.16192626953125, 0.216033935546875, 0.2701416015625, 0.324249267578125, 0.37835693359375, 0.432464599609375, 0.486572265625, 0.540679931640625, 0.59478759765625, 0.648895263671875, 0.7030029296875, 0.757110595703125, 0.81121826171875, 0.865325927734375, 0.91943359375, 0.973541259765625, 1.02764892578125, 1.081756591796875, 1.1358642578125, 1.189971923828125, 1.24407958984375, 1.298187255859375, 1.352294921875, 1.406402587890625, 1.46051025390625, 1.514617919921875, 1.5687255859375, 1.622833251953125, 1.67694091796875, 1.731048583984375, 1.78515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 6.0, 7.0, 7.0, 18.0, 16.0, 31.0, 52.0, 87.0, 148.0, 281.0, 608.0, 1477.0, 3913.0, 13500.0, 59269.0, 429321.0, 3122203.0, 473051.0, 66814.0, 15444.0, 4831.0, 1713.0, 706.0, 320.0, 177.0, 110.0, 57.0, 35.0, 23.0, 15.0, 16.0, 7.0, 6.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.7813720703125, -4.593994140625, -4.4066162109375, -4.21923828125, -4.0318603515625, -3.844482421875, -3.6571044921875, -3.4697265625, -3.2823486328125, -3.094970703125, -2.9075927734375, -2.72021484375, -2.5328369140625, -2.345458984375, -2.1580810546875, -1.970703125, -1.7833251953125, -1.595947265625, -1.4085693359375, -1.22119140625, -1.0338134765625, -0.846435546875, -0.6590576171875, -0.4716796875, -0.2843017578125, -0.096923828125, 0.0904541015625, 0.27783203125, 0.4652099609375, 0.652587890625, 0.8399658203125, 1.02734375, 1.2147216796875, 1.402099609375, 1.5894775390625, 1.77685546875, 1.9642333984375, 2.151611328125, 2.3389892578125, 2.5263671875, 2.7137451171875, 2.901123046875, 3.0885009765625, 3.27587890625, 3.4632568359375, 3.650634765625, 3.8380126953125, 4.025390625, 4.2127685546875, 4.400146484375, 4.5875244140625, 4.77490234375, 4.9622802734375, 5.149658203125, 5.3370361328125, 5.5244140625, 5.7117919921875, 5.899169921875, 6.0865478515625, 6.27392578125, 6.4613037109375, 6.648681640625, 6.8360595703125, 7.0234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 14.0, 16.0, 17.0, 35.0, 52.0, 59.0, 128.0, 198.0, 332.0, 587.0, 769.0, 660.0, 406.0, 251.0, 152.0, 122.0, 61.0, 60.0, 52.0, 26.0, 16.0, 6.0, 7.0, 7.0, 6.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.27996826171875, -5.0755615234375, -4.87115478515625, -4.666748046875, -4.46234130859375, -4.2579345703125, -4.05352783203125, -3.84912109375, -3.64471435546875, -3.4403076171875, -3.23590087890625, -3.031494140625, -2.82708740234375, -2.6226806640625, -2.41827392578125, -2.2138671875, -2.00946044921875, -1.8050537109375, -1.60064697265625, -1.396240234375, -1.19183349609375, -0.9874267578125, -0.78302001953125, -0.57861328125, -0.37420654296875, -0.1697998046875, 0.03460693359375, 0.239013671875, 0.44342041015625, 0.6478271484375, 0.85223388671875, 1.056640625, 1.26104736328125, 1.4654541015625, 1.66986083984375, 1.874267578125, 2.07867431640625, 2.2830810546875, 2.48748779296875, 2.69189453125, 2.89630126953125, 3.1007080078125, 3.30511474609375, 3.509521484375, 3.71392822265625, 3.9183349609375, 4.12274169921875, 4.3271484375, 4.53155517578125, 4.7359619140625, 4.94036865234375, 5.144775390625, 5.34918212890625, 5.5535888671875, 5.75799560546875, 5.96240234375, 6.16680908203125, 6.3712158203125, 6.57562255859375, 6.780029296875, 6.98443603515625, 7.1888427734375, 7.39324951171875, 7.59765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 13.0, 37.0, 62.0, 106.0, 157.0, 182.0, 173.0, 128.0, 73.0, 31.0, 9.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.82395935058594, -70.5685043334961, -68.31304931640625, -66.0575942993164, -63.80213928222656, -61.54668426513672, -59.291229248046875, -57.03577423095703, -54.78031921386719, -52.524864196777344, -50.2694091796875, -48.013954162597656, -45.75849914550781, -43.50304412841797, -41.247589111328125, -38.99213409423828, -36.73667907714844, -34.481224060058594, -32.22576904296875, -29.970314025878906, -27.714859008789062, -25.45940399169922, -23.203948974609375, -20.94849395751953, -18.693038940429688, -16.437583923339844, -14.18212890625, -11.926673889160156, -9.671218872070312, -7.415763854980469, -5.160308837890625, -2.9048538208007812, -0.6493988037109375, 1.6060562133789062, 3.86151123046875, 6.116966247558594, 8.372421264648438, 10.627876281738281, 12.883331298828125, 15.138786315917969, 17.394241333007812, 19.649696350097656, 21.9051513671875, 24.160606384277344, 26.416061401367188, 28.67151641845703, 30.926971435546875, 33.18242645263672, 35.43788146972656, 37.693336486816406, 39.94879150390625, 42.204246520996094, 44.45970153808594, 46.71515655517578, 48.970611572265625, 51.22606658935547, 53.48152160644531, 55.736976623535156, 57.992431640625, 60.247886657714844, 62.50334167480469, 64.75879669189453, 67.01425170898438, 69.26970672607422, 71.52516174316406]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 12.0, 8.0, 15.0, 12.0, 20.0, 18.0, 20.0, 26.0, 32.0, 44.0, 32.0, 41.0, 23.0, 51.0, 51.0, 57.0, 47.0, 41.0, 48.0, 59.0, 48.0, 36.0, 33.0, 29.0, 19.0, 33.0, 25.0, 23.0, 22.0, 18.0, 10.0, 13.0, 3.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.056922912597656, -32.14336395263672, -31.22980499267578, -30.316246032714844, -29.40268898010254, -28.4891300201416, -27.575571060180664, -26.662012100219727, -25.74845314025879, -24.83489418029785, -23.921335220336914, -23.00777816772461, -22.094219207763672, -21.180660247802734, -20.267101287841797, -19.35354232788086, -18.439983367919922, -17.526424407958984, -16.612865447998047, -15.699307441711426, -14.785748481750488, -13.872190475463867, -12.95863151550293, -12.045072555541992, -11.131515502929688, -10.21795654296875, -9.304398536682129, -8.390839576721191, -7.477280616760254, -6.563722133636475, -5.650163650512695, -4.736604690551758, -3.8230457305908203, -2.909487009048462, -1.995928406715393, -1.0823698043823242, -0.16881108283996582, 0.7447476387023926, 1.6583061218261719, 2.5718650817871094, 3.4854235649108887, 4.398982048034668, 5.3125410079956055, 6.226099491119385, 7.139657974243164, 8.053216934204102, 8.966775894165039, 9.880334854125977, 10.793892860412598, 11.707451820373535, 12.621009826660156, 13.534568786621094, 14.448127746582031, 15.361686706542969, 16.275245666503906, 17.188804626464844, 18.10236167907715, 19.015920639038086, 19.929479598999023, 20.843036651611328, 21.756595611572266, 22.670154571533203, 23.58371353149414, 24.497272491455078, 25.410831451416016]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 10.0, 12.0, 21.0, 29.0, 46.0, 85.0, 142.0, 238.0, 392.0, 788.0, 1494.0, 3248.0, 7702.0, 18075.0, 43113.0, 100061.0, 225978.0, 325948.0, 182036.0, 79701.0, 33806.0, 14120.0, 6035.0, 2645.0, 1272.0, 664.0, 364.0, 221.0, 114.0, 71.0, 43.0, 22.0, 16.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.37109375, -4.23602294921875, -4.1009521484375, -3.96588134765625, -3.830810546875, -3.69573974609375, -3.5606689453125, -3.42559814453125, -3.29052734375, -3.15545654296875, -3.0203857421875, -2.88531494140625, -2.750244140625, -2.61517333984375, -2.4801025390625, -2.34503173828125, -2.2099609375, -2.07489013671875, -1.9398193359375, -1.80474853515625, -1.669677734375, -1.53460693359375, -1.3995361328125, -1.26446533203125, -1.12939453125, -0.99432373046875, -0.8592529296875, -0.72418212890625, -0.589111328125, -0.45404052734375, -0.3189697265625, -0.18389892578125, -0.048828125, 0.08624267578125, 0.2213134765625, 0.35638427734375, 0.491455078125, 0.62652587890625, 0.7615966796875, 0.89666748046875, 1.03173828125, 1.16680908203125, 1.3018798828125, 1.43695068359375, 1.572021484375, 1.70709228515625, 1.8421630859375, 1.97723388671875, 2.1123046875, 2.24737548828125, 2.3824462890625, 2.51751708984375, 2.652587890625, 2.78765869140625, 2.9227294921875, 3.05780029296875, 3.19287109375, 3.32794189453125, 3.4630126953125, 3.59808349609375, 3.733154296875, 3.86822509765625, 4.0032958984375, 4.13836669921875, 4.2734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 8.0, 13.0, 6.0, 12.0, 16.0, 20.0, 19.0, 28.0, 21.0, 27.0, 40.0, 29.0, 44.0, 44.0, 43.0, 44.0, 46.0, 44.0, 53.0, 48.0, 50.0, 47.0, 29.0, 39.0, 29.0, 33.0, 31.0, 24.0, 19.0, 14.0, 11.0, 11.0, 9.0, 7.0, 10.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.7088623046875, -1.648193359375, -1.5875244140625, -1.52685546875, -1.4661865234375, -1.405517578125, -1.3448486328125, -1.2841796875, -1.2235107421875, -1.162841796875, -1.1021728515625, -1.04150390625, -0.9808349609375, -0.920166015625, -0.8594970703125, -0.798828125, -0.7381591796875, -0.677490234375, -0.6168212890625, -0.55615234375, -0.4954833984375, -0.434814453125, -0.3741455078125, -0.3134765625, -0.2528076171875, -0.192138671875, -0.1314697265625, -0.07080078125, -0.0101318359375, 0.050537109375, 0.1112060546875, 0.171875, 0.2325439453125, 0.293212890625, 0.3538818359375, 0.41455078125, 0.4752197265625, 0.535888671875, 0.5965576171875, 0.6572265625, 0.7178955078125, 0.778564453125, 0.8392333984375, 0.89990234375, 0.9605712890625, 1.021240234375, 1.0819091796875, 1.142578125, 1.2032470703125, 1.263916015625, 1.3245849609375, 1.38525390625, 1.4459228515625, 1.506591796875, 1.5672607421875, 1.6279296875, 1.6885986328125, 1.749267578125, 1.8099365234375, 1.87060546875, 1.9312744140625, 1.991943359375, 2.0526123046875, 2.11328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 2.0, 8.0, 9.0, 19.0, 19.0, 37.0, 43.0, 74.0, 105.0, 143.0, 222.0, 322.0, 471.0, 735.0, 1184.0, 2094.0, 4887.0, 16324.0, 92000.0, 645067.0, 233749.0, 35466.0, 8196.0, 3129.0, 1535.0, 986.0, 577.0, 338.0, 266.0, 152.0, 117.0, 86.0, 69.0, 34.0, 21.0, 18.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.0, -8.72509765625, -8.4501953125, -8.17529296875, -7.900390625, -7.62548828125, -7.3505859375, -7.07568359375, -6.80078125, -6.52587890625, -6.2509765625, -5.97607421875, -5.701171875, -5.42626953125, -5.1513671875, -4.87646484375, -4.6015625, -4.32666015625, -4.0517578125, -3.77685546875, -3.501953125, -3.22705078125, -2.9521484375, -2.67724609375, -2.40234375, -2.12744140625, -1.8525390625, -1.57763671875, -1.302734375, -1.02783203125, -0.7529296875, -0.47802734375, -0.203125, 0.07177734375, 0.3466796875, 0.62158203125, 0.896484375, 1.17138671875, 1.4462890625, 1.72119140625, 1.99609375, 2.27099609375, 2.5458984375, 2.82080078125, 3.095703125, 3.37060546875, 3.6455078125, 3.92041015625, 4.1953125, 4.47021484375, 4.7451171875, 5.02001953125, 5.294921875, 5.56982421875, 5.8447265625, 6.11962890625, 6.39453125, 6.66943359375, 6.9443359375, 7.21923828125, 7.494140625, 7.76904296875, 8.0439453125, 8.31884765625, 8.59375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 6.0, 18.0, 15.0, 9.0, 28.0, 20.0, 23.0, 37.0, 51.0, 45.0, 40.0, 51.0, 62.0, 60.0, 55.0, 55.0, 51.0, 48.0, 48.0, 41.0, 37.0, 27.0, 26.0, 24.0, 20.0, 21.0, 17.0, 9.0, 16.0, 8.0, 7.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.4765625, -10.1541748046875, -9.831787109375, -9.5093994140625, -9.18701171875, -8.8646240234375, -8.542236328125, -8.2198486328125, -7.8974609375, -7.5750732421875, -7.252685546875, -6.9302978515625, -6.60791015625, -6.2855224609375, -5.963134765625, -5.6407470703125, -5.318359375, -4.9959716796875, -4.673583984375, -4.3511962890625, -4.02880859375, -3.7064208984375, -3.384033203125, -3.0616455078125, -2.7392578125, -2.4168701171875, -2.094482421875, -1.7720947265625, -1.44970703125, -1.1273193359375, -0.804931640625, -0.4825439453125, -0.16015625, 0.1622314453125, 0.484619140625, 0.8070068359375, 1.12939453125, 1.4517822265625, 1.774169921875, 2.0965576171875, 2.4189453125, 2.7413330078125, 3.063720703125, 3.3861083984375, 3.70849609375, 4.0308837890625, 4.353271484375, 4.6756591796875, 4.998046875, 5.3204345703125, 5.642822265625, 5.9652099609375, 6.28759765625, 6.6099853515625, 6.932373046875, 7.2547607421875, 7.5771484375, 7.8995361328125, 8.221923828125, 8.5443115234375, 8.86669921875, 9.1890869140625, 9.511474609375, 9.8338623046875, 10.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 15.0, 13.0, 22.0, 23.0, 27.0, 42.0, 39.0, 79.0, 125.0, 238.0, 436.0, 865.0, 2475.0, 9218.0, 51362.0, 507107.0, 413700.0, 49471.0, 8962.0, 2452.0, 891.0, 399.0, 208.0, 115.0, 82.0, 35.0, 40.0, 28.0, 21.0, 5.0, 14.0, 8.0, 5.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.966796875, -3.853424072265625, -3.74005126953125, -3.626678466796875, -3.5133056640625, -3.399932861328125, -3.28656005859375, -3.173187255859375, -3.059814453125, -2.946441650390625, -2.83306884765625, -2.719696044921875, -2.6063232421875, -2.492950439453125, -2.37957763671875, -2.266204833984375, -2.15283203125, -2.039459228515625, -1.92608642578125, -1.812713623046875, -1.6993408203125, -1.585968017578125, -1.47259521484375, -1.359222412109375, -1.245849609375, -1.132476806640625, -1.01910400390625, -0.905731201171875, -0.7923583984375, -0.678985595703125, -0.56561279296875, -0.452239990234375, -0.3388671875, -0.225494384765625, -0.11212158203125, 0.001251220703125, 0.1146240234375, 0.227996826171875, 0.34136962890625, 0.454742431640625, 0.568115234375, 0.681488037109375, 0.79486083984375, 0.908233642578125, 1.0216064453125, 1.134979248046875, 1.24835205078125, 1.361724853515625, 1.47509765625, 1.588470458984375, 1.70184326171875, 1.815216064453125, 1.9285888671875, 2.041961669921875, 2.15533447265625, 2.268707275390625, 2.382080078125, 2.495452880859375, 2.60882568359375, 2.722198486328125, 2.8355712890625, 2.948944091796875, 3.06231689453125, 3.175689697265625, 3.2890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 10.0, 24.0, 19.0, 32.0, 34.0, 44.0, 70.0, 99.0, 137.0, 154.0, 79.0, 53.0, 46.0, 36.0, 31.0, 17.0, 21.0, 7.0, 19.0, 9.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008678436279296875, -0.0008405372500419617, -0.0008132308721542358, -0.00078592449426651, -0.0007586181163787842, -0.0007313117384910583, -0.0007040053606033325, -0.0006766989827156067, -0.0006493926048278809, -0.000622086226940155, -0.0005947798490524292, -0.0005674734711647034, -0.0005401670932769775, -0.0005128607153892517, -0.0004855543375015259, -0.00045824795961380005, -0.0004309415817260742, -0.0004036352038383484, -0.00037632882595062256, -0.00034902244806289673, -0.0003217160701751709, -0.00029440969228744507, -0.00026710331439971924, -0.0002397969365119934, -0.00021249055862426758, -0.00018518418073654175, -0.00015787780284881592, -0.0001305714249610901, -0.00010326504707336426, -7.595866918563843e-05, -4.86522912979126e-05, -2.1345913410186768e-05, 5.9604644775390625e-06, 3.326684236526489e-05, 6.057322025299072e-05, 8.787959814071655e-05, 0.00011518597602844238, 0.0001424923539161682, 0.00016979873180389404, 0.00019710510969161987, 0.0002244114875793457, 0.00025171786546707153, 0.00027902424335479736, 0.0003063306212425232, 0.000333636999130249, 0.00036094337701797485, 0.0003882497549057007, 0.0004155561327934265, 0.00044286251068115234, 0.0004701688885688782, 0.000497475266456604, 0.0005247816443443298, 0.0005520880222320557, 0.0005793944001197815, 0.0006067007780075073, 0.0006340071558952332, 0.000661313533782959, 0.0006886199116706848, 0.0007159262895584106, 0.0007432326674461365, 0.0007705390453338623, 0.0007978454232215881, 0.000825151801109314, 0.0008524581789970398, 0.0008797645568847656]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 5.0, 9.0, 13.0, 29.0, 29.0, 86.0, 164.0, 307.0, 680.0, 1680.0, 5837.0, 33257.0, 497700.0, 467030.0, 33176.0, 5619.0, 1649.0, 618.0, 314.0, 137.0, 74.0, 53.0, 30.0, 17.0, 14.0, 5.0, 7.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.13470458984375, -4.9920654296875, -4.84942626953125, -4.706787109375, -4.56414794921875, -4.4215087890625, -4.27886962890625, -4.13623046875, -3.99359130859375, -3.8509521484375, -3.70831298828125, -3.565673828125, -3.42303466796875, -3.2803955078125, -3.13775634765625, -2.9951171875, -2.85247802734375, -2.7098388671875, -2.56719970703125, -2.424560546875, -2.28192138671875, -2.1392822265625, -1.99664306640625, -1.85400390625, -1.71136474609375, -1.5687255859375, -1.42608642578125, -1.283447265625, -1.14080810546875, -0.9981689453125, -0.85552978515625, -0.712890625, -0.57025146484375, -0.4276123046875, -0.28497314453125, -0.142333984375, 0.00030517578125, 0.1429443359375, 0.28558349609375, 0.42822265625, 0.57086181640625, 0.7135009765625, 0.85614013671875, 0.998779296875, 1.14141845703125, 1.2840576171875, 1.42669677734375, 1.5693359375, 1.71197509765625, 1.8546142578125, 1.99725341796875, 2.139892578125, 2.28253173828125, 2.4251708984375, 2.56781005859375, 2.71044921875, 2.85308837890625, 2.9957275390625, 3.13836669921875, 3.281005859375, 3.42364501953125, 3.5662841796875, 3.70892333984375, 3.8515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 12.0, 11.0, 16.0, 16.0, 19.0, 38.0, 42.0, 37.0, 53.0, 62.0, 103.0, 98.0, 93.0, 82.0, 73.0, 50.0, 47.0, 28.0, 28.0, 21.0, 17.0, 12.0, 11.0, 8.0, 10.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.544677734375, -2.44287109375, -2.341064453125, -2.2392578125, -2.137451171875, -2.03564453125, -1.933837890625, -1.83203125, -1.730224609375, -1.62841796875, -1.526611328125, -1.4248046875, -1.322998046875, -1.22119140625, -1.119384765625, -1.017578125, -0.915771484375, -0.81396484375, -0.712158203125, -0.6103515625, -0.508544921875, -0.40673828125, -0.304931640625, -0.203125, -0.101318359375, 0.00048828125, 0.102294921875, 0.2041015625, 0.305908203125, 0.40771484375, 0.509521484375, 0.611328125, 0.713134765625, 0.81494140625, 0.916748046875, 1.0185546875, 1.120361328125, 1.22216796875, 1.323974609375, 1.42578125, 1.527587890625, 1.62939453125, 1.731201171875, 1.8330078125, 1.934814453125, 2.03662109375, 2.138427734375, 2.240234375, 2.342041015625, 2.44384765625, 2.545654296875, 2.6474609375, 2.749267578125, 2.85107421875, 2.952880859375, 3.0546875, 3.156494140625, 3.25830078125, 3.360107421875, 3.4619140625, 3.563720703125, 3.66552734375, 3.767333984375, 3.869140625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 18.0, 45.0, 64.0, 103.0, 172.0, 212.0, 144.0, 85.0, 56.0, 39.0, 11.0, 11.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.531558990478516, -34.52313232421875, -32.51470947265625, -30.506282806396484, -28.49785614013672, -26.489431381225586, -24.481006622314453, -22.472579956054688, -20.464155197143555, -18.455730438232422, -16.447303771972656, -14.438879013061523, -12.430453300476074, -10.422027587890625, -8.413602828979492, -6.405177116394043, -4.396751403808594, -2.3883259296417236, -0.3799004554748535, 1.6285247802734375, 3.6369504928588867, 5.645376205444336, 7.653800964355469, 9.662226676940918, 11.670652389526367, 13.679078102111816, 15.687503814697266, 17.6959285736084, 19.70435333251953, 21.712779998779297, 23.72120475769043, 25.729629516601562, 27.738052368164062, 29.746477127075195, 31.75490379333496, 33.763328552246094, 35.77175521850586, 37.780181884765625, 39.788604736328125, 41.79703140258789, 43.805458068847656, 45.81388473510742, 47.82230758666992, 49.83073425292969, 51.83916091918945, 53.84758758544922, 55.85601043701172, 57.864437103271484, 59.872859954833984, 61.88128662109375, 63.88970947265625, 65.89813232421875, 67.90656280517578, 69.91498565673828, 71.92341613769531, 73.93183898925781, 75.94026184082031, 77.94868469238281, 79.95711517333984, 81.96553802490234, 83.97396087646484, 85.98239135742188, 87.99081420898438, 89.99923706054688, 92.0076675415039]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 5.0, 9.0, 14.0, 9.0, 16.0, 20.0, 17.0, 22.0, 26.0, 28.0, 30.0, 40.0, 29.0, 46.0, 60.0, 89.0, 77.0, 75.0, 49.0, 37.0, 48.0, 32.0, 23.0, 34.0, 33.0, 19.0, 21.0, 16.0, 12.0, 10.0, 13.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.06446075439453, -43.8564453125, -42.6484260559082, -41.44041061401367, -40.232391357421875, -39.024375915527344, -37.81636047363281, -36.60834503173828, -35.400325775146484, -34.19231033325195, -32.984291076660156, -31.776275634765625, -30.56825828552246, -29.360240936279297, -28.152225494384766, -26.9442081451416, -25.736190795898438, -24.528173446655273, -23.32015609741211, -22.112140655517578, -20.904123306274414, -19.69610595703125, -18.48809051513672, -17.280073165893555, -16.07205581665039, -14.864038467407227, -13.656022071838379, -12.448005676269531, -11.239988327026367, -10.031970977783203, -8.823954582214355, -7.615938186645508, -6.407920837402344, -5.199903964996338, -3.991887092590332, -2.783870220184326, -1.5758533477783203, -0.36783647537231445, 0.8401803970336914, 2.048196792602539, 3.256214141845703, 4.464231014251709, 5.672247886657715, 6.880264759063721, 8.088281631469727, 9.29629898071289, 10.504315376281738, 11.712331771850586, 12.92034912109375, 14.128366470336914, 15.336382865905762, 16.54439926147461, 17.752416610717773, 18.960433959960938, 20.16844940185547, 21.376466751098633, 22.584484100341797, 23.79250144958496, 25.000518798828125, 26.208534240722656, 27.41655158996582, 28.624568939208984, 29.832584381103516, 31.04060173034668, 32.248619079589844]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 8.0, 23.0, 25.0, 34.0, 51.0, 80.0, 114.0, 186.0, 349.0, 798.0, 2026.0, 6332.0, 23024.0, 118791.0, 1519012.0, 2303127.0, 177661.0, 30600.0, 7818.0, 2434.0, 865.0, 386.0, 188.0, 118.0, 63.0, 41.0, 34.0, 19.0, 13.0, 11.0, 7.0, 3.0, 12.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.0911865234375, -3.940185546875, -3.7891845703125, -3.63818359375, -3.4871826171875, -3.336181640625, -3.1851806640625, -3.0341796875, -2.8831787109375, -2.732177734375, -2.5811767578125, -2.43017578125, -2.2791748046875, -2.128173828125, -1.9771728515625, -1.826171875, -1.6751708984375, -1.524169921875, -1.3731689453125, -1.22216796875, -1.0711669921875, -0.920166015625, -0.7691650390625, -0.6181640625, -0.4671630859375, -0.316162109375, -0.1651611328125, -0.01416015625, 0.1368408203125, 0.287841796875, 0.4388427734375, 0.58984375, 0.7408447265625, 0.891845703125, 1.0428466796875, 1.19384765625, 1.3448486328125, 1.495849609375, 1.6468505859375, 1.7978515625, 1.9488525390625, 2.099853515625, 2.2508544921875, 2.40185546875, 2.5528564453125, 2.703857421875, 2.8548583984375, 3.005859375, 3.1568603515625, 3.307861328125, 3.4588623046875, 3.60986328125, 3.7608642578125, 3.911865234375, 4.0628662109375, 4.2138671875, 4.3648681640625, 4.515869140625, 4.6668701171875, 4.81787109375, 4.9688720703125, 5.119873046875, 5.2708740234375, 5.421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 11.0, 9.0, 12.0, 18.0, 13.0, 23.0, 35.0, 30.0, 38.0, 50.0, 43.0, 54.0, 52.0, 75.0, 60.0, 77.0, 67.0, 78.0, 53.0, 46.0, 36.0, 35.0, 16.0, 21.0, 22.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.90631103515625, -1.8204345703125, -1.73455810546875, -1.648681640625, -1.56280517578125, -1.4769287109375, -1.39105224609375, -1.30517578125, -1.21929931640625, -1.1334228515625, -1.04754638671875, -0.961669921875, -0.87579345703125, -0.7899169921875, -0.70404052734375, -0.6181640625, -0.53228759765625, -0.4464111328125, -0.36053466796875, -0.274658203125, -0.18878173828125, -0.1029052734375, -0.01702880859375, 0.06884765625, 0.15472412109375, 0.2406005859375, 0.32647705078125, 0.412353515625, 0.49822998046875, 0.5841064453125, 0.66998291015625, 0.755859375, 0.84173583984375, 0.9276123046875, 1.01348876953125, 1.099365234375, 1.18524169921875, 1.2711181640625, 1.35699462890625, 1.44287109375, 1.52874755859375, 1.6146240234375, 1.70050048828125, 1.786376953125, 1.87225341796875, 1.9581298828125, 2.04400634765625, 2.1298828125, 2.21575927734375, 2.3016357421875, 2.38751220703125, 2.473388671875, 2.55926513671875, 2.6451416015625, 2.73101806640625, 2.81689453125, 2.90277099609375, 2.9886474609375, 3.07452392578125, 3.160400390625, 3.24627685546875, 3.3321533203125, 3.41802978515625, 3.50390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 6.0, 7.0, 11.0, 32.0, 37.0, 45.0, 66.0, 144.0, 295.0, 628.0, 1420.0, 3573.0, 9922.0, 33330.0, 149430.0, 1490259.0, 2229614.0, 213644.0, 43183.0, 11980.0, 3980.0, 1466.0, 575.0, 267.0, 146.0, 66.0, 51.0, 30.0, 27.0, 16.0, 11.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.15625, -5.998779296875, -5.84130859375, -5.683837890625, -5.5263671875, -5.368896484375, -5.21142578125, -5.053955078125, -4.896484375, -4.739013671875, -4.58154296875, -4.424072265625, -4.2666015625, -4.109130859375, -3.95166015625, -3.794189453125, -3.63671875, -3.479248046875, -3.32177734375, -3.164306640625, -3.0068359375, -2.849365234375, -2.69189453125, -2.534423828125, -2.376953125, -2.219482421875, -2.06201171875, -1.904541015625, -1.7470703125, -1.589599609375, -1.43212890625, -1.274658203125, -1.1171875, -0.959716796875, -0.80224609375, -0.644775390625, -0.4873046875, -0.329833984375, -0.17236328125, -0.014892578125, 0.142578125, 0.300048828125, 0.45751953125, 0.614990234375, 0.7724609375, 0.929931640625, 1.08740234375, 1.244873046875, 1.40234375, 1.559814453125, 1.71728515625, 1.874755859375, 2.0322265625, 2.189697265625, 2.34716796875, 2.504638671875, 2.662109375, 2.819580078125, 2.97705078125, 3.134521484375, 3.2919921875, 3.449462890625, 3.60693359375, 3.764404296875, 3.921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 13.0, 13.0, 23.0, 26.0, 25.0, 43.0, 75.0, 85.0, 107.0, 168.0, 244.0, 414.0, 585.0, 585.0, 525.0, 323.0, 229.0, 152.0, 109.0, 77.0, 55.0, 50.0, 32.0, 26.0, 18.0, 13.0, 9.0, 3.0, 9.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.74627685546875, -4.5902099609375, -4.43414306640625, -4.278076171875, -4.12200927734375, -3.9659423828125, -3.80987548828125, -3.65380859375, -3.49774169921875, -3.3416748046875, -3.18560791015625, -3.029541015625, -2.87347412109375, -2.7174072265625, -2.56134033203125, -2.4052734375, -2.24920654296875, -2.0931396484375, -1.93707275390625, -1.781005859375, -1.62493896484375, -1.4688720703125, -1.31280517578125, -1.15673828125, -1.00067138671875, -0.8446044921875, -0.68853759765625, -0.532470703125, -0.37640380859375, -0.2203369140625, -0.06427001953125, 0.091796875, 0.24786376953125, 0.4039306640625, 0.55999755859375, 0.716064453125, 0.87213134765625, 1.0281982421875, 1.18426513671875, 1.34033203125, 1.49639892578125, 1.6524658203125, 1.80853271484375, 1.964599609375, 2.12066650390625, 2.2767333984375, 2.43280029296875, 2.5888671875, 2.74493408203125, 2.9010009765625, 3.05706787109375, 3.213134765625, 3.36920166015625, 3.5252685546875, 3.68133544921875, 3.83740234375, 3.99346923828125, 4.1495361328125, 4.30560302734375, 4.461669921875, 4.61773681640625, 4.7738037109375, 4.92987060546875, 5.0859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 10.0, 14.0, 34.0, 111.0, 218.0, 292.0, 179.0, 94.0, 31.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-145.3556671142578, -142.28211975097656, -139.2085723876953, -136.135009765625, -133.06146240234375, -129.9879150390625, -126.91436767578125, -123.8408203125, -120.76727294921875, -117.6937255859375, -114.62017059326172, -111.54662322998047, -108.47307586669922, -105.39952087402344, -102.32597351074219, -99.25242614746094, -96.17887115478516, -93.1053237915039, -90.03176879882812, -86.95822143554688, -83.88467407226562, -80.81112670898438, -77.7375717163086, -74.66402435302734, -71.59046936035156, -68.51692199707031, -65.44336700439453, -62.36981964111328, -59.29627227783203, -56.222721099853516, -53.149169921875, -50.07562255859375, -47.002079010009766, -43.92852783203125, -40.85498046875, -37.781429290771484, -34.70787811279297, -31.63433074951172, -28.560779571533203, -25.48723030090332, -22.413681030273438, -19.340131759643555, -16.266582489013672, -13.193031311035156, -10.119482040405273, -7.045932769775391, -3.972381591796875, -0.8988323211669922, 2.1747169494628906, 5.248266696929932, 8.321816444396973, 11.395366668701172, 14.468915939331055, 17.542465209960938, 20.616016387939453, 23.689565658569336, 26.76311492919922, 29.8366641998291, 32.910213470458984, 35.9837646484375, 39.05731201171875, 42.130863189697266, 45.20441436767578, 48.27796173095703, 51.35151290893555]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 7.0, 4.0, 9.0, 10.0, 12.0, 8.0, 19.0, 12.0, 31.0, 38.0, 29.0, 36.0, 42.0, 49.0, 40.0, 58.0, 49.0, 58.0, 62.0, 45.0, 57.0, 41.0, 40.0, 35.0, 35.0, 37.0, 26.0, 24.0, 24.0, 18.0, 13.0, 11.0, 9.0, 4.0, 2.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.38002014160156, -31.456268310546875, -30.532514572143555, -29.608762741088867, -28.68501091003418, -27.76125717163086, -26.837505340576172, -25.913753509521484, -24.990001678466797, -24.06624984741211, -23.14249610900879, -22.2187442779541, -21.294992446899414, -20.371238708496094, -19.447486877441406, -18.52373504638672, -17.5999813079834, -16.67622947692871, -15.752476692199707, -14.828723907470703, -13.904972076416016, -12.981219291687012, -12.057466506958008, -11.13371467590332, -10.209961891174316, -9.286209106445312, -8.362457275390625, -7.438704490661621, -6.514952182769775, -5.59119987487793, -4.667447090148926, -3.74369478225708, -2.819944381713867, -1.896191954612732, -0.9724395275115967, -0.048686981201171875, 0.8750653266906738, 1.7988176345825195, 2.7225704193115234, 3.646322727203369, 4.570075035095215, 5.4938273429870605, 6.417579650878906, 7.34133243560791, 8.265085220336914, 9.188837051391602, 10.112589836120605, 11.03634262084961, 11.960094451904297, 12.8838472366333, 13.807599067687988, 14.731351852416992, 15.65510368347168, 16.578857421875, 17.502609252929688, 18.426361083984375, 19.350112915039062, 20.27386474609375, 21.19761848449707, 22.121370315551758, 23.045122146606445, 23.968875885009766, 24.892627716064453, 25.81637954711914, 26.74013328552246]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 5.0, 8.0, 15.0, 12.0, 17.0, 26.0, 61.0, 68.0, 86.0, 150.0, 230.0, 326.0, 588.0, 867.0, 1442.0, 2656.0, 4582.0, 8236.0, 15412.0, 29235.0, 56497.0, 115931.0, 229697.0, 268058.0, 156813.0, 75224.0, 37754.0, 19891.0, 10717.0, 5851.0, 3254.0, 1912.0, 1126.0, 633.0, 401.0, 250.0, 157.0, 133.0, 81.0, 37.0, 34.0, 22.0, 14.0, 4.0, 8.0, 10.0, 14.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-3.59375, -3.488677978515625, -3.38360595703125, -3.278533935546875, -3.1734619140625, -3.068389892578125, -2.96331787109375, -2.858245849609375, -2.753173828125, -2.648101806640625, -2.54302978515625, -2.437957763671875, -2.3328857421875, -2.227813720703125, -2.12274169921875, -2.017669677734375, -1.91259765625, -1.807525634765625, -1.70245361328125, -1.597381591796875, -1.4923095703125, -1.387237548828125, -1.28216552734375, -1.177093505859375, -1.072021484375, -0.966949462890625, -0.86187744140625, -0.756805419921875, -0.6517333984375, -0.546661376953125, -0.44158935546875, -0.336517333984375, -0.2314453125, -0.126373291015625, -0.02130126953125, 0.083770751953125, 0.1888427734375, 0.293914794921875, 0.39898681640625, 0.504058837890625, 0.609130859375, 0.714202880859375, 0.81927490234375, 0.924346923828125, 1.0294189453125, 1.134490966796875, 1.23956298828125, 1.344635009765625, 1.44970703125, 1.554779052734375, 1.65985107421875, 1.764923095703125, 1.8699951171875, 1.975067138671875, 2.08013916015625, 2.185211181640625, 2.290283203125, 2.395355224609375, 2.50042724609375, 2.605499267578125, 2.7105712890625, 2.815643310546875, 2.92071533203125, 3.025787353515625, 3.130859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 8.0, 17.0, 19.0, 24.0, 22.0, 19.0, 24.0, 18.0, 37.0, 29.0, 33.0, 51.0, 48.0, 46.0, 57.0, 41.0, 53.0, 45.0, 50.0, 43.0, 36.0, 42.0, 29.0, 23.0, 23.0, 23.0, 26.0, 14.0, 16.0, 14.0, 9.0, 8.0, 9.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.79296875, -1.729583740234375, -1.66619873046875, -1.602813720703125, -1.5394287109375, -1.476043701171875, -1.41265869140625, -1.349273681640625, -1.285888671875, -1.222503662109375, -1.15911865234375, -1.095733642578125, -1.0323486328125, -0.968963623046875, -0.90557861328125, -0.842193603515625, -0.77880859375, -0.715423583984375, -0.65203857421875, -0.588653564453125, -0.5252685546875, -0.461883544921875, -0.39849853515625, -0.335113525390625, -0.271728515625, -0.208343505859375, -0.14495849609375, -0.081573486328125, -0.0181884765625, 0.045196533203125, 0.10858154296875, 0.171966552734375, 0.2353515625, 0.298736572265625, 0.36212158203125, 0.425506591796875, 0.4888916015625, 0.552276611328125, 0.61566162109375, 0.679046630859375, 0.742431640625, 0.805816650390625, 0.86920166015625, 0.932586669921875, 0.9959716796875, 1.059356689453125, 1.12274169921875, 1.186126708984375, 1.24951171875, 1.312896728515625, 1.37628173828125, 1.439666748046875, 1.5030517578125, 1.566436767578125, 1.62982177734375, 1.693206787109375, 1.756591796875, 1.819976806640625, 1.88336181640625, 1.946746826171875, 2.0101318359375, 2.073516845703125, 2.13690185546875, 2.200286865234375, 2.263671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 11.0, 22.0, 15.0, 31.0, 33.0, 61.0, 67.0, 107.0, 150.0, 225.0, 375.0, 592.0, 956.0, 2026.0, 4977.0, 17360.0, 89345.0, 670871.0, 213710.0, 33343.0, 8063.0, 2781.0, 1268.0, 755.0, 456.0, 273.0, 200.0, 133.0, 88.0, 63.0, 63.0, 38.0, 21.0, 21.0, 10.0, 11.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.055419921875, -7.77490234375, -7.494384765625, -7.2138671875, -6.933349609375, -6.65283203125, -6.372314453125, -6.091796875, -5.811279296875, -5.53076171875, -5.250244140625, -4.9697265625, -4.689208984375, -4.40869140625, -4.128173828125, -3.84765625, -3.567138671875, -3.28662109375, -3.006103515625, -2.7255859375, -2.445068359375, -2.16455078125, -1.884033203125, -1.603515625, -1.322998046875, -1.04248046875, -0.761962890625, -0.4814453125, -0.200927734375, 0.07958984375, 0.360107421875, 0.640625, 0.921142578125, 1.20166015625, 1.482177734375, 1.7626953125, 2.043212890625, 2.32373046875, 2.604248046875, 2.884765625, 3.165283203125, 3.44580078125, 3.726318359375, 4.0068359375, 4.287353515625, 4.56787109375, 4.848388671875, 5.12890625, 5.409423828125, 5.68994140625, 5.970458984375, 6.2509765625, 6.531494140625, 6.81201171875, 7.092529296875, 7.373046875, 7.653564453125, 7.93408203125, 8.214599609375, 8.4951171875, 8.775634765625, 9.05615234375, 9.336669921875, 9.6171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 7.0, 5.0, 7.0, 11.0, 12.0, 12.0, 17.0, 16.0, 10.0, 34.0, 40.0, 33.0, 46.0, 41.0, 69.0, 61.0, 76.0, 64.0, 61.0, 59.0, 38.0, 41.0, 45.0, 29.0, 31.0, 26.0, 31.0, 14.0, 21.0, 11.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.5140380859375, -10.215576171875, -9.9171142578125, -9.61865234375, -9.3201904296875, -9.021728515625, -8.7232666015625, -8.4248046875, -8.1263427734375, -7.827880859375, -7.5294189453125, -7.23095703125, -6.9324951171875, -6.634033203125, -6.3355712890625, -6.037109375, -5.7386474609375, -5.440185546875, -5.1417236328125, -4.84326171875, -4.5447998046875, -4.246337890625, -3.9478759765625, -3.6494140625, -3.3509521484375, -3.052490234375, -2.7540283203125, -2.45556640625, -2.1571044921875, -1.858642578125, -1.5601806640625, -1.26171875, -0.9632568359375, -0.664794921875, -0.3663330078125, -0.06787109375, 0.2305908203125, 0.529052734375, 0.8275146484375, 1.1259765625, 1.4244384765625, 1.722900390625, 2.0213623046875, 2.31982421875, 2.6182861328125, 2.916748046875, 3.2152099609375, 3.513671875, 3.8121337890625, 4.110595703125, 4.4090576171875, 4.70751953125, 5.0059814453125, 5.304443359375, 5.6029052734375, 5.9013671875, 6.1998291015625, 6.498291015625, 6.7967529296875, 7.09521484375, 7.3936767578125, 7.692138671875, 7.9906005859375, 8.2890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 13.0, 11.0, 13.0, 15.0, 24.0, 30.0, 39.0, 51.0, 90.0, 115.0, 218.0, 424.0, 857.0, 2324.0, 7976.0, 38356.0, 255690.0, 642471.0, 79112.0, 14409.0, 3694.0, 1313.0, 532.0, 271.0, 155.0, 91.0, 61.0, 47.0, 30.0, 22.0, 25.0, 19.0, 12.0, 7.0, 7.0, 2.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.7576904296875, -2.659912109375, -2.5621337890625, -2.46435546875, -2.3665771484375, -2.268798828125, -2.1710205078125, -2.0732421875, -1.9754638671875, -1.877685546875, -1.7799072265625, -1.68212890625, -1.5843505859375, -1.486572265625, -1.3887939453125, -1.291015625, -1.1932373046875, -1.095458984375, -0.9976806640625, -0.89990234375, -0.8021240234375, -0.704345703125, -0.6065673828125, -0.5087890625, -0.4110107421875, -0.313232421875, -0.2154541015625, -0.11767578125, -0.0198974609375, 0.077880859375, 0.1756591796875, 0.2734375, 0.3712158203125, 0.468994140625, 0.5667724609375, 0.66455078125, 0.7623291015625, 0.860107421875, 0.9578857421875, 1.0556640625, 1.1534423828125, 1.251220703125, 1.3489990234375, 1.44677734375, 1.5445556640625, 1.642333984375, 1.7401123046875, 1.837890625, 1.9356689453125, 2.033447265625, 2.1312255859375, 2.22900390625, 2.3267822265625, 2.424560546875, 2.5223388671875, 2.6201171875, 2.7178955078125, 2.815673828125, 2.9134521484375, 3.01123046875, 3.1090087890625, 3.206787109375, 3.3045654296875, 3.40234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 9.0, 5.0, 7.0, 4.0, 5.0, 5.0, 12.0, 13.0, 16.0, 16.0, 15.0, 20.0, 20.0, 33.0, 45.0, 58.0, 61.0, 67.0, 81.0, 74.0, 66.0, 69.0, 55.0, 46.0, 42.0, 31.0, 10.0, 19.0, 13.0, 19.0, 10.0, 13.0, 7.0, 2.0, 8.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.0005130767822265625, -0.0004974678158760071, -0.00048185884952545166, -0.00046624988317489624, -0.0004506409168243408, -0.0004350319504737854, -0.00041942298412323, -0.00040381401777267456, -0.00038820505142211914, -0.0003725960850715637, -0.0003569871187210083, -0.0003413781523704529, -0.00032576918601989746, -0.00031016021966934204, -0.0002945512533187866, -0.0002789422869682312, -0.0002633333206176758, -0.00024772435426712036, -0.00023211538791656494, -0.00021650642156600952, -0.0002008974552154541, -0.00018528848886489868, -0.00016967952251434326, -0.00015407055616378784, -0.00013846158981323242, -0.000122852623462677, -0.00010724365711212158, -9.163469076156616e-05, -7.602572441101074e-05, -6.041675806045532e-05, -4.48077917098999e-05, -2.9198825359344482e-05, -1.3589859008789062e-05, 2.0191073417663574e-06, 1.7628073692321777e-05, 3.32370400428772e-05, 4.884600639343262e-05, 6.445497274398804e-05, 8.006393909454346e-05, 9.567290544509888e-05, 0.0001112818717956543, 0.00012689083814620972, 0.00014249980449676514, 0.00015810877084732056, 0.00017371773719787598, 0.0001893267035484314, 0.00020493566989898682, 0.00022054463624954224, 0.00023615360260009766, 0.0002517625689506531, 0.0002673715353012085, 0.0002829805016517639, 0.00029858946800231934, 0.00031419843435287476, 0.0003298074007034302, 0.0003454163670539856, 0.000361025333404541, 0.00037663429975509644, 0.00039224326610565186, 0.0004078522324562073, 0.0004234611988067627, 0.0004390701651573181, 0.00045467913150787354, 0.00047028809785842896, 0.0004858970642089844]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 14.0, 20.0, 18.0, 43.0, 70.0, 97.0, 175.0, 199.0, 360.0, 710.0, 1375.0, 3154.0, 9349.0, 36609.0, 195404.0, 634151.0, 128880.0, 25625.0, 7024.0, 2652.0, 1142.0, 598.0, 333.0, 205.0, 113.0, 79.0, 44.0, 31.0, 25.0, 17.0, 4.0, 15.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8289947509765625, -1.750762939453125, -1.6725311279296875, -1.59429931640625, -1.5160675048828125, -1.437835693359375, -1.3596038818359375, -1.2813720703125, -1.2031402587890625, -1.124908447265625, -1.0466766357421875, -0.96844482421875, -0.8902130126953125, -0.811981201171875, -0.7337493896484375, -0.655517578125, -0.5772857666015625, -0.499053955078125, -0.4208221435546875, -0.34259033203125, -0.2643585205078125, -0.186126708984375, -0.1078948974609375, -0.0296630859375, 0.0485687255859375, 0.126800537109375, 0.2050323486328125, 0.28326416015625, 0.3614959716796875, 0.439727783203125, 0.5179595947265625, 0.59619140625, 0.6744232177734375, 0.752655029296875, 0.8308868408203125, 0.90911865234375, 0.9873504638671875, 1.065582275390625, 1.1438140869140625, 1.2220458984375, 1.3002777099609375, 1.378509521484375, 1.4567413330078125, 1.53497314453125, 1.6132049560546875, 1.691436767578125, 1.7696685791015625, 1.847900390625, 1.9261322021484375, 2.004364013671875, 2.0825958251953125, 2.16082763671875, 2.2390594482421875, 2.317291259765625, 2.3955230712890625, 2.4737548828125, 2.5519866943359375, 2.630218505859375, 2.7084503173828125, 2.78668212890625, 2.8649139404296875, 2.943145751953125, 3.0213775634765625, 3.099609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 12.0, 9.0, 11.0, 9.0, 22.0, 31.0, 31.0, 33.0, 51.0, 59.0, 72.0, 82.0, 96.0, 78.0, 73.0, 57.0, 58.0, 46.0, 38.0, 17.0, 22.0, 20.0, 13.0, 8.0, 13.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1953125, -2.121337890625, -2.04736328125, -1.973388671875, -1.8994140625, -1.825439453125, -1.75146484375, -1.677490234375, -1.603515625, -1.529541015625, -1.45556640625, -1.381591796875, -1.3076171875, -1.233642578125, -1.15966796875, -1.085693359375, -1.01171875, -0.937744140625, -0.86376953125, -0.789794921875, -0.7158203125, -0.641845703125, -0.56787109375, -0.493896484375, -0.419921875, -0.345947265625, -0.27197265625, -0.197998046875, -0.1240234375, -0.050048828125, 0.02392578125, 0.097900390625, 0.171875, 0.245849609375, 0.31982421875, 0.393798828125, 0.4677734375, 0.541748046875, 0.61572265625, 0.689697265625, 0.763671875, 0.837646484375, 0.91162109375, 0.985595703125, 1.0595703125, 1.133544921875, 1.20751953125, 1.281494140625, 1.35546875, 1.429443359375, 1.50341796875, 1.577392578125, 1.6513671875, 1.725341796875, 1.79931640625, 1.873291015625, 1.947265625, 2.021240234375, 2.09521484375, 2.169189453125, 2.2431640625, 2.317138671875, 2.39111328125, 2.465087890625, 2.5390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 17.0, 22.0, 73.0, 149.0, 271.0, 239.0, 119.0, 49.0, 26.0, 13.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.43888854980469, -72.83250427246094, -70.22611999511719, -67.6197280883789, -65.01334381103516, -62.406959533691406, -59.800575256347656, -57.194190979003906, -54.58780288696289, -51.98141860961914, -49.375030517578125, -46.768646240234375, -44.162261962890625, -41.55587387084961, -38.94948959350586, -36.343101501464844, -33.736717224121094, -31.13033103942871, -28.523944854736328, -25.917560577392578, -23.311174392700195, -20.704788208007812, -18.098403930664062, -15.49201774597168, -12.885631561279297, -10.279245376586914, -7.672860145568848, -5.066474437713623, -2.4600887298583984, 0.14629745483398438, 2.752682685852051, 5.359067916870117, 7.965461730957031, 10.571847915649414, 13.17823314666748, 15.784618377685547, 18.39100456237793, 20.997390747070312, 23.603775024414062, 26.210161209106445, 28.816547393798828, 31.42293357849121, 34.029319763183594, 36.635704040527344, 39.242088317871094, 41.84847640991211, 44.45486068725586, 47.061248779296875, 49.667633056640625, 52.274017333984375, 54.88040542602539, 57.48678970336914, 60.093177795410156, 62.699562072753906, 65.30594635009766, 67.9123306274414, 70.51872253417969, 73.12510681152344, 75.73149108886719, 78.33788299560547, 80.94426727294922, 83.55065155029297, 86.15703582763672, 88.76342010498047, 91.36980438232422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 13.0, 9.0, 14.0, 8.0, 16.0, 13.0, 16.0, 21.0, 19.0, 27.0, 20.0, 29.0, 26.0, 24.0, 34.0, 45.0, 38.0, 48.0, 69.0, 58.0, 52.0, 25.0, 47.0, 23.0, 28.0, 29.0, 31.0, 22.0, 27.0, 12.0, 11.0, 21.0, 15.0, 11.0, 8.0, 11.0, 11.0, 9.0, 7.0, 6.0, 5.0, 7.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-27.12267303466797, -26.319021224975586, -25.51536750793457, -24.711715698242188, -23.908061981201172, -23.10441017150879, -22.300758361816406, -21.49710464477539, -20.693450927734375, -19.889799118041992, -19.086145401000977, -18.282493591308594, -17.478839874267578, -16.675188064575195, -15.871535301208496, -15.067882537841797, -14.264230728149414, -13.460577964782715, -12.656925201416016, -11.853273391723633, -11.049619674682617, -10.245967864990234, -9.442315101623535, -8.638662338256836, -7.835009574890137, -7.0313568115234375, -6.227704048156738, -5.424051761627197, -4.620398998260498, -3.816746234893799, -3.013093948364258, -2.2094411849975586, -1.4057884216308594, -0.6021357774734497, 0.20151686668395996, 1.00516939163208, 1.8088221549987793, 2.6124749183654785, 3.4161272048950195, 4.219779968261719, 5.023432731628418, 5.827085494995117, 6.630738258361816, 7.434390544891357, 8.238042831420898, 9.041696548461914, 9.845348358154297, 10.649001121520996, 11.452653884887695, 12.256306648254395, 13.059959411621094, 13.863611221313477, 14.667264938354492, 15.470916748046875, 16.27457046508789, 17.078222274780273, 17.881874084472656, 18.68552589416504, 19.489179611206055, 20.292831420898438, 21.096485137939453, 21.900136947631836, 22.70378875732422, 23.507442474365234, 24.31109619140625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 0.0, 5.0, 7.0, 10.0, 13.0, 11.0, 18.0, 27.0, 45.0, 44.0, 75.0, 121.0, 175.0, 317.0, 484.0, 944.0, 1718.0, 3694.0, 9076.0, 25849.0, 106753.0, 918176.0, 2652372.0, 385332.0, 59819.0, 17038.0, 6307.0, 2704.0, 1286.0, 716.0, 406.0, 245.0, 167.0, 108.0, 87.0, 50.0, 25.0, 14.0, 18.0, 9.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.65625, -3.5465087890625, -3.436767578125, -3.3270263671875, -3.21728515625, -3.1075439453125, -2.997802734375, -2.8880615234375, -2.7783203125, -2.6685791015625, -2.558837890625, -2.4490966796875, -2.33935546875, -2.2296142578125, -2.119873046875, -2.0101318359375, -1.900390625, -1.7906494140625, -1.680908203125, -1.5711669921875, -1.46142578125, -1.3516845703125, -1.241943359375, -1.1322021484375, -1.0224609375, -0.9127197265625, -0.802978515625, -0.6932373046875, -0.58349609375, -0.4737548828125, -0.364013671875, -0.2542724609375, -0.14453125, -0.0347900390625, 0.074951171875, 0.1846923828125, 0.29443359375, 0.4041748046875, 0.513916015625, 0.6236572265625, 0.7333984375, 0.8431396484375, 0.952880859375, 1.0626220703125, 1.17236328125, 1.2821044921875, 1.391845703125, 1.5015869140625, 1.611328125, 1.7210693359375, 1.830810546875, 1.9405517578125, 2.05029296875, 2.1600341796875, 2.269775390625, 2.3795166015625, 2.4892578125, 2.5989990234375, 2.708740234375, 2.8184814453125, 2.92822265625, 3.0379638671875, 3.147705078125, 3.2574462890625, 3.3671875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 8.0, 12.0, 17.0, 17.0, 20.0, 24.0, 27.0, 27.0, 43.0, 52.0, 49.0, 52.0, 65.0, 57.0, 45.0, 51.0, 62.0, 65.0, 56.0, 49.0, 41.0, 34.0, 28.0, 22.0, 15.0, 19.0, 16.0, 2.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.6812896728515625, -1.605743408203125, -1.5301971435546875, -1.45465087890625, -1.3791046142578125, -1.303558349609375, -1.2280120849609375, -1.1524658203125, -1.0769195556640625, -1.001373291015625, -0.9258270263671875, -0.85028076171875, -0.7747344970703125, -0.699188232421875, -0.6236419677734375, -0.548095703125, -0.4725494384765625, -0.397003173828125, -0.3214569091796875, -0.24591064453125, -0.1703643798828125, -0.094818115234375, -0.0192718505859375, 0.0562744140625, 0.1318206787109375, 0.207366943359375, 0.2829132080078125, 0.35845947265625, 0.4340057373046875, 0.509552001953125, 0.5850982666015625, 0.66064453125, 0.7361907958984375, 0.811737060546875, 0.8872833251953125, 0.96282958984375, 1.0383758544921875, 1.113922119140625, 1.1894683837890625, 1.2650146484375, 1.3405609130859375, 1.416107177734375, 1.4916534423828125, 1.56719970703125, 1.6427459716796875, 1.718292236328125, 1.7938385009765625, 1.869384765625, 1.9449310302734375, 2.020477294921875, 2.0960235595703125, 2.17156982421875, 2.2471160888671875, 2.322662353515625, 2.3982086181640625, 2.4737548828125, 2.5493011474609375, 2.624847412109375, 2.7003936767578125, 2.77593994140625, 2.8514862060546875, 2.927032470703125, 3.0025787353515625, 3.078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 11.0, 7.0, 11.0, 17.0, 23.0, 48.0, 79.0, 146.0, 307.0, 690.0, 1684.0, 6237.0, 30460.0, 314942.0, 3524254.0, 278832.0, 27990.0, 5698.0, 1650.0, 658.0, 262.0, 134.0, 55.0, 38.0, 20.0, 14.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.90301513671875, -4.6849365234375, -4.46685791015625, -4.248779296875, -4.03070068359375, -3.8126220703125, -3.59454345703125, -3.37646484375, -3.15838623046875, -2.9403076171875, -2.72222900390625, -2.504150390625, -2.28607177734375, -2.0679931640625, -1.84991455078125, -1.6318359375, -1.41375732421875, -1.1956787109375, -0.97760009765625, -0.759521484375, -0.54144287109375, -0.3233642578125, -0.10528564453125, 0.11279296875, 0.33087158203125, 0.5489501953125, 0.76702880859375, 0.985107421875, 1.20318603515625, 1.4212646484375, 1.63934326171875, 1.857421875, 2.07550048828125, 2.2935791015625, 2.51165771484375, 2.729736328125, 2.94781494140625, 3.1658935546875, 3.38397216796875, 3.60205078125, 3.82012939453125, 4.0382080078125, 4.25628662109375, 4.474365234375, 4.69244384765625, 4.9105224609375, 5.12860107421875, 5.3466796875, 5.56475830078125, 5.7828369140625, 6.00091552734375, 6.218994140625, 6.43707275390625, 6.6551513671875, 6.87322998046875, 7.09130859375, 7.30938720703125, 7.5274658203125, 7.74554443359375, 7.963623046875, 8.18170166015625, 8.3997802734375, 8.61785888671875, 8.8359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 3.0, 14.0, 17.0, 15.0, 35.0, 44.0, 54.0, 85.0, 136.0, 222.0, 331.0, 528.0, 761.0, 656.0, 436.0, 231.0, 145.0, 97.0, 79.0, 53.0, 38.0, 28.0, 12.0, 15.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.56585693359375, -5.4012451171875, -5.23663330078125, -5.072021484375, -4.90740966796875, -4.7427978515625, -4.57818603515625, -4.41357421875, -4.24896240234375, -4.0843505859375, -3.91973876953125, -3.755126953125, -3.59051513671875, -3.4259033203125, -3.26129150390625, -3.0966796875, -2.93206787109375, -2.7674560546875, -2.60284423828125, -2.438232421875, -2.27362060546875, -2.1090087890625, -1.94439697265625, -1.77978515625, -1.61517333984375, -1.4505615234375, -1.28594970703125, -1.121337890625, -0.95672607421875, -0.7921142578125, -0.62750244140625, -0.462890625, -0.29827880859375, -0.1336669921875, 0.03094482421875, 0.195556640625, 0.36016845703125, 0.5247802734375, 0.68939208984375, 0.85400390625, 1.01861572265625, 1.1832275390625, 1.34783935546875, 1.512451171875, 1.67706298828125, 1.8416748046875, 2.00628662109375, 2.1708984375, 2.33551025390625, 2.5001220703125, 2.66473388671875, 2.829345703125, 2.99395751953125, 3.1585693359375, 3.32318115234375, 3.48779296875, 3.65240478515625, 3.8170166015625, 3.98162841796875, 4.146240234375, 4.31085205078125, 4.4754638671875, 4.64007568359375, 4.8046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 14.0, 9.0, 10.0, 42.0, 150.0, 367.0, 280.0, 97.0, 19.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-175.68365478515625, -172.0187225341797, -168.3538055419922, -164.68887329101562, -161.02394104003906, -157.3590087890625, -153.694091796875, -150.02915954589844, -146.36422729492188, -142.6992950439453, -139.0343780517578, -135.36944580078125, -131.7045135498047, -128.03958129882812, -124.37466430664062, -120.70973205566406, -117.04480743408203, -113.3798828125, -109.71495056152344, -106.0500259399414, -102.38509368896484, -98.72016906738281, -95.05523681640625, -91.39031219482422, -87.72538757324219, -84.06046295166016, -80.3955307006836, -76.73060607910156, -73.065673828125, -69.40074920654297, -65.73582458496094, -62.070892333984375, -58.40595245361328, -54.741024017333984, -51.07609558105469, -47.411170959472656, -43.746238708496094, -40.08131408691406, -36.416385650634766, -32.75145721435547, -29.086528778076172, -25.421600341796875, -21.756671905517578, -18.091745376586914, -14.426816940307617, -10.76188850402832, -7.096961975097656, -3.4320335388183594, 0.2328948974609375, 3.897822856903076, 7.562750816345215, 11.227678298950195, 14.892606735229492, 18.55753517150879, 22.222461700439453, 25.88739013671875, 29.552318572998047, 33.217247009277344, 36.88217544555664, 40.54710388183594, 44.21202850341797, 47.87696075439453, 51.54188537597656, 55.20681381225586, 58.871742248535156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 10.0, 9.0, 18.0, 24.0, 16.0, 34.0, 44.0, 50.0, 62.0, 57.0, 58.0, 75.0, 64.0, 64.0, 63.0, 56.0, 45.0, 50.0, 39.0, 41.0, 24.0, 30.0, 18.0, 11.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.94268798828125, -38.983192443847656, -38.02369689941406, -37.06420135498047, -36.104705810546875, -35.14521026611328, -34.18571472167969, -33.226219177246094, -32.2667236328125, -31.307228088378906, -30.347732543945312, -29.38823699951172, -28.428741455078125, -27.46924591064453, -26.509748458862305, -25.55025291442871, -24.590755462646484, -23.63125991821289, -22.671764373779297, -21.712268829345703, -20.75277328491211, -19.793277740478516, -18.83378028869629, -17.874284744262695, -16.9147891998291, -15.955293655395508, -14.995798110961914, -14.036301612854004, -13.07680606842041, -12.117310523986816, -11.157814025878906, -10.198318481445312, -9.238822937011719, -8.279327392578125, -7.319831371307373, -6.360335350036621, -5.400839805603027, -4.441344261169434, -3.4818482398986816, -2.5223522186279297, -1.562856674194336, -0.6033608913421631, 0.35613489151000977, 1.3156306743621826, 2.2751264572143555, 3.234622001647949, 4.194118022918701, 5.153614044189453, 6.113109588623047, 7.072605133056641, 8.032100677490234, 8.991597175598145, 9.951092720031738, 10.910588264465332, 11.870084762573242, 12.829580307006836, 13.78907585144043, 14.748571395874023, 15.708066940307617, 16.66756248474121, 17.627059936523438, 18.58655548095703, 19.546051025390625, 20.50554656982422, 21.465042114257812]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 15.0, 32.0, 31.0, 52.0, 95.0, 210.0, 456.0, 1055.0, 2459.0, 6957.0, 21649.0, 82314.0, 298745.0, 422390.0, 154490.0, 39580.0, 11215.0, 4044.0, 1509.0, 664.0, 280.0, 135.0, 72.0, 32.0, 25.0, 17.0, 9.0, 10.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.50238037109375, -5.3367919921875, -5.17120361328125, -5.005615234375, -4.84002685546875, -4.6744384765625, -4.50885009765625, -4.34326171875, -4.17767333984375, -4.0120849609375, -3.84649658203125, -3.680908203125, -3.51531982421875, -3.3497314453125, -3.18414306640625, -3.0185546875, -2.85296630859375, -2.6873779296875, -2.52178955078125, -2.356201171875, -2.19061279296875, -2.0250244140625, -1.85943603515625, -1.69384765625, -1.52825927734375, -1.3626708984375, -1.19708251953125, -1.031494140625, -0.86590576171875, -0.7003173828125, -0.53472900390625, -0.369140625, -0.20355224609375, -0.0379638671875, 0.12762451171875, 0.293212890625, 0.45880126953125, 0.6243896484375, 0.78997802734375, 0.95556640625, 1.12115478515625, 1.2867431640625, 1.45233154296875, 1.617919921875, 1.78350830078125, 1.9490966796875, 2.11468505859375, 2.2802734375, 2.44586181640625, 2.6114501953125, 2.77703857421875, 2.942626953125, 3.10821533203125, 3.2738037109375, 3.43939208984375, 3.60498046875, 3.77056884765625, 3.9361572265625, 4.10174560546875, 4.267333984375, 4.43292236328125, 4.5985107421875, 4.76409912109375, 4.9296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 3.0, 8.0, 16.0, 12.0, 14.0, 15.0, 17.0, 19.0, 38.0, 30.0, 23.0, 40.0, 33.0, 27.0, 38.0, 40.0, 49.0, 49.0, 46.0, 40.0, 36.0, 58.0, 50.0, 36.0, 38.0, 34.0, 21.0, 28.0, 22.0, 16.0, 17.0, 14.0, 11.0, 15.0, 11.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.827667236328125, -1.76666259765625, -1.705657958984375, -1.6446533203125, -1.583648681640625, -1.52264404296875, -1.461639404296875, -1.400634765625, -1.339630126953125, -1.27862548828125, -1.217620849609375, -1.1566162109375, -1.095611572265625, -1.03460693359375, -0.973602294921875, -0.91259765625, -0.851593017578125, -0.79058837890625, -0.729583740234375, -0.6685791015625, -0.607574462890625, -0.54656982421875, -0.485565185546875, -0.424560546875, -0.363555908203125, -0.30255126953125, -0.241546630859375, -0.1805419921875, -0.119537353515625, -0.05853271484375, 0.002471923828125, 0.0634765625, 0.124481201171875, 0.18548583984375, 0.246490478515625, 0.3074951171875, 0.368499755859375, 0.42950439453125, 0.490509033203125, 0.551513671875, 0.612518310546875, 0.67352294921875, 0.734527587890625, 0.7955322265625, 0.856536865234375, 0.91754150390625, 0.978546142578125, 1.03955078125, 1.100555419921875, 1.16156005859375, 1.222564697265625, 1.2835693359375, 1.344573974609375, 1.40557861328125, 1.466583251953125, 1.527587890625, 1.588592529296875, 1.64959716796875, 1.710601806640625, 1.7716064453125, 1.832611083984375, 1.89361572265625, 1.954620361328125, 2.015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 6.0, 9.0, 15.0, 28.0, 32.0, 29.0, 64.0, 103.0, 188.0, 353.0, 780.0, 2145.0, 6953.0, 32890.0, 202857.0, 646906.0, 126039.0, 21106.0, 5052.0, 1643.0, 628.0, 284.0, 152.0, 76.0, 65.0, 39.0, 27.0, 24.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.51171875, -6.29730224609375, -6.0828857421875, -5.86846923828125, -5.654052734375, -5.43963623046875, -5.2252197265625, -5.01080322265625, -4.79638671875, -4.58197021484375, -4.3675537109375, -4.15313720703125, -3.938720703125, -3.72430419921875, -3.5098876953125, -3.29547119140625, -3.0810546875, -2.86663818359375, -2.6522216796875, -2.43780517578125, -2.223388671875, -2.00897216796875, -1.7945556640625, -1.58013916015625, -1.36572265625, -1.15130615234375, -0.9368896484375, -0.72247314453125, -0.508056640625, -0.29364013671875, -0.0792236328125, 0.13519287109375, 0.349609375, 0.56402587890625, 0.7784423828125, 0.99285888671875, 1.207275390625, 1.42169189453125, 1.6361083984375, 1.85052490234375, 2.06494140625, 2.27935791015625, 2.4937744140625, 2.70819091796875, 2.922607421875, 3.13702392578125, 3.3514404296875, 3.56585693359375, 3.7802734375, 3.99468994140625, 4.2091064453125, 4.42352294921875, 4.637939453125, 4.85235595703125, 5.0667724609375, 5.28118896484375, 5.49560546875, 5.71002197265625, 5.9244384765625, 6.13885498046875, 6.353271484375, 6.56768798828125, 6.7821044921875, 6.99652099609375, 7.2109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 3.0, 7.0, 12.0, 12.0, 16.0, 20.0, 22.0, 28.0, 26.0, 36.0, 45.0, 45.0, 46.0, 49.0, 45.0, 59.0, 51.0, 49.0, 53.0, 45.0, 56.0, 38.0, 38.0, 39.0, 33.0, 18.0, 22.0, 26.0, 11.0, 14.0, 7.0, 9.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.484375, -7.2296142578125, -6.974853515625, -6.7200927734375, -6.46533203125, -6.2105712890625, -5.955810546875, -5.7010498046875, -5.4462890625, -5.1915283203125, -4.936767578125, -4.6820068359375, -4.42724609375, -4.1724853515625, -3.917724609375, -3.6629638671875, -3.408203125, -3.1534423828125, -2.898681640625, -2.6439208984375, -2.38916015625, -2.1343994140625, -1.879638671875, -1.6248779296875, -1.3701171875, -1.1153564453125, -0.860595703125, -0.6058349609375, -0.35107421875, -0.0963134765625, 0.158447265625, 0.4132080078125, 0.66796875, 0.9227294921875, 1.177490234375, 1.4322509765625, 1.68701171875, 1.9417724609375, 2.196533203125, 2.4512939453125, 2.7060546875, 2.9608154296875, 3.215576171875, 3.4703369140625, 3.72509765625, 3.9798583984375, 4.234619140625, 4.4893798828125, 4.744140625, 4.9989013671875, 5.253662109375, 5.5084228515625, 5.76318359375, 6.0179443359375, 6.272705078125, 6.5274658203125, 6.7822265625, 7.0369873046875, 7.291748046875, 7.5465087890625, 7.80126953125, 8.0560302734375, 8.310791015625, 8.5655517578125, 8.8203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 19.0, 22.0, 36.0, 51.0, 72.0, 120.0, 201.0, 343.0, 677.0, 1353.0, 2871.0, 6680.0, 17206.0, 49394.0, 154742.0, 543232.0, 180365.0, 57501.0, 19726.0, 7549.0, 3210.0, 1421.0, 760.0, 410.0, 206.0, 113.0, 68.0, 51.0, 40.0, 23.0, 14.0, 14.0, 5.0, 8.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4892578125, -1.4388885498046875, -1.388519287109375, -1.3381500244140625, -1.28778076171875, -1.2374114990234375, -1.187042236328125, -1.1366729736328125, -1.0863037109375, -1.0359344482421875, -0.985565185546875, -0.9351959228515625, -0.88482666015625, -0.8344573974609375, -0.784088134765625, -0.7337188720703125, -0.683349609375, -0.6329803466796875, -0.582611083984375, -0.5322418212890625, -0.48187255859375, -0.4315032958984375, -0.381134033203125, -0.3307647705078125, -0.2803955078125, -0.2300262451171875, -0.179656982421875, -0.1292877197265625, -0.07891845703125, -0.0285491943359375, 0.021820068359375, 0.0721893310546875, 0.12255859375, 0.1729278564453125, 0.223297119140625, 0.2736663818359375, 0.32403564453125, 0.3744049072265625, 0.424774169921875, 0.4751434326171875, 0.5255126953125, 0.5758819580078125, 0.626251220703125, 0.6766204833984375, 0.72698974609375, 0.7773590087890625, 0.827728271484375, 0.8780975341796875, 0.928466796875, 0.9788360595703125, 1.029205322265625, 1.0795745849609375, 1.12994384765625, 1.1803131103515625, 1.230682373046875, 1.2810516357421875, 1.3314208984375, 1.3817901611328125, 1.432159423828125, 1.4825286865234375, 1.53289794921875, 1.5832672119140625, 1.633636474609375, 1.6840057373046875, 1.734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 12.0, 11.0, 21.0, 22.0, 34.0, 34.0, 45.0, 71.0, 88.0, 94.0, 115.0, 111.0, 82.0, 60.0, 55.0, 29.0, 25.0, 10.0, 20.0, 13.0, 8.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005311965942382812, -0.0005116835236549377, -0.0004921704530715942, -0.00047265738248825073, -0.0004531443119049072, -0.0004336312413215637, -0.0004141181707382202, -0.0003946051001548767, -0.0003750920295715332, -0.0003555789589881897, -0.0003360658884048462, -0.0003165528178215027, -0.0002970397472381592, -0.0002775266766548157, -0.00025801360607147217, -0.00023850053548812866, -0.00021898746490478516, -0.00019947439432144165, -0.00017996132373809814, -0.00016044825315475464, -0.00014093518257141113, -0.00012142211198806763, -0.00010190904140472412, -8.239597082138062e-05, -6.288290023803711e-05, -4.3369829654693604e-05, -2.3856759071350098e-05, -4.343688488006592e-06, 1.5169382095336914e-05, 3.468245267868042e-05, 5.4195523262023926e-05, 7.370859384536743e-05, 9.322166442871094e-05, 0.00011273473501205444, 0.00013224780559539795, 0.00015176087617874146, 0.00017127394676208496, 0.00019078701734542847, 0.00021030008792877197, 0.00022981315851211548, 0.000249326229095459, 0.0002688392996788025, 0.000288352370262146, 0.0003078654408454895, 0.000327378511428833, 0.0003468915820121765, 0.00036640465259552, 0.0003859177231788635, 0.00040543079376220703, 0.00042494386434555054, 0.00044445693492889404, 0.00046397000551223755, 0.00048348307609558105, 0.0005029961466789246, 0.0005225092172622681, 0.0005420222878456116, 0.0005615353584289551, 0.0005810484290122986, 0.0006005614995956421, 0.0006200745701789856, 0.0006395876407623291, 0.0006591007113456726, 0.0006786137819290161, 0.0006981268525123596, 0.0007176399230957031]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 10.0, 8.0, 20.0, 12.0, 22.0, 28.0, 49.0, 72.0, 76.0, 149.0, 237.0, 387.0, 681.0, 1324.0, 2896.0, 6894.0, 18247.0, 56266.0, 186294.0, 543604.0, 156560.0, 47716.0, 15636.0, 5894.0, 2640.0, 1206.0, 638.0, 364.0, 201.0, 120.0, 86.0, 49.0, 42.0, 27.0, 22.0, 18.0, 19.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8349609375, -1.7816619873046875, -1.728363037109375, -1.6750640869140625, -1.62176513671875, -1.5684661865234375, -1.515167236328125, -1.4618682861328125, -1.4085693359375, -1.3552703857421875, -1.301971435546875, -1.2486724853515625, -1.19537353515625, -1.1420745849609375, -1.088775634765625, -1.0354766845703125, -0.982177734375, -0.9288787841796875, -0.875579833984375, -0.8222808837890625, -0.76898193359375, -0.7156829833984375, -0.662384033203125, -0.6090850830078125, -0.5557861328125, -0.5024871826171875, -0.449188232421875, -0.3958892822265625, -0.34259033203125, -0.2892913818359375, -0.235992431640625, -0.1826934814453125, -0.12939453125, -0.0760955810546875, -0.022796630859375, 0.0305023193359375, 0.08380126953125, 0.1371002197265625, 0.190399169921875, 0.2436981201171875, 0.2969970703125, 0.3502960205078125, 0.403594970703125, 0.4568939208984375, 0.51019287109375, 0.5634918212890625, 0.616790771484375, 0.6700897216796875, 0.723388671875, 0.7766876220703125, 0.829986572265625, 0.8832855224609375, 0.93658447265625, 0.9898834228515625, 1.043182373046875, 1.0964813232421875, 1.1497802734375, 1.2030792236328125, 1.256378173828125, 1.3096771240234375, 1.36297607421875, 1.4162750244140625, 1.469573974609375, 1.5228729248046875, 1.576171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 16.0, 12.0, 10.0, 24.0, 33.0, 46.0, 60.0, 78.0, 79.0, 104.0, 108.0, 108.0, 92.0, 53.0, 49.0, 39.0, 22.0, 19.0, 13.0, 10.0, 5.0, 5.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.104583740234375, -2.01776123046875, -1.930938720703125, -1.8441162109375, -1.757293701171875, -1.67047119140625, -1.583648681640625, -1.496826171875, -1.410003662109375, -1.32318115234375, -1.236358642578125, -1.1495361328125, -1.062713623046875, -0.97589111328125, -0.889068603515625, -0.80224609375, -0.715423583984375, -0.62860107421875, -0.541778564453125, -0.4549560546875, -0.368133544921875, -0.28131103515625, -0.194488525390625, -0.107666015625, -0.020843505859375, 0.06597900390625, 0.152801513671875, 0.2396240234375, 0.326446533203125, 0.41326904296875, 0.500091552734375, 0.5869140625, 0.673736572265625, 0.76055908203125, 0.847381591796875, 0.9342041015625, 1.021026611328125, 1.10784912109375, 1.194671630859375, 1.281494140625, 1.368316650390625, 1.45513916015625, 1.541961669921875, 1.6287841796875, 1.715606689453125, 1.80242919921875, 1.889251708984375, 1.97607421875, 2.062896728515625, 2.14971923828125, 2.236541748046875, 2.3233642578125, 2.410186767578125, 2.49700927734375, 2.583831787109375, 2.670654296875, 2.757476806640625, 2.84429931640625, 2.931121826171875, 3.0179443359375, 3.104766845703125, 3.19158935546875, 3.278411865234375, 3.365234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 28.0, 34.0, 68.0, 116.0, 178.0, 254.0, 127.0, 74.0, 47.0, 21.0, 14.0, 7.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.25344848632812, -66.59359741210938, -64.93374633789062, -63.273895263671875, -61.614044189453125, -59.954193115234375, -58.294342041015625, -56.634490966796875, -54.974639892578125, -53.314788818359375, -51.654937744140625, -49.995086669921875, -48.335235595703125, -46.675384521484375, -45.015533447265625, -43.355682373046875, -41.695831298828125, -40.035980224609375, -38.376129150390625, -36.716278076171875, -35.056427001953125, -33.396575927734375, -31.736724853515625, -30.076873779296875, -28.417022705078125, -26.757171630859375, -25.097320556640625, -23.437469482421875, -21.777618408203125, -20.117767333984375, -18.457916259765625, -16.798065185546875, -15.13821029663086, -13.47835922241211, -11.81850814819336, -10.15865707397461, -8.49880599975586, -6.838954925537109, -5.179103851318359, -3.5192527770996094, -1.8594017028808594, -0.19955062866210938, 1.4603004455566406, 3.1201515197753906, 4.780002593994141, 6.439853668212891, 8.09970474243164, 9.75955581665039, 11.41940689086914, 13.07925796508789, 14.73910903930664, 16.39896011352539, 18.05881118774414, 19.71866226196289, 21.37851333618164, 23.03836441040039, 24.69821548461914, 26.35806655883789, 28.01791763305664, 29.67776870727539, 31.33761978149414, 32.99747085571289, 34.65732192993164, 36.31717300415039, 37.97702407836914]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 11.0, 4.0, 10.0, 15.0, 19.0, 26.0, 27.0, 28.0, 32.0, 34.0, 31.0, 35.0, 41.0, 59.0, 80.0, 76.0, 84.0, 62.0, 57.0, 27.0, 36.0, 23.0, 27.0, 24.0, 23.0, 19.0, 13.0, 13.0, 8.0, 4.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.934917449951172, -25.953046798706055, -24.971176147460938, -23.989307403564453, -23.007436752319336, -22.02556610107422, -21.043697357177734, -20.061826705932617, -19.0799560546875, -18.098085403442383, -17.116214752197266, -16.13434600830078, -15.152475357055664, -14.170604705810547, -13.188735008239746, -12.206865310668945, -11.224994659423828, -10.243124008178711, -9.26125431060791, -8.27938461303711, -7.297513961791992, -6.315643787384033, -5.333773612976074, -4.351903438568115, -3.3700332641601562, -2.3881630897521973, -1.4062929153442383, -0.4244227409362793, 0.5574474334716797, 1.5393176078796387, 2.5211877822875977, 3.5030579566955566, 4.484928131103516, 5.466798305511475, 6.448668479919434, 7.430538654327393, 8.412408828735352, 9.394279479980469, 10.37614917755127, 11.35801887512207, 12.339889526367188, 13.321760177612305, 14.303629875183105, 15.285499572753906, 16.267370223999023, 17.24924087524414, 18.231109619140625, 19.212980270385742, 20.19485092163086, 21.176721572875977, 22.158592224121094, 23.140460968017578, 24.122331619262695, 25.104202270507812, 26.086071014404297, 27.067941665649414, 28.04981231689453, 29.03168296813965, 30.013553619384766, 30.99542236328125, 31.977293014526367, 32.959163665771484, 33.94103240966797, 34.92290496826172, 35.9047737121582]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 9.0, 8.0, 11.0, 23.0, 40.0, 58.0, 75.0, 123.0, 178.0, 321.0, 556.0, 1071.0, 2020.0, 4511.0, 12298.0, 44425.0, 260269.0, 2097313.0, 1539816.0, 179492.0, 33915.0, 10134.0, 3880.0, 1729.0, 861.0, 496.0, 266.0, 138.0, 84.0, 60.0, 33.0, 26.0, 12.0, 10.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.353515625, -3.2484130859375, -3.143310546875, -3.0382080078125, -2.93310546875, -2.8280029296875, -2.722900390625, -2.6177978515625, -2.5126953125, -2.4075927734375, -2.302490234375, -2.1973876953125, -2.09228515625, -1.9871826171875, -1.882080078125, -1.7769775390625, -1.671875, -1.5667724609375, -1.461669921875, -1.3565673828125, -1.25146484375, -1.1463623046875, -1.041259765625, -0.9361572265625, -0.8310546875, -0.7259521484375, -0.620849609375, -0.5157470703125, -0.41064453125, -0.3055419921875, -0.200439453125, -0.0953369140625, 0.009765625, 0.1148681640625, 0.219970703125, 0.3250732421875, 0.43017578125, 0.5352783203125, 0.640380859375, 0.7454833984375, 0.8505859375, 0.9556884765625, 1.060791015625, 1.1658935546875, 1.27099609375, 1.3760986328125, 1.481201171875, 1.5863037109375, 1.69140625, 1.7965087890625, 1.901611328125, 2.0067138671875, 2.11181640625, 2.2169189453125, 2.322021484375, 2.4271240234375, 2.5322265625, 2.6373291015625, 2.742431640625, 2.8475341796875, 2.95263671875, 3.0577392578125, 3.162841796875, 3.2679443359375, 3.373046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 9.0, 11.0, 19.0, 15.0, 18.0, 27.0, 22.0, 24.0, 29.0, 33.0, 48.0, 37.0, 33.0, 49.0, 48.0, 51.0, 43.0, 41.0, 45.0, 39.0, 40.0, 31.0, 24.0, 30.0, 27.0, 28.0, 31.0, 24.0, 16.0, 15.0, 14.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8583984375, -1.80072021484375, -1.7430419921875, -1.68536376953125, -1.627685546875, -1.57000732421875, -1.5123291015625, -1.45465087890625, -1.39697265625, -1.33929443359375, -1.2816162109375, -1.22393798828125, -1.166259765625, -1.10858154296875, -1.0509033203125, -0.99322509765625, -0.935546875, -0.87786865234375, -0.8201904296875, -0.76251220703125, -0.704833984375, -0.64715576171875, -0.5894775390625, -0.53179931640625, -0.47412109375, -0.41644287109375, -0.3587646484375, -0.30108642578125, -0.243408203125, -0.18572998046875, -0.1280517578125, -0.07037353515625, -0.0126953125, 0.04498291015625, 0.1026611328125, 0.16033935546875, 0.218017578125, 0.27569580078125, 0.3333740234375, 0.39105224609375, 0.44873046875, 0.50640869140625, 0.5640869140625, 0.62176513671875, 0.679443359375, 0.73712158203125, 0.7947998046875, 0.85247802734375, 0.91015625, 0.96783447265625, 1.0255126953125, 1.08319091796875, 1.140869140625, 1.19854736328125, 1.2562255859375, 1.31390380859375, 1.37158203125, 1.42926025390625, 1.4869384765625, 1.54461669921875, 1.602294921875, 1.65997314453125, 1.7176513671875, 1.77532958984375, 1.8330078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 14.0, 7.0, 14.0, 26.0, 43.0, 51.0, 85.0, 174.0, 310.0, 685.0, 2003.0, 6305.0, 27974.0, 246337.0, 3161857.0, 678675.0, 54137.0, 10371.0, 3040.0, 1139.0, 467.0, 237.0, 123.0, 69.0, 42.0, 27.0, 20.0, 20.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.808837890625, -4.64111328125, -4.473388671875, -4.3056640625, -4.137939453125, -3.97021484375, -3.802490234375, -3.634765625, -3.467041015625, -3.29931640625, -3.131591796875, -2.9638671875, -2.796142578125, -2.62841796875, -2.460693359375, -2.29296875, -2.125244140625, -1.95751953125, -1.789794921875, -1.6220703125, -1.454345703125, -1.28662109375, -1.118896484375, -0.951171875, -0.783447265625, -0.61572265625, -0.447998046875, -0.2802734375, -0.112548828125, 0.05517578125, 0.222900390625, 0.390625, 0.558349609375, 0.72607421875, 0.893798828125, 1.0615234375, 1.229248046875, 1.39697265625, 1.564697265625, 1.732421875, 1.900146484375, 2.06787109375, 2.235595703125, 2.4033203125, 2.571044921875, 2.73876953125, 2.906494140625, 3.07421875, 3.241943359375, 3.40966796875, 3.577392578125, 3.7451171875, 3.912841796875, 4.08056640625, 4.248291015625, 4.416015625, 4.583740234375, 4.75146484375, 4.919189453125, 5.0869140625, 5.254638671875, 5.42236328125, 5.590087890625, 5.7578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 15.0, 18.0, 29.0, 36.0, 50.0, 89.0, 93.0, 164.0, 196.0, 298.0, 435.0, 565.0, 560.0, 485.0, 303.0, 222.0, 135.0, 90.0, 70.0, 55.0, 35.0, 30.0, 17.0, 14.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.716796875, -3.588714599609375, -3.46063232421875, -3.332550048828125, -3.2044677734375, -3.076385498046875, -2.94830322265625, -2.820220947265625, -2.692138671875, -2.564056396484375, -2.43597412109375, -2.307891845703125, -2.1798095703125, -2.051727294921875, -1.92364501953125, -1.795562744140625, -1.66748046875, -1.539398193359375, -1.41131591796875, -1.283233642578125, -1.1551513671875, -1.027069091796875, -0.89898681640625, -0.770904541015625, -0.642822265625, -0.514739990234375, -0.38665771484375, -0.258575439453125, -0.1304931640625, -0.002410888671875, 0.12567138671875, 0.253753662109375, 0.3818359375, 0.509918212890625, 0.63800048828125, 0.766082763671875, 0.8941650390625, 1.022247314453125, 1.15032958984375, 1.278411865234375, 1.406494140625, 1.534576416015625, 1.66265869140625, 1.790740966796875, 1.9188232421875, 2.046905517578125, 2.17498779296875, 2.303070068359375, 2.43115234375, 2.559234619140625, 2.68731689453125, 2.815399169921875, 2.9434814453125, 3.071563720703125, 3.19964599609375, 3.327728271484375, 3.455810546875, 3.583892822265625, 3.71197509765625, 3.840057373046875, 3.9681396484375, 4.096221923828125, 4.22430419921875, 4.352386474609375, 4.48046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 1.0, 15.0, 13.0, 28.0, 37.0, 53.0, 77.0, 94.0, 116.0, 115.0, 131.0, 94.0, 79.0, 42.0, 30.0, 17.0, 17.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.69839859008789, -21.64850616455078, -20.598613739013672, -19.548721313476562, -18.498828887939453, -17.448936462402344, -16.399044036865234, -15.349152565002441, -14.299260139465332, -13.249367713928223, -12.199475288391113, -11.14958381652832, -10.099691390991211, -9.049798965454102, -7.999906539916992, -6.950014114379883, -5.900121688842773, -4.850229263305664, -3.800337076187134, -2.7504448890686035, -1.7005524635314941, -0.6506600379943848, 0.3992319107055664, 1.4491243362426758, 2.499016761779785, 3.5489091873168945, 4.598801612854004, 5.648693561553955, 6.6985859870910645, 7.748478412628174, 8.798370361328125, 9.848262786865234, 10.898155212402344, 11.948047637939453, 12.997940063476562, 14.047832489013672, 15.097724914550781, 16.14761734008789, 17.197509765625, 18.24740219116211, 19.29729461669922, 20.347187042236328, 21.397079467773438, 22.446971893310547, 23.496864318847656, 24.546756744384766, 25.596649169921875, 26.646541595458984, 27.69643211364746, 28.74632453918457, 29.79621696472168, 30.84610939025879, 31.8960018157959, 32.945892333984375, 33.995784759521484, 35.045677185058594, 36.0955696105957, 37.14546203613281, 38.19535446166992, 39.24524688720703, 40.29513931274414, 41.34503173828125, 42.39492416381836, 43.44481658935547, 44.49470901489258]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 7.0, 8.0, 12.0, 8.0, 6.0, 14.0, 26.0, 18.0, 19.0, 21.0, 25.0, 20.0, 28.0, 40.0, 32.0, 40.0, 42.0, 52.0, 43.0, 46.0, 45.0, 46.0, 43.0, 26.0, 35.0, 38.0, 30.0, 24.0, 26.0, 27.0, 20.0, 23.0, 20.0, 14.0, 12.0, 13.0, 10.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.247364044189453, -16.698402404785156, -16.14944076538086, -15.600480079650879, -15.051518440246582, -14.502557754516602, -13.953596115112305, -13.404634475708008, -12.855672836303711, -12.306711196899414, -11.757750511169434, -11.208788871765137, -10.65982723236084, -10.11086654663086, -9.561904907226562, -9.012943267822266, -8.463982582092285, -7.9150214195251465, -7.36605978012085, -6.817098617553711, -6.268136978149414, -5.719175815582275, -5.170214653015137, -4.62125301361084, -4.072291851043701, -3.5233304500579834, -2.9743690490722656, -2.425407886505127, -1.8764464855194092, -1.3274850845336914, -0.7785239219665527, -0.22956252098083496, 0.3193988800048828, 0.8683602213859558, 1.4173215627670288, 1.966282844543457, 2.515244245529175, 3.0642056465148926, 3.6131668090820312, 4.162128448486328, 4.711089611053467, 5.2600507736206055, 5.809012413024902, 6.357973575592041, 6.90693473815918, 7.455896377563477, 8.004858016967773, 8.553818702697754, 9.10278034210205, 9.651741981506348, 10.200702667236328, 10.749664306640625, 11.298625946044922, 11.847587585449219, 12.3965482711792, 12.945509910583496, 13.494470596313477, 14.043432235717773, 14.592392921447754, 15.14135456085205, 15.690316200256348, 16.239276885986328, 16.788238525390625, 17.337200164794922, 17.88616180419922]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 14.0, 22.0, 19.0, 37.0, 52.0, 73.0, 126.0, 159.0, 286.0, 438.0, 677.0, 1111.0, 2003.0, 3717.0, 7169.0, 14459.0, 30115.0, 63589.0, 136026.0, 250547.0, 259578.0, 144819.0, 68807.0, 32122.0, 15567.0, 7708.0, 3945.0, 2140.0, 1159.0, 724.0, 440.0, 286.0, 203.0, 117.0, 94.0, 62.0, 29.0, 31.0, 12.0, 12.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.646484375, -2.56390380859375, -2.4813232421875, -2.39874267578125, -2.316162109375, -2.23358154296875, -2.1510009765625, -2.06842041015625, -1.98583984375, -1.90325927734375, -1.8206787109375, -1.73809814453125, -1.655517578125, -1.57293701171875, -1.4903564453125, -1.40777587890625, -1.3251953125, -1.24261474609375, -1.1600341796875, -1.07745361328125, -0.994873046875, -0.91229248046875, -0.8297119140625, -0.74713134765625, -0.66455078125, -0.58197021484375, -0.4993896484375, -0.41680908203125, -0.334228515625, -0.25164794921875, -0.1690673828125, -0.08648681640625, -0.00390625, 0.07867431640625, 0.1612548828125, 0.24383544921875, 0.326416015625, 0.40899658203125, 0.4915771484375, 0.57415771484375, 0.65673828125, 0.73931884765625, 0.8218994140625, 0.90447998046875, 0.987060546875, 1.06964111328125, 1.1522216796875, 1.23480224609375, 1.3173828125, 1.39996337890625, 1.4825439453125, 1.56512451171875, 1.647705078125, 1.73028564453125, 1.8128662109375, 1.89544677734375, 1.97802734375, 2.06060791015625, 2.1431884765625, 2.22576904296875, 2.308349609375, 2.39093017578125, 2.4735107421875, 2.55609130859375, 2.638671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 3.0, 9.0, 18.0, 14.0, 24.0, 20.0, 27.0, 23.0, 39.0, 40.0, 44.0, 38.0, 50.0, 51.0, 59.0, 44.0, 47.0, 38.0, 58.0, 44.0, 33.0, 37.0, 38.0, 22.0, 37.0, 24.0, 22.0, 21.0, 15.0, 16.0, 11.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.405181884765625, -2.33380126953125, -2.262420654296875, -2.1910400390625, -2.119659423828125, -2.04827880859375, -1.976898193359375, -1.905517578125, -1.834136962890625, -1.76275634765625, -1.691375732421875, -1.6199951171875, -1.548614501953125, -1.47723388671875, -1.405853271484375, -1.33447265625, -1.263092041015625, -1.19171142578125, -1.120330810546875, -1.0489501953125, -0.977569580078125, -0.90618896484375, -0.834808349609375, -0.763427734375, -0.692047119140625, -0.62066650390625, -0.549285888671875, -0.4779052734375, -0.406524658203125, -0.33514404296875, -0.263763427734375, -0.1923828125, -0.121002197265625, -0.04962158203125, 0.021759033203125, 0.0931396484375, 0.164520263671875, 0.23590087890625, 0.307281494140625, 0.378662109375, 0.450042724609375, 0.52142333984375, 0.592803955078125, 0.6641845703125, 0.735565185546875, 0.80694580078125, 0.878326416015625, 0.94970703125, 1.021087646484375, 1.09246826171875, 1.163848876953125, 1.2352294921875, 1.306610107421875, 1.37799072265625, 1.449371337890625, 1.520751953125, 1.592132568359375, 1.66351318359375, 1.734893798828125, 1.8062744140625, 1.877655029296875, 1.94903564453125, 2.020416259765625, 2.091796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 12.0, 9.0, 13.0, 16.0, 22.0, 34.0, 49.0, 64.0, 78.0, 144.0, 197.0, 297.0, 515.0, 911.0, 1991.0, 5882.0, 23187.0, 129336.0, 681792.0, 163658.0, 28710.0, 6951.0, 2198.0, 952.0, 523.0, 296.0, 207.0, 144.0, 99.0, 92.0, 46.0, 33.0, 29.0, 21.0, 14.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.25091552734375, -5.0604248046875, -4.86993408203125, -4.679443359375, -4.48895263671875, -4.2984619140625, -4.10797119140625, -3.91748046875, -3.72698974609375, -3.5364990234375, -3.34600830078125, -3.155517578125, -2.96502685546875, -2.7745361328125, -2.58404541015625, -2.3935546875, -2.20306396484375, -2.0125732421875, -1.82208251953125, -1.631591796875, -1.44110107421875, -1.2506103515625, -1.06011962890625, -0.86962890625, -0.67913818359375, -0.4886474609375, -0.29815673828125, -0.107666015625, 0.08282470703125, 0.2733154296875, 0.46380615234375, 0.654296875, 0.84478759765625, 1.0352783203125, 1.22576904296875, 1.416259765625, 1.60675048828125, 1.7972412109375, 1.98773193359375, 2.17822265625, 2.36871337890625, 2.5592041015625, 2.74969482421875, 2.940185546875, 3.13067626953125, 3.3211669921875, 3.51165771484375, 3.7021484375, 3.89263916015625, 4.0831298828125, 4.27362060546875, 4.464111328125, 4.65460205078125, 4.8450927734375, 5.03558349609375, 5.22607421875, 5.41656494140625, 5.6070556640625, 5.79754638671875, 5.988037109375, 6.17852783203125, 6.3690185546875, 6.55950927734375, 6.75]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 10.0, 10.0, 13.0, 23.0, 21.0, 17.0, 24.0, 26.0, 40.0, 36.0, 41.0, 47.0, 53.0, 69.0, 56.0, 68.0, 59.0, 52.0, 47.0, 43.0, 44.0, 32.0, 17.0, 27.0, 21.0, 16.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.2994384765625, -8.028564453125, -7.7576904296875, -7.48681640625, -7.2159423828125, -6.945068359375, -6.6741943359375, -6.4033203125, -6.1324462890625, -5.861572265625, -5.5906982421875, -5.31982421875, -5.0489501953125, -4.778076171875, -4.5072021484375, -4.236328125, -3.9654541015625, -3.694580078125, -3.4237060546875, -3.15283203125, -2.8819580078125, -2.611083984375, -2.3402099609375, -2.0693359375, -1.7984619140625, -1.527587890625, -1.2567138671875, -0.98583984375, -0.7149658203125, -0.444091796875, -0.1732177734375, 0.09765625, 0.3685302734375, 0.639404296875, 0.9102783203125, 1.18115234375, 1.4520263671875, 1.722900390625, 1.9937744140625, 2.2646484375, 2.5355224609375, 2.806396484375, 3.0772705078125, 3.34814453125, 3.6190185546875, 3.889892578125, 4.1607666015625, 4.431640625, 4.7025146484375, 4.973388671875, 5.2442626953125, 5.51513671875, 5.7860107421875, 6.056884765625, 6.3277587890625, 6.5986328125, 6.8695068359375, 7.140380859375, 7.4112548828125, 7.68212890625, 7.9530029296875, 8.223876953125, 8.4947509765625, 8.765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 14.0, 15.0, 27.0, 41.0, 44.0, 73.0, 131.0, 215.0, 417.0, 689.0, 1386.0, 3306.0, 8146.0, 23022.0, 75181.0, 575615.0, 270584.0, 58796.0, 18643.0, 6862.0, 2740.0, 1187.0, 600.0, 314.0, 178.0, 99.0, 78.0, 39.0, 32.0, 13.0, 19.0, 13.0, 2.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6796875, -1.625335693359375, -1.57098388671875, -1.516632080078125, -1.4622802734375, -1.407928466796875, -1.35357666015625, -1.299224853515625, -1.244873046875, -1.190521240234375, -1.13616943359375, -1.081817626953125, -1.0274658203125, -0.973114013671875, -0.91876220703125, -0.864410400390625, -0.81005859375, -0.755706787109375, -0.70135498046875, -0.647003173828125, -0.5926513671875, -0.538299560546875, -0.48394775390625, -0.429595947265625, -0.375244140625, -0.320892333984375, -0.26654052734375, -0.212188720703125, -0.1578369140625, -0.103485107421875, -0.04913330078125, 0.005218505859375, 0.0595703125, 0.113922119140625, 0.16827392578125, 0.222625732421875, 0.2769775390625, 0.331329345703125, 0.38568115234375, 0.440032958984375, 0.494384765625, 0.548736572265625, 0.60308837890625, 0.657440185546875, 0.7117919921875, 0.766143798828125, 0.82049560546875, 0.874847412109375, 0.92919921875, 0.983551025390625, 1.03790283203125, 1.092254638671875, 1.1466064453125, 1.200958251953125, 1.25531005859375, 1.309661865234375, 1.364013671875, 1.418365478515625, 1.47271728515625, 1.527069091796875, 1.5814208984375, 1.635772705078125, 1.69012451171875, 1.744476318359375, 1.798828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 11.0, 14.0, 14.0, 17.0, 30.0, 29.0, 38.0, 53.0, 73.0, 90.0, 115.0, 92.0, 85.0, 72.0, 41.0, 38.0, 31.0, 27.0, 24.0, 21.0, 8.0, 7.0, 7.0, 7.0, 3.0, 10.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0005044937133789062, -0.0004900023341178894, -0.00047551095485687256, -0.0004610195755958557, -0.00044652819633483887, -0.000432036817073822, -0.0004175454378128052, -0.00040305405855178833, -0.0003885626792907715, -0.00037407130002975464, -0.0003595799207687378, -0.00034508854150772095, -0.0003305971622467041, -0.00031610578298568726, -0.0003016144037246704, -0.00028712302446365356, -0.0002726316452026367, -0.0002581402659416199, -0.00024364888668060303, -0.00022915750741958618, -0.00021466612815856934, -0.0002001747488975525, -0.00018568336963653564, -0.0001711919903755188, -0.00015670061111450195, -0.0001422092318534851, -0.00012771785259246826, -0.00011322647333145142, -9.873509407043457e-05, -8.424371480941772e-05, -6.975233554840088e-05, -5.526095628738403e-05, -4.076957702636719e-05, -2.6278197765350342e-05, -1.1786818504333496e-05, 2.7045607566833496e-06, 1.7195940017700195e-05, 3.168731927871704e-05, 4.617869853973389e-05, 6.067007780075073e-05, 7.516145706176758e-05, 8.965283632278442e-05, 0.00010414421558380127, 0.00011863559484481812, 0.00013312697410583496, 0.0001476183533668518, 0.00016210973262786865, 0.0001766011118888855, 0.00019109249114990234, 0.0002055838704109192, 0.00022007524967193604, 0.00023456662893295288, 0.0002490580081939697, 0.00026354938745498657, 0.0002780407667160034, 0.00029253214597702026, 0.0003070235252380371, 0.00032151490449905396, 0.0003360062837600708, 0.00035049766302108765, 0.0003649890422821045, 0.00037948042154312134, 0.0003939718008041382, 0.00040846318006515503, 0.0004229545593261719]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 15.0, 24.0, 30.0, 26.0, 51.0, 100.0, 160.0, 284.0, 467.0, 855.0, 1694.0, 4000.0, 10473.0, 31795.0, 113645.0, 632685.0, 181306.0, 46282.0, 14786.0, 5286.0, 2149.0, 1069.0, 547.0, 317.0, 187.0, 110.0, 63.0, 48.0, 21.0, 14.0, 19.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9892578125, -1.936431884765625, -1.88360595703125, -1.830780029296875, -1.7779541015625, -1.725128173828125, -1.67230224609375, -1.619476318359375, -1.566650390625, -1.513824462890625, -1.46099853515625, -1.408172607421875, -1.3553466796875, -1.302520751953125, -1.24969482421875, -1.196868896484375, -1.14404296875, -1.091217041015625, -1.03839111328125, -0.985565185546875, -0.9327392578125, -0.879913330078125, -0.82708740234375, -0.774261474609375, -0.721435546875, -0.668609619140625, -0.61578369140625, -0.562957763671875, -0.5101318359375, -0.457305908203125, -0.40447998046875, -0.351654052734375, -0.298828125, -0.246002197265625, -0.19317626953125, -0.140350341796875, -0.0875244140625, -0.034698486328125, 0.01812744140625, 0.070953369140625, 0.123779296875, 0.176605224609375, 0.22943115234375, 0.282257080078125, 0.3350830078125, 0.387908935546875, 0.44073486328125, 0.493560791015625, 0.54638671875, 0.599212646484375, 0.65203857421875, 0.704864501953125, 0.7576904296875, 0.810516357421875, 0.86334228515625, 0.916168212890625, 0.968994140625, 1.021820068359375, 1.07464599609375, 1.127471923828125, 1.1802978515625, 1.233123779296875, 1.28594970703125, 1.338775634765625, 1.3916015625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 13.0, 15.0, 11.0, 12.0, 23.0, 31.0, 32.0, 23.0, 37.0, 39.0, 64.0, 80.0, 109.0, 86.0, 94.0, 61.0, 44.0, 41.0, 28.0, 24.0, 18.0, 14.0, 14.0, 9.0, 5.0, 7.0, 3.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.41796875, -1.3690338134765625, -1.320098876953125, -1.2711639404296875, -1.22222900390625, -1.1732940673828125, -1.124359130859375, -1.0754241943359375, -1.0264892578125, -0.9775543212890625, -0.928619384765625, -0.8796844482421875, -0.83074951171875, -0.7818145751953125, -0.732879638671875, -0.6839447021484375, -0.635009765625, -0.5860748291015625, -0.537139892578125, -0.4882049560546875, -0.43927001953125, -0.3903350830078125, -0.341400146484375, -0.2924652099609375, -0.2435302734375, -0.1945953369140625, -0.145660400390625, -0.0967254638671875, -0.04779052734375, 0.0011444091796875, 0.050079345703125, 0.0990142822265625, 0.14794921875, 0.1968841552734375, 0.245819091796875, 0.2947540283203125, 0.34368896484375, 0.3926239013671875, 0.441558837890625, 0.4904937744140625, 0.5394287109375, 0.5883636474609375, 0.637298583984375, 0.6862335205078125, 0.73516845703125, 0.7841033935546875, 0.833038330078125, 0.8819732666015625, 0.930908203125, 0.9798431396484375, 1.028778076171875, 1.0777130126953125, 1.12664794921875, 1.1755828857421875, 1.224517822265625, 1.2734527587890625, 1.3223876953125, 1.3713226318359375, 1.420257568359375, 1.4691925048828125, 1.51812744140625, 1.5670623779296875, 1.615997314453125, 1.6649322509765625, 1.7138671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 10.0, 25.0, 53.0, 95.0, 198.0, 339.0, 133.0, 73.0, 36.0, 13.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.03370666503906, -75.07115936279297, -73.10861206054688, -71.14607238769531, -69.18352508544922, -67.22097778320312, -65.25843048095703, -63.2958869934082, -61.333343505859375, -59.37079620361328, -57.40825271606445, -55.44570541381836, -53.48316192626953, -51.52061462402344, -49.55807113647461, -47.595523834228516, -45.63298034667969, -43.670433044433594, -41.707889556884766, -39.74534225463867, -37.782798767089844, -35.82025146484375, -33.85770797729492, -31.895160675048828, -29.932613372802734, -27.970067977905273, -26.007522583007812, -24.04497718811035, -22.08243179321289, -20.119884490966797, -18.15734100341797, -16.194793701171875, -14.232250213623047, -12.269704818725586, -10.307159423828125, -8.344614028930664, -6.382068157196045, -4.419522285461426, -2.456976890563965, -0.4944314956665039, 1.468113899230957, 3.430659294128418, 5.393204689025879, 7.355750560760498, 9.318296432495117, 11.280841827392578, 13.243387222290039, 15.2059326171875, 17.16847801208496, 19.131023406982422, 21.093568801879883, 23.056114196777344, 25.018659591674805, 26.981204986572266, 28.94375228881836, 30.906295776367188, 32.86884307861328, 34.831390380859375, 36.7939338684082, 38.7564811706543, 40.719024658203125, 42.68157196044922, 44.64411544799805, 46.60666275024414, 48.56920623779297]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 11.0, 10.0, 22.0, 24.0, 24.0, 21.0, 29.0, 35.0, 43.0, 36.0, 52.0, 91.0, 124.0, 98.0, 55.0, 47.0, 41.0, 27.0, 28.0, 29.0, 21.0, 20.0, 20.0, 11.0, 6.0, 8.0, 9.0, 8.0, 3.0, 4.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.486825942993164, -30.298593521118164, -29.110361099243164, -27.922128677368164, -26.733896255493164, -25.545663833618164, -24.35742950439453, -23.16919708251953, -21.98096466064453, -20.79273223876953, -19.60449981689453, -18.41626739501953, -17.22803497314453, -16.03980255126953, -14.851569175720215, -13.663336753845215, -12.475105285644531, -11.286872863769531, -10.098640441894531, -8.910408020019531, -7.722175121307373, -6.533942699432373, -5.345709800720215, -4.157477378845215, -2.969244956970215, -1.7810124158859253, -0.5927798748016357, 0.5954527854919434, 1.7836852073669434, 2.9719176292419434, 4.160150527954102, 5.348382949829102, 6.536613464355469, 7.724845886230469, 8.913078308105469, 10.101310729980469, 11.289543151855469, 12.477775573730469, 13.666008949279785, 14.854241371154785, 16.04247283935547, 17.23070526123047, 18.41893768310547, 19.60717010498047, 20.79540252685547, 21.98363494873047, 23.17186737060547, 24.36009979248047, 25.5483341217041, 26.7365665435791, 27.9247989654541, 29.1130313873291, 30.3012638092041, 31.4894962310791, 32.677730560302734, 33.865962982177734, 35.054195404052734, 36.242427825927734, 37.430660247802734, 38.618892669677734, 39.807125091552734, 40.995357513427734, 42.183589935302734, 43.371822357177734, 44.560054779052734]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 27.0, 45.0, 39.0, 78.0, 101.0, 141.0, 231.0, 368.0, 622.0, 1056.0, 1948.0, 3846.0, 8459.0, 22595.0, 74775.0, 317183.0, 1440885.0, 1754645.0, 422304.0, 97451.0, 27889.0, 10154.0, 4408.0, 2143.0, 1118.0, 602.0, 408.0, 261.0, 153.0, 97.0, 66.0, 45.0, 28.0, 19.0, 19.0, 11.0, 9.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.5859375, -2.5, -2.4140625, -2.328125, -2.2421875, -2.15625, -2.0703125, -1.984375, -1.8984375, -1.8125, -1.7265625, -1.640625, -1.5546875, -1.46875, -1.3828125, -1.296875, -1.2109375, -1.125, -1.0390625, -0.953125, -0.8671875, -0.78125, -0.6953125, -0.609375, -0.5234375, -0.4375, -0.3515625, -0.265625, -0.1796875, -0.09375, -0.0078125, 0.078125, 0.1640625, 0.25, 0.3359375, 0.421875, 0.5078125, 0.59375, 0.6796875, 0.765625, 0.8515625, 0.9375, 1.0234375, 1.109375, 1.1953125, 1.28125, 1.3671875, 1.453125, 1.5390625, 1.625, 1.7109375, 1.796875, 1.8828125, 1.96875, 2.0546875, 2.140625, 2.2265625, 2.3125, 2.3984375, 2.484375, 2.5703125, 2.65625, 2.7421875, 2.828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 14.0, 15.0, 6.0, 13.0, 22.0, 23.0, 22.0, 42.0, 26.0, 24.0, 47.0, 36.0, 43.0, 50.0, 42.0, 54.0, 35.0, 46.0, 53.0, 52.0, 43.0, 33.0, 25.0, 37.0, 24.0, 30.0, 18.0, 21.0, 10.0, 12.0, 10.0, 11.0, 8.0, 12.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.359375, -2.2938385009765625, -2.228302001953125, -2.1627655029296875, -2.09722900390625, -2.0316925048828125, -1.966156005859375, -1.9006195068359375, -1.8350830078125, -1.7695465087890625, -1.704010009765625, -1.6384735107421875, -1.57293701171875, -1.5074005126953125, -1.441864013671875, -1.3763275146484375, -1.310791015625, -1.2452545166015625, -1.179718017578125, -1.1141815185546875, -1.04864501953125, -0.9831085205078125, -0.917572021484375, -0.8520355224609375, -0.7864990234375, -0.7209625244140625, -0.655426025390625, -0.5898895263671875, -0.52435302734375, -0.4588165283203125, -0.393280029296875, -0.3277435302734375, -0.26220703125, -0.1966705322265625, -0.131134033203125, -0.0655975341796875, -6.103515625e-05, 0.0654754638671875, 0.131011962890625, 0.1965484619140625, 0.2620849609375, 0.3276214599609375, 0.393157958984375, 0.4586944580078125, 0.52423095703125, 0.5897674560546875, 0.655303955078125, 0.7208404541015625, 0.786376953125, 0.8519134521484375, 0.917449951171875, 0.9829864501953125, 1.04852294921875, 1.1140594482421875, 1.179595947265625, 1.2451324462890625, 1.3106689453125, 1.3762054443359375, 1.441741943359375, 1.5072784423828125, 1.57281494140625, 1.6383514404296875, 1.703887939453125, 1.7694244384765625, 1.8349609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 13.0, 16.0, 23.0, 24.0, 37.0, 59.0, 92.0, 150.0, 353.0, 781.0, 2304.0, 10473.0, 70608.0, 1574733.0, 2418997.0, 98311.0, 12739.0, 2818.0, 912.0, 362.0, 175.0, 107.0, 58.0, 41.0, 28.0, 17.0, 12.0, 6.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46875, -6.27313232421875, -6.0775146484375, -5.88189697265625, -5.686279296875, -5.49066162109375, -5.2950439453125, -5.09942626953125, -4.90380859375, -4.70819091796875, -4.5125732421875, -4.31695556640625, -4.121337890625, -3.92572021484375, -3.7301025390625, -3.53448486328125, -3.3388671875, -3.14324951171875, -2.9476318359375, -2.75201416015625, -2.556396484375, -2.36077880859375, -2.1651611328125, -1.96954345703125, -1.77392578125, -1.57830810546875, -1.3826904296875, -1.18707275390625, -0.991455078125, -0.79583740234375, -0.6002197265625, -0.40460205078125, -0.208984375, -0.01336669921875, 0.1822509765625, 0.37786865234375, 0.573486328125, 0.76910400390625, 0.9647216796875, 1.16033935546875, 1.35595703125, 1.55157470703125, 1.7471923828125, 1.94281005859375, 2.138427734375, 2.33404541015625, 2.5296630859375, 2.72528076171875, 2.9208984375, 3.11651611328125, 3.3121337890625, 3.50775146484375, 3.703369140625, 3.89898681640625, 4.0946044921875, 4.29022216796875, 4.48583984375, 4.68145751953125, 4.8770751953125, 5.07269287109375, 5.268310546875, 5.46392822265625, 5.6595458984375, 5.85516357421875, 6.05078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 2.0, 12.0, 16.0, 19.0, 20.0, 36.0, 39.0, 56.0, 84.0, 138.0, 219.0, 321.0, 414.0, 548.0, 630.0, 483.0, 324.0, 239.0, 129.0, 106.0, 59.0, 49.0, 25.0, 22.0, 23.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.822265625, -3.663665771484375, -3.50506591796875, -3.346466064453125, -3.1878662109375, -3.029266357421875, -2.87066650390625, -2.712066650390625, -2.553466796875, -2.394866943359375, -2.23626708984375, -2.077667236328125, -1.9190673828125, -1.760467529296875, -1.60186767578125, -1.443267822265625, -1.28466796875, -1.126068115234375, -0.96746826171875, -0.808868408203125, -0.6502685546875, -0.491668701171875, -0.33306884765625, -0.174468994140625, -0.015869140625, 0.142730712890625, 0.30133056640625, 0.459930419921875, 0.6185302734375, 0.777130126953125, 0.93572998046875, 1.094329833984375, 1.2529296875, 1.411529541015625, 1.57012939453125, 1.728729248046875, 1.8873291015625, 2.045928955078125, 2.20452880859375, 2.363128662109375, 2.521728515625, 2.680328369140625, 2.83892822265625, 2.997528076171875, 3.1561279296875, 3.314727783203125, 3.47332763671875, 3.631927490234375, 3.79052734375, 3.949127197265625, 4.10772705078125, 4.266326904296875, 4.4249267578125, 4.583526611328125, 4.74212646484375, 4.900726318359375, 5.059326171875, 5.217926025390625, 5.37652587890625, 5.535125732421875, 5.6937255859375, 5.852325439453125, 6.01092529296875, 6.169525146484375, 6.328125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 13.0, 12.0, 19.0, 18.0, 41.0, 72.0, 97.0, 136.0, 159.0, 119.0, 111.0, 71.0, 58.0, 28.0, 15.0, 6.0, 8.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46173095703125, -45.16401290893555, -43.86629867553711, -42.568580627441406, -41.27086639404297, -39.973148345947266, -38.67543029785156, -37.377716064453125, -36.07999801635742, -34.78227996826172, -33.48456573486328, -32.18684768676758, -30.889131546020508, -29.591415405273438, -28.293697357177734, -26.995981216430664, -25.698265075683594, -24.400548934936523, -23.102832794189453, -21.80511474609375, -20.50739860534668, -19.20968246459961, -17.911964416503906, -16.614248275756836, -15.316532135009766, -14.018815994262695, -12.721098899841309, -11.423381805419922, -10.125665664672852, -8.827949523925781, -7.5302324295043945, -6.232515335083008, -4.934795379638672, -3.6370787620544434, -2.339362144470215, -1.0416455268859863, 0.2560710906982422, 1.5537877082824707, 2.851504325866699, 4.149221420288086, 5.446937561035156, 6.744654178619385, 8.042370796203613, 9.340087890625, 10.63780403137207, 11.93552017211914, 13.233237266540527, 14.530954360961914, 15.828670501708984, 17.126386642456055, 18.424102783203125, 19.721820831298828, 21.0195369720459, 22.31725311279297, 23.614971160888672, 24.912687301635742, 26.210403442382812, 27.508119583129883, 28.805835723876953, 30.103553771972656, 31.401269912719727, 32.6989860534668, 33.9967041015625, 35.29441833496094, 36.59213638305664]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 10.0, 13.0, 13.0, 12.0, 14.0, 19.0, 25.0, 23.0, 19.0, 21.0, 26.0, 29.0, 25.0, 34.0, 40.0, 33.0, 50.0, 48.0, 50.0, 39.0, 48.0, 43.0, 37.0, 32.0, 23.0, 36.0, 32.0, 28.0, 20.0, 21.0, 25.0, 15.0, 15.0, 14.0, 12.0, 15.0, 3.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.419940948486328, -20.746919631958008, -20.073898315429688, -19.40087890625, -18.72785758972168, -18.05483627319336, -17.381816864013672, -16.70879554748535, -16.03577423095703, -15.362752914428711, -14.689732551574707, -14.016712188720703, -13.343690872192383, -12.670669555664062, -11.997649192810059, -11.324628829956055, -10.651607513427734, -9.978586196899414, -9.30556583404541, -8.632545471191406, -7.959524154663086, -7.286503314971924, -6.613482475280762, -5.9404616355896, -5.2674407958984375, -4.594419956207275, -3.9213991165161133, -3.248378276824951, -2.575357437133789, -1.902336597442627, -1.2293157577514648, -0.5562949180603027, 0.11672401428222656, 0.7897448539733887, 1.4627656936645508, 2.135786533355713, 2.808807373046875, 3.481828212738037, 4.154849052429199, 4.827869892120361, 5.500890731811523, 6.1739115715026855, 6.846932411193848, 7.51995325088501, 8.192974090576172, 8.865995407104492, 9.539015769958496, 10.2120361328125, 10.88505744934082, 11.55807876586914, 12.231099128723145, 12.904119491577148, 13.577140808105469, 14.250162124633789, 14.923182487487793, 15.596202850341797, 16.269224166870117, 16.942245483398438, 17.615264892578125, 18.288286209106445, 18.961307525634766, 19.634328842163086, 20.307350158691406, 20.980369567871094, 21.653390884399414]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 5.0, 10.0, 12.0, 21.0, 27.0, 44.0, 57.0, 112.0, 174.0, 267.0, 451.0, 685.0, 1071.0, 1860.0, 3236.0, 5980.0, 11284.0, 22043.0, 46030.0, 100582.0, 224284.0, 311737.0, 169741.0, 75713.0, 35314.0, 17422.0, 8897.0, 4828.0, 2675.0, 1518.0, 926.0, 551.0, 370.0, 231.0, 138.0, 83.0, 59.0, 34.0, 19.0, 20.0, 16.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.79644775390625, -2.7042236328125, -2.61199951171875, -2.519775390625, -2.42755126953125, -2.3353271484375, -2.24310302734375, -2.15087890625, -2.05865478515625, -1.9664306640625, -1.87420654296875, -1.781982421875, -1.68975830078125, -1.5975341796875, -1.50531005859375, -1.4130859375, -1.32086181640625, -1.2286376953125, -1.13641357421875, -1.044189453125, -0.95196533203125, -0.8597412109375, -0.76751708984375, -0.67529296875, -0.58306884765625, -0.4908447265625, -0.39862060546875, -0.306396484375, -0.21417236328125, -0.1219482421875, -0.02972412109375, 0.0625, 0.15472412109375, 0.2469482421875, 0.33917236328125, 0.431396484375, 0.52362060546875, 0.6158447265625, 0.70806884765625, 0.80029296875, 0.89251708984375, 0.9847412109375, 1.07696533203125, 1.169189453125, 1.26141357421875, 1.3536376953125, 1.44586181640625, 1.5380859375, 1.63031005859375, 1.7225341796875, 1.81475830078125, 1.906982421875, 1.99920654296875, 2.0914306640625, 2.18365478515625, 2.27587890625, 2.36810302734375, 2.4603271484375, 2.55255126953125, 2.644775390625, 2.73699951171875, 2.8292236328125, 2.92144775390625, 3.013671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 2.0, 6.0, 4.0, 19.0, 12.0, 20.0, 14.0, 17.0, 26.0, 27.0, 24.0, 31.0, 31.0, 29.0, 42.0, 41.0, 53.0, 41.0, 43.0, 56.0, 48.0, 41.0, 47.0, 34.0, 27.0, 41.0, 18.0, 38.0, 25.0, 24.0, 22.0, 22.0, 8.0, 12.0, 15.0, 8.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.138671875, -2.0694580078125, -2.000244140625, -1.9310302734375, -1.86181640625, -1.7926025390625, -1.723388671875, -1.6541748046875, -1.5849609375, -1.5157470703125, -1.446533203125, -1.3773193359375, -1.30810546875, -1.2388916015625, -1.169677734375, -1.1004638671875, -1.03125, -0.9620361328125, -0.892822265625, -0.8236083984375, -0.75439453125, -0.6851806640625, -0.615966796875, -0.5467529296875, -0.4775390625, -0.4083251953125, -0.339111328125, -0.2698974609375, -0.20068359375, -0.1314697265625, -0.062255859375, 0.0069580078125, 0.076171875, 0.1453857421875, 0.214599609375, 0.2838134765625, 0.35302734375, 0.4222412109375, 0.491455078125, 0.5606689453125, 0.6298828125, 0.6990966796875, 0.768310546875, 0.8375244140625, 0.90673828125, 0.9759521484375, 1.045166015625, 1.1143798828125, 1.18359375, 1.2528076171875, 1.322021484375, 1.3912353515625, 1.46044921875, 1.5296630859375, 1.598876953125, 1.6680908203125, 1.7373046875, 1.8065185546875, 1.875732421875, 1.9449462890625, 2.01416015625, 2.0833740234375, 2.152587890625, 2.2218017578125, 2.291015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 11.0, 9.0, 12.0, 14.0, 19.0, 18.0, 24.0, 35.0, 45.0, 60.0, 90.0, 95.0, 131.0, 164.0, 277.0, 384.0, 527.0, 891.0, 1649.0, 3591.0, 11235.0, 49495.0, 392552.0, 516107.0, 50987.0, 11738.0, 3752.0, 1616.0, 938.0, 620.0, 400.0, 272.0, 195.0, 140.0, 90.0, 102.0, 53.0, 48.0, 48.0, 28.0, 20.0, 9.0, 13.0, 15.0, 5.0, 10.0, 7.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.109375, -5.91851806640625, -5.7276611328125, -5.53680419921875, -5.345947265625, -5.15509033203125, -4.9642333984375, -4.77337646484375, -4.58251953125, -4.39166259765625, -4.2008056640625, -4.00994873046875, -3.819091796875, -3.62823486328125, -3.4373779296875, -3.24652099609375, -3.0556640625, -2.86480712890625, -2.6739501953125, -2.48309326171875, -2.292236328125, -2.10137939453125, -1.9105224609375, -1.71966552734375, -1.52880859375, -1.33795166015625, -1.1470947265625, -0.95623779296875, -0.765380859375, -0.57452392578125, -0.3836669921875, -0.19281005859375, -0.001953125, 0.18890380859375, 0.3797607421875, 0.57061767578125, 0.761474609375, 0.95233154296875, 1.1431884765625, 1.33404541015625, 1.52490234375, 1.71575927734375, 1.9066162109375, 2.09747314453125, 2.288330078125, 2.47918701171875, 2.6700439453125, 2.86090087890625, 3.0517578125, 3.24261474609375, 3.4334716796875, 3.62432861328125, 3.815185546875, 4.00604248046875, 4.1968994140625, 4.38775634765625, 4.57861328125, 4.76947021484375, 4.9603271484375, 5.15118408203125, 5.342041015625, 5.53289794921875, 5.7237548828125, 5.91461181640625, 6.10546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 1.0, 7.0, 15.0, 14.0, 11.0, 19.0, 23.0, 32.0, 31.0, 45.0, 38.0, 40.0, 57.0, 65.0, 55.0, 63.0, 61.0, 61.0, 37.0, 41.0, 51.0, 42.0, 24.0, 21.0, 25.0, 17.0, 15.0, 12.0, 16.0, 9.0, 13.0, 6.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.364013671875, -9.05615234375, -8.748291015625, -8.4404296875, -8.132568359375, -7.82470703125, -7.516845703125, -7.208984375, -6.901123046875, -6.59326171875, -6.285400390625, -5.9775390625, -5.669677734375, -5.36181640625, -5.053955078125, -4.74609375, -4.438232421875, -4.13037109375, -3.822509765625, -3.5146484375, -3.206787109375, -2.89892578125, -2.591064453125, -2.283203125, -1.975341796875, -1.66748046875, -1.359619140625, -1.0517578125, -0.743896484375, -0.43603515625, -0.128173828125, 0.1796875, 0.487548828125, 0.79541015625, 1.103271484375, 1.4111328125, 1.718994140625, 2.02685546875, 2.334716796875, 2.642578125, 2.950439453125, 3.25830078125, 3.566162109375, 3.8740234375, 4.181884765625, 4.48974609375, 4.797607421875, 5.10546875, 5.413330078125, 5.72119140625, 6.029052734375, 6.3369140625, 6.644775390625, 6.95263671875, 7.260498046875, 7.568359375, 7.876220703125, 8.18408203125, 8.491943359375, 8.7998046875, 9.107666015625, 9.41552734375, 9.723388671875, 10.03125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 6.0, 5.0, 6.0, 13.0, 15.0, 13.0, 29.0, 34.0, 47.0, 63.0, 109.0, 122.0, 242.0, 430.0, 807.0, 1729.0, 4196.0, 13013.0, 52815.0, 617477.0, 294313.0, 44498.0, 11362.0, 3806.0, 1542.0, 777.0, 383.0, 245.0, 149.0, 72.0, 64.0, 48.0, 32.0, 28.0, 17.0, 9.0, 12.0, 5.0, 2.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6632080078125, -1.607666015625, -1.5521240234375, -1.49658203125, -1.4410400390625, -1.385498046875, -1.3299560546875, -1.2744140625, -1.2188720703125, -1.163330078125, -1.1077880859375, -1.05224609375, -0.9967041015625, -0.941162109375, -0.8856201171875, -0.830078125, -0.7745361328125, -0.718994140625, -0.6634521484375, -0.60791015625, -0.5523681640625, -0.496826171875, -0.4412841796875, -0.3857421875, -0.3302001953125, -0.274658203125, -0.2191162109375, -0.16357421875, -0.1080322265625, -0.052490234375, 0.0030517578125, 0.05859375, 0.1141357421875, 0.169677734375, 0.2252197265625, 0.28076171875, 0.3363037109375, 0.391845703125, 0.4473876953125, 0.5029296875, 0.5584716796875, 0.614013671875, 0.6695556640625, 0.72509765625, 0.7806396484375, 0.836181640625, 0.8917236328125, 0.947265625, 1.0028076171875, 1.058349609375, 1.1138916015625, 1.16943359375, 1.2249755859375, 1.280517578125, 1.3360595703125, 1.3916015625, 1.4471435546875, 1.502685546875, 1.5582275390625, 1.61376953125, 1.6693115234375, 1.724853515625, 1.7803955078125, 1.8359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 4.0, 14.0, 8.0, 15.0, 9.0, 18.0, 28.0, 25.0, 31.0, 49.0, 73.0, 103.0, 130.0, 135.0, 109.0, 60.0, 44.0, 20.0, 21.0, 24.0, 13.0, 12.0, 3.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005664825439453125, -0.0005501881241798401, -0.0005338937044143677, -0.0005175992846488953, -0.0005013048648834229, -0.00048501044511795044, -0.00046871602535247803, -0.0004524216055870056, -0.0004361271858215332, -0.0004198327660560608, -0.0004035383462905884, -0.00038724392652511597, -0.00037094950675964355, -0.00035465508699417114, -0.00033836066722869873, -0.0003220662474632263, -0.0003057718276977539, -0.0002894774079322815, -0.0002731829881668091, -0.00025688856840133667, -0.00024059414863586426, -0.00022429972887039185, -0.00020800530910491943, -0.00019171088933944702, -0.0001754164695739746, -0.0001591220498085022, -0.00014282763004302979, -0.00012653321027755737, -0.00011023879051208496, -9.394437074661255e-05, -7.764995098114014e-05, -6.135553121566772e-05, -4.506111145019531e-05, -2.87666916847229e-05, -1.2472271919250488e-05, 3.822147846221924e-06, 2.0116567611694336e-05, 3.641098737716675e-05, 5.270540714263916e-05, 6.899982690811157e-05, 8.529424667358398e-05, 0.0001015886664390564, 0.00011788308620452881, 0.00013417750597000122, 0.00015047192573547363, 0.00016676634550094604, 0.00018306076526641846, 0.00019935518503189087, 0.00021564960479736328, 0.0002319440245628357, 0.0002482384443283081, 0.0002645328640937805, 0.00028082728385925293, 0.00029712170362472534, 0.00031341612339019775, 0.00032971054315567017, 0.0003460049629211426, 0.000362299382686615, 0.0003785938024520874, 0.0003948882222175598, 0.0004111826419830322, 0.00042747706174850464, 0.00044377148151397705, 0.00046006590127944946, 0.0004763603210449219]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 9.0, 6.0, 5.0, 13.0, 14.0, 20.0, 32.0, 55.0, 78.0, 156.0, 219.0, 350.0, 625.0, 1209.0, 2645.0, 6700.0, 20905.0, 88390.0, 680040.0, 189207.0, 39211.0, 10983.0, 4000.0, 1711.0, 829.0, 466.0, 253.0, 143.0, 89.0, 53.0, 45.0, 27.0, 24.0, 14.0, 11.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.4443359375, -1.395751953125, -1.34716796875, -1.298583984375, -1.25, -1.201416015625, -1.15283203125, -1.104248046875, -1.0556640625, -1.007080078125, -0.95849609375, -0.909912109375, -0.861328125, -0.812744140625, -0.76416015625, -0.715576171875, -0.6669921875, -0.618408203125, -0.56982421875, -0.521240234375, -0.47265625, -0.424072265625, -0.37548828125, -0.326904296875, -0.2783203125, -0.229736328125, -0.18115234375, -0.132568359375, -0.083984375, -0.035400390625, 0.01318359375, 0.061767578125, 0.1103515625, 0.158935546875, 0.20751953125, 0.256103515625, 0.3046875, 0.353271484375, 0.40185546875, 0.450439453125, 0.4990234375, 0.547607421875, 0.59619140625, 0.644775390625, 0.693359375, 0.741943359375, 0.79052734375, 0.839111328125, 0.8876953125, 0.936279296875, 0.98486328125, 1.033447265625, 1.08203125, 1.130615234375, 1.17919921875, 1.227783203125, 1.2763671875, 1.324951171875, 1.37353515625, 1.422119140625, 1.470703125, 1.519287109375, 1.56787109375, 1.616455078125, 1.6650390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 6.0, 12.0, 20.0, 28.0, 20.0, 30.0, 54.0, 53.0, 78.0, 108.0, 115.0, 101.0, 83.0, 51.0, 41.0, 34.0, 26.0, 27.0, 26.0, 11.0, 10.0, 15.0, 6.0, 6.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9482421875, -1.89215087890625, -1.8360595703125, -1.77996826171875, -1.723876953125, -1.66778564453125, -1.6116943359375, -1.55560302734375, -1.49951171875, -1.44342041015625, -1.3873291015625, -1.33123779296875, -1.275146484375, -1.21905517578125, -1.1629638671875, -1.10687255859375, -1.05078125, -0.99468994140625, -0.9385986328125, -0.88250732421875, -0.826416015625, -0.77032470703125, -0.7142333984375, -0.65814208984375, -0.60205078125, -0.54595947265625, -0.4898681640625, -0.43377685546875, -0.377685546875, -0.32159423828125, -0.2655029296875, -0.20941162109375, -0.1533203125, -0.09722900390625, -0.0411376953125, 0.01495361328125, 0.071044921875, 0.12713623046875, 0.1832275390625, 0.23931884765625, 0.29541015625, 0.35150146484375, 0.4075927734375, 0.46368408203125, 0.519775390625, 0.57586669921875, 0.6319580078125, 0.68804931640625, 0.744140625, 0.80023193359375, 0.8563232421875, 0.91241455078125, 0.968505859375, 1.02459716796875, 1.0806884765625, 1.13677978515625, 1.19287109375, 1.24896240234375, 1.3050537109375, 1.36114501953125, 1.417236328125, 1.47332763671875, 1.5294189453125, 1.58551025390625, 1.6416015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 17.0, 17.0, 56.0, 160.0, 466.0, 177.0, 66.0, 22.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.0081787109375, -59.13188934326172, -56.25559997558594, -53.379310607910156, -50.50302505493164, -47.62673568725586, -44.75044631958008, -41.87416076660156, -38.99787139892578, -36.12158203125, -33.24529266357422, -30.36900520324707, -27.492717742919922, -24.61642837524414, -21.74013900756836, -18.86385154724121, -15.987560272216797, -13.111271858215332, -10.234983444213867, -7.358694076538086, -4.482405662536621, -1.6061172485351562, 1.270172119140625, 4.146459579467773, 7.022748947143555, 9.89903736114502, 12.775325775146484, 15.651615142822266, 18.527904510498047, 21.404191970825195, 24.280481338500977, 27.156768798828125, 30.033058166503906, 32.90934753417969, 35.78563690185547, 38.66192626953125, 41.538211822509766, 44.41450119018555, 47.29079055786133, 50.167076110839844, 53.043365478515625, 55.919654846191406, 58.79594421386719, 61.67223358154297, 64.54852294921875, 67.4248046875, 70.30110168457031, 73.17738342285156, 76.05368041992188, 78.92996978759766, 81.80625915527344, 84.68254852294922, 87.558837890625, 90.43511962890625, 93.31141662597656, 96.18769836425781, 99.0639877319336, 101.94027709960938, 104.81656646728516, 107.69285583496094, 110.56914520263672, 113.4454345703125, 116.32171630859375, 119.19800567626953, 122.07429504394531]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 9.0, 8.0, 10.0, 12.0, 15.0, 12.0, 16.0, 25.0, 19.0, 20.0, 23.0, 32.0, 20.0, 41.0, 50.0, 112.0, 124.0, 94.0, 45.0, 36.0, 27.0, 18.0, 26.0, 26.0, 26.0, 11.0, 17.0, 16.0, 14.0, 14.0, 12.0, 7.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.63037109375, -33.56171417236328, -32.49305725097656, -31.42440414428711, -30.35574722290039, -29.287090301513672, -28.218435287475586, -27.1497802734375, -26.08112335205078, -25.012466430664062, -23.943811416625977, -22.87515640258789, -21.806499481201172, -20.737842559814453, -19.669187545776367, -18.60053253173828, -17.531875610351562, -16.463218688964844, -15.394563674926758, -14.325907707214355, -13.257251739501953, -12.18859577178955, -11.119939804077148, -10.051283836364746, -8.982627868652344, -7.913971900939941, -6.845315933227539, -5.776659965515137, -4.708003997802734, -3.639348030090332, -2.5706920623779297, -1.5020360946655273, -0.433380126953125, 0.6352758407592773, 1.7039318084716797, 2.772587776184082, 3.8412437438964844, 4.909899711608887, 5.978555679321289, 7.047211647033691, 8.115867614746094, 9.184523582458496, 10.253179550170898, 11.3218355178833, 12.390491485595703, 13.459147453308105, 14.527803421020508, 15.59645938873291, 16.665115356445312, 17.73377227783203, 18.802427291870117, 19.871082305908203, 20.939739227294922, 22.00839614868164, 23.077051162719727, 24.145706176757812, 25.21436309814453, 26.28302001953125, 27.351675033569336, 28.420330047607422, 29.48898696899414, 30.55764389038086, 31.626298904418945, 32.69495391845703, 33.76361083984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 2.0, 5.0, 8.0, 11.0, 21.0, 28.0, 42.0, 58.0, 89.0, 140.0, 207.0, 333.0, 512.0, 793.0, 1287.0, 2402.0, 4341.0, 8966.0, 21847.0, 62751.0, 213175.0, 698662.0, 1541656.0, 1080777.0, 382267.0, 111700.0, 35600.0, 13247.0, 6031.0, 3044.0, 1739.0, 969.0, 525.0, 366.0, 257.0, 145.0, 98.0, 58.0, 41.0, 28.0, 15.0, 14.0, 12.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.51171875, -2.42999267578125, -2.3482666015625, -2.26654052734375, -2.184814453125, -2.10308837890625, -2.0213623046875, -1.93963623046875, -1.85791015625, -1.77618408203125, -1.6944580078125, -1.61273193359375, -1.531005859375, -1.44927978515625, -1.3675537109375, -1.28582763671875, -1.2041015625, -1.12237548828125, -1.0406494140625, -0.95892333984375, -0.877197265625, -0.79547119140625, -0.7137451171875, -0.63201904296875, -0.55029296875, -0.46856689453125, -0.3868408203125, -0.30511474609375, -0.223388671875, -0.14166259765625, -0.0599365234375, 0.02178955078125, 0.103515625, 0.18524169921875, 0.2669677734375, 0.34869384765625, 0.430419921875, 0.51214599609375, 0.5938720703125, 0.67559814453125, 0.75732421875, 0.83905029296875, 0.9207763671875, 1.00250244140625, 1.084228515625, 1.16595458984375, 1.2476806640625, 1.32940673828125, 1.4111328125, 1.49285888671875, 1.5745849609375, 1.65631103515625, 1.738037109375, 1.81976318359375, 1.9014892578125, 1.98321533203125, 2.06494140625, 2.14666748046875, 2.2283935546875, 2.31011962890625, 2.391845703125, 2.47357177734375, 2.5552978515625, 2.63702392578125, 2.71875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 14.0, 12.0, 18.0, 17.0, 18.0, 25.0, 24.0, 36.0, 27.0, 33.0, 30.0, 48.0, 33.0, 44.0, 35.0, 58.0, 51.0, 45.0, 42.0, 47.0, 46.0, 29.0, 34.0, 37.0, 21.0, 25.0, 20.0, 24.0, 15.0, 21.0, 12.0, 5.0, 15.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.0037078857421875, -1.941009521484375, -1.8783111572265625, -1.81561279296875, -1.7529144287109375, -1.690216064453125, -1.6275177001953125, -1.5648193359375, -1.5021209716796875, -1.439422607421875, -1.3767242431640625, -1.31402587890625, -1.2513275146484375, -1.188629150390625, -1.1259307861328125, -1.063232421875, -1.0005340576171875, -0.937835693359375, -0.8751373291015625, -0.81243896484375, -0.7497406005859375, -0.687042236328125, -0.6243438720703125, -0.5616455078125, -0.4989471435546875, -0.436248779296875, -0.3735504150390625, -0.31085205078125, -0.2481536865234375, -0.185455322265625, -0.1227569580078125, -0.06005859375, 0.0026397705078125, 0.065338134765625, 0.1280364990234375, 0.19073486328125, 0.2534332275390625, 0.316131591796875, 0.3788299560546875, 0.4415283203125, 0.5042266845703125, 0.566925048828125, 0.6296234130859375, 0.69232177734375, 0.7550201416015625, 0.817718505859375, 0.8804168701171875, 0.943115234375, 1.0058135986328125, 1.068511962890625, 1.1312103271484375, 1.19390869140625, 1.2566070556640625, 1.319305419921875, 1.3820037841796875, 1.4447021484375, 1.5074005126953125, 1.570098876953125, 1.6327972412109375, 1.69549560546875, 1.7581939697265625, 1.820892333984375, 1.8835906982421875, 1.9462890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 9.0, 13.0, 21.0, 24.0, 47.0, 48.0, 70.0, 119.0, 187.0, 297.0, 464.0, 947.0, 2136.0, 6016.0, 38343.0, 1885662.0, 2208749.0, 40411.0, 6175.0, 2127.0, 918.0, 503.0, 326.0, 243.0, 122.0, 88.0, 51.0, 47.0, 41.0, 18.0, 12.0, 10.0, 3.0, 8.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.484375, -10.20111083984375, -9.9178466796875, -9.63458251953125, -9.351318359375, -9.06805419921875, -8.7847900390625, -8.50152587890625, -8.21826171875, -7.93499755859375, -7.6517333984375, -7.36846923828125, -7.085205078125, -6.80194091796875, -6.5186767578125, -6.23541259765625, -5.9521484375, -5.66888427734375, -5.3856201171875, -5.10235595703125, -4.819091796875, -4.53582763671875, -4.2525634765625, -3.96929931640625, -3.68603515625, -3.40277099609375, -3.1195068359375, -2.83624267578125, -2.552978515625, -2.26971435546875, -1.9864501953125, -1.70318603515625, -1.419921875, -1.13665771484375, -0.8533935546875, -0.57012939453125, -0.286865234375, -0.00360107421875, 0.2796630859375, 0.56292724609375, 0.84619140625, 1.12945556640625, 1.4127197265625, 1.69598388671875, 1.979248046875, 2.26251220703125, 2.5457763671875, 2.82904052734375, 3.1123046875, 3.39556884765625, 3.6788330078125, 3.96209716796875, 4.245361328125, 4.52862548828125, 4.8118896484375, 5.09515380859375, 5.37841796875, 5.66168212890625, 5.9449462890625, 6.22821044921875, 6.511474609375, 6.79473876953125, 7.0780029296875, 7.36126708984375, 7.64453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 2.0, 16.0, 18.0, 16.0, 27.0, 28.0, 41.0, 57.0, 79.0, 95.0, 174.0, 232.0, 260.0, 347.0, 451.0, 542.0, 423.0, 337.0, 245.0, 175.0, 132.0, 95.0, 79.0, 38.0, 45.0, 21.0, 24.0, 23.0, 13.0, 14.0, 6.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.42462158203125, -4.2359619140625, -4.04730224609375, -3.858642578125, -3.66998291015625, -3.4813232421875, -3.29266357421875, -3.10400390625, -2.91534423828125, -2.7266845703125, -2.53802490234375, -2.349365234375, -2.16070556640625, -1.9720458984375, -1.78338623046875, -1.5947265625, -1.40606689453125, -1.2174072265625, -1.02874755859375, -0.840087890625, -0.65142822265625, -0.4627685546875, -0.27410888671875, -0.08544921875, 0.10321044921875, 0.2918701171875, 0.48052978515625, 0.669189453125, 0.85784912109375, 1.0465087890625, 1.23516845703125, 1.423828125, 1.61248779296875, 1.8011474609375, 1.98980712890625, 2.178466796875, 2.36712646484375, 2.5557861328125, 2.74444580078125, 2.93310546875, 3.12176513671875, 3.3104248046875, 3.49908447265625, 3.687744140625, 3.87640380859375, 4.0650634765625, 4.25372314453125, 4.4423828125, 4.63104248046875, 4.8197021484375, 5.00836181640625, 5.197021484375, 5.38568115234375, 5.5743408203125, 5.76300048828125, 5.95166015625, 6.14031982421875, 6.3289794921875, 6.51763916015625, 6.706298828125, 6.89495849609375, 7.0836181640625, 7.27227783203125, 7.4609375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 2.0, 8.0, 13.0, 20.0, 30.0, 41.0, 86.0, 128.0, 177.0, 159.0, 112.0, 80.0, 52.0, 30.0, 19.0, 12.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1199951171875, -62.79826736450195, -60.47654342651367, -58.154815673828125, -55.833091735839844, -53.5113639831543, -51.18963623046875, -48.86791229248047, -46.54618453979492, -44.224456787109375, -41.902732849121094, -39.58100509643555, -37.25927734375, -34.93755340576172, -32.61582565307617, -30.294099807739258, -27.972373962402344, -25.65064811706543, -23.328922271728516, -21.00719451904297, -18.685468673706055, -16.36374282836914, -14.04201602935791, -11.72028923034668, -9.398563385009766, -7.076837062835693, -4.755110740661621, -2.433384418487549, -0.11165809631347656, 2.2100677490234375, 4.531794548034668, 6.853521347045898, 9.175247192382812, 11.496973037719727, 13.818699836730957, 16.140426635742188, 18.4621524810791, 20.783878326416016, 23.105606079101562, 25.427331924438477, 27.74905776977539, 30.070783615112305, 32.39250946044922, 34.714237213134766, 37.03596496582031, 39.357688903808594, 41.67941665649414, 44.00114440917969, 46.32286834716797, 48.644596099853516, 50.9663200378418, 53.288047790527344, 55.609771728515625, 57.93149948120117, 60.25322723388672, 62.574951171875, 64.89668273925781, 67.2184066772461, 69.5401382446289, 71.86186218261719, 74.18358612060547, 76.50531005859375, 78.82704162597656, 81.14876556396484, 83.47048950195312]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 4.0, 2.0, 10.0, 11.0, 14.0, 18.0, 15.0, 22.0, 18.0, 29.0, 33.0, 26.0, 35.0, 42.0, 40.0, 55.0, 45.0, 62.0, 48.0, 44.0, 51.0, 58.0, 43.0, 34.0, 35.0, 34.0, 22.0, 21.0, 15.0, 13.0, 18.0, 14.0, 11.0, 11.0, 6.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.22328186035156, -32.05840301513672, -30.893524169921875, -29.72864532470703, -28.563766479492188, -27.398887634277344, -26.2340087890625, -25.069129943847656, -23.904251098632812, -22.73937225341797, -21.574493408203125, -20.40961456298828, -19.244735717773438, -18.079856872558594, -16.91497802734375, -15.750099182128906, -14.585220336914062, -13.420341491699219, -12.255462646484375, -11.090583801269531, -9.925704956054688, -8.760826110839844, -7.595947265625, -6.431068420410156, -5.2661895751953125, -4.101310729980469, -2.936431884765625, -1.7715530395507812, -0.6066741943359375, 0.5582046508789062, 1.72308349609375, 2.8879623413085938, 4.052837371826172, 5.217716217041016, 6.382595062255859, 7.547473907470703, 8.712352752685547, 9.87723159790039, 11.042110443115234, 12.206989288330078, 13.371868133544922, 14.536746978759766, 15.70162582397461, 16.866504669189453, 18.031383514404297, 19.19626235961914, 20.361141204833984, 21.526020050048828, 22.690898895263672, 23.855777740478516, 25.02065658569336, 26.185535430908203, 27.350414276123047, 28.51529312133789, 29.680171966552734, 30.845050811767578, 32.00992965698242, 33.174808502197266, 34.33968734741211, 35.50456619262695, 36.6694450378418, 37.83432388305664, 38.999202728271484, 40.16408157348633, 41.32896041870117]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 5.0, 10.0, 11.0, 13.0, 13.0, 29.0, 42.0, 67.0, 99.0, 173.0, 266.0, 466.0, 765.0, 1386.0, 2574.0, 5328.0, 12033.0, 30840.0, 95711.0, 456983.0, 321025.0, 75089.0, 25518.0, 10265.0, 4633.0, 2231.0, 1210.0, 692.0, 397.0, 240.0, 138.0, 120.0, 63.0, 41.0, 19.0, 13.0, 14.0, 12.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.45233154296875, -3.3441162109375, -3.23590087890625, -3.127685546875, -3.01947021484375, -2.9112548828125, -2.80303955078125, -2.69482421875, -2.58660888671875, -2.4783935546875, -2.37017822265625, -2.261962890625, -2.15374755859375, -2.0455322265625, -1.93731689453125, -1.8291015625, -1.72088623046875, -1.6126708984375, -1.50445556640625, -1.396240234375, -1.28802490234375, -1.1798095703125, -1.07159423828125, -0.96337890625, -0.85516357421875, -0.7469482421875, -0.63873291015625, -0.530517578125, -0.42230224609375, -0.3140869140625, -0.20587158203125, -0.09765625, 0.01055908203125, 0.1187744140625, 0.22698974609375, 0.335205078125, 0.44342041015625, 0.5516357421875, 0.65985107421875, 0.76806640625, 0.87628173828125, 0.9844970703125, 1.09271240234375, 1.200927734375, 1.30914306640625, 1.4173583984375, 1.52557373046875, 1.6337890625, 1.74200439453125, 1.8502197265625, 1.95843505859375, 2.066650390625, 2.17486572265625, 2.2830810546875, 2.39129638671875, 2.49951171875, 2.60772705078125, 2.7159423828125, 2.82415771484375, 2.932373046875, 3.04058837890625, 3.1488037109375, 3.25701904296875, 3.365234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 13.0, 4.0, 22.0, 24.0, 25.0, 23.0, 40.0, 51.0, 36.0, 39.0, 50.0, 52.0, 66.0, 62.0, 59.0, 42.0, 57.0, 48.0, 43.0, 37.0, 52.0, 30.0, 18.0, 16.0, 15.0, 15.0, 8.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.634185791015625, -2.54766845703125, -2.461151123046875, -2.3746337890625, -2.288116455078125, -2.20159912109375, -2.115081787109375, -2.028564453125, -1.942047119140625, -1.85552978515625, -1.769012451171875, -1.6824951171875, -1.595977783203125, -1.50946044921875, -1.422943115234375, -1.33642578125, -1.249908447265625, -1.16339111328125, -1.076873779296875, -0.9903564453125, -0.903839111328125, -0.81732177734375, -0.730804443359375, -0.644287109375, -0.557769775390625, -0.47125244140625, -0.384735107421875, -0.2982177734375, -0.211700439453125, -0.12518310546875, -0.038665771484375, 0.0478515625, 0.134368896484375, 0.22088623046875, 0.307403564453125, 0.3939208984375, 0.480438232421875, 0.56695556640625, 0.653472900390625, 0.739990234375, 0.826507568359375, 0.91302490234375, 0.999542236328125, 1.0860595703125, 1.172576904296875, 1.25909423828125, 1.345611572265625, 1.43212890625, 1.518646240234375, 1.60516357421875, 1.691680908203125, 1.7781982421875, 1.864715576171875, 1.95123291015625, 2.037750244140625, 2.124267578125, 2.210784912109375, 2.29730224609375, 2.383819580078125, 2.4703369140625, 2.556854248046875, 2.64337158203125, 2.729888916015625, 2.81640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 8.0, 6.0, 9.0, 22.0, 22.0, 39.0, 52.0, 82.0, 104.0, 192.0, 328.0, 644.0, 1496.0, 5758.0, 54784.0, 927186.0, 49536.0, 5478.0, 1414.0, 592.0, 300.0, 172.0, 108.0, 71.0, 53.0, 26.0, 29.0, 16.0, 13.0, 3.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.703125, -7.48602294921875, -7.2689208984375, -7.05181884765625, -6.834716796875, -6.61761474609375, -6.4005126953125, -6.18341064453125, -5.96630859375, -5.74920654296875, -5.5321044921875, -5.31500244140625, -5.097900390625, -4.88079833984375, -4.6636962890625, -4.44659423828125, -4.2294921875, -4.01239013671875, -3.7952880859375, -3.57818603515625, -3.361083984375, -3.14398193359375, -2.9268798828125, -2.70977783203125, -2.49267578125, -2.27557373046875, -2.0584716796875, -1.84136962890625, -1.624267578125, -1.40716552734375, -1.1900634765625, -0.97296142578125, -0.755859375, -0.53875732421875, -0.3216552734375, -0.10455322265625, 0.112548828125, 0.32965087890625, 0.5467529296875, 0.76385498046875, 0.98095703125, 1.19805908203125, 1.4151611328125, 1.63226318359375, 1.849365234375, 2.06646728515625, 2.2835693359375, 2.50067138671875, 2.7177734375, 2.93487548828125, 3.1519775390625, 3.36907958984375, 3.586181640625, 3.80328369140625, 4.0203857421875, 4.23748779296875, 4.45458984375, 4.67169189453125, 4.8887939453125, 5.10589599609375, 5.322998046875, 5.54010009765625, 5.7572021484375, 5.97430419921875, 6.19140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 10.0, 12.0, 13.0, 15.0, 15.0, 24.0, 17.0, 25.0, 27.0, 32.0, 51.0, 43.0, 80.0, 87.0, 90.0, 69.0, 75.0, 56.0, 45.0, 32.0, 28.0, 21.0, 20.0, 15.0, 18.0, 10.0, 9.0, 12.0, 8.0, 5.0, 0.0, 10.0, 11.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.890625, -11.556396484375, -11.22216796875, -10.887939453125, -10.5537109375, -10.219482421875, -9.88525390625, -9.551025390625, -9.216796875, -8.882568359375, -8.54833984375, -8.214111328125, -7.8798828125, -7.545654296875, -7.21142578125, -6.877197265625, -6.54296875, -6.208740234375, -5.87451171875, -5.540283203125, -5.2060546875, -4.871826171875, -4.53759765625, -4.203369140625, -3.869140625, -3.534912109375, -3.20068359375, -2.866455078125, -2.5322265625, -2.197998046875, -1.86376953125, -1.529541015625, -1.1953125, -0.861083984375, -0.52685546875, -0.192626953125, 0.1416015625, 0.475830078125, 0.81005859375, 1.144287109375, 1.478515625, 1.812744140625, 2.14697265625, 2.481201171875, 2.8154296875, 3.149658203125, 3.48388671875, 3.818115234375, 4.15234375, 4.486572265625, 4.82080078125, 5.155029296875, 5.4892578125, 5.823486328125, 6.15771484375, 6.491943359375, 6.826171875, 7.160400390625, 7.49462890625, 7.828857421875, 8.1630859375, 8.497314453125, 8.83154296875, 9.165771484375, 9.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 6.0, 7.0, 9.0, 10.0, 10.0, 21.0, 32.0, 38.0, 89.0, 110.0, 105.0, 233.0, 349.0, 665.0, 1404.0, 3156.0, 8716.0, 28283.0, 160306.0, 776236.0, 47186.0, 13086.0, 4536.0, 1871.0, 875.0, 404.0, 266.0, 151.0, 83.0, 75.0, 58.0, 34.0, 16.0, 22.0, 19.0, 22.0, 16.0, 8.0, 7.0, 7.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.8095703125, -0.7851715087890625, -0.760772705078125, -0.7363739013671875, -0.71197509765625, -0.6875762939453125, -0.663177490234375, -0.6387786865234375, -0.6143798828125, -0.5899810791015625, -0.565582275390625, -0.5411834716796875, -0.51678466796875, -0.4923858642578125, -0.467987060546875, -0.4435882568359375, -0.419189453125, -0.3947906494140625, -0.370391845703125, -0.3459930419921875, -0.32159423828125, -0.2971954345703125, -0.272796630859375, -0.2483978271484375, -0.2239990234375, -0.1996002197265625, -0.175201416015625, -0.1508026123046875, -0.12640380859375, -0.1020050048828125, -0.077606201171875, -0.0532073974609375, -0.02880859375, -0.0044097900390625, 0.019989013671875, 0.0443878173828125, 0.06878662109375, 0.0931854248046875, 0.117584228515625, 0.1419830322265625, 0.1663818359375, 0.1907806396484375, 0.215179443359375, 0.2395782470703125, 0.26397705078125, 0.2883758544921875, 0.312774658203125, 0.3371734619140625, 0.361572265625, 0.3859710693359375, 0.410369873046875, 0.4347686767578125, 0.45916748046875, 0.4835662841796875, 0.507965087890625, 0.5323638916015625, 0.5567626953125, 0.5811614990234375, 0.605560302734375, 0.6299591064453125, 0.65435791015625, 0.6787567138671875, 0.703155517578125, 0.7275543212890625, 0.751953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 8.0, 6.0, 13.0, 10.0, 21.0, 32.0, 38.0, 41.0, 58.0, 83.0, 115.0, 104.0, 114.0, 97.0, 55.0, 44.0, 28.0, 28.0, 28.0, 16.0, 10.0, 8.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.00026886165142059326, -0.0002606809139251709, -0.00025250017642974854, -0.00024431943893432617, -0.0002361387014389038, -0.00022795796394348145, -0.00021977722644805908, -0.00021159648895263672, -0.00020341575145721436, -0.000195235013961792, -0.00018705427646636963, -0.00017887353897094727, -0.0001706928014755249, -0.00016251206398010254, -0.00015433132648468018, -0.0001461505889892578, -0.00013796985149383545, -0.00012978911399841309, -0.00012160837650299072, -0.00011342763900756836, -0.000105246901512146, -9.706616401672363e-05, -8.888542652130127e-05, -8.07046890258789e-05, -7.252395153045654e-05, -6.434321403503418e-05, -5.6162476539611816e-05, -4.798173904418945e-05, -3.980100154876709e-05, -3.1620264053344727e-05, -2.3439526557922363e-05, -1.52587890625e-05, -7.078051567077637e-06, 1.1026859283447266e-06, 9.28342342376709e-06, 1.7464160919189453e-05, 2.5644898414611816e-05, 3.382563591003418e-05, 4.200637340545654e-05, 5.0187110900878906e-05, 5.836784839630127e-05, 6.654858589172363e-05, 7.4729323387146e-05, 8.291006088256836e-05, 9.109079837799072e-05, 9.927153587341309e-05, 0.00010745227336883545, 0.00011563301086425781, 0.00012381374835968018, 0.00013199448585510254, 0.0001401752233505249, 0.00014835596084594727, 0.00015653669834136963, 0.000164717435836792, 0.00017289817333221436, 0.00018107891082763672, 0.00018925964832305908, 0.00019744038581848145, 0.0002056211233139038, 0.00021380186080932617, 0.00022198259830474854, 0.0002301633358001709, 0.00023834407329559326, 0.0002465248107910156]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 11.0, 11.0, 21.0, 30.0, 46.0, 59.0, 95.0, 128.0, 200.0, 295.0, 561.0, 907.0, 1600.0, 3244.0, 6877.0, 15640.0, 44532.0, 215237.0, 673729.0, 52161.0, 17712.0, 7477.0, 3550.0, 1754.0, 1017.0, 588.0, 361.0, 244.0, 138.0, 96.0, 73.0, 44.0, 42.0, 13.0, 10.0, 11.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.66162109375, -0.6427536010742188, -0.6238861083984375, -0.6050186157226562, -0.586151123046875, -0.5672836303710938, -0.5484161376953125, -0.5295486450195312, -0.51068115234375, -0.49181365966796875, -0.4729461669921875, -0.45407867431640625, -0.435211181640625, -0.41634368896484375, -0.3974761962890625, -0.37860870361328125, -0.3597412109375, -0.34087371826171875, -0.3220062255859375, -0.30313873291015625, -0.284271240234375, -0.26540374755859375, -0.2465362548828125, -0.22766876220703125, -0.20880126953125, -0.18993377685546875, -0.1710662841796875, -0.15219879150390625, -0.133331298828125, -0.11446380615234375, -0.0955963134765625, -0.07672882080078125, -0.057861328125, -0.03899383544921875, -0.0201263427734375, -0.00125885009765625, 0.017608642578125, 0.03647613525390625, 0.0553436279296875, 0.07421112060546875, 0.09307861328125, 0.11194610595703125, 0.1308135986328125, 0.14968109130859375, 0.168548583984375, 0.18741607666015625, 0.2062835693359375, 0.22515106201171875, 0.2440185546875, 0.26288604736328125, 0.2817535400390625, 0.30062103271484375, 0.319488525390625, 0.33835601806640625, 0.3572235107421875, 0.37609100341796875, 0.39495849609375, 0.41382598876953125, 0.4326934814453125, 0.45156097412109375, 0.470428466796875, 0.48929595947265625, 0.5081634521484375, 0.5270309448242188, 0.5458984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 10.0, 3.0, 7.0, 17.0, 15.0, 26.0, 27.0, 28.0, 47.0, 57.0, 88.0, 86.0, 112.0, 107.0, 94.0, 61.0, 35.0, 35.0, 29.0, 18.0, 15.0, 17.0, 11.0, 13.0, 8.0, 3.0, 7.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8056640625, -0.7765045166015625, -0.747344970703125, -0.7181854248046875, -0.68902587890625, -0.6598663330078125, -0.630706787109375, -0.6015472412109375, -0.5723876953125, -0.5432281494140625, -0.514068603515625, -0.4849090576171875, -0.45574951171875, -0.4265899658203125, -0.397430419921875, -0.3682708740234375, -0.339111328125, -0.3099517822265625, -0.280792236328125, -0.2516326904296875, -0.22247314453125, -0.1933135986328125, -0.164154052734375, -0.1349945068359375, -0.1058349609375, -0.0766754150390625, -0.047515869140625, -0.0183563232421875, 0.01080322265625, 0.0399627685546875, 0.069122314453125, 0.0982818603515625, 0.12744140625, 0.1566009521484375, 0.185760498046875, 0.2149200439453125, 0.24407958984375, 0.2732391357421875, 0.302398681640625, 0.3315582275390625, 0.3607177734375, 0.3898773193359375, 0.419036865234375, 0.4481964111328125, 0.47735595703125, 0.5065155029296875, 0.535675048828125, 0.5648345947265625, 0.593994140625, 0.6231536865234375, 0.652313232421875, 0.6814727783203125, 0.71063232421875, 0.7397918701171875, 0.768951416015625, 0.7981109619140625, 0.8272705078125, 0.8564300537109375, 0.885589599609375, 0.9147491455078125, 0.94390869140625, 0.9730682373046875, 1.002227783203125, 1.0313873291015625, 1.060546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 26.0, 43.0, 80.0, 522.0, 202.0, 62.0, 25.0, 12.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.83708953857422, -23.04227066040039, -21.247453689575195, -19.452634811401367, -17.657817840576172, -15.862998962402344, -14.068180084228516, -12.273362159729004, -10.478544235229492, -8.68372631072998, -6.8889079093933105, -5.094089508056641, -3.299271583557129, -1.5044536590576172, 0.29036521911621094, 2.0851831436157227, 3.8800010681152344, 5.674818992614746, 7.469637393951416, 9.264455795288086, 11.059273719787598, 12.85409164428711, 14.648910522460938, 16.443729400634766, 18.23854637145996, 20.03336524963379, 21.828182220458984, 23.623001098632812, 25.41781997680664, 27.212636947631836, 29.007455825805664, 30.80227279663086, 32.59709167480469, 34.391910552978516, 36.186729431152344, 37.981544494628906, 39.776363372802734, 41.57118225097656, 43.36600112915039, 45.16082000732422, 46.95563507080078, 48.75045394897461, 50.54527282714844, 52.340087890625, 54.13490676879883, 55.929725646972656, 57.724544525146484, 59.51936340332031, 61.31418228149414, 63.10900115966797, 64.90381622314453, 66.69863891601562, 68.49345397949219, 70.28826904296875, 72.08309173583984, 73.8779067993164, 75.6727294921875, 77.46754455566406, 79.26236724853516, 81.05718231201172, 82.85200500488281, 84.64682006835938, 86.44163513183594, 88.23645782470703, 90.0312728881836]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 9.0, 4.0, 2.0, 10.0, 8.0, 9.0, 11.0, 9.0, 12.0, 15.0, 16.0, 20.0, 20.0, 12.0, 27.0, 29.0, 65.0, 191.0, 209.0, 77.0, 28.0, 30.0, 15.0, 23.0, 16.0, 23.0, 10.0, 18.0, 12.0, 15.0, 11.0, 7.0, 6.0, 6.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.27923583984375, -25.485610961914062, -24.691986083984375, -23.898361206054688, -23.104736328125, -22.311111450195312, -21.517486572265625, -20.72386360168457, -19.930238723754883, -19.136613845825195, -18.342988967895508, -17.54936408996582, -16.755739212036133, -15.962115287780762, -15.168490409851074, -14.374866485595703, -13.5812406539917, -12.787615776062012, -11.993990898132324, -11.200366973876953, -10.406742095947266, -9.613117218017578, -8.81949234008789, -8.025867462158203, -7.232243061065674, -6.438618183135986, -5.644993782043457, -4.8513689041137695, -4.057744026184082, -3.2641196250915527, -2.4704947471618652, -1.676870346069336, -0.8832454681396484, -0.08962076902389526, 0.7040039300918579, 1.4976286888122559, 2.2912533283233643, 3.0848779678344727, 3.87850284576416, 4.6721272468566895, 5.465752124786377, 6.2593770027160645, 7.053001403808594, 7.846626281738281, 8.640251159667969, 9.433876037597656, 10.227500915527344, 11.021124839782715, 11.814749717712402, 12.60837459564209, 13.401999473571777, 14.195623397827148, 14.989248275756836, 15.782873153686523, 16.57649803161621, 17.3701229095459, 18.163747787475586, 18.957372665405273, 19.75099754333496, 20.54462242126465, 21.338247299194336, 22.13187026977539, 22.925495147705078, 23.719120025634766, 24.512744903564453]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 17.0, 5.0, 17.0, 22.0, 30.0, 21.0, 42.0, 59.0, 57.0, 168.0, 259.0, 60.0, 36.0, 39.0, 41.0, 23.0, 22.0, 11.0, 18.0, 14.0, 7.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.768402099609375, -3.66961669921875, -3.570831298828125, -3.4720458984375, -3.373260498046875, -3.27447509765625, -3.175689697265625, -3.076904296875, -2.978118896484375, -2.87933349609375, -2.780548095703125, -2.6817626953125, -2.582977294921875, -2.48419189453125, -2.385406494140625, -2.28662109375, -2.187835693359375, -2.08905029296875, -1.990264892578125, -1.8914794921875, -1.792694091796875, -1.69390869140625, -1.595123291015625, -1.496337890625, -1.397552490234375, -1.29876708984375, -1.199981689453125, -1.1011962890625, -1.002410888671875, -0.90362548828125, -0.804840087890625, -0.7060546875, -0.607269287109375, -0.50848388671875, -0.409698486328125, -0.3109130859375, -0.212127685546875, -0.11334228515625, -0.014556884765625, 0.084228515625, 0.183013916015625, 0.28179931640625, 0.380584716796875, 0.4793701171875, 0.578155517578125, 0.67694091796875, 0.775726318359375, 0.87451171875, 0.973297119140625, 1.07208251953125, 1.170867919921875, 1.2696533203125, 1.368438720703125, 1.46722412109375, 1.566009521484375, 1.664794921875, 1.763580322265625, 1.86236572265625, 1.961151123046875, 2.0599365234375, 2.158721923828125, 2.25750732421875, 2.356292724609375, 2.455078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 8.0, 2.0, 6.0, 4.0, 5.0, 11.0, 6.0, 10.0, 30.0, 39.0, 68.0, 91.0, 127.0, 219.0, 655.0, 1924.0, 7673.0, 8232546.0, 136654.0, 5890.0, 1550.0, 503.0, 221.0, 121.0, 81.0, 43.0, 22.0, 20.0, 12.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.8878231048584, -24.131732940673828, -23.375642776489258, -22.619552612304688, -21.86346435546875, -21.10737419128418, -20.35128402709961, -19.59519386291504, -18.83910369873047, -18.0830135345459, -17.326923370361328, -16.570833206176758, -15.814743995666504, -15.058653831481934, -14.30256462097168, -13.54647445678711, -12.790384292602539, -12.034294128417969, -11.278203964233398, -10.522114753723145, -9.766024589538574, -9.009934425354004, -8.25384521484375, -7.49775505065918, -6.741664886474609, -5.985574722290039, -5.229485034942627, -4.473395347595215, -3.7173051834106445, -2.9612152576446533, -2.205125331878662, -1.44903564453125, -0.6929454803466797, 0.06314444541931152, 0.8192343711853027, 1.575324296951294, 2.331414222717285, 3.0875041484832764, 3.8435940742492676, 4.59968376159668, 5.35577392578125, 6.11186408996582, 6.867953777313232, 7.6240434646606445, 8.380133628845215, 9.136223793029785, 9.892313003540039, 10.64840316772461, 11.40449333190918, 12.16058349609375, 12.91667366027832, 13.672762870788574, 14.428853034973145, 15.184943199157715, 15.941032409667969, 16.69712257385254, 17.45321273803711, 18.20930290222168, 18.96539306640625, 19.72148323059082, 20.47757339477539, 21.233661651611328, 21.9897518157959, 22.74584197998047, 23.50193214416504]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 6.0, 8.0, 4.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-36.54899597167969, -35.15544891357422, -33.761905670166016, -32.36836242675781, -30.974815368652344, -29.581270217895508, -28.187725067138672, -26.794179916381836, -25.400634765625, -24.007089614868164, -22.613544464111328, -21.219999313354492, -19.826454162597656, -18.43290901184082, -17.039363861083984, -15.645818710327148, -14.252273559570312, -12.858728408813477, -11.46518325805664, -10.071638107299805, -8.678092956542969, -7.284547805786133, -5.891002655029297, -4.497457504272461, -3.103912353515625, -1.710367202758789, -0.3168220520019531, 1.0767230987548828, 2.4702682495117188, 3.8638134002685547, 5.257358551025391, 6.650903701782227, 8.044445037841797, 9.437990188598633, 10.831535339355469, 12.225080490112305, 13.61862564086914, 15.012170791625977, 16.405715942382812, 17.79926109313965, 19.192806243896484, 20.58635139465332, 21.979896545410156, 23.373441696166992, 24.766986846923828, 26.160531997680664, 27.5540771484375, 28.947622299194336, 30.341167449951172, 31.734712600708008, 33.128257751464844, 34.52180480957031, 35.915348052978516, 37.30889129638672, 38.70243835449219, 40.095985412597656, 41.48952865600586, 42.88307189941406, 44.27661895751953, 45.670166015625, 47.0637092590332, 48.457252502441406, 49.850799560546875, 51.244346618652344, 52.63788986206055]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 10.0, 10.0, 14.0, 13.0, 25.0, 34.0, 38.0, 66.0, 88.0, 137.0, 204.0, 302.0, 624.0, 1387.0, 3115.0, 7200.0, 17452.0, 43809.0, 107133.0, 174421.0, 99481.0, 40094.0, 16057.0, 6845.0, 2840.0, 1244.0, 635.0, 359.0, 216.0, 112.0, 86.0, 54.0, 37.0, 39.0, 11.0, 11.0, 17.0, 14.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-19.71875, -19.1923828125, -18.666015625, -18.1396484375, -17.61328125, -17.0869140625, -16.560546875, -16.0341796875, -15.5078125, -14.9814453125, -14.455078125, -13.9287109375, -13.40234375, -12.8759765625, -12.349609375, -11.8232421875, -11.296875, -10.7705078125, -10.244140625, -9.7177734375, -9.19140625, -8.6650390625, -8.138671875, -7.6123046875, -7.0859375, -6.5595703125, -6.033203125, -5.5068359375, -4.98046875, -4.4541015625, -3.927734375, -3.4013671875, -2.875, -2.3486328125, -1.822265625, -1.2958984375, -0.76953125, -0.2431640625, 0.283203125, 0.8095703125, 1.3359375, 1.8623046875, 2.388671875, 2.9150390625, 3.44140625, 3.9677734375, 4.494140625, 5.0205078125, 5.546875, 6.0732421875, 6.599609375, 7.1259765625, 7.65234375, 8.1787109375, 8.705078125, 9.2314453125, 9.7578125, 10.2841796875, 10.810546875, 11.3369140625, 11.86328125, 12.3896484375, 12.916015625, 13.4423828125, 13.96875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 6.0, 7.0, 10.0, 13.0, 25.0, 24.0, 29.0, 26.0, 32.0, 51.0, 50.0, 46.0, 63.0, 76.0, 72.0, 58.0, 63.0, 64.0, 36.0, 36.0, 31.0, 27.0, 23.0, 20.0, 23.0, 17.0, 14.0, 8.0, 7.0, 7.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.64227294921875, -2.5579833984375, -2.47369384765625, -2.389404296875, -2.30511474609375, -2.2208251953125, -2.13653564453125, -2.05224609375, -1.96795654296875, -1.8836669921875, -1.79937744140625, -1.715087890625, -1.63079833984375, -1.5465087890625, -1.46221923828125, -1.3779296875, -1.29364013671875, -1.2093505859375, -1.12506103515625, -1.040771484375, -0.95648193359375, -0.8721923828125, -0.78790283203125, -0.70361328125, -0.61932373046875, -0.5350341796875, -0.45074462890625, -0.366455078125, -0.28216552734375, -0.1978759765625, -0.11358642578125, -0.029296875, 0.05499267578125, 0.1392822265625, 0.22357177734375, 0.307861328125, 0.39215087890625, 0.4764404296875, 0.56072998046875, 0.64501953125, 0.72930908203125, 0.8135986328125, 0.89788818359375, 0.982177734375, 1.06646728515625, 1.1507568359375, 1.23504638671875, 1.3193359375, 1.40362548828125, 1.4879150390625, 1.57220458984375, 1.656494140625, 1.74078369140625, 1.8250732421875, 1.90936279296875, 1.99365234375, 2.07794189453125, 2.1622314453125, 2.24652099609375, 2.330810546875, 2.41510009765625, 2.4993896484375, 2.58367919921875, 2.66796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 13.0, 25.0, 41.0, 61.0, 72.0, 63.0, 42.0, 41.0, 28.0, 9.0, 12.0, 12.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.385527610778809, -11.901786804199219, -11.418045997619629, -10.934305191040039, -10.450565338134766, -9.966824531555176, -9.483083724975586, -8.999342918395996, -8.515602111816406, -8.031861305236816, -7.548120975494385, -7.064380168914795, -6.580639839172363, -6.096899032592773, -5.613158226013184, -5.129417419433594, -4.64567756652832, -4.1619367599487305, -3.678196430206299, -3.194455623626709, -2.7107150554656982, -2.2269744873046875, -1.7432336807250977, -1.259493112564087, -0.7757525444030762, -0.29201191663742065, 0.19172871112823486, 0.6754693984985352, 1.159209966659546, 1.6429505348205566, 2.1266913414001465, 2.6104319095611572, 3.0941734313964844, 3.577913999557495, 4.061654567718506, 4.545395374298096, 5.029135704040527, 5.512876510620117, 5.996617317199707, 6.480358123779297, 6.9640984535217285, 7.447839260101318, 7.93157958984375, 8.41532039642334, 8.89906120300293, 9.382801055908203, 9.86654281616211, 10.350282669067383, 10.834023475646973, 11.317764282226562, 11.801505088806152, 12.285245895385742, 12.768985748291016, 13.252726554870605, 13.736467361450195, 14.220208168029785, 14.703948974609375, 15.187689781188965, 15.671430587768555, 16.155170440673828, 16.638912200927734, 17.122652053833008, 17.60639190673828, 18.090133666992188, 18.57387351989746]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 4.0, 7.0, 7.0, 7.0, 12.0, 13.0, 28.0, 46.0, 65.0, 79.0, 65.0, 52.0, 37.0, 18.0, 9.0, 9.0, 5.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.785943031311035, -15.283476829528809, -14.781010627746582, -14.278544425964355, -13.776078224182129, -13.273612022399902, -12.771145820617676, -12.26867961883545, -11.766213417053223, -11.263747215270996, -10.76128101348877, -10.258814811706543, -9.756348609924316, -9.25388240814209, -8.751416206359863, -8.248950004577637, -7.74648380279541, -7.244017601013184, -6.741551399230957, -6.2390851974487305, -5.736618995666504, -5.234152793884277, -4.731686592102051, -4.229220390319824, -3.7267541885375977, -3.224287986755371, -2.7218217849731445, -2.219355583190918, -1.7168893814086914, -1.2144231796264648, -0.7119569778442383, -0.20949077606201172, 0.29297637939453125, 0.7954425811767578, 1.2979087829589844, 1.800374984741211, 2.3028411865234375, 2.805307388305664, 3.3077735900878906, 3.810239791870117, 4.312705993652344, 4.81517219543457, 5.317638397216797, 5.820104598999023, 6.32257080078125, 6.825037002563477, 7.327503204345703, 7.82996940612793, 8.332435607910156, 8.834901809692383, 9.33736801147461, 9.839834213256836, 10.342300415039062, 10.844766616821289, 11.347232818603516, 11.849699020385742, 12.352165222167969, 12.854631423950195, 13.357097625732422, 13.859563827514648, 14.362030029296875, 14.864496231079102, 15.366962432861328, 15.869428634643555, 16.37189483642578]}, "eval/loss": 12.739469528198242, "eval/wer": 2.0272040002381093, "eval/runtime": 953.2256, "eval/samples_per_second": 2.772, "eval/steps_per_second": 0.347} \ No newline at end of file +{"train/loss": 4.7636, "train/learning_rate": 2.137767220902613e-08, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 120296, "_timestamp": 1647066064, "_step": 17851, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 113.0, 23.0, 14.0, 1.0, 4.0, 8.0, 30110.0, 165.0, 34.0, 14.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.427001953125, -8.15869140625, -7.890380859375, -7.6220703125, -7.353759765625, -7.08544921875, -6.817138671875, -6.548828125, -6.280517578125, -6.01220703125, -5.743896484375, -5.4755859375, -5.207275390625, -4.93896484375, -4.670654296875, -4.40234375, -4.134033203125, -3.86572265625, -3.597412109375, -3.3291015625, -3.060791015625, -2.79248046875, -2.524169921875, -2.255859375, -1.987548828125, -1.71923828125, -1.450927734375, -1.1826171875, -0.914306640625, -0.64599609375, -0.377685546875, -0.109375, 0.158935546875, 0.42724609375, 0.695556640625, 0.9638671875, 1.232177734375, 1.50048828125, 1.768798828125, 2.037109375, 2.305419921875, 2.57373046875, 2.842041015625, 3.1103515625, 3.378662109375, 3.64697265625, 3.915283203125, 4.18359375, 4.451904296875, 4.72021484375, 4.988525390625, 5.2568359375, 5.525146484375, 5.79345703125, 6.061767578125, 6.330078125, 6.598388671875, 6.86669921875, 7.135009765625, 7.4033203125, 7.671630859375, 7.93994140625, 8.208251953125, 8.4765625]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 101.0, 461.0, 360.0, 82.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.2723388671875, -35.635013580322266, -34.99768829345703, -34.3603630065918, -33.72303771972656, -33.085716247558594, -32.44839096069336, -31.811065673828125, -31.17374038696289, -30.536415100097656, -29.899089813232422, -29.26176643371582, -28.624441146850586, -27.98711585998535, -27.34979248046875, -26.712467193603516, -26.07514190673828, -25.437816619873047, -24.800491333007812, -24.16316795349121, -23.525842666625977, -22.888517379760742, -22.25119400024414, -21.613868713378906, -20.976543426513672, -20.339218139648438, -19.701892852783203, -19.0645694732666, -18.427244186401367, -17.789918899536133, -17.15259552001953, -16.515270233154297, -15.877946853637695, -15.240621566772461, -14.603297233581543, -13.965972900390625, -13.32864761352539, -12.691322326660156, -12.053997993469238, -11.41667366027832, -10.779348373413086, -10.142023086547852, -9.504698753356934, -8.867374420166016, -8.230049133300781, -7.592724323272705, -6.955399513244629, -6.318074703216553, -5.680749893188477, -5.0434250831604, -4.406100273132324, -3.768775463104248, -3.131450653076172, -2.4941258430480957, -1.8568010330200195, -1.2194762229919434, -0.5821514129638672, 0.055173397064208984, 0.6924982070922852, 1.3298230171203613, 1.9671478271484375, 2.6044726371765137, 3.24179744720459, 3.879122257232666, 4.516447067260742]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 12.0, 7.0, 11.0, 16.0, 15.0, 19.0, 22.0, 23.0, 32.0, 27.0, 38.0, 32.0, 22.0, 28.0, 49.0, 44.0, 44.0, 42.0, 37.0, 45.0, 41.0, 39.0, 36.0, 38.0, 35.0, 31.0, 28.0, 27.0, 22.0, 18.0, 14.0, 18.0, 11.0, 14.0, 9.0, 12.0, 4.0, 4.0, 5.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1041932106018066, -3.0013654232025146, -2.8985378742218018, -2.7957100868225098, -2.6928822994232178, -2.590054512023926, -2.487226963043213, -2.384399175643921, -2.281571388244629, -2.178743600845337, -2.075916051864624, -1.973088264465332, -1.87026047706604, -1.7674328088760376, -1.6646051406860352, -1.5617773532867432, -1.4589498043060303, -1.3561221361160278, -1.2532943487167358, -1.1504666805267334, -1.0476388931274414, -0.944811224937439, -0.8419835567474365, -0.7391558289527893, -0.6363281011581421, -0.5335003733634949, -0.43067267537117004, -0.3278449773788452, -0.225017249584198, -0.12218952178955078, -0.01936185359954834, 0.08346587419509888, 0.1862938404083252, 0.2891215682029724, 0.39194926619529724, 0.49477696418762207, 0.5976046919822693, 0.7004324197769165, 0.803260087966919, 0.9060878157615662, 1.0089155435562134, 1.1117432117462158, 1.2145709991455078, 1.3173986673355103, 1.4202263355255127, 1.5230541229248047, 1.6258817911148071, 1.7287094593048096, 1.8315372467041016, 1.934364914894104, 2.0371925830841064, 2.1400203704833984, 2.2428481578826904, 2.3456759452819824, 2.4485034942626953, 2.5513312816619873, 2.6541590690612793, 2.7569868564605713, 2.859814405441284, 2.962642192840576, 3.065469980239868, 3.16829776763916, 3.271125316619873, 3.373953104019165, 3.476780652999878]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 4.0, 8.0, 4.0, 8.0, 16.0, 12.0, 18.0, 12.0, 19.0, 34.0, 55.0, 103.0, 202.0, 549.0, 1437.0, 4271.0, 12777.0, 40602.0, 117755.0, 252588.0, 363374.0, 163575.0, 61428.0, 19964.0, 6181.0, 2155.0, 767.0, 290.0, 120.0, 62.0, 37.0, 22.0, 24.0, 19.0, 12.0, 9.0, 8.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.1953125, -10.8363037109375, -10.477294921875, -10.1182861328125, -9.75927734375, -9.4002685546875, -9.041259765625, -8.6822509765625, -8.3232421875, -7.9642333984375, -7.605224609375, -7.2462158203125, -6.88720703125, -6.5281982421875, -6.169189453125, -5.8101806640625, -5.451171875, -5.0921630859375, -4.733154296875, -4.3741455078125, -4.01513671875, -3.6561279296875, -3.297119140625, -2.9381103515625, -2.5791015625, -2.2200927734375, -1.861083984375, -1.5020751953125, -1.14306640625, -0.7840576171875, -0.425048828125, -0.0660400390625, 0.29296875, 0.6519775390625, 1.010986328125, 1.3699951171875, 1.72900390625, 2.0880126953125, 2.447021484375, 2.8060302734375, 3.1650390625, 3.5240478515625, 3.883056640625, 4.2420654296875, 4.60107421875, 4.9600830078125, 5.319091796875, 5.6781005859375, 6.037109375, 6.3961181640625, 6.755126953125, 7.1141357421875, 7.47314453125, 7.8321533203125, 8.191162109375, 8.5501708984375, 8.9091796875, 9.2681884765625, 9.627197265625, 9.9862060546875, 10.34521484375, 10.7042236328125, 11.063232421875, 11.4222412109375, 11.78125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 11.0, 7.0, 14.0, 21.0, 15.0, 23.0, 32.0, 28.0, 36.0, 23.0, 28.0, 38.0, 38.0, 36.0, 49.0, 104.0, 50.0, 39.0, 43.0, 40.0, 33.0, 27.0, 35.0, 28.0, 27.0, 19.0, 21.0, 15.0, 16.0, 12.0, 15.0, 10.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.356048583984375, -2.26483154296875, -2.173614501953125, -2.0823974609375, -1.991180419921875, -1.89996337890625, -1.808746337890625, -1.717529296875, -1.626312255859375, -1.53509521484375, -1.443878173828125, -1.3526611328125, -1.261444091796875, -1.17022705078125, -1.079010009765625, -0.98779296875, -0.896575927734375, -0.80535888671875, -0.714141845703125, -0.6229248046875, -0.531707763671875, -0.44049072265625, -0.349273681640625, -0.258056640625, -0.166839599609375, -0.07562255859375, 0.015594482421875, 0.1068115234375, 0.198028564453125, 0.28924560546875, 0.380462646484375, 0.4716796875, 0.562896728515625, 0.65411376953125, 0.745330810546875, 0.8365478515625, 0.927764892578125, 1.01898193359375, 1.110198974609375, 1.201416015625, 1.292633056640625, 1.38385009765625, 1.475067138671875, 1.5662841796875, 1.657501220703125, 1.74871826171875, 1.839935302734375, 1.93115234375, 2.022369384765625, 2.11358642578125, 2.204803466796875, 2.2960205078125, 2.387237548828125, 2.47845458984375, 2.569671630859375, 2.660888671875, 2.752105712890625, 2.84332275390625, 2.934539794921875, 3.0257568359375, 3.116973876953125, 3.20819091796875, 3.299407958984375, 3.390625]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [6.0, 4.0, 3.0, 14.0, 18.0, 25.0, 57.0, 63.0, 94.0, 93.0, 117.0, 125.0, 107.0, 90.0, 79.0, 36.0, 23.0, 26.0, 20.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7842276096343994, -2.535231113433838, -2.2862348556518555, -2.037238597869873, -1.7882421016693115, -1.5392457246780396, -1.2902493476867676, -1.0412529706954956, -0.7922565937042236, -0.5432602167129517, -0.2942638397216797, -0.045267462730407715, 0.20372891426086426, 0.45272529125213623, 0.7017216682434082, 0.9507180452346802, 1.1997144222259521, 1.4487107992172241, 1.697707176208496, 1.946703553199768, 2.19569993019104, 2.4446964263916016, 2.693692684173584, 2.9426889419555664, 3.191685438156128, 3.4406819343566895, 3.689678192138672, 3.9386744499206543, 4.187670707702637, 4.436667442321777, 4.68566370010376, 4.934659957885742, 5.183656692504883, 5.432652950286865, 5.681649208068848, 5.930645942687988, 6.179642200469971, 6.428638458251953, 6.677635192871094, 6.926631450653076, 7.175627708435059, 7.424623966217041, 7.673620223999023, 7.922616958618164, 8.171613693237305, 8.420609474182129, 8.66960620880127, 8.918601989746094, 9.167598724365234, 9.416595458984375, 9.6655912399292, 9.91458797454834, 10.163583755493164, 10.412580490112305, 10.661577224731445, 10.91057300567627, 11.15956974029541, 11.40856647491455, 11.657562255859375, 11.906558990478516, 12.155555725097656, 12.40455150604248, 12.653548240661621, 12.902544021606445, 13.151540756225586]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 1.0, 13.0, 9.0, 8.0, 8.0, 10.0, 5.0, 21.0, 12.0, 15.0, 20.0, 25.0, 22.0, 33.0, 36.0, 26.0, 40.0, 29.0, 35.0, 42.0, 44.0, 49.0, 41.0, 41.0, 48.0, 29.0, 30.0, 32.0, 27.0, 28.0, 28.0, 21.0, 21.0, 22.0, 21.0, 21.0, 12.0, 12.0, 19.0, 9.0, 5.0, 6.0, 6.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.554716110229492, -3.439323902130127, -3.3239316940307617, -3.2085394859313965, -3.093147039413452, -2.977754831314087, -2.8623626232147217, -2.7469704151153564, -2.631577968597412, -2.516185760498047, -2.4007935523986816, -2.2854013442993164, -2.170008897781372, -2.054616689682007, -1.9392244815826416, -1.8238322734832764, -1.7084400653839111, -1.593047857284546, -1.4776555299758911, -1.3622633218765259, -1.246870994567871, -1.1314787864685059, -1.0160865783691406, -0.9006943106651306, -0.7853020429611206, -0.6699097752571106, -0.5545175075531006, -0.43912529945373535, -0.32373303174972534, -0.20834076404571533, -0.0929485559463501, 0.022443711757659912, 0.13783597946166992, 0.25322824716567993, 0.36862048506736755, 0.4840127229690552, 0.5994049906730652, 0.7147972583770752, 0.8301894664764404, 0.9455817341804504, 1.0609740018844604, 1.1763662099838257, 1.2917585372924805, 1.4071507453918457, 1.522542953491211, 1.6379352807998657, 1.753327488899231, 1.8687198162078857, 1.984112024307251, 2.099504232406616, 2.2148964405059814, 2.330288887023926, 2.445681095123291, 2.5610733032226562, 2.6764655113220215, 2.7918577194213867, 2.907249927520752, 3.022642135620117, 3.1380343437194824, 3.2534265518188477, 3.368818998336792, 3.4842112064361572, 3.5996034145355225, 3.7149956226348877, 3.830388069152832]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 6.0, 9.0, 6.0, 8.0, 10.0, 22.0, 31.0, 41.0, 46.0, 99.0, 146.0, 260.0, 437.0, 691.0, 1372.0, 2442.0, 4891.0, 10435.0, 23341.0, 61496.0, 425134.0, 3326470.0, 246884.0, 51046.0, 19971.0, 9246.0, 4452.0, 2290.0, 1229.0, 699.0, 398.0, 223.0, 165.0, 87.0, 55.0, 44.0, 26.0, 15.0, 24.0, 13.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1953125, -6.0098876953125, -5.824462890625, -5.6390380859375, -5.45361328125, -5.2681884765625, -5.082763671875, -4.8973388671875, -4.7119140625, -4.5264892578125, -4.341064453125, -4.1556396484375, -3.97021484375, -3.7847900390625, -3.599365234375, -3.4139404296875, -3.228515625, -3.0430908203125, -2.857666015625, -2.6722412109375, -2.48681640625, -2.3013916015625, -2.115966796875, -1.9305419921875, -1.7451171875, -1.5596923828125, -1.374267578125, -1.1888427734375, -1.00341796875, -0.8179931640625, -0.632568359375, -0.4471435546875, -0.26171875, -0.0762939453125, 0.109130859375, 0.2945556640625, 0.47998046875, 0.6654052734375, 0.850830078125, 1.0362548828125, 1.2216796875, 1.4071044921875, 1.592529296875, 1.7779541015625, 1.96337890625, 2.1488037109375, 2.334228515625, 2.5196533203125, 2.705078125, 2.8905029296875, 3.075927734375, 3.2613525390625, 3.44677734375, 3.6322021484375, 3.817626953125, 4.0030517578125, 4.1884765625, 4.3739013671875, 4.559326171875, 4.7447509765625, 4.93017578125, 5.1156005859375, 5.301025390625, 5.4864501953125, 5.671875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 9.0, 6.0, 5.0, 11.0, 11.0, 21.0, 21.0, 17.0, 20.0, 21.0, 34.0, 32.0, 35.0, 36.0, 37.0, 41.0, 42.0, 46.0, 45.0, 37.0, 54.0, 40.0, 36.0, 31.0, 29.0, 27.0, 28.0, 27.0, 33.0, 27.0, 21.0, 19.0, 13.0, 10.0, 19.0, 9.0, 6.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.51953125, -2.440093994140625, -2.36065673828125, -2.281219482421875, -2.2017822265625, -2.122344970703125, -2.04290771484375, -1.963470458984375, -1.884033203125, -1.804595947265625, -1.72515869140625, -1.645721435546875, -1.5662841796875, -1.486846923828125, -1.40740966796875, -1.327972412109375, -1.24853515625, -1.169097900390625, -1.08966064453125, -1.010223388671875, -0.9307861328125, -0.851348876953125, -0.77191162109375, -0.692474365234375, -0.613037109375, -0.533599853515625, -0.45416259765625, -0.374725341796875, -0.2952880859375, -0.215850830078125, -0.13641357421875, -0.056976318359375, 0.0224609375, 0.101898193359375, 0.18133544921875, 0.260772705078125, 0.3402099609375, 0.419647216796875, 0.49908447265625, 0.578521728515625, 0.657958984375, 0.737396240234375, 0.81683349609375, 0.896270751953125, 0.9757080078125, 1.055145263671875, 1.13458251953125, 1.214019775390625, 1.29345703125, 1.372894287109375, 1.45233154296875, 1.531768798828125, 1.6112060546875, 1.690643310546875, 1.77008056640625, 1.849517822265625, 1.928955078125, 2.008392333984375, 2.08782958984375, 2.167266845703125, 2.2467041015625, 2.326141357421875, 2.40557861328125, 2.485015869140625, 2.564453125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 2.0, 6.0, 10.0, 13.0, 43.0, 76.0, 164.0, 675.0, 31799.0, 4156255.0, 4616.0, 385.0, 117.0, 37.0, 29.0, 15.0, 8.0, 12.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.34375, -46.63720703125, -44.9306640625, -43.22412109375, -41.517578125, -39.81103515625, -38.1044921875, -36.39794921875, -34.69140625, -32.98486328125, -31.2783203125, -29.57177734375, -27.865234375, -26.15869140625, -24.4521484375, -22.74560546875, -21.0390625, -19.33251953125, -17.6259765625, -15.91943359375, -14.212890625, -12.50634765625, -10.7998046875, -9.09326171875, -7.38671875, -5.68017578125, -3.9736328125, -2.26708984375, -0.560546875, 1.14599609375, 2.8525390625, 4.55908203125, 6.265625, 7.97216796875, 9.6787109375, 11.38525390625, 13.091796875, 14.79833984375, 16.5048828125, 18.21142578125, 19.91796875, 21.62451171875, 23.3310546875, 25.03759765625, 26.744140625, 28.45068359375, 30.1572265625, 31.86376953125, 33.5703125, 35.27685546875, 36.9833984375, 38.68994140625, 40.396484375, 42.10302734375, 43.8095703125, 45.51611328125, 47.22265625, 48.92919921875, 50.6357421875, 52.34228515625, 54.048828125, 55.75537109375, 57.4619140625, 59.16845703125, 60.875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 12.0, 3.0, 11.0, 22.0, 50.0, 87.0, 151.0, 390.0, 1804.0, 1066.0, 225.0, 105.0, 49.0, 43.0, 22.0, 10.0, 11.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.99609375, -2.898834228515625, -2.80157470703125, -2.704315185546875, -2.6070556640625, -2.509796142578125, -2.41253662109375, -2.315277099609375, -2.218017578125, -2.120758056640625, -2.02349853515625, -1.926239013671875, -1.8289794921875, -1.731719970703125, -1.63446044921875, -1.537200927734375, -1.43994140625, -1.342681884765625, -1.24542236328125, -1.148162841796875, -1.0509033203125, -0.953643798828125, -0.85638427734375, -0.759124755859375, -0.661865234375, -0.564605712890625, -0.46734619140625, -0.370086669921875, -0.2728271484375, -0.175567626953125, -0.07830810546875, 0.018951416015625, 0.1162109375, 0.213470458984375, 0.31072998046875, 0.407989501953125, 0.5052490234375, 0.602508544921875, 0.69976806640625, 0.797027587890625, 0.894287109375, 0.991546630859375, 1.08880615234375, 1.186065673828125, 1.2833251953125, 1.380584716796875, 1.47784423828125, 1.575103759765625, 1.67236328125, 1.769622802734375, 1.86688232421875, 1.964141845703125, 2.0614013671875, 2.158660888671875, 2.25592041015625, 2.353179931640625, 2.450439453125, 2.547698974609375, 2.64495849609375, 2.742218017578125, 2.8394775390625, 2.936737060546875, 3.03399658203125, 3.131256103515625, 3.228515625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 24.0, 37.0, 73.0, 88.0, 112.0, 142.0, 137.0, 130.0, 86.0, 60.0, 46.0, 12.0, 18.0, 13.0, 7.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.436715841293335, -2.235708475112915, -2.034701108932495, -1.8336936235427856, -1.6326862573623657, -1.4316788911819458, -1.2306714057922363, -1.0296640396118164, -0.8286566734313965, -0.6276493072509766, -0.42664188146591187, -0.22563445568084717, -0.024627089500427246, 0.17638027667999268, 0.37738776206970215, 0.5783951282501221, 0.779402494430542, 0.9804098606109619, 1.1814172267913818, 1.3824247121810913, 1.5834320783615112, 1.7844394445419312, 1.9854469299316406, 2.1864542961120605, 2.3874616622924805, 2.5884690284729004, 2.7894763946533203, 2.9904837608337402, 3.19149112701416, 3.39249849319458, 3.593506097793579, 3.794513463973999, 3.99552059173584, 4.19652795791626, 4.39753532409668, 4.5985426902771, 4.7995500564575195, 5.0005574226379395, 5.201564788818359, 5.4025726318359375, 5.603579521179199, 5.804586887359619, 6.005594253540039, 6.206601619720459, 6.407608985900879, 6.608616352081299, 6.809623718261719, 7.010631561279297, 7.211638927459717, 7.412646293640137, 7.613653659820557, 7.814661026000977, 8.015668869018555, 8.216675758361816, 8.417683601379395, 8.618690490722656, 8.819698333740234, 9.020706176757812, 9.221713066101074, 9.422720909118652, 9.623727798461914, 9.824735641479492, 10.025742530822754, 10.226750373840332, 10.427757263183594]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 5.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 7.0, 12.0, 11.0, 16.0, 14.0, 19.0, 17.0, 18.0, 22.0, 25.0, 26.0, 29.0, 27.0, 33.0, 35.0, 31.0, 34.0, 44.0, 46.0, 33.0, 35.0, 50.0, 26.0, 47.0, 32.0, 37.0, 19.0, 16.0, 26.0, 19.0, 20.0, 27.0, 24.0, 18.0, 12.0, 12.0, 15.0, 8.0, 10.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.566723108291626, -2.489471673965454, -2.4122202396392822, -2.3349688053131104, -2.2577173709869385, -2.1804659366607666, -2.1032145023345947, -2.025963306427002, -1.9487117528915405, -1.8714603185653687, -1.7942088842391968, -1.716957449913025, -1.6397061347961426, -1.5624547004699707, -1.4852032661437988, -1.407951831817627, -1.330700397491455, -1.2534489631652832, -1.1761975288391113, -1.0989460945129395, -1.0216946601867676, -0.9444432854652405, -0.8671919107437134, -0.7899404764175415, -0.7126890420913696, -0.6354376077651978, -0.5581861734390259, -0.4809347987174988, -0.4036833643913269, -0.32643193006515503, -0.24918052554130554, -0.17192912101745605, -0.09467744827270508, -0.017426028847694397, 0.059825390577316284, 0.13707681000232697, 0.21432822942733765, 0.2915796637535095, 0.368831068277359, 0.4460824728012085, 0.5233339071273804, 0.6005853414535522, 0.6778367757797241, 0.7550881505012512, 0.8323395848274231, 0.909591019153595, 0.9868423938751221, 1.064093828201294, 1.1413452625274658, 1.2185966968536377, 1.2958481311798096, 1.3730995655059814, 1.4503509998321533, 1.5276024341583252, 1.6048537492752075, 1.6821051836013794, 1.7593566179275513, 1.8366080522537231, 1.913859486579895, 1.991110920906067, 2.068362236022949, 2.145613670349121, 2.222865104675293, 2.300116539001465, 2.3773679733276367]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 19.0, 21.0, 23.0, 47.0, 65.0, 97.0, 129.0, 179.0, 310.0, 353.0, 516.0, 732.0, 1031.0, 1510.0, 2144.0, 3088.0, 4396.0, 6522.0, 9867.0, 15531.0, 25143.0, 42113.0, 72815.0, 127249.0, 209550.0, 208945.0, 128018.0, 73444.0, 42599.0, 25374.0, 15457.0, 10148.0, 6611.0, 4422.0, 3029.0, 2064.0, 1488.0, 1028.0, 742.0, 500.0, 364.0, 249.0, 180.0, 133.0, 100.0, 73.0, 36.0, 33.0, 17.0, 15.0, 7.0, 5.0, 6.0, 7.0, 4.0, 2.0], "bins": [-4.75390625, -4.60986328125, -4.4658203125, -4.32177734375, -4.177734375, -4.03369140625, -3.8896484375, -3.74560546875, -3.6015625, -3.45751953125, -3.3134765625, -3.16943359375, -3.025390625, -2.88134765625, -2.7373046875, -2.59326171875, -2.44921875, -2.30517578125, -2.1611328125, -2.01708984375, -1.873046875, -1.72900390625, -1.5849609375, -1.44091796875, -1.296875, -1.15283203125, -1.0087890625, -0.86474609375, -0.720703125, -0.57666015625, -0.4326171875, -0.28857421875, -0.14453125, -0.00048828125, 0.1435546875, 0.28759765625, 0.431640625, 0.57568359375, 0.7197265625, 0.86376953125, 1.0078125, 1.15185546875, 1.2958984375, 1.43994140625, 1.583984375, 1.72802734375, 1.8720703125, 2.01611328125, 2.16015625, 2.30419921875, 2.4482421875, 2.59228515625, 2.736328125, 2.88037109375, 3.0244140625, 3.16845703125, 3.3125, 3.45654296875, 3.6005859375, 3.74462890625, 3.888671875, 4.03271484375, 4.1767578125, 4.32080078125, 4.46484375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 7.0, 8.0, 6.0, 12.0, 11.0, 15.0, 18.0, 17.0, 18.0, 23.0, 20.0, 27.0, 33.0, 30.0, 27.0, 37.0, 24.0, 45.0, 54.0, 43.0, 51.0, 32.0, 38.0, 41.0, 24.0, 37.0, 31.0, 26.0, 28.0, 20.0, 27.0, 26.0, 20.0, 21.0, 13.0, 17.0, 12.0, 7.0, 6.0, 6.0, 11.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.302734375, -2.235443115234375, -2.16815185546875, -2.100860595703125, -2.0335693359375, -1.966278076171875, -1.89898681640625, -1.831695556640625, -1.764404296875, -1.697113037109375, -1.62982177734375, -1.562530517578125, -1.4952392578125, -1.427947998046875, -1.36065673828125, -1.293365478515625, -1.22607421875, -1.158782958984375, -1.09149169921875, -1.024200439453125, -0.9569091796875, -0.889617919921875, -0.82232666015625, -0.755035400390625, -0.687744140625, -0.620452880859375, -0.55316162109375, -0.485870361328125, -0.4185791015625, -0.351287841796875, -0.28399658203125, -0.216705322265625, -0.1494140625, -0.082122802734375, -0.01483154296875, 0.052459716796875, 0.1197509765625, 0.187042236328125, 0.25433349609375, 0.321624755859375, 0.388916015625, 0.456207275390625, 0.52349853515625, 0.590789794921875, 0.6580810546875, 0.725372314453125, 0.79266357421875, 0.859954833984375, 0.92724609375, 0.994537353515625, 1.06182861328125, 1.129119873046875, 1.1964111328125, 1.263702392578125, 1.33099365234375, 1.398284912109375, 1.465576171875, 1.532867431640625, 1.60015869140625, 1.667449951171875, 1.7347412109375, 1.802032470703125, 1.86932373046875, 1.936614990234375, 2.00390625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 13.0, 10.0, 20.0, 27.0, 41.0, 47.0, 39.0, 71.0, 113.0, 146.0, 222.0, 318.0, 523.0, 971.0, 1911.0, 4490.0, 13437.0, 61959.0, 735199.0, 188251.0, 27081.0, 7322.0, 2846.0, 1414.0, 664.0, 428.0, 302.0, 202.0, 103.0, 83.0, 68.0, 55.0, 25.0, 31.0, 20.0, 31.0, 16.0, 8.0, 5.0, 8.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.3671875, -12.9461669921875, -12.525146484375, -12.1041259765625, -11.68310546875, -11.2620849609375, -10.841064453125, -10.4200439453125, -9.9990234375, -9.5780029296875, -9.156982421875, -8.7359619140625, -8.31494140625, -7.8939208984375, -7.472900390625, -7.0518798828125, -6.630859375, -6.2098388671875, -5.788818359375, -5.3677978515625, -4.94677734375, -4.5257568359375, -4.104736328125, -3.6837158203125, -3.2626953125, -2.8416748046875, -2.420654296875, -1.9996337890625, -1.57861328125, -1.1575927734375, -0.736572265625, -0.3155517578125, 0.10546875, 0.5264892578125, 0.947509765625, 1.3685302734375, 1.78955078125, 2.2105712890625, 2.631591796875, 3.0526123046875, 3.4736328125, 3.8946533203125, 4.315673828125, 4.7366943359375, 5.15771484375, 5.5787353515625, 5.999755859375, 6.4207763671875, 6.841796875, 7.2628173828125, 7.683837890625, 8.1048583984375, 8.52587890625, 8.9468994140625, 9.367919921875, 9.7889404296875, 10.2099609375, 10.6309814453125, 11.052001953125, 11.4730224609375, 11.89404296875, 12.3150634765625, 12.736083984375, 13.1571044921875, 13.578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 10.0, 11.0, 9.0, 15.0, 17.0, 27.0, 16.0, 27.0, 17.0, 42.0, 33.0, 42.0, 46.0, 46.0, 43.0, 54.0, 41.0, 34.0, 47.0, 48.0, 49.0, 43.0, 40.0, 32.0, 27.0, 23.0, 25.0, 20.0, 23.0, 16.0, 18.0, 12.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6298828125, -1.574249267578125, -1.51861572265625, -1.462982177734375, -1.4073486328125, -1.351715087890625, -1.29608154296875, -1.240447998046875, -1.184814453125, -1.129180908203125, -1.07354736328125, -1.017913818359375, -0.9622802734375, -0.906646728515625, -0.85101318359375, -0.795379638671875, -0.73974609375, -0.684112548828125, -0.62847900390625, -0.572845458984375, -0.5172119140625, -0.461578369140625, -0.40594482421875, -0.350311279296875, -0.294677734375, -0.239044189453125, -0.18341064453125, -0.127777099609375, -0.0721435546875, -0.016510009765625, 0.03912353515625, 0.094757080078125, 0.150390625, 0.206024169921875, 0.26165771484375, 0.317291259765625, 0.3729248046875, 0.428558349609375, 0.48419189453125, 0.539825439453125, 0.595458984375, 0.651092529296875, 0.70672607421875, 0.762359619140625, 0.8179931640625, 0.873626708984375, 0.92926025390625, 0.984893798828125, 1.04052734375, 1.096160888671875, 1.15179443359375, 1.207427978515625, 1.2630615234375, 1.318695068359375, 1.37432861328125, 1.429962158203125, 1.485595703125, 1.541229248046875, 1.59686279296875, 1.652496337890625, 1.7081298828125, 1.763763427734375, 1.81939697265625, 1.875030517578125, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 3.0, 4.0, 7.0, 10.0, 10.0, 22.0, 17.0, 27.0, 39.0, 51.0, 97.0, 106.0, 148.0, 261.0, 404.0, 577.0, 1022.0, 2010.0, 4319.0, 10871.0, 36542.0, 333255.0, 592988.0, 43213.0, 12487.0, 4769.0, 2209.0, 1174.0, 671.0, 403.0, 235.0, 149.0, 109.0, 78.0, 76.0, 52.0, 42.0, 22.0, 24.0, 17.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.328857421875, -10.93896484375, -10.549072265625, -10.1591796875, -9.769287109375, -9.37939453125, -8.989501953125, -8.599609375, -8.209716796875, -7.81982421875, -7.429931640625, -7.0400390625, -6.650146484375, -6.26025390625, -5.870361328125, -5.48046875, -5.090576171875, -4.70068359375, -4.310791015625, -3.9208984375, -3.531005859375, -3.14111328125, -2.751220703125, -2.361328125, -1.971435546875, -1.58154296875, -1.191650390625, -0.8017578125, -0.411865234375, -0.02197265625, 0.367919921875, 0.7578125, 1.147705078125, 1.53759765625, 1.927490234375, 2.3173828125, 2.707275390625, 3.09716796875, 3.487060546875, 3.876953125, 4.266845703125, 4.65673828125, 5.046630859375, 5.4365234375, 5.826416015625, 6.21630859375, 6.606201171875, 6.99609375, 7.385986328125, 7.77587890625, 8.165771484375, 8.5556640625, 8.945556640625, 9.33544921875, 9.725341796875, 10.115234375, 10.505126953125, 10.89501953125, 11.284912109375, 11.6748046875, 12.064697265625, 12.45458984375, 12.844482421875, 13.234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 17.0, 16.0, 24.0, 36.0, 54.0, 97.0, 120.0, 162.0, 130.0, 84.0, 71.0, 42.0, 24.0, 22.0, 12.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00046539306640625, -0.00044793635606765747, -0.00043047964572906494, -0.0004130229353904724, -0.0003955662250518799, -0.00037810951471328735, -0.0003606528043746948, -0.0003431960940361023, -0.00032573938369750977, -0.00030828267335891724, -0.0002908259630203247, -0.0002733692526817322, -0.00025591254234313965, -0.00023845583200454712, -0.0002209991216659546, -0.00020354241132736206, -0.00018608570098876953, -0.000168628990650177, -0.00015117228031158447, -0.00013371556997299194, -0.00011625885963439941, -9.880214929580688e-05, -8.134543895721436e-05, -6.388872861862183e-05, -4.64320182800293e-05, -2.8975307941436768e-05, -1.1518597602844238e-05, 5.938112735748291e-06, 2.339482307434082e-05, 4.085153341293335e-05, 5.830824375152588e-05, 7.576495409011841e-05, 9.322166442871094e-05, 0.00011067837476730347, 0.000128135085105896, 0.00014559179544448853, 0.00016304850578308105, 0.00018050521612167358, 0.0001979619264602661, 0.00021541863679885864, 0.00023287534713745117, 0.0002503320574760437, 0.00026778876781463623, 0.00028524547815322876, 0.0003027021884918213, 0.0003201588988304138, 0.00033761560916900635, 0.0003550723195075989, 0.0003725290298461914, 0.00038998574018478394, 0.00040744245052337646, 0.000424899160861969, 0.0004423558712005615, 0.00045981258153915405, 0.0004772692918777466, 0.0004947260022163391, 0.0005121827125549316, 0.0005296394228935242, 0.0005470961332321167, 0.0005645528435707092, 0.0005820095539093018, 0.0005994662642478943, 0.0006169229745864868, 0.0006343796849250793, 0.0006518363952636719]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 6.0, 3.0, 10.0, 17.0, 13.0, 24.0, 34.0, 60.0, 293.0, 23370.0, 1021437.0, 2990.0, 122.0, 39.0, 38.0, 22.0, 11.0, 10.0, 6.0, 6.0, 7.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.0, -60.33837890625, -58.6767578125, -57.01513671875, -55.353515625, -53.69189453125, -52.0302734375, -50.36865234375, -48.70703125, -47.04541015625, -45.3837890625, -43.72216796875, -42.060546875, -40.39892578125, -38.7373046875, -37.07568359375, -35.4140625, -33.75244140625, -32.0908203125, -30.42919921875, -28.767578125, -27.10595703125, -25.4443359375, -23.78271484375, -22.12109375, -20.45947265625, -18.7978515625, -17.13623046875, -15.474609375, -13.81298828125, -12.1513671875, -10.48974609375, -8.828125, -7.16650390625, -5.5048828125, -3.84326171875, -2.181640625, -0.52001953125, 1.1416015625, 2.80322265625, 4.46484375, 6.12646484375, 7.7880859375, 9.44970703125, 11.111328125, 12.77294921875, 14.4345703125, 16.09619140625, 17.7578125, 19.41943359375, 21.0810546875, 22.74267578125, 24.404296875, 26.06591796875, 27.7275390625, 29.38916015625, 31.05078125, 32.71240234375, 34.3740234375, 36.03564453125, 37.697265625, 39.35888671875, 41.0205078125, 42.68212890625, 44.34375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 20.0, 20.0, 26.0, 34.0, 59.0, 103.0, 153.0, 187.0, 138.0, 76.0, 44.0, 41.0, 15.0, 17.0, 8.0, 9.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.6476898193359375, -2.576629638671875, -2.5055694580078125, -2.43450927734375, -2.3634490966796875, -2.292388916015625, -2.2213287353515625, -2.1502685546875, -2.0792083740234375, -2.008148193359375, -1.9370880126953125, -1.86602783203125, -1.7949676513671875, -1.723907470703125, -1.6528472900390625, -1.581787109375, -1.5107269287109375, -1.439666748046875, -1.3686065673828125, -1.29754638671875, -1.2264862060546875, -1.155426025390625, -1.0843658447265625, -1.0133056640625, -0.9422454833984375, -0.871185302734375, -0.8001251220703125, -0.72906494140625, -0.6580047607421875, -0.586944580078125, -0.5158843994140625, -0.44482421875, -0.3737640380859375, -0.302703857421875, -0.2316436767578125, -0.16058349609375, -0.0895233154296875, -0.018463134765625, 0.0525970458984375, 0.1236572265625, 0.1947174072265625, 0.265777587890625, 0.3368377685546875, 0.40789794921875, 0.4789581298828125, 0.550018310546875, 0.6210784912109375, 0.692138671875, 0.7631988525390625, 0.834259033203125, 0.9053192138671875, 0.97637939453125, 1.0474395751953125, 1.118499755859375, 1.1895599365234375, 1.2606201171875, 1.3316802978515625, 1.402740478515625, 1.4738006591796875, 1.54486083984375, 1.6159210205078125, 1.686981201171875, 1.7580413818359375, 1.8291015625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 7.0, 10.0, 17.0, 16.0, 24.0, 19.0, 33.0, 31.0, 41.0, 34.0, 58.0, 48.0, 61.0, 47.0, 62.0, 59.0, 52.0, 50.0, 51.0, 51.0, 35.0, 33.0, 33.0, 21.0, 11.0, 28.0, 10.0, 8.0, 6.0, 3.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.616600751876831, -2.5319411754608154, -2.447281837463379, -2.3626222610473633, -2.2779626846313477, -2.193303108215332, -2.1086437702178955, -2.02398419380188, -1.9393247365951538, -1.8546652793884277, -1.770005702972412, -1.685346245765686, -1.60068678855896, -1.5160272121429443, -1.4313677549362183, -1.3467082977294922, -1.2620487213134766, -1.1773892641067505, -1.0927296876907349, -1.0080702304840088, -0.9234107136726379, -0.8387511968612671, -0.754091739654541, -0.6694322228431702, -0.5847727060317993, -0.5001131892204285, -0.41545370221138, -0.33079421520233154, -0.2461346983909607, -0.16147518157958984, -0.07681572437286377, 0.00784379243850708, 0.09250354766845703, 0.1771630495786667, 0.26182255148887634, 0.3464820384979248, 0.43114155530929565, 0.5158010721206665, 0.6004605293273926, 0.6851200461387634, 0.7697795629501343, 0.8544390797615051, 0.939098596572876, 1.023758053779602, 1.1084175109863281, 1.1930770874023438, 1.2777365446090698, 1.362396001815796, 1.4470555782318115, 1.5317150354385376, 1.6163746118545532, 1.7010340690612793, 1.785693645477295, 1.870353102684021, 1.955012559890747, 2.0396721363067627, 2.124331474304199, 2.208991050720215, 2.2936503887176514, 2.378309965133667, 2.4629695415496826, 2.547628879547119, 2.6322884559631348, 2.7169480323791504, 2.801607608795166]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 13.0, 5.0, 8.0, 11.0, 10.0, 9.0, 14.0, 17.0, 23.0, 23.0, 42.0, 21.0, 34.0, 27.0, 36.0, 42.0, 42.0, 42.0, 31.0, 28.0, 41.0, 52.0, 29.0, 40.0, 38.0, 27.0, 36.0, 40.0, 32.0, 16.0, 35.0, 19.0, 16.0, 19.0, 16.0, 11.0, 10.0, 13.0, 11.0, 9.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6463916301727295, -2.5615241527557373, -2.476656675338745, -2.391789197921753, -2.3069217205047607, -2.2220542430877686, -2.1371870040893555, -2.0523195266723633, -1.9674519300460815, -1.8825844526290894, -1.7977169752120972, -1.7128496170043945, -1.6279821395874023, -1.5431146621704102, -1.458247184753418, -1.3733797073364258, -1.2885122299194336, -1.2036447525024414, -1.1187772750854492, -1.033909797668457, -0.9490423798561096, -0.8641749024391174, -0.77930748462677, -0.6944400072097778, -0.6095725297927856, -0.5247050523757935, -0.43983760476112366, -0.35497015714645386, -0.27010267972946167, -0.18523520231246948, -0.10036778450012207, -0.015500307083129883, 0.0693674087524414, 0.1542348712682724, 0.2391023337841034, 0.3239697813987732, 0.4088372588157654, 0.49370473623275757, 0.578572154045105, 0.6634396314620972, 0.7483071088790894, 0.8331745862960815, 0.9180420637130737, 1.0029094219207764, 1.0877768993377686, 1.1726443767547607, 1.257511854171753, 1.3423793315887451, 1.4272468090057373, 1.5121142864227295, 1.5969817638397217, 1.6818492412567139, 1.766716718673706, 1.8515841960906982, 1.9364515542984009, 2.0213189125061035, 2.1061863899230957, 2.191053867340088, 2.27592134475708, 2.3607888221740723, 2.4456562995910645, 2.5305237770080566, 2.615391254425049, 2.700258731842041, 2.785126209259033]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 10.0, 13.0, 21.0, 31.0, 35.0, 77.0, 102.0, 111.0, 185.0, 311.0, 472.0, 849.0, 1387.0, 2670.0, 5105.0, 9740.0, 19010.0, 36189.0, 67107.0, 115658.0, 170718.0, 197443.0, 167995.0, 112855.0, 65829.0, 35460.0, 18585.0, 9451.0, 4943.0, 2585.0, 1459.0, 795.0, 481.0, 285.0, 187.0, 128.0, 77.0, 54.0, 47.0, 22.0, 17.0, 19.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.599609375, -3.485260009765625, -3.37091064453125, -3.256561279296875, -3.1422119140625, -3.027862548828125, -2.91351318359375, -2.799163818359375, -2.684814453125, -2.570465087890625, -2.45611572265625, -2.341766357421875, -2.2274169921875, -2.113067626953125, -1.99871826171875, -1.884368896484375, -1.77001953125, -1.655670166015625, -1.54132080078125, -1.426971435546875, -1.3126220703125, -1.198272705078125, -1.08392333984375, -0.969573974609375, -0.855224609375, -0.740875244140625, -0.62652587890625, -0.512176513671875, -0.3978271484375, -0.283477783203125, -0.16912841796875, -0.054779052734375, 0.0595703125, 0.173919677734375, 0.28826904296875, 0.402618408203125, 0.5169677734375, 0.631317138671875, 0.74566650390625, 0.860015869140625, 0.974365234375, 1.088714599609375, 1.20306396484375, 1.317413330078125, 1.4317626953125, 1.546112060546875, 1.66046142578125, 1.774810791015625, 1.88916015625, 2.003509521484375, 2.11785888671875, 2.232208251953125, 2.3465576171875, 2.460906982421875, 2.57525634765625, 2.689605712890625, 2.803955078125, 2.918304443359375, 3.03265380859375, 3.147003173828125, 3.2613525390625, 3.375701904296875, 3.49005126953125, 3.604400634765625, 3.71875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 14.0, 11.0, 16.0, 21.0, 20.0, 27.0, 25.0, 36.0, 33.0, 28.0, 32.0, 38.0, 41.0, 33.0, 40.0, 46.0, 40.0, 43.0, 42.0, 34.0, 42.0, 40.0, 34.0, 36.0, 16.0, 17.0, 27.0, 23.0, 20.0, 21.0, 12.0, 11.0, 10.0, 5.0, 10.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.7862091064453125, -1.728668212890625, -1.6711273193359375, -1.61358642578125, -1.5560455322265625, -1.498504638671875, -1.4409637451171875, -1.3834228515625, -1.3258819580078125, -1.268341064453125, -1.2108001708984375, -1.15325927734375, -1.0957183837890625, -1.038177490234375, -0.9806365966796875, -0.923095703125, -0.8655548095703125, -0.808013916015625, -0.7504730224609375, -0.69293212890625, -0.6353912353515625, -0.577850341796875, -0.5203094482421875, -0.4627685546875, -0.4052276611328125, -0.347686767578125, -0.2901458740234375, -0.23260498046875, -0.1750640869140625, -0.117523193359375, -0.0599822998046875, -0.00244140625, 0.0550994873046875, 0.112640380859375, 0.1701812744140625, 0.22772216796875, 0.2852630615234375, 0.342803955078125, 0.4003448486328125, 0.4578857421875, 0.5154266357421875, 0.572967529296875, 0.6305084228515625, 0.68804931640625, 0.7455902099609375, 0.803131103515625, 0.8606719970703125, 0.918212890625, 0.9757537841796875, 1.033294677734375, 1.0908355712890625, 1.14837646484375, 1.2059173583984375, 1.263458251953125, 1.3209991455078125, 1.3785400390625, 1.4360809326171875, 1.493621826171875, 1.5511627197265625, 1.60870361328125, 1.6662445068359375, 1.723785400390625, 1.7813262939453125, 1.8388671875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 9.0, 6.0, 16.0, 10.0, 15.0, 18.0, 16.0, 16.0, 28.0, 23.0, 35.0, 31.0, 32.0, 33.0, 26.0, 29.0, 46.0, 463.0, 25209.0, 936074.0, 84998.0, 990.0, 62.0, 36.0, 26.0, 36.0, 30.0, 20.0, 30.0, 25.0, 26.0, 17.0, 19.0, 13.0, 14.0, 15.0, 7.0, 7.0, 7.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.28125, -31.26025390625, -30.2392578125, -29.21826171875, -28.197265625, -27.17626953125, -26.1552734375, -25.13427734375, -24.11328125, -23.09228515625, -22.0712890625, -21.05029296875, -20.029296875, -19.00830078125, -17.9873046875, -16.96630859375, -15.9453125, -14.92431640625, -13.9033203125, -12.88232421875, -11.861328125, -10.84033203125, -9.8193359375, -8.79833984375, -7.77734375, -6.75634765625, -5.7353515625, -4.71435546875, -3.693359375, -2.67236328125, -1.6513671875, -0.63037109375, 0.390625, 1.41162109375, 2.4326171875, 3.45361328125, 4.474609375, 5.49560546875, 6.5166015625, 7.53759765625, 8.55859375, 9.57958984375, 10.6005859375, 11.62158203125, 12.642578125, 13.66357421875, 14.6845703125, 15.70556640625, 16.7265625, 17.74755859375, 18.7685546875, 19.78955078125, 20.810546875, 21.83154296875, 22.8525390625, 23.87353515625, 24.89453125, 25.91552734375, 26.9365234375, 27.95751953125, 28.978515625, 29.99951171875, 31.0205078125, 32.04150390625, 33.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 19.0, 8.0, 19.0, 27.0, 24.0, 15.0, 33.0, 34.0, 28.0, 30.0, 38.0, 26.0, 29.0, 42.0, 45.0, 36.0, 43.0, 45.0, 38.0, 39.0, 42.0, 24.0, 31.0, 32.0, 24.0, 26.0, 27.0, 19.0, 17.0, 9.0, 16.0, 14.0, 12.0, 8.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.283203125, -2.211578369140625, -2.13995361328125, -2.068328857421875, -1.9967041015625, -1.925079345703125, -1.85345458984375, -1.781829833984375, -1.710205078125, -1.638580322265625, -1.56695556640625, -1.495330810546875, -1.4237060546875, -1.352081298828125, -1.28045654296875, -1.208831787109375, -1.13720703125, -1.065582275390625, -0.99395751953125, -0.922332763671875, -0.8507080078125, -0.779083251953125, -0.70745849609375, -0.635833740234375, -0.564208984375, -0.492584228515625, -0.42095947265625, -0.349334716796875, -0.2777099609375, -0.206085205078125, -0.13446044921875, -0.062835693359375, 0.0087890625, 0.080413818359375, 0.15203857421875, 0.223663330078125, 0.2952880859375, 0.366912841796875, 0.43853759765625, 0.510162353515625, 0.581787109375, 0.653411865234375, 0.72503662109375, 0.796661376953125, 0.8682861328125, 0.939910888671875, 1.01153564453125, 1.083160400390625, 1.15478515625, 1.226409912109375, 1.29803466796875, 1.369659423828125, 1.4412841796875, 1.512908935546875, 1.58453369140625, 1.656158447265625, 1.727783203125, 1.799407958984375, 1.87103271484375, 1.942657470703125, 2.0142822265625, 2.085906982421875, 2.15753173828125, 2.229156494140625, 2.30078125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 14.0, 9.0, 31.0, 38.0, 57.0, 90.0, 122.0, 157.0, 247.0, 502.0, 985.0, 2292.0, 6375.0, 20414.0, 86584.0, 728846.0, 155917.0, 30817.0, 9154.0, 3174.0, 1218.0, 595.0, 333.0, 183.0, 128.0, 90.0, 61.0, 36.0, 32.0, 20.0, 15.0, 6.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.59375, -8.35931396484375, -8.1248779296875, -7.89044189453125, -7.656005859375, -7.42156982421875, -7.1871337890625, -6.95269775390625, -6.71826171875, -6.48382568359375, -6.2493896484375, -6.01495361328125, -5.780517578125, -5.54608154296875, -5.3116455078125, -5.07720947265625, -4.8427734375, -4.60833740234375, -4.3739013671875, -4.13946533203125, -3.905029296875, -3.67059326171875, -3.4361572265625, -3.20172119140625, -2.96728515625, -2.73284912109375, -2.4984130859375, -2.26397705078125, -2.029541015625, -1.79510498046875, -1.5606689453125, -1.32623291015625, -1.091796875, -0.85736083984375, -0.6229248046875, -0.38848876953125, -0.154052734375, 0.08038330078125, 0.3148193359375, 0.54925537109375, 0.78369140625, 1.01812744140625, 1.2525634765625, 1.48699951171875, 1.721435546875, 1.95587158203125, 2.1903076171875, 2.42474365234375, 2.6591796875, 2.89361572265625, 3.1280517578125, 3.36248779296875, 3.596923828125, 3.83135986328125, 4.0657958984375, 4.30023193359375, 4.53466796875, 4.76910400390625, 5.0035400390625, 5.23797607421875, 5.472412109375, 5.70684814453125, 5.9412841796875, 6.17572021484375, 6.41015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 12.0, 15.0, 15.0, 17.0, 25.0, 49.0, 60.0, 95.0, 174.0, 192.0, 108.0, 70.0, 50.0, 25.0, 18.0, 24.0, 8.0, 13.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034689903259277344, -0.00033119693398475647, -0.0003154948353767395, -0.00029979273676872253, -0.00028409063816070557, -0.0002683885395526886, -0.00025268644094467163, -0.00023698434233665466, -0.0002212822437286377, -0.00020558014512062073, -0.00018987804651260376, -0.0001741759479045868, -0.00015847384929656982, -0.00014277175068855286, -0.0001270696520805359, -0.00011136755347251892, -9.566545486450195e-05, -7.996335625648499e-05, -6.426125764846802e-05, -4.855915904045105e-05, -3.285706043243408e-05, -1.7154961824417114e-05, -1.4528632164001465e-06, 1.4249235391616821e-05, 2.995133399963379e-05, 4.565343260765076e-05, 6.135553121566772e-05, 7.705762982368469e-05, 9.275972843170166e-05, 0.00010846182703971863, 0.0001241639256477356, 0.00013986602425575256, 0.00015556812286376953, 0.0001712702214717865, 0.00018697232007980347, 0.00020267441868782043, 0.0002183765172958374, 0.00023407861590385437, 0.00024978071451187134, 0.0002654828131198883, 0.0002811849117279053, 0.00029688701033592224, 0.0003125891089439392, 0.0003282912075519562, 0.00034399330615997314, 0.0003596954047679901, 0.0003753975033760071, 0.00039109960198402405, 0.000406801700592041, 0.000422503799200058, 0.00043820589780807495, 0.0004539079964160919, 0.0004696100950241089, 0.00048531219363212585, 0.0005010142922401428, 0.0005167163908481598, 0.0005324184894561768, 0.0005481205880641937, 0.0005638226866722107, 0.0005795247852802277, 0.0005952268838882446, 0.0006109289824962616, 0.0006266310811042786, 0.0006423331797122955, 0.0006580352783203125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 6.0, 7.0, 6.0, 14.0, 12.0, 16.0, 26.0, 22.0, 30.0, 45.0, 156.0, 1670.0, 865828.0, 179374.0, 1045.0, 99.0, 46.0, 35.0, 33.0, 17.0, 17.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.0625, -32.8427734375, -31.623046875, -30.4033203125, -29.18359375, -27.9638671875, -26.744140625, -25.5244140625, -24.3046875, -23.0849609375, -21.865234375, -20.6455078125, -19.42578125, -18.2060546875, -16.986328125, -15.7666015625, -14.546875, -13.3271484375, -12.107421875, -10.8876953125, -9.66796875, -8.4482421875, -7.228515625, -6.0087890625, -4.7890625, -3.5693359375, -2.349609375, -1.1298828125, 0.08984375, 1.3095703125, 2.529296875, 3.7490234375, 4.96875, 6.1884765625, 7.408203125, 8.6279296875, 9.84765625, 11.0673828125, 12.287109375, 13.5068359375, 14.7265625, 15.9462890625, 17.166015625, 18.3857421875, 19.60546875, 20.8251953125, 22.044921875, 23.2646484375, 24.484375, 25.7041015625, 26.923828125, 28.1435546875, 29.36328125, 30.5830078125, 31.802734375, 33.0224609375, 34.2421875, 35.4619140625, 36.681640625, 37.9013671875, 39.12109375, 40.3408203125, 41.560546875, 42.7802734375, 44.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 4.0, 5.0, 6.0, 7.0, 10.0, 14.0, 16.0, 22.0, 24.0, 30.0, 41.0, 55.0, 67.0, 179.0, 200.0, 76.0, 45.0, 48.0, 29.0, 38.0, 16.0, 20.0, 14.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.421875, -2.335418701171875, -2.24896240234375, -2.162506103515625, -2.0760498046875, -1.989593505859375, -1.90313720703125, -1.816680908203125, -1.730224609375, -1.643768310546875, -1.55731201171875, -1.470855712890625, -1.3843994140625, -1.297943115234375, -1.21148681640625, -1.125030517578125, -1.03857421875, -0.952117919921875, -0.86566162109375, -0.779205322265625, -0.6927490234375, -0.606292724609375, -0.51983642578125, -0.433380126953125, -0.346923828125, -0.260467529296875, -0.17401123046875, -0.087554931640625, -0.0010986328125, 0.085357666015625, 0.17181396484375, 0.258270263671875, 0.3447265625, 0.431182861328125, 0.51763916015625, 0.604095458984375, 0.6905517578125, 0.777008056640625, 0.86346435546875, 0.949920654296875, 1.036376953125, 1.122833251953125, 1.20928955078125, 1.295745849609375, 1.3822021484375, 1.468658447265625, 1.55511474609375, 1.641571044921875, 1.72802734375, 1.814483642578125, 1.90093994140625, 1.987396240234375, 2.0738525390625, 2.160308837890625, 2.24676513671875, 2.333221435546875, 2.419677734375, 2.506134033203125, 2.59259033203125, 2.679046630859375, 2.7655029296875, 2.851959228515625, 2.93841552734375, 3.024871826171875, 3.111328125]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 332.0, 688.0], "bins": [-174.1782684326172, -171.41941833496094, -168.6605682373047, -165.90171813964844, -163.1428680419922, -160.38401794433594, -157.6251678466797, -154.86630249023438, -152.10745239257812, -149.34860229492188, -146.58975219726562, -143.83090209960938, -141.07205200195312, -138.31320190429688, -135.55435180664062, -132.79550170898438, -130.03665161132812, -127.27780151367188, -124.51895141601562, -121.76010131835938, -119.00125122070312, -116.24239349365234, -113.4835433959961, -110.72469329833984, -107.9658432006836, -105.20699310302734, -102.4481430053711, -99.68929290771484, -96.93043518066406, -94.17158508300781, -91.41273498535156, -88.65388488769531, -85.89502716064453, -83.13617706298828, -80.37732696533203, -77.61847686767578, -74.859619140625, -72.10076904296875, -69.3419189453125, -66.58306884765625, -63.82421875, -61.06536865234375, -58.3065185546875, -55.547664642333984, -52.788814544677734, -50.029964447021484, -47.27111053466797, -44.51226043701172, -41.75341033935547, -38.99456024169922, -36.23571014404297, -33.47685623168945, -30.718006134033203, -27.959156036376953, -25.20030403137207, -22.441452026367188, -19.682601928710938, -16.923751831054688, -14.164899826049805, -11.406048774719238, -8.647197723388672, -5.8883466720581055, -3.129495620727539, -0.37064361572265625, 2.3882064819335938]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 23.0, 25.0, 39.0, 74.0, 73.0, 90.0, 110.0, 127.0, 102.0, 94.0, 72.0, 67.0, 46.0, 29.0, 18.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.505906105041504, -13.101679801940918, -12.697453498840332, -12.293228149414062, -11.889001846313477, -11.48477554321289, -11.080549240112305, -10.676322937011719, -10.272096633911133, -9.867870330810547, -9.463644027709961, -9.059417724609375, -8.655192375183105, -8.25096607208252, -7.846739768981934, -7.442513465881348, -7.03828763961792, -6.634061336517334, -6.229835510253906, -5.82560920715332, -5.421382904052734, -5.017156600952148, -4.612930774688721, -4.208704471588135, -3.804478406906128, -3.400252342224121, -2.996026039123535, -2.5917999744415283, -2.1875739097595215, -1.7833476066589355, -1.3791215419769287, -0.9748952388763428, -0.5706691741943359, -0.16644302010536194, 0.23778313398361206, 0.6420092582702637, 1.04623544216156, 1.4504616260528564, 1.8546876907348633, 2.258913993835449, 2.663140058517456, 3.067366123199463, 3.471592426300049, 3.8758184909820557, 4.2800445556640625, 4.684270858764648, 5.088497161865234, 5.49272346496582, 5.896949291229248, 6.301175594329834, 6.705401420593262, 7.109627723693848, 7.513854026794434, 7.9180803298950195, 8.322305679321289, 8.726531982421875, 9.130758285522461, 9.534984588623047, 9.939210891723633, 10.343437194824219, 10.747662544250488, 11.151888847351074, 11.55611515045166, 11.960341453552246, 12.364567756652832]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 5.0, 6.0, 6.0, 4.0, 20.0, 11.0, 23.0, 36.0, 61.0, 57.0, 99.0, 124.0, 175.0, 217.0, 296.0, 420.0, 641.0, 944.0, 1301.0, 1988.0, 3140.0, 4836.0, 7832.0, 12891.0, 23121.0, 45383.0, 133335.0, 962302.0, 2468085.0, 372590.0, 76683.0, 32531.0, 17350.0, 9883.0, 6131.0, 3808.0, 2461.0, 1612.0, 1104.0, 818.0, 563.0, 397.0, 272.0, 183.0, 164.0, 100.0, 88.0, 66.0, 45.0, 18.0, 26.0, 14.0, 15.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.841796875, -3.7227783203125, -3.603759765625, -3.4847412109375, -3.36572265625, -3.2467041015625, -3.127685546875, -3.0086669921875, -2.8896484375, -2.7706298828125, -2.651611328125, -2.5325927734375, -2.41357421875, -2.2945556640625, -2.175537109375, -2.0565185546875, -1.9375, -1.8184814453125, -1.699462890625, -1.5804443359375, -1.46142578125, -1.3424072265625, -1.223388671875, -1.1043701171875, -0.9853515625, -0.8663330078125, -0.747314453125, -0.6282958984375, -0.50927734375, -0.3902587890625, -0.271240234375, -0.1522216796875, -0.033203125, 0.0858154296875, 0.204833984375, 0.3238525390625, 0.44287109375, 0.5618896484375, 0.680908203125, 0.7999267578125, 0.9189453125, 1.0379638671875, 1.156982421875, 1.2760009765625, 1.39501953125, 1.5140380859375, 1.633056640625, 1.7520751953125, 1.87109375, 1.9901123046875, 2.109130859375, 2.2281494140625, 2.34716796875, 2.4661865234375, 2.585205078125, 2.7042236328125, 2.8232421875, 2.9422607421875, 3.061279296875, 3.1802978515625, 3.29931640625, 3.4183349609375, 3.537353515625, 3.6563720703125, 3.775390625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 8.0, 6.0, 2.0, 5.0, 15.0, 14.0, 19.0, 20.0, 21.0, 16.0, 23.0, 21.0, 20.0, 37.0, 24.0, 40.0, 29.0, 40.0, 36.0, 37.0, 48.0, 30.0, 39.0, 41.0, 28.0, 38.0, 32.0, 34.0, 30.0, 22.0, 23.0, 31.0, 26.0, 26.0, 26.0, 11.0, 14.0, 13.0, 11.0, 7.0, 8.0, 10.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.509765625, -2.432647705078125, -2.35552978515625, -2.278411865234375, -2.2012939453125, -2.124176025390625, -2.04705810546875, -1.969940185546875, -1.892822265625, -1.815704345703125, -1.73858642578125, -1.661468505859375, -1.5843505859375, -1.507232666015625, -1.43011474609375, -1.352996826171875, -1.27587890625, -1.198760986328125, -1.12164306640625, -1.044525146484375, -0.9674072265625, -0.890289306640625, -0.81317138671875, -0.736053466796875, -0.658935546875, -0.581817626953125, -0.50469970703125, -0.427581787109375, -0.3504638671875, -0.273345947265625, -0.19622802734375, -0.119110107421875, -0.0419921875, 0.035125732421875, 0.11224365234375, 0.189361572265625, 0.2664794921875, 0.343597412109375, 0.42071533203125, 0.497833251953125, 0.574951171875, 0.652069091796875, 0.72918701171875, 0.806304931640625, 0.8834228515625, 0.960540771484375, 1.03765869140625, 1.114776611328125, 1.19189453125, 1.269012451171875, 1.34613037109375, 1.423248291015625, 1.5003662109375, 1.577484130859375, 1.65460205078125, 1.731719970703125, 1.808837890625, 1.885955810546875, 1.96307373046875, 2.040191650390625, 2.1173095703125, 2.194427490234375, 2.27154541015625, 2.348663330078125, 2.42578125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 5.0, 11.0, 14.0, 24.0, 16.0, 20.0, 43.0, 88.0, 180.0, 661.0, 85261.0, 4105123.0, 2285.0, 237.0, 98.0, 65.0, 44.0, 25.0, 16.0, 18.0, 8.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.60986328125, -47.1884765625, -45.76708984375, -44.345703125, -42.92431640625, -41.5029296875, -40.08154296875, -38.66015625, -37.23876953125, -35.8173828125, -34.39599609375, -32.974609375, -31.55322265625, -30.1318359375, -28.71044921875, -27.2890625, -25.86767578125, -24.4462890625, -23.02490234375, -21.603515625, -20.18212890625, -18.7607421875, -17.33935546875, -15.91796875, -14.49658203125, -13.0751953125, -11.65380859375, -10.232421875, -8.81103515625, -7.3896484375, -5.96826171875, -4.546875, -3.12548828125, -1.7041015625, -0.28271484375, 1.138671875, 2.56005859375, 3.9814453125, 5.40283203125, 6.82421875, 8.24560546875, 9.6669921875, 11.08837890625, 12.509765625, 13.93115234375, 15.3525390625, 16.77392578125, 18.1953125, 19.61669921875, 21.0380859375, 22.45947265625, 23.880859375, 25.30224609375, 26.7236328125, 28.14501953125, 29.56640625, 30.98779296875, 32.4091796875, 33.83056640625, 35.251953125, 36.67333984375, 38.0947265625, 39.51611328125, 40.9375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 6.0, 10.0, 9.0, 17.0, 25.0, 21.0, 34.0, 67.0, 130.0, 225.0, 552.0, 1201.0, 952.0, 394.0, 162.0, 72.0, 70.0, 30.0, 23.0, 24.0, 9.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.23077392578125, -2.1666259765625, -2.10247802734375, -2.038330078125, -1.97418212890625, -1.9100341796875, -1.84588623046875, -1.78173828125, -1.71759033203125, -1.6534423828125, -1.58929443359375, -1.525146484375, -1.46099853515625, -1.3968505859375, -1.33270263671875, -1.2685546875, -1.20440673828125, -1.1402587890625, -1.07611083984375, -1.011962890625, -0.94781494140625, -0.8836669921875, -0.81951904296875, -0.75537109375, -0.69122314453125, -0.6270751953125, -0.56292724609375, -0.498779296875, -0.43463134765625, -0.3704833984375, -0.30633544921875, -0.2421875, -0.17803955078125, -0.1138916015625, -0.04974365234375, 0.014404296875, 0.07855224609375, 0.1427001953125, 0.20684814453125, 0.27099609375, 0.33514404296875, 0.3992919921875, 0.46343994140625, 0.527587890625, 0.59173583984375, 0.6558837890625, 0.72003173828125, 0.7841796875, 0.84832763671875, 0.9124755859375, 0.97662353515625, 1.040771484375, 1.10491943359375, 1.1690673828125, 1.23321533203125, 1.29736328125, 1.36151123046875, 1.4256591796875, 1.48980712890625, 1.553955078125, 1.61810302734375, 1.6822509765625, 1.74639892578125, 1.810546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 14.0, 14.0, 22.0, 21.0, 48.0, 58.0, 83.0, 111.0, 119.0, 114.0, 132.0, 83.0, 60.0, 48.0, 20.0, 21.0, 12.0, 11.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.991671562194824, -3.859605312347412, -3.727539300918579, -3.595473051071167, -3.463407039642334, -3.331340789794922, -3.1992745399475098, -3.0672085285186768, -2.9351425170898438, -2.8030762672424316, -2.6710102558135986, -2.5389440059661865, -2.4068779945373535, -2.2748117446899414, -2.1427454948425293, -2.0106794834136963, -1.8786132335662842, -1.7465471029281616, -1.614480972290039, -1.482414722442627, -1.350348711013794, -1.2182824611663818, -1.0862163305282593, -0.9541501998901367, -0.8220840692520142, -0.6900179386138916, -0.557951807975769, -0.4258856177330017, -0.29381948709487915, -0.1617533564567566, -0.029687166213989258, 0.1023789644241333, 0.23444509506225586, 0.3665112257003784, 0.49857738614082336, 0.6306435465812683, 0.7627096772193909, 0.8947758078575134, 1.0268419981002808, 1.1589081287384033, 1.2909742593765259, 1.4230403900146484, 1.555106520652771, 1.6871726512908936, 1.8192389011383057, 1.9513049125671387, 2.083371162414551, 2.215437412261963, 2.347503423690796, 2.479569673538208, 2.611635684967041, 2.743701934814453, 2.875767946243286, 3.0078341960906982, 3.1399002075195312, 3.2719664573669434, 3.4040327072143555, 3.5360989570617676, 3.6681649684906006, 3.8002312183380127, 3.9322972297668457, 4.064363479614258, 4.19642972946167, 4.328495979309082, 4.460561752319336]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 13.0, 13.0, 14.0, 22.0, 14.0, 25.0, 20.0, 22.0, 31.0, 26.0, 37.0, 38.0, 34.0, 31.0, 28.0, 42.0, 34.0, 40.0, 45.0, 26.0, 29.0, 37.0, 36.0, 30.0, 42.0, 27.0, 36.0, 24.0, 16.0, 19.0, 14.0, 14.0, 13.0, 13.0, 10.0, 9.0, 7.0, 5.0, 10.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.7402760982513428, -2.654853105545044, -2.569430112838745, -2.4840073585510254, -2.3985843658447266, -2.3131613731384277, -2.227738380432129, -2.14231538772583, -2.0568923950195312, -1.9714694023132324, -1.8860465288162231, -1.8006235361099243, -1.715200662612915, -1.6297776699066162, -1.5443546772003174, -1.4589316844940186, -1.3735089302062988, -1.2880859375, -1.2026630640029907, -1.117240071296692, -1.0318171977996826, -0.9463942050933838, -0.860971212387085, -0.7755482792854309, -0.6901253461837769, -0.6047024130821228, -0.5192794799804688, -0.4338564872741699, -0.34843355417251587, -0.2630106210708618, -0.177587628364563, -0.09216469526290894, -0.006742000579833984, 0.07868094742298126, 0.1641038954257965, 0.24952685832977295, 0.334949791431427, 0.42037272453308105, 0.5057957172393799, 0.5912186503410339, 0.676641583442688, 0.762064516544342, 0.8474874496459961, 0.9329104423522949, 1.0183334350585938, 1.103756308555603, 1.1891793012619019, 1.2746021747589111, 1.36002516746521, 1.4454481601715088, 1.530871033668518, 1.616294026374817, 1.7017168998718262, 1.787139892578125, 1.8725628852844238, 1.9579858779907227, 2.0434088706970215, 2.1288318634033203, 2.214254856109619, 2.299677848815918, 2.3851006031036377, 2.4705235958099365, 2.5559465885162354, 2.641369581222534, 2.726792335510254]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 11.0, 12.0, 23.0, 39.0, 55.0, 112.0, 182.0, 344.0, 598.0, 1222.0, 2395.0, 5062.0, 11643.0, 28880.0, 78502.0, 254323.0, 432133.0, 148943.0, 49539.0, 19104.0, 8103.0, 3613.0, 1812.0, 878.0, 412.0, 270.0, 149.0, 61.0, 56.0, 24.0, 16.0, 18.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71484375, -7.45135498046875, -7.1878662109375, -6.92437744140625, -6.660888671875, -6.39739990234375, -6.1339111328125, -5.87042236328125, -5.60693359375, -5.34344482421875, -5.0799560546875, -4.81646728515625, -4.552978515625, -4.28948974609375, -4.0260009765625, -3.76251220703125, -3.4990234375, -3.23553466796875, -2.9720458984375, -2.70855712890625, -2.445068359375, -2.18157958984375, -1.9180908203125, -1.65460205078125, -1.39111328125, -1.12762451171875, -0.8641357421875, -0.60064697265625, -0.337158203125, -0.07366943359375, 0.1898193359375, 0.45330810546875, 0.716796875, 0.98028564453125, 1.2437744140625, 1.50726318359375, 1.770751953125, 2.03424072265625, 2.2977294921875, 2.56121826171875, 2.82470703125, 3.08819580078125, 3.3516845703125, 3.61517333984375, 3.878662109375, 4.14215087890625, 4.4056396484375, 4.66912841796875, 4.9326171875, 5.19610595703125, 5.4595947265625, 5.72308349609375, 5.986572265625, 6.25006103515625, 6.5135498046875, 6.77703857421875, 7.04052734375, 7.30401611328125, 7.5675048828125, 7.83099365234375, 8.094482421875, 8.35797119140625, 8.6214599609375, 8.88494873046875, 9.1484375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 11.0, 3.0, 11.0, 12.0, 3.0, 24.0, 17.0, 9.0, 17.0, 34.0, 23.0, 21.0, 28.0, 30.0, 39.0, 35.0, 30.0, 28.0, 37.0, 31.0, 44.0, 33.0, 40.0, 31.0, 33.0, 33.0, 37.0, 31.0, 23.0, 38.0, 27.0, 35.0, 24.0, 11.0, 12.0, 19.0, 10.0, 8.0, 14.0, 12.0, 8.0, 7.0, 7.0, 6.0, 2.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.060546875, -1.9983978271484375, -1.936248779296875, -1.8740997314453125, -1.81195068359375, -1.7498016357421875, -1.687652587890625, -1.6255035400390625, -1.5633544921875, -1.5012054443359375, -1.439056396484375, -1.3769073486328125, -1.31475830078125, -1.2526092529296875, -1.190460205078125, -1.1283111572265625, -1.066162109375, -1.0040130615234375, -0.941864013671875, -0.8797149658203125, -0.81756591796875, -0.7554168701171875, -0.693267822265625, -0.6311187744140625, -0.5689697265625, -0.5068206787109375, -0.444671630859375, -0.3825225830078125, -0.32037353515625, -0.2582244873046875, -0.196075439453125, -0.1339263916015625, -0.07177734375, -0.0096282958984375, 0.052520751953125, 0.1146697998046875, 0.17681884765625, 0.2389678955078125, 0.301116943359375, 0.3632659912109375, 0.4254150390625, 0.4875640869140625, 0.549713134765625, 0.6118621826171875, 0.67401123046875, 0.7361602783203125, 0.798309326171875, 0.8604583740234375, 0.922607421875, 0.9847564697265625, 1.046905517578125, 1.1090545654296875, 1.17120361328125, 1.2333526611328125, 1.295501708984375, 1.3576507568359375, 1.4197998046875, 1.4819488525390625, 1.544097900390625, 1.6062469482421875, 1.66839599609375, 1.7305450439453125, 1.792694091796875, 1.8548431396484375, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 13.0, 15.0, 17.0, 29.0, 31.0, 46.0, 65.0, 76.0, 112.0, 145.0, 202.0, 307.0, 431.0, 661.0, 1054.0, 1675.0, 2905.0, 5427.0, 11443.0, 28424.0, 97646.0, 642444.0, 181355.0, 41916.0, 15424.0, 7069.0, 3692.0, 2004.0, 1288.0, 814.0, 520.0, 371.0, 263.0, 171.0, 137.0, 91.0, 75.0, 48.0, 42.0, 25.0, 22.0, 13.0, 6.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.69622802734375, -6.4705810546875, -6.24493408203125, -6.019287109375, -5.79364013671875, -5.5679931640625, -5.34234619140625, -5.11669921875, -4.89105224609375, -4.6654052734375, -4.43975830078125, -4.214111328125, -3.98846435546875, -3.7628173828125, -3.53717041015625, -3.3115234375, -3.08587646484375, -2.8602294921875, -2.63458251953125, -2.408935546875, -2.18328857421875, -1.9576416015625, -1.73199462890625, -1.50634765625, -1.28070068359375, -1.0550537109375, -0.82940673828125, -0.603759765625, -0.37811279296875, -0.1524658203125, 0.07318115234375, 0.298828125, 0.52447509765625, 0.7501220703125, 0.97576904296875, 1.201416015625, 1.42706298828125, 1.6527099609375, 1.87835693359375, 2.10400390625, 2.32965087890625, 2.5552978515625, 2.78094482421875, 3.006591796875, 3.23223876953125, 3.4578857421875, 3.68353271484375, 3.9091796875, 4.13482666015625, 4.3604736328125, 4.58612060546875, 4.811767578125, 5.03741455078125, 5.2630615234375, 5.48870849609375, 5.71435546875, 5.94000244140625, 6.1656494140625, 6.39129638671875, 6.616943359375, 6.84259033203125, 7.0682373046875, 7.29388427734375, 7.51953125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 11.0, 11.0, 14.0, 12.0, 19.0, 23.0, 22.0, 28.0, 33.0, 39.0, 29.0, 41.0, 51.0, 51.0, 50.0, 50.0, 44.0, 47.0, 46.0, 53.0, 48.0, 26.0, 32.0, 42.0, 20.0, 30.0, 33.0, 17.0, 14.0, 10.0, 9.0, 5.0, 4.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.43011474609375, -1.3758544921875, -1.32159423828125, -1.267333984375, -1.21307373046875, -1.1588134765625, -1.10455322265625, -1.05029296875, -0.99603271484375, -0.9417724609375, -0.88751220703125, -0.833251953125, -0.77899169921875, -0.7247314453125, -0.67047119140625, -0.6162109375, -0.56195068359375, -0.5076904296875, -0.45343017578125, -0.399169921875, -0.34490966796875, -0.2906494140625, -0.23638916015625, -0.18212890625, -0.12786865234375, -0.0736083984375, -0.01934814453125, 0.034912109375, 0.08917236328125, 0.1434326171875, 0.19769287109375, 0.251953125, 0.30621337890625, 0.3604736328125, 0.41473388671875, 0.468994140625, 0.52325439453125, 0.5775146484375, 0.63177490234375, 0.68603515625, 0.74029541015625, 0.7945556640625, 0.84881591796875, 0.903076171875, 0.95733642578125, 1.0115966796875, 1.06585693359375, 1.1201171875, 1.17437744140625, 1.2286376953125, 1.28289794921875, 1.337158203125, 1.39141845703125, 1.4456787109375, 1.49993896484375, 1.55419921875, 1.60845947265625, 1.6627197265625, 1.71697998046875, 1.771240234375, 1.82550048828125, 1.8797607421875, 1.93402099609375, 1.98828125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 8.0, 14.0, 11.0, 12.0, 20.0, 23.0, 44.0, 41.0, 60.0, 78.0, 104.0, 164.0, 249.0, 370.0, 704.0, 1391.0, 3065.0, 9221.0, 57166.0, 924297.0, 38520.0, 7424.0, 2644.0, 1187.0, 609.0, 349.0, 211.0, 135.0, 102.0, 79.0, 50.0, 25.0, 32.0, 30.0, 22.0, 16.0, 9.0, 11.0, 4.0, 6.0, 12.0, 3.0, 3.0, 9.0, 1.0, 2.0, 1.0], "bins": [-25.6875, -24.982177734375, -24.27685546875, -23.571533203125, -22.8662109375, -22.160888671875, -21.45556640625, -20.750244140625, -20.044921875, -19.339599609375, -18.63427734375, -17.928955078125, -17.2236328125, -16.518310546875, -15.81298828125, -15.107666015625, -14.40234375, -13.697021484375, -12.99169921875, -12.286376953125, -11.5810546875, -10.875732421875, -10.17041015625, -9.465087890625, -8.759765625, -8.054443359375, -7.34912109375, -6.643798828125, -5.9384765625, -5.233154296875, -4.52783203125, -3.822509765625, -3.1171875, -2.411865234375, -1.70654296875, -1.001220703125, -0.2958984375, 0.409423828125, 1.11474609375, 1.820068359375, 2.525390625, 3.230712890625, 3.93603515625, 4.641357421875, 5.3466796875, 6.052001953125, 6.75732421875, 7.462646484375, 8.16796875, 8.873291015625, 9.57861328125, 10.283935546875, 10.9892578125, 11.694580078125, 12.39990234375, 13.105224609375, 13.810546875, 14.515869140625, 15.22119140625, 15.926513671875, 16.6318359375, 17.337158203125, 18.04248046875, 18.747802734375, 19.453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 4.0, 6.0, 3.0, 12.0, 16.0, 28.0, 30.0, 51.0, 96.0, 183.0, 189.0, 149.0, 89.0, 44.0, 28.0, 12.0, 10.0, 10.0, 10.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003502368927001953, -0.0003413371741771698, -0.0003324374556541443, -0.0003235377371311188, -0.00031463801860809326, -0.00030573830008506775, -0.00029683858156204224, -0.0002879388630390167, -0.0002790391445159912, -0.0002701394259929657, -0.0002612397074699402, -0.00025233998894691467, -0.00024344027042388916, -0.00023454055190086365, -0.00022564083337783813, -0.00021674111485481262, -0.0002078413963317871, -0.0001989416778087616, -0.00019004195928573608, -0.00018114224076271057, -0.00017224252223968506, -0.00016334280371665955, -0.00015444308519363403, -0.00014554336667060852, -0.000136643648147583, -0.0001277439296245575, -0.00011884421110153198, -0.00010994449257850647, -0.00010104477405548096, -9.214505553245544e-05, -8.324533700942993e-05, -7.434561848640442e-05, -6.54458999633789e-05, -5.6546181440353394e-05, -4.764646291732788e-05, -3.874674439430237e-05, -2.9847025871276855e-05, -2.0947307348251343e-05, -1.204758882522583e-05, -3.1478703022003174e-06, 5.751848220825195e-06, 1.4651566743850708e-05, 2.355128526687622e-05, 3.2451003789901733e-05, 4.1350722312927246e-05, 5.025044083595276e-05, 5.915015935897827e-05, 6.804987788200378e-05, 7.69495964050293e-05, 8.584931492805481e-05, 9.474903345108032e-05, 0.00010364875197410583, 0.00011254847049713135, 0.00012144818902015686, 0.00013034790754318237, 0.00013924762606620789, 0.0001481473445892334, 0.0001570470631122589, 0.00016594678163528442, 0.00017484650015830994, 0.00018374621868133545, 0.00019264593720436096, 0.00020154565572738647, 0.000210445374250412, 0.0002193450927734375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 18.0, 28.0, 84.0, 1589.0, 1045717.0, 953.0, 80.0, 23.0, 14.0, 9.0, 12.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-161.0, -156.7001953125, -152.400390625, -148.1005859375, -143.80078125, -139.5009765625, -135.201171875, -130.9013671875, -126.6015625, -122.3017578125, -118.001953125, -113.7021484375, -109.40234375, -105.1025390625, -100.802734375, -96.5029296875, -92.203125, -87.9033203125, -83.603515625, -79.3037109375, -75.00390625, -70.7041015625, -66.404296875, -62.1044921875, -57.8046875, -53.5048828125, -49.205078125, -44.9052734375, -40.60546875, -36.3056640625, -32.005859375, -27.7060546875, -23.40625, -19.1064453125, -14.806640625, -10.5068359375, -6.20703125, -1.9072265625, 2.392578125, 6.6923828125, 10.9921875, 15.2919921875, 19.591796875, 23.8916015625, 28.19140625, 32.4912109375, 36.791015625, 41.0908203125, 45.390625, 49.6904296875, 53.990234375, 58.2900390625, 62.58984375, 66.8896484375, 71.189453125, 75.4892578125, 79.7890625, 84.0888671875, 88.388671875, 92.6884765625, 96.98828125, 101.2880859375, 105.587890625, 109.8876953125, 114.1875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 12.0, 21.0, 34.0, 46.0, 153.0, 370.0, 189.0, 88.0, 38.0, 13.0, 10.0, 14.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.63671875, -5.486602783203125, -5.33648681640625, -5.186370849609375, -5.0362548828125, -4.886138916015625, -4.73602294921875, -4.585906982421875, -4.435791015625, -4.285675048828125, -4.13555908203125, -3.985443115234375, -3.8353271484375, -3.685211181640625, -3.53509521484375, -3.384979248046875, -3.23486328125, -3.084747314453125, -2.93463134765625, -2.784515380859375, -2.6343994140625, -2.484283447265625, -2.33416748046875, -2.184051513671875, -2.033935546875, -1.883819580078125, -1.73370361328125, -1.583587646484375, -1.4334716796875, -1.283355712890625, -1.13323974609375, -0.983123779296875, -0.8330078125, -0.682891845703125, -0.53277587890625, -0.382659912109375, -0.2325439453125, -0.082427978515625, 0.06768798828125, 0.217803955078125, 0.367919921875, 0.518035888671875, 0.66815185546875, 0.818267822265625, 0.9683837890625, 1.118499755859375, 1.26861572265625, 1.418731689453125, 1.56884765625, 1.718963623046875, 1.86907958984375, 2.019195556640625, 2.1693115234375, 2.319427490234375, 2.46954345703125, 2.619659423828125, 2.769775390625, 2.919891357421875, 3.07000732421875, 3.220123291015625, 3.3702392578125, 3.520355224609375, 3.67047119140625, 3.820587158203125, 3.970703125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 12.0, 28.0, 79.0, 143.0, 202.0, 232.0, 142.0, 75.0, 44.0, 23.0, 8.0, 7.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6682015657424927, -1.4578100442886353, -1.2474186420440674, -1.03702712059021, -0.8266355991363525, -0.6162440776824951, -0.40585267543792725, -0.19546115398406982, 0.014930367469787598, 0.22532185912132263, 0.43571335077285767, 0.6461048126220703, 0.8564963340759277, 1.0668878555297852, 1.277279257774353, 1.4876707792282104, 1.6980623006820679, 1.9084538221359253, 2.118845224380493, 2.3292367458343506, 2.539628267288208, 2.7500197887420654, 2.9604110717773438, 3.170802593231201, 3.3811941146850586, 3.591585636138916, 3.8019771575927734, 4.012368679046631, 4.222760200500488, 4.433151721954346, 4.643543243408203, 4.853934288024902, 5.064326286315918, 5.274717807769775, 5.485109329223633, 5.69550085067749, 5.905892372131348, 6.116283893585205, 6.3266754150390625, 6.537066459655762, 6.747458457946777, 6.957849979400635, 7.168241500854492, 7.37863302230835, 7.589024543762207, 7.7994160652160645, 8.009807586669922, 8.220198631286621, 8.43058967590332, 8.64098072052002, 8.851372718811035, 9.061763763427734, 9.27215576171875, 9.48254680633545, 9.692938804626465, 9.903329849243164, 10.11372184753418, 10.324112892150879, 10.534504890441895, 10.744895935058594, 10.95528793334961, 11.165678977966309, 11.376070976257324, 11.586462020874023, 11.796854019165039]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 1.0, 10.0, 11.0, 8.0, 8.0, 8.0, 37.0, 15.0, 16.0, 24.0, 25.0, 20.0, 15.0, 22.0, 34.0, 26.0, 40.0, 45.0, 42.0, 29.0, 37.0, 37.0, 39.0, 34.0, 43.0, 33.0, 35.0, 42.0, 25.0, 31.0, 17.0, 31.0, 28.0, 21.0, 13.0, 11.0, 10.0, 12.0, 12.0, 10.0, 6.0, 3.0, 0.0, 7.0, 2.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.3453330993652344, -2.270292282104492, -2.19525146484375, -2.120210647583008, -2.0451698303222656, -1.9701288938522339, -1.8950879573822021, -1.82004714012146, -1.7450063228607178, -1.6699655055999756, -1.5949246883392334, -1.5198837518692017, -1.4448429346084595, -1.3698021173477173, -1.2947611808776855, -1.2197203636169434, -1.1446795463562012, -1.069638729095459, -0.994597852230072, -0.9195569753646851, -0.8445161581039429, -0.7694753408432007, -0.6944344639778137, -0.6193935871124268, -0.5443527698516846, -0.46931192278862, -0.3942710757255554, -0.31923022866249084, -0.24418938159942627, -0.1691485345363617, -0.09410768747329712, -0.019066810607910156, 0.05597400665283203, 0.1310148537158966, 0.20605570077896118, 0.28109654784202576, 0.35613739490509033, 0.4311782419681549, 0.5062190890312195, 0.5812599658966064, 0.6563007831573486, 0.7313416004180908, 0.8063824772834778, 0.8814233541488647, 0.9564641714096069, 1.0315049886703491, 1.1065459251403809, 1.181586742401123, 1.2566275596618652, 1.3316683769226074, 1.4067091941833496, 1.4817501306533813, 1.5567909479141235, 1.6318317651748657, 1.7068727016448975, 1.7819135189056396, 1.8569543361663818, 1.931995153427124, 2.007035970687866, 2.0820767879486084, 2.1571178436279297, 2.232158660888672, 2.307199478149414, 2.3822402954101562, 2.4572811126708984]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 6.0, 10.0, 16.0, 22.0, 26.0, 30.0, 48.0, 54.0, 64.0, 85.0, 110.0, 170.0, 224.0, 291.0, 350.0, 491.0, 669.0, 993.0, 1392.0, 2192.0, 3595.0, 6415.0, 12152.0, 24941.0, 57303.0, 145913.0, 309512.0, 272594.0, 115930.0, 46256.0, 20788.0, 10364.0, 5622.0, 3247.0, 2019.0, 1288.0, 897.0, 637.0, 504.0, 304.0, 254.0, 199.0, 164.0, 95.0, 77.0, 65.0, 42.0, 34.0, 26.0, 24.0, 13.0, 10.0, 13.0, 4.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-4.953125, -4.787353515625, -4.62158203125, -4.455810546875, -4.2900390625, -4.124267578125, -3.95849609375, -3.792724609375, -3.626953125, -3.461181640625, -3.29541015625, -3.129638671875, -2.9638671875, -2.798095703125, -2.63232421875, -2.466552734375, -2.30078125, -2.135009765625, -1.96923828125, -1.803466796875, -1.6376953125, -1.471923828125, -1.30615234375, -1.140380859375, -0.974609375, -0.808837890625, -0.64306640625, -0.477294921875, -0.3115234375, -0.145751953125, 0.02001953125, 0.185791015625, 0.3515625, 0.517333984375, 0.68310546875, 0.848876953125, 1.0146484375, 1.180419921875, 1.34619140625, 1.511962890625, 1.677734375, 1.843505859375, 2.00927734375, 2.175048828125, 2.3408203125, 2.506591796875, 2.67236328125, 2.838134765625, 3.00390625, 3.169677734375, 3.33544921875, 3.501220703125, 3.6669921875, 3.832763671875, 3.99853515625, 4.164306640625, 4.330078125, 4.495849609375, 4.66162109375, 4.827392578125, 4.9931640625, 5.158935546875, 5.32470703125, 5.490478515625, 5.65625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 2.0, 5.0, 8.0, 8.0, 7.0, 14.0, 16.0, 17.0, 15.0, 21.0, 26.0, 32.0, 30.0, 35.0, 57.0, 42.0, 41.0, 58.0, 37.0, 35.0, 56.0, 54.0, 46.0, 47.0, 38.0, 35.0, 27.0, 38.0, 30.0, 23.0, 14.0, 20.0, 17.0, 9.0, 8.0, 10.0, 6.0, 2.0, 7.0, 5.0, 1.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.271484375, -2.20196533203125, -2.1324462890625, -2.06292724609375, -1.993408203125, -1.92388916015625, -1.8543701171875, -1.78485107421875, -1.71533203125, -1.64581298828125, -1.5762939453125, -1.50677490234375, -1.437255859375, -1.36773681640625, -1.2982177734375, -1.22869873046875, -1.1591796875, -1.08966064453125, -1.0201416015625, -0.95062255859375, -0.881103515625, -0.81158447265625, -0.7420654296875, -0.67254638671875, -0.60302734375, -0.53350830078125, -0.4639892578125, -0.39447021484375, -0.324951171875, -0.25543212890625, -0.1859130859375, -0.11639404296875, -0.046875, 0.02264404296875, 0.0921630859375, 0.16168212890625, 0.231201171875, 0.30072021484375, 0.3702392578125, 0.43975830078125, 0.50927734375, 0.57879638671875, 0.6483154296875, 0.71783447265625, 0.787353515625, 0.85687255859375, 0.9263916015625, 0.99591064453125, 1.0654296875, 1.13494873046875, 1.2044677734375, 1.27398681640625, 1.343505859375, 1.41302490234375, 1.4825439453125, 1.55206298828125, 1.62158203125, 1.69110107421875, 1.7606201171875, 1.83013916015625, 1.899658203125, 1.96917724609375, 2.0386962890625, 2.10821533203125, 2.177734375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 10.0, 17.0, 22.0, 25.0, 21.0, 48.0, 50.0, 81.0, 237.0, 3224.0, 991080.0, 52579.0, 765.0, 113.0, 63.0, 44.0, 37.0, 37.0, 19.0, 14.0, 10.0, 12.0, 11.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-62.375, -60.34765625, -58.3203125, -56.29296875, -54.265625, -52.23828125, -50.2109375, -48.18359375, -46.15625, -44.12890625, -42.1015625, -40.07421875, -38.046875, -36.01953125, -33.9921875, -31.96484375, -29.9375, -27.91015625, -25.8828125, -23.85546875, -21.828125, -19.80078125, -17.7734375, -15.74609375, -13.71875, -11.69140625, -9.6640625, -7.63671875, -5.609375, -3.58203125, -1.5546875, 0.47265625, 2.5, 4.52734375, 6.5546875, 8.58203125, 10.609375, 12.63671875, 14.6640625, 16.69140625, 18.71875, 20.74609375, 22.7734375, 24.80078125, 26.828125, 28.85546875, 30.8828125, 32.91015625, 34.9375, 36.96484375, 38.9921875, 41.01953125, 43.046875, 45.07421875, 47.1015625, 49.12890625, 51.15625, 53.18359375, 55.2109375, 57.23828125, 59.265625, 61.29296875, 63.3203125, 65.34765625, 67.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 23.0, 25.0, 24.0, 34.0, 45.0, 71.0, 76.0, 70.0, 99.0, 83.0, 86.0, 66.0, 60.0, 47.0, 42.0, 35.0, 19.0, 12.0, 15.0, 9.0, 8.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.2890625, -5.1180419921875, -4.947021484375, -4.7760009765625, -4.60498046875, -4.4339599609375, -4.262939453125, -4.0919189453125, -3.9208984375, -3.7498779296875, -3.578857421875, -3.4078369140625, -3.23681640625, -3.0657958984375, -2.894775390625, -2.7237548828125, -2.552734375, -2.3817138671875, -2.210693359375, -2.0396728515625, -1.86865234375, -1.6976318359375, -1.526611328125, -1.3555908203125, -1.1845703125, -1.0135498046875, -0.842529296875, -0.6715087890625, -0.50048828125, -0.3294677734375, -0.158447265625, 0.0125732421875, 0.18359375, 0.3546142578125, 0.525634765625, 0.6966552734375, 0.86767578125, 1.0386962890625, 1.209716796875, 1.3807373046875, 1.5517578125, 1.7227783203125, 1.893798828125, 2.0648193359375, 2.23583984375, 2.4068603515625, 2.577880859375, 2.7489013671875, 2.919921875, 3.0909423828125, 3.261962890625, 3.4329833984375, 3.60400390625, 3.7750244140625, 3.946044921875, 4.1170654296875, 4.2880859375, 4.4591064453125, 4.630126953125, 4.8011474609375, 4.97216796875, 5.1431884765625, 5.314208984375, 5.4852294921875, 5.65625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 7.0, 7.0, 16.0, 16.0, 14.0, 40.0, 38.0, 33.0, 90.0, 128.0, 206.0, 340.0, 512.0, 842.0, 1659.0, 3249.0, 6551.0, 15926.0, 47736.0, 261919.0, 608240.0, 64520.0, 20234.0, 8159.0, 3604.0, 1812.0, 1006.0, 588.0, 355.0, 217.0, 137.0, 101.0, 66.0, 51.0, 38.0, 19.0, 10.0, 18.0, 17.0, 9.0, 9.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.91015625, -1.8557586669921875, -1.801361083984375, -1.7469635009765625, -1.69256591796875, -1.6381683349609375, -1.583770751953125, -1.5293731689453125, -1.4749755859375, -1.4205780029296875, -1.366180419921875, -1.3117828369140625, -1.25738525390625, -1.2029876708984375, -1.148590087890625, -1.0941925048828125, -1.039794921875, -0.9853973388671875, -0.930999755859375, -0.8766021728515625, -0.82220458984375, -0.7678070068359375, -0.713409423828125, -0.6590118408203125, -0.6046142578125, -0.5502166748046875, -0.495819091796875, -0.4414215087890625, -0.38702392578125, -0.3326263427734375, -0.278228759765625, -0.2238311767578125, -0.16943359375, -0.1150360107421875, -0.060638427734375, -0.0062408447265625, 0.04815673828125, 0.1025543212890625, 0.156951904296875, 0.2113494873046875, 0.2657470703125, 0.3201446533203125, 0.374542236328125, 0.4289398193359375, 0.48333740234375, 0.5377349853515625, 0.592132568359375, 0.6465301513671875, 0.700927734375, 0.7553253173828125, 0.809722900390625, 0.8641204833984375, 0.91851806640625, 0.9729156494140625, 1.027313232421875, 1.0817108154296875, 1.1361083984375, 1.1905059814453125, 1.244903564453125, 1.2993011474609375, 1.35369873046875, 1.4080963134765625, 1.462493896484375, 1.5168914794921875, 1.5712890625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 12.0, 12.0, 10.0, 22.0, 39.0, 47.0, 59.0, 100.0, 111.0, 199.0, 115.0, 60.0, 56.0, 35.0, 33.0, 16.0, 18.0, 10.0, 2.0, 7.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.26120376586914e-05, -7.956754416227341e-05, -7.652305066585541e-05, -7.347855716943741e-05, -7.043406367301941e-05, -6.738957017660141e-05, -6.434507668018341e-05, -6.130058318376541e-05, -5.825608968734741e-05, -5.521159619092941e-05, -5.2167102694511414e-05, -4.9122609198093414e-05, -4.6078115701675415e-05, -4.3033622205257416e-05, -3.9989128708839417e-05, -3.694463521242142e-05, -3.390014171600342e-05, -3.085564821958542e-05, -2.781115472316742e-05, -2.476666122674942e-05, -2.172216773033142e-05, -1.867767423391342e-05, -1.5633180737495422e-05, -1.2588687241077423e-05, -9.544193744659424e-06, -6.4997002482414246e-06, -3.4552067518234253e-06, -4.10713255405426e-07, 2.6337802410125732e-06, 5.6782737374305725e-06, 8.722767233848572e-06, 1.1767260730266571e-05, 1.481175422668457e-05, 1.785624772310257e-05, 2.090074121952057e-05, 2.3945234715938568e-05, 2.6989728212356567e-05, 3.0034221708774567e-05, 3.3078715205192566e-05, 3.6123208701610565e-05, 3.9167702198028564e-05, 4.2212195694446564e-05, 4.525668919086456e-05, 4.830118268728256e-05, 5.134567618370056e-05, 5.439016968011856e-05, 5.743466317653656e-05, 6.047915667295456e-05, 6.352365016937256e-05, 6.656814366579056e-05, 6.961263716220856e-05, 7.265713065862656e-05, 7.570162415504456e-05, 7.874611765146255e-05, 8.179061114788055e-05, 8.483510464429855e-05, 8.787959814071655e-05, 9.092409163713455e-05, 9.396858513355255e-05, 9.701307862997055e-05, 0.00010005757212638855, 0.00010310206562280655, 0.00010614655911922455, 0.00010919105261564255, 0.00011223554611206055]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 1.0, 4.0, 10.0, 9.0, 13.0, 14.0, 18.0, 26.0, 31.0, 59.0, 317.0, 14312.0, 1031050.0, 2353.0, 151.0, 57.0, 29.0, 25.0, 20.0, 14.0, 15.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.671875, -18.03515625, -17.3984375, -16.76171875, -16.125, -15.48828125, -14.8515625, -14.21484375, -13.578125, -12.94140625, -12.3046875, -11.66796875, -11.03125, -10.39453125, -9.7578125, -9.12109375, -8.484375, -7.84765625, -7.2109375, -6.57421875, -5.9375, -5.30078125, -4.6640625, -4.02734375, -3.390625, -2.75390625, -2.1171875, -1.48046875, -0.84375, -0.20703125, 0.4296875, 1.06640625, 1.703125, 2.33984375, 2.9765625, 3.61328125, 4.25, 4.88671875, 5.5234375, 6.16015625, 6.796875, 7.43359375, 8.0703125, 8.70703125, 9.34375, 9.98046875, 10.6171875, 11.25390625, 11.890625, 12.52734375, 13.1640625, 13.80078125, 14.4375, 15.07421875, 15.7109375, 16.34765625, 16.984375, 17.62109375, 18.2578125, 18.89453125, 19.53125, 20.16796875, 20.8046875, 21.44140625, 22.078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 7.0, 11.0, 8.0, 12.0, 18.0, 16.0, 30.0, 30.0, 48.0, 75.0, 128.0, 277.0, 89.0, 75.0, 51.0, 27.0, 21.0, 27.0, 10.0, 15.0, 5.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2024383544921875, -1.159759521484375, -1.1170806884765625, -1.07440185546875, -1.0317230224609375, -0.989044189453125, -0.9463653564453125, -0.9036865234375, -0.8610076904296875, -0.818328857421875, -0.7756500244140625, -0.73297119140625, -0.6902923583984375, -0.647613525390625, -0.6049346923828125, -0.562255859375, -0.5195770263671875, -0.476898193359375, -0.4342193603515625, -0.39154052734375, -0.3488616943359375, -0.306182861328125, -0.2635040283203125, -0.2208251953125, -0.1781463623046875, -0.135467529296875, -0.0927886962890625, -0.05010986328125, -0.0074310302734375, 0.035247802734375, 0.0779266357421875, 0.12060546875, 0.1632843017578125, 0.205963134765625, 0.2486419677734375, 0.29132080078125, 0.3339996337890625, 0.376678466796875, 0.4193572998046875, 0.4620361328125, 0.5047149658203125, 0.547393798828125, 0.5900726318359375, 0.63275146484375, 0.6754302978515625, 0.718109130859375, 0.7607879638671875, 0.803466796875, 0.8461456298828125, 0.888824462890625, 0.9315032958984375, 0.97418212890625, 1.0168609619140625, 1.059539794921875, 1.1022186279296875, 1.1448974609375, 1.1875762939453125, 1.230255126953125, 1.2729339599609375, 1.31561279296875, 1.3582916259765625, 1.400970458984375, 1.4436492919921875, 1.486328125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 87.0, 918.0, 14.0], "bins": [-81.04156494140625, -79.7428970336914, -78.4442367553711, -77.14556884765625, -75.8469009399414, -74.5482406616211, -73.24957275390625, -71.9509048461914, -70.65223693847656, -69.35356903076172, -68.0549087524414, -66.75624084472656, -65.45757293701172, -64.1589126586914, -62.86024475097656, -61.56157684326172, -60.262916564941406, -58.96425247192383, -57.665584564208984, -56.366920471191406, -55.06825256347656, -53.769588470458984, -52.470924377441406, -51.17225646972656, -49.873592376708984, -48.574928283691406, -47.27626037597656, -45.977596282958984, -44.678932189941406, -43.38026428222656, -42.081600189208984, -40.782936096191406, -39.48426818847656, -38.185604095458984, -36.88693618774414, -35.58827209472656, -34.28960418701172, -32.99094009399414, -31.692276000976562, -30.39361000061035, -29.094945907592773, -27.796279907226562, -26.497615814208984, -25.198949813842773, -23.900283813476562, -22.60161781311035, -21.30295181274414, -20.004287719726562, -18.70562171936035, -17.40695571899414, -16.108291625976562, -14.809625625610352, -13.51095962524414, -12.21229362487793, -10.913628578186035, -9.61496353149414, -8.31629753112793, -7.017632007598877, -5.718966484069824, -4.4203009605407715, -3.1216354370117188, -1.822969913482666, -0.5243043899536133, 0.7743606567382812, 2.0730271339416504]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 23.0, 28.0, 46.0, 76.0, 106.0, 122.0, 132.0, 119.0, 118.0, 94.0, 51.0, 40.0, 21.0, 12.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45428991317749, -7.229437828063965, -7.004586219787598, -6.779734134674072, -6.554882049560547, -6.33003044128418, -6.105178356170654, -5.880326271057129, -5.655474662780762, -5.430622577667236, -5.205770969390869, -4.980918884277344, -4.756067276000977, -4.531215190887451, -4.306363105773926, -4.081511497497559, -3.856659412384033, -3.631807565689087, -3.4069557189941406, -3.1821036338806152, -2.957251787185669, -2.7323999404907227, -2.5075478553771973, -2.282696008682251, -2.0578441619873047, -1.8329923152923584, -1.6081403493881226, -1.3832883834838867, -1.1584365367889404, -0.9335846900939941, -0.7087327241897583, -0.48388075828552246, -0.2590293884277344, -0.03417748212814331, 0.19067442417144775, 0.4155263304710388, 0.6403782367706299, 0.8652300834655762, 1.090082049369812, 1.3149340152740479, 1.5397858619689941, 1.7646377086639404, 1.9894896745681763, 2.214341640472412, 2.4391934871673584, 2.6640453338623047, 2.88889741897583, 3.1137492656707764, 3.3386011123657227, 3.563452959060669, 3.7883048057556152, 4.013156890869141, 4.238008499145508, 4.462860584259033, 4.687712669372559, 4.912564277648926, 5.137416362762451, 5.362268447875977, 5.587120056152344, 5.811972141265869, 6.0368242263793945, 6.261675834655762, 6.486527919769287, 6.7113800048828125, 6.93623161315918]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 14.0, 15.0, 29.0, 48.0, 46.0, 68.0, 90.0, 133.0, 200.0, 293.0, 378.0, 618.0, 943.0, 1476.0, 2422.0, 4200.0, 7799.0, 16492.0, 59780.0, 431113.0, 2534575.0, 971664.0, 115146.0, 24406.0, 9829.0, 4918.0, 2759.0, 1672.0, 1025.0, 658.0, 433.0, 303.0, 175.0, 179.0, 98.0, 73.0, 42.0, 56.0, 40.0, 22.0, 13.0, 9.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.22265625, -2.15020751953125, -2.0777587890625, -2.00531005859375, -1.932861328125, -1.86041259765625, -1.7879638671875, -1.71551513671875, -1.64306640625, -1.57061767578125, -1.4981689453125, -1.42572021484375, -1.353271484375, -1.28082275390625, -1.2083740234375, -1.13592529296875, -1.0634765625, -0.99102783203125, -0.9185791015625, -0.84613037109375, -0.773681640625, -0.70123291015625, -0.6287841796875, -0.55633544921875, -0.48388671875, -0.41143798828125, -0.3389892578125, -0.26654052734375, -0.194091796875, -0.12164306640625, -0.0491943359375, 0.02325439453125, 0.095703125, 0.16815185546875, 0.2406005859375, 0.31304931640625, 0.385498046875, 0.45794677734375, 0.5303955078125, 0.60284423828125, 0.67529296875, 0.74774169921875, 0.8201904296875, 0.89263916015625, 0.965087890625, 1.03753662109375, 1.1099853515625, 1.18243408203125, 1.2548828125, 1.32733154296875, 1.3997802734375, 1.47222900390625, 1.544677734375, 1.61712646484375, 1.6895751953125, 1.76202392578125, 1.83447265625, 1.90692138671875, 1.9793701171875, 2.05181884765625, 2.124267578125, 2.19671630859375, 2.2691650390625, 2.34161376953125, 2.4140625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 4.0, 8.0, 8.0, 5.0, 11.0, 18.0, 13.0, 20.0, 18.0, 17.0, 23.0, 38.0, 41.0, 34.0, 33.0, 41.0, 34.0, 47.0, 36.0, 30.0, 34.0, 49.0, 56.0, 38.0, 41.0, 35.0, 22.0, 39.0, 33.0, 21.0, 19.0, 24.0, 19.0, 9.0, 12.0, 10.0, 9.0, 6.0, 6.0, 8.0, 5.0, 3.0, 0.0, 7.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.44921875, -1.405242919921875, -1.36126708984375, -1.317291259765625, -1.2733154296875, -1.229339599609375, -1.18536376953125, -1.141387939453125, -1.097412109375, -1.053436279296875, -1.00946044921875, -0.965484619140625, -0.9215087890625, -0.877532958984375, -0.83355712890625, -0.789581298828125, -0.74560546875, -0.701629638671875, -0.65765380859375, -0.613677978515625, -0.5697021484375, -0.525726318359375, -0.48175048828125, -0.437774658203125, -0.393798828125, -0.349822998046875, -0.30584716796875, -0.261871337890625, -0.2178955078125, -0.173919677734375, -0.12994384765625, -0.085968017578125, -0.0419921875, 0.001983642578125, 0.04595947265625, 0.089935302734375, 0.1339111328125, 0.177886962890625, 0.22186279296875, 0.265838623046875, 0.309814453125, 0.353790283203125, 0.39776611328125, 0.441741943359375, 0.4857177734375, 0.529693603515625, 0.57366943359375, 0.617645263671875, 0.66162109375, 0.705596923828125, 0.74957275390625, 0.793548583984375, 0.8375244140625, 0.881500244140625, 0.92547607421875, 0.969451904296875, 1.013427734375, 1.057403564453125, 1.10137939453125, 1.145355224609375, 1.1893310546875, 1.233306884765625, 1.27728271484375, 1.321258544921875, 1.365234375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 8.0, 26.0, 21.0, 37.0, 58.0, 89.0, 228.0, 548.0, 4373.0, 4114883.0, 71982.0, 1208.0, 345.0, 159.0, 72.0, 47.0, 41.0, 29.0, 19.0, 11.0, 14.0, 12.0, 6.0, 5.0, 4.0, 2.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.5546875, -15.0321044921875, -14.509521484375, -13.9869384765625, -13.46435546875, -12.9417724609375, -12.419189453125, -11.8966064453125, -11.3740234375, -10.8514404296875, -10.328857421875, -9.8062744140625, -9.28369140625, -8.7611083984375, -8.238525390625, -7.7159423828125, -7.193359375, -6.6707763671875, -6.148193359375, -5.6256103515625, -5.10302734375, -4.5804443359375, -4.057861328125, -3.5352783203125, -3.0126953125, -2.4901123046875, -1.967529296875, -1.4449462890625, -0.92236328125, -0.3997802734375, 0.122802734375, 0.6453857421875, 1.16796875, 1.6905517578125, 2.213134765625, 2.7357177734375, 3.25830078125, 3.7808837890625, 4.303466796875, 4.8260498046875, 5.3486328125, 5.8712158203125, 6.393798828125, 6.9163818359375, 7.43896484375, 7.9615478515625, 8.484130859375, 9.0067138671875, 9.529296875, 10.0518798828125, 10.574462890625, 11.0970458984375, 11.61962890625, 12.1422119140625, 12.664794921875, 13.1873779296875, 13.7099609375, 14.2325439453125, 14.755126953125, 15.2777099609375, 15.80029296875, 16.3228759765625, 16.845458984375, 17.3680419921875, 17.890625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 11.0, 10.0, 19.0, 32.0, 32.0, 43.0, 89.0, 193.0, 342.0, 627.0, 857.0, 730.0, 467.0, 223.0, 124.0, 64.0, 39.0, 41.0, 18.0, 24.0, 16.0, 11.0, 12.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6352691650390625, -0.612335205078125, -0.5894012451171875, -0.56646728515625, -0.5435333251953125, -0.520599365234375, -0.4976654052734375, -0.4747314453125, -0.4517974853515625, -0.428863525390625, -0.4059295654296875, -0.38299560546875, -0.3600616455078125, -0.337127685546875, -0.3141937255859375, -0.291259765625, -0.2683258056640625, -0.245391845703125, -0.2224578857421875, -0.19952392578125, -0.1765899658203125, -0.153656005859375, -0.1307220458984375, -0.1077880859375, -0.0848541259765625, -0.061920166015625, -0.0389862060546875, -0.01605224609375, 0.0068817138671875, 0.029815673828125, 0.0527496337890625, 0.07568359375, 0.0986175537109375, 0.121551513671875, 0.1444854736328125, 0.16741943359375, 0.1903533935546875, 0.213287353515625, 0.2362213134765625, 0.2591552734375, 0.2820892333984375, 0.305023193359375, 0.3279571533203125, 0.35089111328125, 0.3738250732421875, 0.396759033203125, 0.4196929931640625, 0.442626953125, 0.4655609130859375, 0.488494873046875, 0.5114288330078125, 0.53436279296875, 0.5572967529296875, 0.580230712890625, 0.6031646728515625, 0.6260986328125, 0.6490325927734375, 0.671966552734375, 0.6949005126953125, 0.71783447265625, 0.7407684326171875, 0.763702392578125, 0.7866363525390625, 0.8095703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 6.0, 15.0, 44.0, 116.0, 188.0, 268.0, 230.0, 90.0, 38.0, 14.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.143775939941406, -7.994078636169434, -7.844381332397461, -7.69468355178833, -7.544986248016357, -7.395288944244385, -7.245591163635254, -7.095893859863281, -6.946196556091309, -6.796499252319336, -6.646801948547363, -6.497104167938232, -6.34740686416626, -6.197709560394287, -6.048011779785156, -5.898314476013184, -5.748617172241211, -5.598919868469238, -5.449222564697266, -5.299524784088135, -5.149827480316162, -5.0001301765441895, -4.850432395935059, -4.700735092163086, -4.551037788391113, -4.401340484619141, -4.251643180847168, -4.101945400238037, -3.9522480964660645, -3.802550792694092, -3.65285325050354, -3.5031557083129883, -3.3534586429595947, -3.203761100769043, -3.0540637969970703, -2.9043664932250977, -2.754668951034546, -2.604971408843994, -2.4552741050720215, -2.305576801300049, -2.155879259109497, -2.0061817169189453, -1.8564844131469727, -1.7067869901657104, -1.5570895671844482, -1.407392144203186, -1.2576947212219238, -1.1079972982406616, -0.9582998752593994, -0.8086024522781372, -0.658905029296875, -0.5092076063156128, -0.3595101833343506, -0.20981276035308838, -0.06011533737182617, 0.08958208560943604, 0.23927950859069824, 0.38897693157196045, 0.5386743545532227, 0.6883717775344849, 0.8380692005157471, 0.9877666234970093, 1.1374640464782715, 1.2871614694595337, 1.436858892440796]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 7.0, 7.0, 7.0, 6.0, 17.0, 8.0, 16.0, 13.0, 27.0, 21.0, 26.0, 37.0, 30.0, 32.0, 35.0, 27.0, 47.0, 47.0, 38.0, 39.0, 43.0, 34.0, 27.0, 39.0, 42.0, 33.0, 25.0, 33.0, 33.0, 26.0, 25.0, 25.0, 16.0, 18.0, 4.0, 12.0, 13.0, 7.0, 8.0, 10.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.4196873903274536, -1.3755905628204346, -1.331493616104126, -1.287396788597107, -1.243299961090088, -1.1992031335830688, -1.1551063060760498, -1.1110093593597412, -1.0669125318527222, -1.0228157043457031, -0.9787188172340393, -0.9346219301223755, -0.8905251026153564, -0.8464282751083374, -0.8023313879966736, -0.7582345008850098, -0.7141376733779907, -0.6700408458709717, -0.6259439587593079, -0.581847071647644, -0.537750244140625, -0.49365338683128357, -0.44955652952194214, -0.4054596722126007, -0.3613628149032593, -0.31726595759391785, -0.2731691002845764, -0.22907224297523499, -0.18497538566589355, -0.14087852835655212, -0.0967816710472107, -0.05268481373786926, -0.008587837219238281, 0.03550902009010315, 0.07960587739944458, 0.12370273470878601, 0.16779959201812744, 0.21189644932746887, 0.2559933066368103, 0.30009016394615173, 0.34418702125549316, 0.3882838785648346, 0.432380735874176, 0.47647759318351746, 0.5205744504928589, 0.5646712779998779, 0.6087681651115417, 0.6528650522232056, 0.6969618797302246, 0.7410587072372437, 0.7851555943489075, 0.8292524814605713, 0.8733493089675903, 0.9174461364746094, 0.9615430235862732, 1.005639910697937, 1.049736738204956, 1.093833565711975, 1.1379303932189941, 1.1820273399353027, 1.2261241674423218, 1.2702209949493408, 1.3143179416656494, 1.3584147691726685, 1.4025115966796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 9.0, 13.0, 26.0, 40.0, 43.0, 68.0, 93.0, 126.0, 167.0, 262.0, 352.0, 502.0, 720.0, 1083.0, 1618.0, 2275.0, 3543.0, 5476.0, 8421.0, 14935.0, 29640.0, 71075.0, 214735.0, 409504.0, 165740.0, 57492.0, 25082.0, 12907.0, 7691.0, 4891.0, 3184.0, 2173.0, 1438.0, 998.0, 689.0, 473.0, 281.0, 230.0, 167.0, 102.0, 85.0, 65.0, 37.0, 20.0, 26.0, 17.0, 22.0, 5.0, 4.0, 3.0, 1.0, 4.0], "bins": [-3.9375, -3.82623291015625, -3.7149658203125, -3.60369873046875, -3.492431640625, -3.38116455078125, -3.2698974609375, -3.15863037109375, -3.04736328125, -2.93609619140625, -2.8248291015625, -2.71356201171875, -2.602294921875, -2.49102783203125, -2.3797607421875, -2.26849365234375, -2.1572265625, -2.04595947265625, -1.9346923828125, -1.82342529296875, -1.712158203125, -1.60089111328125, -1.4896240234375, -1.37835693359375, -1.26708984375, -1.15582275390625, -1.0445556640625, -0.93328857421875, -0.822021484375, -0.71075439453125, -0.5994873046875, -0.48822021484375, -0.376953125, -0.26568603515625, -0.1544189453125, -0.04315185546875, 0.068115234375, 0.17938232421875, 0.2906494140625, 0.40191650390625, 0.51318359375, 0.62445068359375, 0.7357177734375, 0.84698486328125, 0.958251953125, 1.06951904296875, 1.1807861328125, 1.29205322265625, 1.4033203125, 1.51458740234375, 1.6258544921875, 1.73712158203125, 1.848388671875, 1.95965576171875, 2.0709228515625, 2.18218994140625, 2.29345703125, 2.40472412109375, 2.5159912109375, 2.62725830078125, 2.738525390625, 2.84979248046875, 2.9610595703125, 3.07232666015625, 3.18359375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 0.0, 8.0, 9.0, 6.0, 10.0, 6.0, 5.0, 16.0, 14.0, 16.0, 25.0, 15.0, 26.0, 28.0, 34.0, 42.0, 32.0, 35.0, 38.0, 40.0, 29.0, 39.0, 41.0, 34.0, 46.0, 39.0, 28.0, 50.0, 28.0, 20.0, 22.0, 45.0, 37.0, 14.0, 16.0, 14.0, 11.0, 13.0, 6.0, 11.0, 11.0, 8.0, 4.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.9375, -0.9084930419921875, -0.879486083984375, -0.8504791259765625, -0.82147216796875, -0.7924652099609375, -0.763458251953125, -0.7344512939453125, -0.7054443359375, -0.6764373779296875, -0.647430419921875, -0.6184234619140625, -0.58941650390625, -0.5604095458984375, -0.531402587890625, -0.5023956298828125, -0.473388671875, -0.4443817138671875, -0.415374755859375, -0.3863677978515625, -0.35736083984375, -0.3283538818359375, -0.299346923828125, -0.2703399658203125, -0.2413330078125, -0.2123260498046875, -0.183319091796875, -0.1543121337890625, -0.12530517578125, -0.0962982177734375, -0.067291259765625, -0.0382843017578125, -0.00927734375, 0.0197296142578125, 0.048736572265625, 0.0777435302734375, 0.10675048828125, 0.1357574462890625, 0.164764404296875, 0.1937713623046875, 0.2227783203125, 0.2517852783203125, 0.280792236328125, 0.3097991943359375, 0.33880615234375, 0.3678131103515625, 0.396820068359375, 0.4258270263671875, 0.454833984375, 0.4838409423828125, 0.512847900390625, 0.5418548583984375, 0.57086181640625, 0.5998687744140625, 0.628875732421875, 0.6578826904296875, 0.6868896484375, 0.7158966064453125, 0.744903564453125, 0.7739105224609375, 0.80291748046875, 0.8319244384765625, 0.860931396484375, 0.8899383544921875, 0.9189453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 13.0, 16.0, 21.0, 28.0, 57.0, 53.0, 68.0, 108.0, 166.0, 197.0, 300.0, 406.0, 626.0, 978.0, 1416.0, 2242.0, 3794.0, 6802.0, 13340.0, 30331.0, 88682.0, 526553.0, 264531.0, 58700.0, 23025.0, 10853.0, 5768.0, 3224.0, 2068.0, 1318.0, 873.0, 615.0, 413.0, 287.0, 181.0, 136.0, 106.0, 60.0, 58.0, 34.0, 27.0, 20.0, 15.0, 7.0, 1.0, 12.0, 0.0, 5.0, 0.0, 1.0, 2.0, 3.0], "bins": [-2.849609375, -2.765380859375, -2.68115234375, -2.596923828125, -2.5126953125, -2.428466796875, -2.34423828125, -2.260009765625, -2.17578125, -2.091552734375, -2.00732421875, -1.923095703125, -1.8388671875, -1.754638671875, -1.67041015625, -1.586181640625, -1.501953125, -1.417724609375, -1.33349609375, -1.249267578125, -1.1650390625, -1.080810546875, -0.99658203125, -0.912353515625, -0.828125, -0.743896484375, -0.65966796875, -0.575439453125, -0.4912109375, -0.406982421875, -0.32275390625, -0.238525390625, -0.154296875, -0.070068359375, 0.01416015625, 0.098388671875, 0.1826171875, 0.266845703125, 0.35107421875, 0.435302734375, 0.51953125, 0.603759765625, 0.68798828125, 0.772216796875, 0.8564453125, 0.940673828125, 1.02490234375, 1.109130859375, 1.193359375, 1.277587890625, 1.36181640625, 1.446044921875, 1.5302734375, 1.614501953125, 1.69873046875, 1.782958984375, 1.8671875, 1.951416015625, 2.03564453125, 2.119873046875, 2.2041015625, 2.288330078125, 2.37255859375, 2.456787109375, 2.541015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 7.0, 6.0, 11.0, 13.0, 4.0, 8.0, 20.0, 15.0, 26.0, 11.0, 18.0, 26.0, 34.0, 35.0, 43.0, 41.0, 31.0, 48.0, 35.0, 45.0, 43.0, 48.0, 41.0, 42.0, 39.0, 41.0, 38.0, 26.0, 22.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 17.0, 12.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6513671875, -0.63006591796875, -0.6087646484375, -0.58746337890625, -0.566162109375, -0.54486083984375, -0.5235595703125, -0.50225830078125, -0.48095703125, -0.45965576171875, -0.4383544921875, -0.41705322265625, -0.395751953125, -0.37445068359375, -0.3531494140625, -0.33184814453125, -0.310546875, -0.28924560546875, -0.2679443359375, -0.24664306640625, -0.225341796875, -0.20404052734375, -0.1827392578125, -0.16143798828125, -0.14013671875, -0.11883544921875, -0.0975341796875, -0.07623291015625, -0.054931640625, -0.03363037109375, -0.0123291015625, 0.00897216796875, 0.0302734375, 0.05157470703125, 0.0728759765625, 0.09417724609375, 0.115478515625, 0.13677978515625, 0.1580810546875, 0.17938232421875, 0.20068359375, 0.22198486328125, 0.2432861328125, 0.26458740234375, 0.285888671875, 0.30718994140625, 0.3284912109375, 0.34979248046875, 0.37109375, 0.39239501953125, 0.4136962890625, 0.43499755859375, 0.456298828125, 0.47760009765625, 0.4989013671875, 0.52020263671875, 0.54150390625, 0.56280517578125, 0.5841064453125, 0.60540771484375, 0.626708984375, 0.64801025390625, 0.6693115234375, 0.69061279296875, 0.7119140625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 6.0, 6.0, 9.0, 11.0, 9.0, 12.0, 25.0, 53.0, 67.0, 112.0, 192.0, 326.0, 714.0, 1457.0, 4337.0, 19662.0, 968420.0, 43314.0, 5941.0, 2007.0, 859.0, 420.0, 212.0, 114.0, 73.0, 60.0, 38.0, 17.0, 22.0, 17.0, 13.0, 9.0, 3.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.2408447265625, -12.794189453125, -12.3475341796875, -11.90087890625, -11.4542236328125, -11.007568359375, -10.5609130859375, -10.1142578125, -9.6676025390625, -9.220947265625, -8.7742919921875, -8.32763671875, -7.8809814453125, -7.434326171875, -6.9876708984375, -6.541015625, -6.0943603515625, -5.647705078125, -5.2010498046875, -4.75439453125, -4.3077392578125, -3.861083984375, -3.4144287109375, -2.9677734375, -2.5211181640625, -2.074462890625, -1.6278076171875, -1.18115234375, -0.7344970703125, -0.287841796875, 0.1588134765625, 0.60546875, 1.0521240234375, 1.498779296875, 1.9454345703125, 2.39208984375, 2.8387451171875, 3.285400390625, 3.7320556640625, 4.1787109375, 4.6253662109375, 5.072021484375, 5.5186767578125, 5.96533203125, 6.4119873046875, 6.858642578125, 7.3052978515625, 7.751953125, 8.1986083984375, 8.645263671875, 9.0919189453125, 9.53857421875, 9.9852294921875, 10.431884765625, 10.8785400390625, 11.3251953125, 11.7718505859375, 12.218505859375, 12.6651611328125, 13.11181640625, 13.5584716796875, 14.005126953125, 14.4517822265625, 14.8984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 18.0, 13.0, 22.0, 39.0, 64.0, 126.0, 240.0, 183.0, 95.0, 49.0, 47.0, 21.0, 18.0, 8.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.818771362304688e-05, -6.436929106712341e-05, -6.055086851119995e-05, -5.673244595527649e-05, -5.291402339935303e-05, -4.9095600843429565e-05, -4.5277178287506104e-05, -4.145875573158264e-05, -3.764033317565918e-05, -3.382191061973572e-05, -3.0003488063812256e-05, -2.6185065507888794e-05, -2.2366642951965332e-05, -1.854822039604187e-05, -1.4729797840118408e-05, -1.0911375284194946e-05, -7.092952728271484e-06, -3.2745301723480225e-06, 5.438923835754395e-07, 4.362314939498901e-06, 8.180737495422363e-06, 1.1999160051345825e-05, 1.5817582607269287e-05, 1.963600516319275e-05, 2.345442771911621e-05, 2.7272850275039673e-05, 3.1091272830963135e-05, 3.49096953868866e-05, 3.872811794281006e-05, 4.254654049873352e-05, 4.636496305465698e-05, 5.0183385610580444e-05, 5.4001808166503906e-05, 5.782023072242737e-05, 6.163865327835083e-05, 6.545707583427429e-05, 6.927549839019775e-05, 7.309392094612122e-05, 7.691234350204468e-05, 8.073076605796814e-05, 8.45491886138916e-05, 8.836761116981506e-05, 9.218603372573853e-05, 9.600445628166199e-05, 9.982287883758545e-05, 0.00010364130139350891, 0.00010745972394943237, 0.00011127814650535583, 0.0001150965690612793, 0.00011891499161720276, 0.00012273341417312622, 0.00012655183672904968, 0.00013037025928497314, 0.0001341886818408966, 0.00013800710439682007, 0.00014182552695274353, 0.000145643949508667, 0.00014946237206459045, 0.00015328079462051392, 0.00015709921717643738, 0.00016091763973236084, 0.0001647360622882843, 0.00016855448484420776, 0.00017237290740013123, 0.0001761913299560547]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 15.0, 13.0, 25.0, 24.0, 98.0, 1472.0, 1045507.0, 1188.0, 73.0, 38.0, 19.0, 12.0, 5.0, 12.0, 4.0, 6.0, 4.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.375, -69.919921875, -67.46484375, -65.009765625, -62.5546875, -60.099609375, -57.64453125, -55.189453125, -52.734375, -50.279296875, -47.82421875, -45.369140625, -42.9140625, -40.458984375, -38.00390625, -35.548828125, -33.09375, -30.638671875, -28.18359375, -25.728515625, -23.2734375, -20.818359375, -18.36328125, -15.908203125, -13.453125, -10.998046875, -8.54296875, -6.087890625, -3.6328125, -1.177734375, 1.27734375, 3.732421875, 6.1875, 8.642578125, 11.09765625, 13.552734375, 16.0078125, 18.462890625, 20.91796875, 23.373046875, 25.828125, 28.283203125, 30.73828125, 33.193359375, 35.6484375, 38.103515625, 40.55859375, 43.013671875, 45.46875, 47.923828125, 50.37890625, 52.833984375, 55.2890625, 57.744140625, 60.19921875, 62.654296875, 65.109375, 67.564453125, 70.01953125, 72.474609375, 74.9296875, 77.384765625, 79.83984375, 82.294921875, 84.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 16.0, 13.0, 15.0, 51.0, 107.0, 522.0, 106.0, 38.0, 26.0, 15.0, 12.0, 5.0, 10.0, 4.0, 5.0, 5.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.0755615234375, -2.002685546875, -1.9298095703125, -1.85693359375, -1.7840576171875, -1.711181640625, -1.6383056640625, -1.5654296875, -1.4925537109375, -1.419677734375, -1.3468017578125, -1.27392578125, -1.2010498046875, -1.128173828125, -1.0552978515625, -0.982421875, -0.9095458984375, -0.836669921875, -0.7637939453125, -0.69091796875, -0.6180419921875, -0.545166015625, -0.4722900390625, -0.3994140625, -0.3265380859375, -0.253662109375, -0.1807861328125, -0.10791015625, -0.0350341796875, 0.037841796875, 0.1107177734375, 0.18359375, 0.2564697265625, 0.329345703125, 0.4022216796875, 0.47509765625, 0.5479736328125, 0.620849609375, 0.6937255859375, 0.7666015625, 0.8394775390625, 0.912353515625, 0.9852294921875, 1.05810546875, 1.1309814453125, 1.203857421875, 1.2767333984375, 1.349609375, 1.4224853515625, 1.495361328125, 1.5682373046875, 1.64111328125, 1.7139892578125, 1.786865234375, 1.8597412109375, 1.9326171875, 2.0054931640625, 2.078369140625, 2.1512451171875, 2.22412109375, 2.2969970703125, 2.369873046875, 2.4427490234375, 2.515625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 9.0, 47.0, 325.0, 529.0, 93.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3648936748504639, -1.0398458242416382, -0.7147979140281677, -0.38975000381469727, -0.06470215320587158, 0.2603456974029541, 0.5853936672210693, 0.9104413986206055, 1.2354893684387207, 1.5605372190475464, 1.885585069656372, 2.2106330394744873, 2.5356807708740234, 2.8607287406921387, 3.185776710510254, 3.51082444190979, 3.8358724117279053, 4.160920143127441, 4.485968112945557, 4.811016082763672, 5.136064052581787, 5.461112022399902, 5.786159515380859, 6.111207485198975, 6.43625545501709, 6.761303424835205, 7.08635139465332, 7.411398887634277, 7.736446857452393, 8.061494827270508, 8.386543273925781, 8.711590766906738, 9.036639213562012, 9.361686706542969, 9.686735153198242, 10.0117826461792, 10.336831092834473, 10.66187858581543, 10.986927032470703, 11.31197452545166, 11.637022018432617, 11.962069511413574, 12.287117958068848, 12.612165451049805, 12.937213897705078, 13.262261390686035, 13.587308883666992, 13.912357330322266, 14.237405776977539, 14.562453269958496, 14.88750171661377, 15.212549209594727, 15.53759765625, 15.862645149230957, 16.187692642211914, 16.512741088867188, 16.837787628173828, 17.1628360748291, 17.487882614135742, 17.812931060791016, 18.13797950744629, 18.463027954101562, 18.788074493408203, 19.113122940063477, 19.43817138671875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 8.0, 18.0, 18.0, 13.0, 17.0, 15.0, 28.0, 42.0, 47.0, 36.0, 37.0, 37.0, 36.0, 45.0, 49.0, 40.0, 42.0, 37.0, 45.0, 32.0, 27.0, 34.0, 45.0, 42.0, 30.0, 27.0, 19.0, 21.0, 19.0, 13.0, 10.0, 12.0, 7.0, 6.0, 4.0, 2.0, 9.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.245413899421692, -1.2084311246871948, -1.1714483499526978, -1.1344655752182007, -1.0974828004837036, -1.0605000257492065, -1.0235172510147095, -0.9865344166755676, -0.9495516419410706, -0.9125688672065735, -0.8755860924720764, -0.8386033177375793, -0.8016204833984375, -0.7646377086639404, -0.7276549339294434, -0.6906721591949463, -0.6536893844604492, -0.6167066097259521, -0.5797238349914551, -0.542741060256958, -0.5057582855224609, -0.4687754809856415, -0.431792676448822, -0.39480990171432495, -0.3578271269798279, -0.3208443522453308, -0.28386157751083374, -0.24687877297401428, -0.2098959982395172, -0.17291322350502014, -0.13593043386936188, -0.09894764423370361, -0.06196486949920654, -0.024982087314128876, 0.012000694870948792, 0.04898347705602646, 0.08596625924110413, 0.1229490339756012, 0.15993182361125946, 0.19691461324691772, 0.2338973879814148, 0.27088016271591187, 0.30786293745040894, 0.3448457419872284, 0.38182851672172546, 0.41881129145622253, 0.455794095993042, 0.49277687072753906, 0.5297596454620361, 0.5667424201965332, 0.6037251949310303, 0.6407079696655273, 0.6776907444000244, 0.7146735191345215, 0.7516563534736633, 0.7886391282081604, 0.8256219029426575, 0.8626046776771545, 0.8995874524116516, 0.9365702271461487, 0.9735530614852905, 1.0105358362197876, 1.0475186109542847, 1.0845013856887817, 1.1214841604232788]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 16.0, 24.0, 31.0, 63.0, 77.0, 137.0, 225.0, 386.0, 653.0, 1165.0, 2238.0, 4454.0, 10019.0, 26552.0, 83690.0, 316790.0, 419809.0, 120979.0, 36202.0, 13393.0, 5608.0, 2804.0, 1368.0, 723.0, 463.0, 247.0, 151.0, 78.0, 64.0, 45.0, 29.0, 15.0, 13.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.2265625, -5.08953857421875, -4.9525146484375, -4.81549072265625, -4.678466796875, -4.54144287109375, -4.4044189453125, -4.26739501953125, -4.13037109375, -3.99334716796875, -3.8563232421875, -3.71929931640625, -3.582275390625, -3.44525146484375, -3.3082275390625, -3.17120361328125, -3.0341796875, -2.89715576171875, -2.7601318359375, -2.62310791015625, -2.486083984375, -2.34906005859375, -2.2120361328125, -2.07501220703125, -1.93798828125, -1.80096435546875, -1.6639404296875, -1.52691650390625, -1.389892578125, -1.25286865234375, -1.1158447265625, -0.97882080078125, -0.841796875, -0.70477294921875, -0.5677490234375, -0.43072509765625, -0.293701171875, -0.15667724609375, -0.0196533203125, 0.11737060546875, 0.25439453125, 0.39141845703125, 0.5284423828125, 0.66546630859375, 0.802490234375, 0.93951416015625, 1.0765380859375, 1.21356201171875, 1.3505859375, 1.48760986328125, 1.6246337890625, 1.76165771484375, 1.898681640625, 2.03570556640625, 2.1727294921875, 2.30975341796875, 2.44677734375, 2.58380126953125, 2.7208251953125, 2.85784912109375, 2.994873046875, 3.13189697265625, 3.2689208984375, 3.40594482421875, 3.54296875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 12.0, 14.0, 19.0, 25.0, 23.0, 45.0, 37.0, 58.0, 56.0, 65.0, 58.0, 54.0, 49.0, 65.0, 58.0, 35.0, 53.0, 54.0, 46.0, 37.0, 30.0, 21.0, 21.0, 14.0, 12.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.15106201171875, -1.1038818359375, -1.05670166015625, -1.009521484375, -0.96234130859375, -0.9151611328125, -0.86798095703125, -0.82080078125, -0.77362060546875, -0.7264404296875, -0.67926025390625, -0.632080078125, -0.58489990234375, -0.5377197265625, -0.49053955078125, -0.443359375, -0.39617919921875, -0.3489990234375, -0.30181884765625, -0.254638671875, -0.20745849609375, -0.1602783203125, -0.11309814453125, -0.06591796875, -0.01873779296875, 0.0284423828125, 0.07562255859375, 0.122802734375, 0.16998291015625, 0.2171630859375, 0.26434326171875, 0.3115234375, 0.35870361328125, 0.4058837890625, 0.45306396484375, 0.500244140625, 0.54742431640625, 0.5946044921875, 0.64178466796875, 0.68896484375, 0.73614501953125, 0.7833251953125, 0.83050537109375, 0.877685546875, 0.92486572265625, 0.9720458984375, 1.01922607421875, 1.06640625, 1.11358642578125, 1.1607666015625, 1.20794677734375, 1.255126953125, 1.30230712890625, 1.3494873046875, 1.39666748046875, 1.44384765625, 1.49102783203125, 1.5382080078125, 1.58538818359375, 1.632568359375, 1.67974853515625, 1.7269287109375, 1.77410888671875, 1.8212890625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 3.0, 2.0, 8.0, 14.0, 9.0, 18.0, 28.0, 30.0, 27.0, 43.0, 43.0, 69.0, 135.0, 798.0, 8593.0, 337118.0, 683606.0, 16230.0, 1214.0, 219.0, 72.0, 55.0, 34.0, 43.0, 21.0, 36.0, 19.0, 12.0, 12.0, 10.0, 13.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.73974609375, -11.3623046875, -10.98486328125, -10.607421875, -10.22998046875, -9.8525390625, -9.47509765625, -9.09765625, -8.72021484375, -8.3427734375, -7.96533203125, -7.587890625, -7.21044921875, -6.8330078125, -6.45556640625, -6.078125, -5.70068359375, -5.3232421875, -4.94580078125, -4.568359375, -4.19091796875, -3.8134765625, -3.43603515625, -3.05859375, -2.68115234375, -2.3037109375, -1.92626953125, -1.548828125, -1.17138671875, -0.7939453125, -0.41650390625, -0.0390625, 0.33837890625, 0.7158203125, 1.09326171875, 1.470703125, 1.84814453125, 2.2255859375, 2.60302734375, 2.98046875, 3.35791015625, 3.7353515625, 4.11279296875, 4.490234375, 4.86767578125, 5.2451171875, 5.62255859375, 6.0, 6.37744140625, 6.7548828125, 7.13232421875, 7.509765625, 7.88720703125, 8.2646484375, 8.64208984375, 9.01953125, 9.39697265625, 9.7744140625, 10.15185546875, 10.529296875, 10.90673828125, 11.2841796875, 11.66162109375, 12.0390625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 16.0, 16.0, 20.0, 22.0, 24.0, 28.0, 31.0, 40.0, 38.0, 57.0, 47.0, 53.0, 59.0, 73.0, 61.0, 53.0, 52.0, 55.0, 38.0, 47.0, 35.0, 29.0, 20.0, 20.0, 17.0, 13.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.583343505859375, -1.53387451171875, -1.484405517578125, -1.4349365234375, -1.385467529296875, -1.33599853515625, -1.286529541015625, -1.237060546875, -1.187591552734375, -1.13812255859375, -1.088653564453125, -1.0391845703125, -0.989715576171875, -0.94024658203125, -0.890777587890625, -0.84130859375, -0.791839599609375, -0.74237060546875, -0.692901611328125, -0.6434326171875, -0.593963623046875, -0.54449462890625, -0.495025634765625, -0.445556640625, -0.396087646484375, -0.34661865234375, -0.297149658203125, -0.2476806640625, -0.198211669921875, -0.14874267578125, -0.099273681640625, -0.0498046875, -0.000335693359375, 0.04913330078125, 0.098602294921875, 0.1480712890625, 0.197540283203125, 0.24700927734375, 0.296478271484375, 0.345947265625, 0.395416259765625, 0.44488525390625, 0.494354248046875, 0.5438232421875, 0.593292236328125, 0.64276123046875, 0.692230224609375, 0.74169921875, 0.791168212890625, 0.84063720703125, 0.890106201171875, 0.9395751953125, 0.989044189453125, 1.03851318359375, 1.087982177734375, 1.137451171875, 1.186920166015625, 1.23638916015625, 1.285858154296875, 1.3353271484375, 1.384796142578125, 1.43426513671875, 1.483734130859375, 1.533203125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 7.0, 6.0, 13.0, 16.0, 25.0, 44.0, 77.0, 175.0, 539.0, 1278.0, 3435.0, 14047.0, 130454.0, 853302.0, 35357.0, 6370.0, 2072.0, 753.0, 303.0, 118.0, 71.0, 35.0, 12.0, 9.0, 9.0, 2.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.015625, -0.98089599609375, -0.9461669921875, -0.91143798828125, -0.876708984375, -0.84197998046875, -0.8072509765625, -0.77252197265625, -0.73779296875, -0.70306396484375, -0.6683349609375, -0.63360595703125, -0.598876953125, -0.56414794921875, -0.5294189453125, -0.49468994140625, -0.4599609375, -0.42523193359375, -0.3905029296875, -0.35577392578125, -0.321044921875, -0.28631591796875, -0.2515869140625, -0.21685791015625, -0.18212890625, -0.14739990234375, -0.1126708984375, -0.07794189453125, -0.043212890625, -0.00848388671875, 0.0262451171875, 0.06097412109375, 0.095703125, 0.13043212890625, 0.1651611328125, 0.19989013671875, 0.234619140625, 0.26934814453125, 0.3040771484375, 0.33880615234375, 0.37353515625, 0.40826416015625, 0.4429931640625, 0.47772216796875, 0.512451171875, 0.54718017578125, 0.5819091796875, 0.61663818359375, 0.6513671875, 0.68609619140625, 0.7208251953125, 0.75555419921875, 0.790283203125, 0.82501220703125, 0.8597412109375, 0.89447021484375, 0.92919921875, 0.96392822265625, 0.9986572265625, 1.03338623046875, 1.068115234375, 1.10284423828125, 1.1375732421875, 1.17230224609375, 1.20703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 20.0, 11.0, 25.0, 48.0, 65.0, 103.0, 306.0, 191.0, 83.0, 46.0, 36.0, 12.0, 9.0, 11.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.194280624389648e-05, -6.878841668367386e-05, -6.563402712345123e-05, -6.247963756322861e-05, -5.932524800300598e-05, -5.6170858442783356e-05, -5.301646888256073e-05, -4.9862079322338104e-05, -4.670768976211548e-05, -4.355330020189285e-05, -4.039891064167023e-05, -3.72445210814476e-05, -3.4090131521224976e-05, -3.093574196100235e-05, -2.7781352400779724e-05, -2.46269628405571e-05, -2.1472573280334473e-05, -1.8318183720111847e-05, -1.5163794159889221e-05, -1.2009404599666595e-05, -8.85501503944397e-06, -5.700625479221344e-06, -2.5462359189987183e-06, 6.081536412239075e-07, 3.762543201446533e-06, 6.916932761669159e-06, 1.0071322321891785e-05, 1.322571188211441e-05, 1.6380101442337036e-05, 1.9534491002559662e-05, 2.2688880562782288e-05, 2.5843270123004913e-05, 2.899765968322754e-05, 3.2152049243450165e-05, 3.530643880367279e-05, 3.8460828363895416e-05, 4.161521792411804e-05, 4.476960748434067e-05, 4.7923997044563293e-05, 5.107838660478592e-05, 5.4232776165008545e-05, 5.738716572523117e-05, 6.0541555285453796e-05, 6.369594484567642e-05, 6.685033440589905e-05, 7.000472396612167e-05, 7.31591135263443e-05, 7.631350308656693e-05, 7.946789264678955e-05, 8.262228220701218e-05, 8.57766717672348e-05, 8.893106132745743e-05, 9.208545088768005e-05, 9.523984044790268e-05, 9.83942300081253e-05, 0.00010154861956834793, 0.00010470300912857056, 0.00010785739868879318, 0.00011101178824901581, 0.00011416617780923843, 0.00011732056736946106, 0.00012047495692968369, 0.0001236293464899063, 0.00012678373605012894, 0.00012993812561035156]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 4.0, 5.0, 9.0, 16.0, 23.0, 80.0, 520.0, 27338.0, 1018268.0, 2006.0, 192.0, 47.0, 11.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8515625, -4.717620849609375, -4.58367919921875, -4.449737548828125, -4.3157958984375, -4.181854248046875, -4.04791259765625, -3.913970947265625, -3.780029296875, -3.646087646484375, -3.51214599609375, -3.378204345703125, -3.2442626953125, -3.110321044921875, -2.97637939453125, -2.842437744140625, -2.70849609375, -2.574554443359375, -2.44061279296875, -2.306671142578125, -2.1727294921875, -2.038787841796875, -1.90484619140625, -1.770904541015625, -1.636962890625, -1.503021240234375, -1.36907958984375, -1.235137939453125, -1.1011962890625, -0.967254638671875, -0.83331298828125, -0.699371337890625, -0.5654296875, -0.431488037109375, -0.29754638671875, -0.163604736328125, -0.0296630859375, 0.104278564453125, 0.23822021484375, 0.372161865234375, 0.506103515625, 0.640045166015625, 0.77398681640625, 0.907928466796875, 1.0418701171875, 1.175811767578125, 1.30975341796875, 1.443695068359375, 1.57763671875, 1.711578369140625, 1.84552001953125, 1.979461669921875, 2.1134033203125, 2.247344970703125, 2.38128662109375, 2.515228271484375, 2.649169921875, 2.783111572265625, 2.91705322265625, 3.050994873046875, 3.1849365234375, 3.318878173828125, 3.45281982421875, 3.586761474609375, 3.720703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 7.0, 12.0, 33.0, 48.0, 142.0, 522.0, 105.0, 49.0, 25.0, 10.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52734375, -0.512847900390625, -0.49835205078125, -0.483856201171875, -0.4693603515625, -0.454864501953125, -0.44036865234375, -0.425872802734375, -0.411376953125, -0.396881103515625, -0.38238525390625, -0.367889404296875, -0.3533935546875, -0.338897705078125, -0.32440185546875, -0.309906005859375, -0.29541015625, -0.280914306640625, -0.26641845703125, -0.251922607421875, -0.2374267578125, -0.222930908203125, -0.20843505859375, -0.193939208984375, -0.179443359375, -0.164947509765625, -0.15045166015625, -0.135955810546875, -0.1214599609375, -0.106964111328125, -0.09246826171875, -0.077972412109375, -0.0634765625, -0.048980712890625, -0.03448486328125, -0.019989013671875, -0.0054931640625, 0.009002685546875, 0.02349853515625, 0.037994384765625, 0.052490234375, 0.066986083984375, 0.08148193359375, 0.095977783203125, 0.1104736328125, 0.124969482421875, 0.13946533203125, 0.153961181640625, 0.16845703125, 0.182952880859375, 0.19744873046875, 0.211944580078125, 0.2264404296875, 0.240936279296875, 0.25543212890625, 0.269927978515625, 0.284423828125, 0.298919677734375, 0.31341552734375, 0.327911376953125, 0.3424072265625, 0.356903076171875, 0.37139892578125, 0.385894775390625, 0.400390625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 54.0, 366.0, 519.0, 58.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.349918842315674, -5.084228038787842, -4.81853723526001, -4.552846431732178, -4.287155628204346, -4.021464824676514, -3.7557740211486816, -3.4900832176208496, -3.2243924140930176, -2.9587016105651855, -2.6930108070373535, -2.4273200035095215, -2.1616291999816895, -1.8959383964538574, -1.6302475929260254, -1.3645567893981934, -1.0988659858703613, -0.8331751823425293, -0.5674843788146973, -0.30179357528686523, -0.0361027717590332, 0.22958803176879883, 0.49527883529663086, 0.7609696388244629, 1.026660442352295, 1.292351245880127, 1.558042049407959, 1.823732852935791, 2.089423656463623, 2.355114459991455, 2.620805263519287, 2.886496067047119, 3.152186393737793, 3.417877197265625, 3.683568000793457, 3.949258804321289, 4.214949607849121, 4.480640411376953, 4.746331214904785, 5.012022018432617, 5.277712821960449, 5.543403625488281, 5.809094429016113, 6.074785232543945, 6.340476036071777, 6.606166839599609, 6.871857643127441, 7.137548446655273, 7.4032392501831055, 7.6689300537109375, 7.9346208572387695, 8.200311660766602, 8.466002464294434, 8.731693267822266, 8.997384071350098, 9.26307487487793, 9.528765678405762, 9.794456481933594, 10.060147285461426, 10.325838088989258, 10.59152889251709, 10.857219696044922, 11.122910499572754, 11.388601303100586, 11.654292106628418]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 11.0, 15.0, 12.0, 19.0, 13.0, 22.0, 32.0, 18.0, 39.0, 25.0, 43.0, 37.0, 35.0, 47.0, 48.0, 44.0, 39.0, 46.0, 38.0, 37.0, 42.0, 45.0, 25.0, 42.0, 30.0, 23.0, 33.0, 27.0, 21.0, 13.0, 16.0, 12.0, 7.0, 7.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.332074522972107, -1.2864357233047485, -1.2407970428466797, -1.1951582431793213, -1.149519443511963, -1.1038806438446045, -1.0582419633865356, -1.0126031637191772, -0.9669644236564636, -0.92132568359375, -0.8756868839263916, -0.830048143863678, -0.7844094038009644, -0.738770604133606, -0.6931318640708923, -0.6474931240081787, -0.6018543243408203, -0.5562155842781067, -0.5105767846107483, -0.46493804454803467, -0.41929927468299866, -0.37366050481796265, -0.328021764755249, -0.282382994890213, -0.236744225025177, -0.191105455160141, -0.14546670019626617, -0.09982794523239136, -0.05418917536735535, -0.008550405502319336, 0.03708833456039429, 0.0827271044254303, 0.12836575508117676, 0.17400452494621277, 0.21964327991008759, 0.2652820348739624, 0.3109208047389984, 0.3565595746040344, 0.40219831466674805, 0.44783708453178406, 0.49347585439682007, 0.5391145944595337, 0.5847533941268921, 0.6303921341896057, 0.6760308742523193, 0.7216696739196777, 0.7673084139823914, 0.812947154045105, 0.8585859537124634, 0.904224693775177, 0.9498634934425354, 0.995502233505249, 1.0411410331726074, 1.0867798328399658, 1.1324185132980347, 1.178057312965393, 1.223695993423462, 1.2693347930908203, 1.3149734735488892, 1.3606122732162476, 1.406251072883606, 1.4518897533416748, 1.4975285530090332, 1.5431673526763916, 1.58880615234375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [7.0, 3.0, 5.0, 7.0, 3.0, 11.0, 11.0, 14.0, 23.0, 31.0, 37.0, 53.0, 64.0, 72.0, 108.0, 184.0, 206.0, 296.0, 387.0, 654.0, 956.0, 1516.0, 2534.0, 4518.0, 8606.0, 19158.0, 77528.0, 3265632.0, 746557.0, 36289.0, 13342.0, 6286.0, 3311.0, 2031.0, 1152.0, 777.0, 544.0, 396.0, 268.0, 189.0, 152.0, 94.0, 75.0, 52.0, 49.0, 38.0, 21.0, 7.0, 6.0, 14.0, 11.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7049102783203125, -1.641265869140625, -1.5776214599609375, -1.51397705078125, -1.4503326416015625, -1.386688232421875, -1.3230438232421875, -1.2593994140625, -1.1957550048828125, -1.132110595703125, -1.0684661865234375, -1.00482177734375, -0.9411773681640625, -0.877532958984375, -0.8138885498046875, -0.750244140625, -0.6865997314453125, -0.622955322265625, -0.5593109130859375, -0.49566650390625, -0.4320220947265625, -0.368377685546875, -0.3047332763671875, -0.2410888671875, -0.1774444580078125, -0.113800048828125, -0.0501556396484375, 0.01348876953125, 0.0771331787109375, 0.140777587890625, 0.2044219970703125, 0.26806640625, 0.3317108154296875, 0.395355224609375, 0.4589996337890625, 0.52264404296875, 0.5862884521484375, 0.649932861328125, 0.7135772705078125, 0.7772216796875, 0.8408660888671875, 0.904510498046875, 0.9681549072265625, 1.03179931640625, 1.0954437255859375, 1.159088134765625, 1.2227325439453125, 1.286376953125, 1.3500213623046875, 1.413665771484375, 1.4773101806640625, 1.54095458984375, 1.6045989990234375, 1.668243408203125, 1.7318878173828125, 1.7955322265625, 1.8591766357421875, 1.922821044921875, 1.9864654541015625, 2.05010986328125, 2.1137542724609375, 2.177398681640625, 2.2410430908203125, 2.3046875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 6.0, 14.0, 10.0, 7.0, 14.0, 25.0, 21.0, 26.0, 25.0, 30.0, 38.0, 30.0, 38.0, 46.0, 35.0, 46.0, 48.0, 41.0, 41.0, 47.0, 37.0, 37.0, 38.0, 39.0, 30.0, 31.0, 29.0, 35.0, 15.0, 17.0, 14.0, 19.0, 15.0, 11.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56689453125, -0.5489120483398438, -0.5309295654296875, -0.5129470825195312, -0.494964599609375, -0.47698211669921875, -0.4589996337890625, -0.44101715087890625, -0.42303466796875, -0.40505218505859375, -0.3870697021484375, -0.36908721923828125, -0.351104736328125, -0.33312225341796875, -0.3151397705078125, -0.29715728759765625, -0.2791748046875, -0.26119232177734375, -0.2432098388671875, -0.22522735595703125, -0.207244873046875, -0.18926239013671875, -0.1712799072265625, -0.15329742431640625, -0.13531494140625, -0.11733245849609375, -0.0993499755859375, -0.08136749267578125, -0.063385009765625, -0.04540252685546875, -0.0274200439453125, -0.00943756103515625, 0.008544921875, 0.02652740478515625, 0.0445098876953125, 0.06249237060546875, 0.080474853515625, 0.09845733642578125, 0.1164398193359375, 0.13442230224609375, 0.15240478515625, 0.17038726806640625, 0.1883697509765625, 0.20635223388671875, 0.224334716796875, 0.24231719970703125, 0.2602996826171875, 0.27828216552734375, 0.2962646484375, 0.31424713134765625, 0.3322296142578125, 0.35021209716796875, 0.368194580078125, 0.38617706298828125, 0.4041595458984375, 0.42214202880859375, 0.44012451171875, 0.45810699462890625, 0.4760894775390625, 0.49407196044921875, 0.512054443359375, 0.5300369262695312, 0.5480194091796875, 0.5660018920898438, 0.583984375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 16.0, 14.0, 22.0, 47.0, 131.0, 485.0, 13346.0, 4176384.0, 3325.0, 265.0, 93.0, 59.0, 25.0, 13.0, 17.0, 12.0, 7.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.6988525390625, -11.124267578125, -10.5496826171875, -9.97509765625, -9.4005126953125, -8.825927734375, -8.2513427734375, -7.6767578125, -7.1021728515625, -6.527587890625, -5.9530029296875, -5.37841796875, -4.8038330078125, -4.229248046875, -3.6546630859375, -3.080078125, -2.5054931640625, -1.930908203125, -1.3563232421875, -0.78173828125, -0.2071533203125, 0.367431640625, 0.9420166015625, 1.5166015625, 2.0911865234375, 2.665771484375, 3.2403564453125, 3.81494140625, 4.3895263671875, 4.964111328125, 5.5386962890625, 6.11328125, 6.6878662109375, 7.262451171875, 7.8370361328125, 8.41162109375, 8.9862060546875, 9.560791015625, 10.1353759765625, 10.7099609375, 11.2845458984375, 11.859130859375, 12.4337158203125, 13.00830078125, 13.5828857421875, 14.157470703125, 14.7320556640625, 15.306640625, 15.8812255859375, 16.455810546875, 17.0303955078125, 17.60498046875, 18.1795654296875, 18.754150390625, 19.3287353515625, 19.9033203125, 20.4779052734375, 21.052490234375, 21.6270751953125, 22.20166015625, 22.7762451171875, 23.350830078125, 23.9254150390625, 24.5]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 15.0, 19.0, 23.0, 39.0, 65.0, 212.0, 1190.0, 1849.0, 396.0, 83.0, 54.0, 42.0, 17.0, 13.0, 16.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6400375366210938, -0.6135711669921875, -0.5871047973632812, -0.560638427734375, -0.5341720581054688, -0.5077056884765625, -0.48123931884765625, -0.45477294921875, -0.42830657958984375, -0.4018402099609375, -0.37537384033203125, -0.348907470703125, -0.32244110107421875, -0.2959747314453125, -0.26950836181640625, -0.2430419921875, -0.21657562255859375, -0.1901092529296875, -0.16364288330078125, -0.137176513671875, -0.11071014404296875, -0.0842437744140625, -0.05777740478515625, -0.03131103515625, -0.00484466552734375, 0.0216217041015625, 0.04808807373046875, 0.074554443359375, 0.10102081298828125, 0.1274871826171875, 0.15395355224609375, 0.180419921875, 0.20688629150390625, 0.2333526611328125, 0.25981903076171875, 0.286285400390625, 0.31275177001953125, 0.3392181396484375, 0.36568450927734375, 0.39215087890625, 0.41861724853515625, 0.4450836181640625, 0.47154998779296875, 0.498016357421875, 0.5244827270507812, 0.5509490966796875, 0.5774154663085938, 0.6038818359375, 0.6303482055664062, 0.6568145751953125, 0.6832809448242188, 0.709747314453125, 0.7362136840820312, 0.7626800537109375, 0.7891464233398438, 0.81561279296875, 0.8420791625976562, 0.8685455322265625, 0.8950119018554688, 0.921478271484375, 0.9479446411132812, 0.9744110107421875, 1.0008773803710938, 1.02734375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 18.0, 30.0, 45.0, 79.0, 113.0, 171.0, 210.0, 111.0, 80.0, 53.0, 18.0, 22.0, 13.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0824494361877441, -1.0354136228561401, -0.9883776903152466, -0.9413418173789978, -0.894305944442749, -0.8472700715065002, -0.8002341985702515, -0.7531983852386475, -0.7061624526977539, -0.6591265797615051, -0.6120907068252563, -0.5650548338890076, -0.5180189609527588, -0.47098308801651, -0.4239472448825836, -0.37691137194633484, -0.32987552881240845, -0.28283965587615967, -0.2358037829399109, -0.1887679249048233, -0.14173205196857452, -0.09469617903232574, -0.04766032099723816, -0.0006244480609893799, 0.0464114248752594, 0.09344729781150818, 0.14048317074775696, 0.18751902878284454, 0.23455490171909332, 0.2815907597541809, 0.3286266326904297, 0.37566250562667847, 0.42269837856292725, 0.469734251499176, 0.5167701244354248, 0.5638059973716736, 0.6108418703079224, 0.6578777432441711, 0.7049136161804199, 0.7519494295120239, 0.7989853620529175, 0.8460212349891663, 0.893057107925415, 0.9400929808616638, 0.9871288537979126, 1.0341646671295166, 1.0812005996704102, 1.1282364130020142, 1.1752722263336182, 1.2223080396652222, 1.2693439722061157, 1.3163797855377197, 1.3634157180786133, 1.4104515314102173, 1.4574874639511108, 1.5045232772827148, 1.5515592098236084, 1.5985950231552124, 1.645630955696106, 1.69266676902771, 1.7397027015686035, 1.7867385149002075, 1.833774447441101, 1.880810260772705, 1.9278461933135986]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 4.0, 3.0, 11.0, 10.0, 7.0, 13.0, 12.0, 16.0, 11.0, 20.0, 15.0, 33.0, 35.0, 27.0, 33.0, 30.0, 29.0, 32.0, 36.0, 29.0, 42.0, 26.0, 32.0, 32.0, 36.0, 33.0, 30.0, 32.0, 42.0, 26.0, 24.0, 26.0, 33.0, 27.0, 25.0, 20.0, 19.0, 12.0, 14.0, 9.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 10.0, 3.0, 0.0, 1.0], "bins": [-0.7235569357872009, -0.7030559778213501, -0.6825549602508545, -0.6620539426803589, -0.6415529847145081, -0.6210520267486572, -0.6005510091781616, -0.580049991607666, -0.5595490336418152, -0.5390480756759644, -0.5185470581054688, -0.49804607033729553, -0.4775450825691223, -0.4570440948009491, -0.4365431070327759, -0.41604211926460266, -0.39554113149642944, -0.3750401437282562, -0.354539155960083, -0.3340381681919098, -0.3135371804237366, -0.29303619265556335, -0.27253520488739014, -0.2520342171192169, -0.2315332293510437, -0.21103224158287048, -0.19053125381469727, -0.17003026604652405, -0.14952927827835083, -0.1290282905101776, -0.1085273027420044, -0.08802631497383118, -0.06752532720565796, -0.04702433943748474, -0.026523351669311523, -0.006022363901138306, 0.014478623867034912, 0.03497961163520813, 0.05548059940338135, 0.07598158717155457, 0.09648257493972778, 0.116983562707901, 0.13748455047607422, 0.15798553824424744, 0.17848652601242065, 0.19898751378059387, 0.2194885015487671, 0.2399894893169403, 0.2604904770851135, 0.28099146485328674, 0.30149245262145996, 0.3219934403896332, 0.3424944281578064, 0.3629954159259796, 0.38349640369415283, 0.40399739146232605, 0.42449837923049927, 0.4449993669986725, 0.4655003547668457, 0.4860013425350189, 0.5065023303031921, 0.527003288269043, 0.5475043058395386, 0.5680053234100342, 0.588506281375885]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 29.0, 46.0, 76.0, 126.0, 159.0, 209.0, 326.0, 470.0, 661.0, 947.0, 1404.0, 2085.0, 2997.0, 4418.0, 6891.0, 10573.0, 17338.0, 28605.0, 50458.0, 93121.0, 181770.0, 287712.0, 159475.0, 82601.0, 45284.0, 26011.0, 15399.0, 9779.0, 6383.0, 4212.0, 2792.0, 1887.0, 1291.0, 833.0, 645.0, 411.0, 304.0, 256.0, 156.0, 112.0, 80.0, 66.0, 32.0, 28.0, 16.0, 17.0, 10.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6748046875, -1.6214752197265625, -1.568145751953125, -1.5148162841796875, -1.46148681640625, -1.4081573486328125, -1.354827880859375, -1.3014984130859375, -1.2481689453125, -1.1948394775390625, -1.141510009765625, -1.0881805419921875, -1.03485107421875, -0.9815216064453125, -0.928192138671875, -0.8748626708984375, -0.821533203125, -0.7682037353515625, -0.714874267578125, -0.6615447998046875, -0.60821533203125, -0.5548858642578125, -0.501556396484375, -0.4482269287109375, -0.3948974609375, -0.3415679931640625, -0.288238525390625, -0.2349090576171875, -0.18157958984375, -0.1282501220703125, -0.074920654296875, -0.0215911865234375, 0.03173828125, 0.0850677490234375, 0.138397216796875, 0.1917266845703125, 0.24505615234375, 0.2983856201171875, 0.351715087890625, 0.4050445556640625, 0.4583740234375, 0.5117034912109375, 0.565032958984375, 0.6183624267578125, 0.67169189453125, 0.7250213623046875, 0.778350830078125, 0.8316802978515625, 0.885009765625, 0.9383392333984375, 0.991668701171875, 1.0449981689453125, 1.09832763671875, 1.1516571044921875, 1.204986572265625, 1.2583160400390625, 1.3116455078125, 1.3649749755859375, 1.418304443359375, 1.4716339111328125, 1.52496337890625, 1.5782928466796875, 1.631622314453125, 1.6849517822265625, 1.73828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 11.0, 7.0, 6.0, 9.0, 9.0, 11.0, 11.0, 6.0, 18.0, 11.0, 32.0, 30.0, 27.0, 28.0, 37.0, 22.0, 34.0, 41.0, 33.0, 33.0, 49.0, 28.0, 28.0, 33.0, 45.0, 31.0, 32.0, 35.0, 34.0, 36.0, 32.0, 26.0, 23.0, 24.0, 26.0, 16.0, 19.0, 13.0, 12.0, 11.0, 10.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3564453125, -0.34601593017578125, -0.3355865478515625, -0.32515716552734375, -0.314727783203125, -0.30429840087890625, -0.2938690185546875, -0.28343963623046875, -0.27301025390625, -0.26258087158203125, -0.2521514892578125, -0.24172210693359375, -0.231292724609375, -0.22086334228515625, -0.2104339599609375, -0.20000457763671875, -0.1895751953125, -0.17914581298828125, -0.1687164306640625, -0.15828704833984375, -0.147857666015625, -0.13742828369140625, -0.1269989013671875, -0.11656951904296875, -0.10614013671875, -0.09571075439453125, -0.0852813720703125, -0.07485198974609375, -0.064422607421875, -0.05399322509765625, -0.0435638427734375, -0.03313446044921875, -0.022705078125, -0.01227569580078125, -0.0018463134765625, 0.00858306884765625, 0.019012451171875, 0.02944183349609375, 0.0398712158203125, 0.05030059814453125, 0.06072998046875, 0.07115936279296875, 0.0815887451171875, 0.09201812744140625, 0.102447509765625, 0.11287689208984375, 0.1233062744140625, 0.13373565673828125, 0.1441650390625, 0.15459442138671875, 0.1650238037109375, 0.17545318603515625, 0.185882568359375, 0.19631195068359375, 0.2067413330078125, 0.21717071533203125, 0.22760009765625, 0.23802947998046875, 0.2484588623046875, 0.25888824462890625, 0.269317626953125, 0.27974700927734375, 0.2901763916015625, 0.30060577392578125, 0.31103515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 13.0, 21.0, 31.0, 44.0, 54.0, 65.0, 100.0, 175.0, 227.0, 314.0, 452.0, 647.0, 985.0, 1556.0, 2419.0, 3668.0, 5859.0, 9741.0, 16580.0, 31261.0, 72732.0, 630074.0, 163689.0, 49129.0, 23720.0, 13188.0, 7905.0, 4805.0, 3148.0, 1947.0, 1276.0, 878.0, 555.0, 372.0, 262.0, 189.0, 128.0, 96.0, 54.0, 48.0, 40.0, 25.0, 18.0, 19.0, 10.0, 14.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.8125, -2.721160888671875, -2.62982177734375, -2.538482666015625, -2.4471435546875, -2.355804443359375, -2.26446533203125, -2.173126220703125, -2.081787109375, -1.990447998046875, -1.89910888671875, -1.807769775390625, -1.7164306640625, -1.625091552734375, -1.53375244140625, -1.442413330078125, -1.35107421875, -1.259735107421875, -1.16839599609375, -1.077056884765625, -0.9857177734375, -0.894378662109375, -0.80303955078125, -0.711700439453125, -0.620361328125, -0.529022216796875, -0.43768310546875, -0.346343994140625, -0.2550048828125, -0.163665771484375, -0.07232666015625, 0.019012451171875, 0.1103515625, 0.201690673828125, 0.29302978515625, 0.384368896484375, 0.4757080078125, 0.567047119140625, 0.65838623046875, 0.749725341796875, 0.841064453125, 0.932403564453125, 1.02374267578125, 1.115081787109375, 1.2064208984375, 1.297760009765625, 1.38909912109375, 1.480438232421875, 1.57177734375, 1.663116455078125, 1.75445556640625, 1.845794677734375, 1.9371337890625, 2.028472900390625, 2.11981201171875, 2.211151123046875, 2.302490234375, 2.393829345703125, 2.48516845703125, 2.576507568359375, 2.6678466796875, 2.759185791015625, 2.85052490234375, 2.941864013671875, 3.033203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 5.0, 9.0, 14.0, 12.0, 12.0, 13.0, 12.0, 18.0, 23.0, 22.0, 25.0, 25.0, 29.0, 40.0, 25.0, 27.0, 34.0, 32.0, 37.0, 47.0, 41.0, 30.0, 32.0, 30.0, 36.0, 36.0, 34.0, 33.0, 31.0, 31.0, 26.0, 28.0, 26.0, 12.0, 21.0, 21.0, 13.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.332275390625, -0.3222618103027344, -0.31224822998046875, -0.3022346496582031, -0.2922210693359375, -0.2822074890136719, -0.27219390869140625, -0.2621803283691406, -0.252166748046875, -0.24215316772460938, -0.23213958740234375, -0.22212600708007812, -0.2121124267578125, -0.20209884643554688, -0.19208526611328125, -0.18207168579101562, -0.17205810546875, -0.16204452514648438, -0.15203094482421875, -0.14201736450195312, -0.1320037841796875, -0.12199020385742188, -0.11197662353515625, -0.10196304321289062, -0.091949462890625, -0.08193588256835938, -0.07192230224609375, -0.061908721923828125, -0.0518951416015625, -0.041881561279296875, -0.03186798095703125, -0.021854400634765625, -0.0118408203125, -0.001827239990234375, 0.00818634033203125, 0.018199920654296875, 0.0282135009765625, 0.038227081298828125, 0.04824066162109375, 0.058254241943359375, 0.068267822265625, 0.07828140258789062, 0.08829498291015625, 0.09830856323242188, 0.1083221435546875, 0.11833572387695312, 0.12834930419921875, 0.13836288452148438, 0.14837646484375, 0.15839004516601562, 0.16840362548828125, 0.17841720581054688, 0.1884307861328125, 0.19844436645507812, 0.20845794677734375, 0.21847152709960938, 0.228485107421875, 0.23849868774414062, 0.24851226806640625, 0.2585258483886719, 0.2685394287109375, 0.2785530090332031, 0.28856658935546875, 0.2985801696777344, 0.30859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 7.0, 11.0, 13.0, 20.0, 15.0, 30.0, 25.0, 48.0, 61.0, 81.0, 96.0, 154.0, 203.0, 308.0, 429.0, 670.0, 1161.0, 2029.0, 4552.0, 13547.0, 94762.0, 897127.0, 20622.0, 6225.0, 2514.0, 1336.0, 808.0, 512.0, 335.0, 208.0, 151.0, 114.0, 99.0, 57.0, 53.0, 35.0, 25.0, 17.0, 24.0, 12.0, 11.0, 10.0, 6.0, 8.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.572265625, -3.45758056640625, -3.3428955078125, -3.22821044921875, -3.113525390625, -2.99884033203125, -2.8841552734375, -2.76947021484375, -2.65478515625, -2.54010009765625, -2.4254150390625, -2.31072998046875, -2.196044921875, -2.08135986328125, -1.9666748046875, -1.85198974609375, -1.7373046875, -1.62261962890625, -1.5079345703125, -1.39324951171875, -1.278564453125, -1.16387939453125, -1.0491943359375, -0.93450927734375, -0.81982421875, -0.70513916015625, -0.5904541015625, -0.47576904296875, -0.361083984375, -0.24639892578125, -0.1317138671875, -0.01702880859375, 0.09765625, 0.21234130859375, 0.3270263671875, 0.44171142578125, 0.556396484375, 0.67108154296875, 0.7857666015625, 0.90045166015625, 1.01513671875, 1.12982177734375, 1.2445068359375, 1.35919189453125, 1.473876953125, 1.58856201171875, 1.7032470703125, 1.81793212890625, 1.9326171875, 2.04730224609375, 2.1619873046875, 2.27667236328125, 2.391357421875, 2.50604248046875, 2.6207275390625, 2.73541259765625, 2.85009765625, 2.96478271484375, 3.0794677734375, 3.19415283203125, 3.308837890625, 3.42352294921875, 3.5382080078125, 3.65289306640625, 3.767578125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 22.0, 23.0, 70.0, 305.0, 397.0, 89.0, 28.0, 15.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010353326797485352, -9.971018880605698e-05, -9.588710963726044e-05, -9.20640304684639e-05, -8.824095129966736e-05, -8.441787213087082e-05, -8.059479296207428e-05, -7.677171379327774e-05, -7.29486346244812e-05, -6.912555545568466e-05, -6.530247628688812e-05, -6.147939711809158e-05, -5.7656317949295044e-05, -5.3833238780498505e-05, -5.0010159611701965e-05, -4.6187080442905426e-05, -4.236400127410889e-05, -3.854092210531235e-05, -3.471784293651581e-05, -3.089476376771927e-05, -2.707168459892273e-05, -2.324860543012619e-05, -1.942552626132965e-05, -1.560244709253311e-05, -1.1779367923736572e-05, -7.956288754940033e-06, -4.133209586143494e-06, -3.1013041734695435e-07, 3.512948751449585e-06, 7.336027920246124e-06, 1.1159107089042664e-05, 1.4982186257839203e-05, 1.8805265426635742e-05, 2.262834459543228e-05, 2.645142376422882e-05, 3.027450293302536e-05, 3.40975821018219e-05, 3.792066127061844e-05, 4.174374043941498e-05, 4.556681960821152e-05, 4.938989877700806e-05, 5.3212977945804596e-05, 5.7036057114601135e-05, 6.0859136283397675e-05, 6.468221545219421e-05, 6.850529462099075e-05, 7.232837378978729e-05, 7.615145295858383e-05, 7.997453212738037e-05, 8.379761129617691e-05, 8.762069046497345e-05, 9.144376963376999e-05, 9.526684880256653e-05, 9.908992797136307e-05, 0.00010291300714015961, 0.00010673608630895615, 0.00011055916547775269, 0.00011438224464654922, 0.00011820532381534576, 0.0001220284029841423, 0.00012585148215293884, 0.00012967456132173538, 0.00013349764049053192, 0.00013732071965932846, 0.000141143798828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 6.0, 10.0, 14.0, 42.0, 243.0, 2249.0, 1038733.0, 6649.0, 439.0, 71.0, 22.0, 13.0, 6.0, 3.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.5625, -70.4072265625, -68.251953125, -66.0966796875, -63.94140625, -61.7861328125, -59.630859375, -57.4755859375, -55.3203125, -53.1650390625, -51.009765625, -48.8544921875, -46.69921875, -44.5439453125, -42.388671875, -40.2333984375, -38.078125, -35.9228515625, -33.767578125, -31.6123046875, -29.45703125, -27.3017578125, -25.146484375, -22.9912109375, -20.8359375, -18.6806640625, -16.525390625, -14.3701171875, -12.21484375, -10.0595703125, -7.904296875, -5.7490234375, -3.59375, -1.4384765625, 0.716796875, 2.8720703125, 5.02734375, 7.1826171875, 9.337890625, 11.4931640625, 13.6484375, 15.8037109375, 17.958984375, 20.1142578125, 22.26953125, 24.4248046875, 26.580078125, 28.7353515625, 30.890625, 33.0458984375, 35.201171875, 37.3564453125, 39.51171875, 41.6669921875, 43.822265625, 45.9775390625, 48.1328125, 50.2880859375, 52.443359375, 54.5986328125, 56.75390625, 58.9091796875, 61.064453125, 63.2197265625, 65.375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 8.0, 888.0, 66.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.166778564453125, -3.06988525390625, -2.972991943359375, -2.8760986328125, -2.779205322265625, -2.68231201171875, -2.585418701171875, -2.488525390625, -2.391632080078125, -2.29473876953125, -2.197845458984375, -2.1009521484375, -2.004058837890625, -1.90716552734375, -1.810272216796875, -1.71337890625, -1.616485595703125, -1.51959228515625, -1.422698974609375, -1.3258056640625, -1.228912353515625, -1.13201904296875, -1.035125732421875, -0.938232421875, -0.841339111328125, -0.74444580078125, -0.647552490234375, -0.5506591796875, -0.453765869140625, -0.35687255859375, -0.259979248046875, -0.1630859375, -0.066192626953125, 0.03070068359375, 0.127593994140625, 0.2244873046875, 0.321380615234375, 0.41827392578125, 0.515167236328125, 0.612060546875, 0.708953857421875, 0.80584716796875, 0.902740478515625, 0.9996337890625, 1.096527099609375, 1.19342041015625, 1.290313720703125, 1.38720703125, 1.484100341796875, 1.58099365234375, 1.677886962890625, 1.7747802734375, 1.871673583984375, 1.96856689453125, 2.065460205078125, 2.162353515625, 2.259246826171875, 2.35614013671875, 2.453033447265625, 2.5499267578125, 2.646820068359375, 2.74371337890625, 2.840606689453125, 2.9375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 9.0, 27.0, 178.0, 655.0, 84.0, 29.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.655416488647461, -9.42729377746582, -9.19917106628418, -8.971047401428223, -8.742924690246582, -8.514801979064941, -8.2866792678833, -8.058555603027344, -7.830432891845703, -7.6023101806640625, -7.374186992645264, -7.146064281463623, -6.917941093444824, -6.689818382263184, -6.461695671081543, -6.233572483062744, -6.0054497718811035, -5.777327060699463, -5.549203872680664, -5.321081161499023, -5.092957973480225, -4.864835262298584, -4.636712074279785, -4.4085893630981445, -4.180466651916504, -3.952343702316284, -3.7242207527160645, -3.496098041534424, -3.267974853515625, -3.0398521423339844, -2.8117291927337646, -2.583606243133545, -2.3554835319519043, -2.1273605823516846, -1.8992376327514648, -1.6711148023605347, -1.442991852760315, -1.2148689031600952, -0.986746072769165, -0.7586231231689453, -0.5305001735687256, -0.30237725377082825, -0.07425433397293091, 0.15386855602264404, 0.38199150562286377, 0.6101144552230835, 0.8382372856140137, 1.0663602352142334, 1.2944831848144531, 1.5226061344146729, 1.7507290840148926, 1.9788519144058228, 2.206974983215332, 2.4350976943969727, 2.6632206439971924, 2.891343593597412, 3.119466543197632, 3.3475894927978516, 3.5757124423980713, 3.803835391998291, 4.031958103179932, 4.2600812911987305, 4.488204002380371, 4.716326713562012, 4.9444499015808105]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 11.0, 15.0, 16.0, 20.0, 20.0, 30.0, 24.0, 34.0, 38.0, 39.0, 37.0, 42.0, 57.0, 47.0, 53.0, 55.0, 50.0, 51.0, 43.0, 45.0, 34.0, 40.0, 34.0, 39.0, 24.0, 26.0, 14.0, 12.0, 5.0, 8.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9778990149497986, -0.9487543106079102, -0.919609546661377, -0.8904648423194885, -0.8613201379776001, -0.8321753740310669, -0.8030306696891785, -0.77388596534729, -0.7447412014007568, -0.7155964970588684, -0.6864517331123352, -0.6573070287704468, -0.6281622648239136, -0.5990175604820251, -0.5698728561401367, -0.5407280921936035, -0.5115833878517151, -0.4824386537075043, -0.45329391956329346, -0.42414921522140503, -0.3950044810771942, -0.3658597469329834, -0.33671504259109497, -0.30757030844688416, -0.27842557430267334, -0.24928084015846252, -0.2201361209154129, -0.19099140167236328, -0.16184666752815247, -0.13270193338394165, -0.10355721414089203, -0.07441249489784241, -0.045267701148986816, -0.016122974455356598, 0.01302175223827362, 0.04216647893190384, 0.07131120562553406, 0.10045593976974487, 0.1296006590127945, 0.15874537825584412, 0.18789011240005493, 0.21703484654426575, 0.24617956578731537, 0.275324285030365, 0.3044690191745758, 0.3336137533187866, 0.36275845766067505, 0.39190319180488586, 0.4210479259490967, 0.4501926600933075, 0.4793373942375183, 0.5084820985794067, 0.5376268625259399, 0.5667715668678284, 0.5959162712097168, 0.62506103515625, 0.6542057394981384, 0.6833504438400269, 0.7124952077865601, 0.7416399121284485, 0.7707846164703369, 0.7999293804168701, 0.8290740847587585, 0.858218789100647, 0.8873635530471802]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 1.0, 7.0, 10.0, 4.0, 17.0, 11.0, 19.0, 18.0, 23.0, 23.0, 37.0, 61.0, 56.0, 113.0, 161.0, 302.0, 561.0, 1185.0, 3167.0, 10348.0, 44089.0, 404413.0, 516082.0, 50490.0, 11080.0, 3541.0, 1245.0, 556.0, 305.0, 184.0, 122.0, 79.0, 55.0, 42.0, 24.0, 23.0, 14.0, 16.0, 8.0, 9.0, 9.0, 7.0, 10.0, 2.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.869140625, -3.744476318359375, -3.61981201171875, -3.495147705078125, -3.3704833984375, -3.245819091796875, -3.12115478515625, -2.996490478515625, -2.871826171875, -2.747161865234375, -2.62249755859375, -2.497833251953125, -2.3731689453125, -2.248504638671875, -2.12384033203125, -1.999176025390625, -1.87451171875, -1.749847412109375, -1.62518310546875, -1.500518798828125, -1.3758544921875, -1.251190185546875, -1.12652587890625, -1.001861572265625, -0.877197265625, -0.752532958984375, -0.62786865234375, -0.503204345703125, -0.3785400390625, -0.253875732421875, -0.12921142578125, -0.004547119140625, 0.1201171875, 0.244781494140625, 0.36944580078125, 0.494110107421875, 0.6187744140625, 0.743438720703125, 0.86810302734375, 0.992767333984375, 1.117431640625, 1.242095947265625, 1.36676025390625, 1.491424560546875, 1.6160888671875, 1.740753173828125, 1.86541748046875, 1.990081787109375, 2.11474609375, 2.239410400390625, 2.36407470703125, 2.488739013671875, 2.6134033203125, 2.738067626953125, 2.86273193359375, 2.987396240234375, 3.112060546875, 3.236724853515625, 3.36138916015625, 3.486053466796875, 3.6107177734375, 3.735382080078125, 3.86004638671875, 3.984710693359375, 4.109375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 12.0, 36.0, 62.0, 65.0, 96.0, 137.0, 151.0, 145.0, 108.0, 64.0, 56.0, 31.0, 12.0, 9.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5302734375, -1.48590087890625, -1.4415283203125, -1.39715576171875, -1.352783203125, -1.30841064453125, -1.2640380859375, -1.21966552734375, -1.17529296875, -1.13092041015625, -1.0865478515625, -1.04217529296875, -0.997802734375, -0.95343017578125, -0.9090576171875, -0.86468505859375, -0.8203125, -0.77593994140625, -0.7315673828125, -0.68719482421875, -0.642822265625, -0.59844970703125, -0.5540771484375, -0.50970458984375, -0.46533203125, -0.42095947265625, -0.3765869140625, -0.33221435546875, -0.287841796875, -0.24346923828125, -0.1990966796875, -0.15472412109375, -0.1103515625, -0.06597900390625, -0.0216064453125, 0.02276611328125, 0.067138671875, 0.11151123046875, 0.1558837890625, 0.20025634765625, 0.24462890625, 0.28900146484375, 0.3333740234375, 0.37774658203125, 0.422119140625, 0.46649169921875, 0.5108642578125, 0.55523681640625, 0.599609375, 0.64398193359375, 0.6883544921875, 0.73272705078125, 0.777099609375, 0.82147216796875, 0.8658447265625, 0.91021728515625, 0.95458984375, 0.99896240234375, 1.0433349609375, 1.08770751953125, 1.132080078125, 1.17645263671875, 1.2208251953125, 1.26519775390625, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 5.0, 4.0, 7.0, 11.0, 8.0, 13.0, 14.0, 27.0, 29.0, 35.0, 63.0, 174.0, 566.0, 2318.0, 13641.0, 117573.0, 819273.0, 81677.0, 10391.0, 1872.0, 463.0, 161.0, 73.0, 31.0, 32.0, 16.0, 15.0, 11.0, 13.0, 7.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -3.009368896484375, -2.90350341796875, -2.797637939453125, -2.6917724609375, -2.585906982421875, -2.48004150390625, -2.374176025390625, -2.268310546875, -2.162445068359375, -2.05657958984375, -1.950714111328125, -1.8448486328125, -1.738983154296875, -1.63311767578125, -1.527252197265625, -1.42138671875, -1.315521240234375, -1.20965576171875, -1.103790283203125, -0.9979248046875, -0.892059326171875, -0.78619384765625, -0.680328369140625, -0.574462890625, -0.468597412109375, -0.36273193359375, -0.256866455078125, -0.1510009765625, -0.045135498046875, 0.06072998046875, 0.166595458984375, 0.2724609375, 0.378326416015625, 0.48419189453125, 0.590057373046875, 0.6959228515625, 0.801788330078125, 0.90765380859375, 1.013519287109375, 1.119384765625, 1.225250244140625, 1.33111572265625, 1.436981201171875, 1.5428466796875, 1.648712158203125, 1.75457763671875, 1.860443115234375, 1.96630859375, 2.072174072265625, 2.17803955078125, 2.283905029296875, 2.3897705078125, 2.495635986328125, 2.60150146484375, 2.707366943359375, 2.813232421875, 2.919097900390625, 3.02496337890625, 3.130828857421875, 3.2366943359375, 3.342559814453125, 3.44842529296875, 3.554290771484375, 3.66015625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 12.0, 14.0, 11.0, 9.0, 12.0, 16.0, 19.0, 23.0, 18.0, 21.0, 30.0, 29.0, 33.0, 42.0, 28.0, 35.0, 32.0, 52.0, 50.0, 55.0, 35.0, 37.0, 37.0, 41.0, 36.0, 37.0, 27.0, 27.0, 17.0, 20.0, 20.0, 24.0, 15.0, 19.0, 15.0, 9.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4742431640625, -0.4599609375, -0.4456787109375, -0.431396484375, -0.4171142578125, -0.40283203125, -0.3885498046875, -0.374267578125, -0.3599853515625, -0.345703125, -0.3314208984375, -0.317138671875, -0.3028564453125, -0.28857421875, -0.2742919921875, -0.260009765625, -0.2457275390625, -0.2314453125, -0.2171630859375, -0.202880859375, -0.1885986328125, -0.17431640625, -0.1600341796875, -0.145751953125, -0.1314697265625, -0.1171875, -0.1029052734375, -0.088623046875, -0.0743408203125, -0.06005859375, -0.0457763671875, -0.031494140625, -0.0172119140625, -0.0029296875, 0.0113525390625, 0.025634765625, 0.0399169921875, 0.05419921875, 0.0684814453125, 0.082763671875, 0.0970458984375, 0.111328125, 0.1256103515625, 0.139892578125, 0.1541748046875, 0.16845703125, 0.1827392578125, 0.197021484375, 0.2113037109375, 0.2255859375, 0.2398681640625, 0.254150390625, 0.2684326171875, 0.28271484375, 0.2969970703125, 0.311279296875, 0.3255615234375, 0.33984375, 0.3541259765625, 0.368408203125, 0.3826904296875, 0.39697265625, 0.4112548828125, 0.425537109375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 6.0, 5.0, 2.0, 7.0, 10.0, 10.0, 14.0, 32.0, 65.0, 122.0, 428.0, 2154.0, 17217.0, 930619.0, 91368.0, 5126.0, 879.0, 246.0, 79.0, 39.0, 24.0, 20.0, 14.0, 5.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16390419006347656, -0.15874099731445312, -0.1535778045654297, -0.14841461181640625, -0.1432514190673828, -0.13808822631835938, -0.13292503356933594, -0.1277618408203125, -0.12259864807128906, -0.11743545532226562, -0.11227226257324219, -0.10710906982421875, -0.10194587707519531, -0.09678268432617188, -0.09161949157714844, -0.086456298828125, -0.08129310607910156, -0.07612991333007812, -0.07096672058105469, -0.06580352783203125, -0.06064033508300781, -0.055477142333984375, -0.05031394958496094, -0.0451507568359375, -0.03998756408691406, -0.034824371337890625, -0.029661178588867188, -0.02449798583984375, -0.019334793090820312, -0.014171600341796875, -0.009008407592773438, -0.00384521484375, 0.0013179779052734375, 0.006481170654296875, 0.011644363403320312, 0.01680755615234375, 0.021970748901367188, 0.027133941650390625, 0.03229713439941406, 0.0374603271484375, 0.04262351989746094, 0.047786712646484375, 0.05294990539550781, 0.05811309814453125, 0.06327629089355469, 0.06843948364257812, 0.07360267639160156, 0.078765869140625, 0.08392906188964844, 0.08909225463867188, 0.09425544738769531, 0.09941864013671875, 0.10458183288574219, 0.10974502563476562, 0.11490821838378906, 0.1200714111328125, 0.12523460388183594, 0.13039779663085938, 0.1355609893798828, 0.14072418212890625, 0.1458873748779297, 0.15105056762695312, 0.15621376037597656, 0.161376953125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 6.0, 11.0, 15.0, 10.0, 22.0, 39.0, 60.0, 98.0, 251.0, 208.0, 115.0, 49.0, 27.0, 20.0, 17.0, 13.0, 9.0, 6.0, 9.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2709369659423828e-05, -2.1721236407756805e-05, -2.0733103156089783e-05, -1.974496990442276e-05, -1.8756836652755737e-05, -1.7768703401088715e-05, -1.6780570149421692e-05, -1.579243689775467e-05, -1.4804303646087646e-05, -1.3816170394420624e-05, -1.2828037142753601e-05, -1.1839903891086578e-05, -1.0851770639419556e-05, -9.863637387752533e-06, -8.87550413608551e-06, -7.887370884418488e-06, -6.899237632751465e-06, -5.911104381084442e-06, -4.9229711294174194e-06, -3.934837877750397e-06, -2.946704626083374e-06, -1.9585713744163513e-06, -9.704381227493286e-07, 1.7695128917694092e-08, 1.0058283805847168e-06, 1.9939616322517395e-06, 2.982094883918762e-06, 3.970228135585785e-06, 4.958361387252808e-06, 5.94649463891983e-06, 6.934627890586853e-06, 7.922761142253876e-06, 8.910894393920898e-06, 9.899027645587921e-06, 1.0887160897254944e-05, 1.1875294148921967e-05, 1.286342740058899e-05, 1.3851560652256012e-05, 1.4839693903923035e-05, 1.5827827155590057e-05, 1.681596040725708e-05, 1.7804093658924103e-05, 1.8792226910591125e-05, 1.9780360162258148e-05, 2.076849341392517e-05, 2.1756626665592194e-05, 2.2744759917259216e-05, 2.373289316892624e-05, 2.4721026420593262e-05, 2.5709159672260284e-05, 2.6697292923927307e-05, 2.768542617559433e-05, 2.8673559427261353e-05, 2.9661692678928375e-05, 3.06498259305954e-05, 3.163795918226242e-05, 3.262609243392944e-05, 3.3614225685596466e-05, 3.460235893726349e-05, 3.559049218893051e-05, 3.6578625440597534e-05, 3.756675869226456e-05, 3.855489194393158e-05, 3.95430251955986e-05, 4.0531158447265625e-05]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 9.0, 12.0, 10.0, 17.0, 37.0, 79.0, 218.0, 985.0, 10357.0, 718051.0, 310664.0, 7026.0, 744.0, 156.0, 75.0, 30.0, 23.0, 14.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0697021484375, -0.06729316711425781, -0.06488418579101562, -0.06247520446777344, -0.06006622314453125, -0.05765724182128906, -0.055248260498046875, -0.05283927917480469, -0.0504302978515625, -0.04802131652832031, -0.045612335205078125, -0.04320335388183594, -0.04079437255859375, -0.03838539123535156, -0.035976409912109375, -0.03356742858886719, -0.031158447265625, -0.028749465942382812, -0.026340484619140625, -0.023931503295898438, -0.02152252197265625, -0.019113540649414062, -0.016704559326171875, -0.014295578002929688, -0.0118865966796875, -0.009477615356445312, -0.007068634033203125, -0.0046596527099609375, -0.00225067138671875, 0.0001583099365234375, 0.002567291259765625, 0.0049762725830078125, 0.00738525390625, 0.009794235229492188, 0.012203216552734375, 0.014612197875976562, 0.01702117919921875, 0.019430160522460938, 0.021839141845703125, 0.024248123168945312, 0.0266571044921875, 0.029066085815429688, 0.031475067138671875, 0.03388404846191406, 0.03629302978515625, 0.03870201110839844, 0.041110992431640625, 0.04351997375488281, 0.045928955078125, 0.04833793640136719, 0.050746917724609375, 0.05315589904785156, 0.05556488037109375, 0.05797386169433594, 0.060382843017578125, 0.06279182434082031, 0.0652008056640625, 0.06760978698730469, 0.07001876831054688, 0.07242774963378906, 0.07483673095703125, 0.07724571228027344, 0.07965469360351562, 0.08206367492675781, 0.08447265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 9.0, 15.0, 13.0, 24.0, 25.0, 26.0, 57.0, 60.0, 69.0, 82.0, 102.0, 80.0, 101.0, 66.0, 66.0, 38.0, 34.0, 21.0, 23.0, 12.0, 13.0, 11.0, 8.0, 5.0, 8.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006893157958984375, -0.006605088710784912, -0.006317019462585449, -0.006028950214385986, -0.0057408809661865234, -0.0054528117179870605, -0.005164742469787598, -0.004876673221588135, -0.004588603973388672, -0.004300534725189209, -0.004012465476989746, -0.003724396228790283, -0.0034363269805908203, -0.0031482577323913574, -0.0028601884841918945, -0.0025721192359924316, -0.0022840499877929688, -0.001995980739593506, -0.001707911491394043, -0.00141984224319458, -0.0011317729949951172, -0.0008437037467956543, -0.0005556344985961914, -0.0002675652503967285, 2.0503997802734375e-05, 0.00030857324600219727, 0.0005966424942016602, 0.000884711742401123, 0.001172780990600586, 0.0014608502388000488, 0.0017489194869995117, 0.0020369887351989746, 0.0023250579833984375, 0.0026131272315979004, 0.0029011964797973633, 0.003189265727996826, 0.003477334976196289, 0.003765404224395752, 0.004053473472595215, 0.004341542720794678, 0.004629611968994141, 0.0049176812171936035, 0.005205750465393066, 0.005493819713592529, 0.005781888961791992, 0.006069958209991455, 0.006358027458190918, 0.006646096706390381, 0.006934165954589844, 0.007222235202789307, 0.0075103044509887695, 0.007798373699188232, 0.008086442947387695, 0.008374512195587158, 0.008662581443786621, 0.008950650691986084, 0.009238719940185547, 0.00952678918838501, 0.009814858436584473, 0.010102927684783936, 0.010390996932983398, 0.010679066181182861, 0.010967135429382324, 0.011255204677581787, 0.01154327392578125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 30.0, 441.0, 497.0, 35.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.017688751220703, -3.826444625854492, -3.635200262069702, -3.443956136703491, -3.252711772918701, -3.0614676475524902, -2.8702235221862793, -2.6789793968200684, -2.4877350330352783, -2.2964909076690674, -2.1052465438842773, -1.9140024185180664, -1.722758173942566, -1.5315139293670654, -1.3402698040008545, -1.149025559425354, -0.9577813148498535, -0.766537070274353, -0.5752928853034973, -0.3840487003326416, -0.1928044557571411, -0.001560211181640625, 0.1896839141845703, 0.3809281587600708, 0.5721724033355713, 0.7634166479110718, 0.9546608328819275, 1.1459050178527832, 1.3371492624282837, 1.5283935070037842, 1.7196376323699951, 1.9108818769454956, 2.102126121520996, 2.293370246887207, 2.484614610671997, 2.675858736038208, 2.867103099822998, 3.058347225189209, 3.24959135055542, 3.440835475921631, 3.632079839706421, 3.823323965072632, 4.014568328857422, 4.205812454223633, 4.397056579589844, 4.588300704956055, 4.779544830322266, 4.970789432525635, 5.162033557891846, 5.353277683258057, 5.544521808624268, 5.735766410827637, 5.927010536193848, 6.118254661560059, 6.3094987869262695, 6.5007429122924805, 6.691987037658691, 6.883231163024902, 7.074475288391113, 7.265719413757324, 7.456964015960693, 7.648208141326904, 7.839452266693115, 8.030696868896484, 8.221940994262695]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 12.0, 29.0, 45.0, 61.0, 73.0, 80.0, 91.0, 94.0, 87.0, 78.0, 82.0, 63.0, 54.0, 42.0, 40.0, 24.0, 19.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6532704830169678, -1.6077730655670166, -1.5622756481170654, -1.5167783498764038, -1.4712809324264526, -1.4257835149765015, -1.3802860975265503, -1.3347887992858887, -1.2892913818359375, -1.2437939643859863, -1.1982965469360352, -1.1527992486953735, -1.1073018312454224, -1.0618044137954712, -1.01630699634552, -0.9708096385002136, -0.9253122210502625, -0.8798148036003113, -0.8343174457550049, -0.7888200283050537, -0.7433226704597473, -0.6978252530097961, -0.6523278951644897, -0.6068304777145386, -0.5613330602645874, -0.5158356428146362, -0.47033828496932983, -0.42484086751937866, -0.37934350967407227, -0.3338460922241211, -0.2883487045764923, -0.24285131692886353, -0.19735395908355713, -0.15185657143592834, -0.10635917633771896, -0.06086178123950958, -0.015364393591880798, 0.030132994055747986, 0.07563039660453796, 0.12112778425216675, 0.16662517189979553, 0.21212255954742432, 0.2576199471950531, 0.3031173348426819, 0.34861475229263306, 0.39411211013793945, 0.4396095275878906, 0.4851069152355194, 0.5306043028831482, 0.5761017203330994, 0.6215990781784058, 0.6670964956283569, 0.7125938534736633, 0.7580912709236145, 0.8035886287689209, 0.8490860462188721, 0.8945834636688232, 0.9400808811187744, 0.9855782389640808, 1.0310755968093872, 1.0765730142593384, 1.1220704317092896, 1.1675678491592407, 1.2130651473999023, 1.2585625648498535]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 17.0, 16.0, 10.0, 19.0, 32.0, 57.0, 66.0, 106.0, 166.0, 280.0, 614.0, 1271.0, 3689.0, 33201.0, 4144156.0, 6738.0, 1940.0, 838.0, 423.0, 232.0, 115.0, 70.0, 45.0, 50.0, 31.0, 21.0, 20.0, 14.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.86932373046875, -4.7269287109375, -4.58453369140625, -4.442138671875, -4.29974365234375, -4.1573486328125, -4.01495361328125, -3.87255859375, -3.73016357421875, -3.5877685546875, -3.44537353515625, -3.302978515625, -3.16058349609375, -3.0181884765625, -2.87579345703125, -2.7333984375, -2.59100341796875, -2.4486083984375, -2.30621337890625, -2.163818359375, -2.02142333984375, -1.8790283203125, -1.73663330078125, -1.59423828125, -1.45184326171875, -1.3094482421875, -1.16705322265625, -1.024658203125, -0.88226318359375, -0.7398681640625, -0.59747314453125, -0.455078125, -0.31268310546875, -0.1702880859375, -0.02789306640625, 0.114501953125, 0.25689697265625, 0.3992919921875, 0.54168701171875, 0.68408203125, 0.82647705078125, 0.9688720703125, 1.11126708984375, 1.253662109375, 1.39605712890625, 1.5384521484375, 1.68084716796875, 1.8232421875, 1.96563720703125, 2.1080322265625, 2.25042724609375, 2.392822265625, 2.53521728515625, 2.6776123046875, 2.82000732421875, 2.96240234375, 3.10479736328125, 3.2471923828125, 3.38958740234375, 3.531982421875, 3.67437744140625, 3.8167724609375, 3.95916748046875, 4.1015625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 12.0, 12.0, 7.0, 16.0, 19.0, 38.0, 27.0, 42.0, 37.0, 47.0, 56.0, 42.0, 55.0, 57.0, 48.0, 52.0, 54.0, 45.0, 41.0, 36.0, 33.0, 35.0, 25.0, 40.0, 30.0, 14.0, 17.0, 17.0, 10.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31600189208984375, -0.3065643310546875, -0.29712677001953125, -0.287689208984375, -0.27825164794921875, -0.2688140869140625, -0.25937652587890625, -0.24993896484375, -0.24050140380859375, -0.2310638427734375, -0.22162628173828125, -0.212188720703125, -0.20275115966796875, -0.1933135986328125, -0.18387603759765625, -0.1744384765625, -0.16500091552734375, -0.1555633544921875, -0.14612579345703125, -0.136688232421875, -0.12725067138671875, -0.1178131103515625, -0.10837554931640625, -0.09893798828125, -0.08950042724609375, -0.0800628662109375, -0.07062530517578125, -0.061187744140625, -0.05175018310546875, -0.0423126220703125, -0.03287506103515625, -0.0234375, -0.01399993896484375, -0.0045623779296875, 0.00487518310546875, 0.014312744140625, 0.02375030517578125, 0.0331878662109375, 0.04262542724609375, 0.05206298828125, 0.06150054931640625, 0.0709381103515625, 0.08037567138671875, 0.089813232421875, 0.09925079345703125, 0.1086883544921875, 0.11812591552734375, 0.1275634765625, 0.13700103759765625, 0.1464385986328125, 0.15587615966796875, 0.165313720703125, 0.17475128173828125, 0.1841888427734375, 0.19362640380859375, 0.20306396484375, 0.21250152587890625, 0.2219390869140625, 0.23137664794921875, 0.240814208984375, 0.25025177001953125, 0.2596893310546875, 0.26912689208984375, 0.278564453125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 11.0, 11.0, 18.0, 28.0, 34.0, 61.0, 124.0, 274.0, 889.0, 4844.0, 204958.0, 3975001.0, 6296.0, 1096.0, 331.0, 129.0, 64.0, 41.0, 19.0, 17.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.6295166015625, -4.489501953125, -4.3494873046875, -4.20947265625, -4.0694580078125, -3.929443359375, -3.7894287109375, -3.6494140625, -3.5093994140625, -3.369384765625, -3.2293701171875, -3.08935546875, -2.9493408203125, -2.809326171875, -2.6693115234375, -2.529296875, -2.3892822265625, -2.249267578125, -2.1092529296875, -1.96923828125, -1.8292236328125, -1.689208984375, -1.5491943359375, -1.4091796875, -1.2691650390625, -1.129150390625, -0.9891357421875, -0.84912109375, -0.7091064453125, -0.569091796875, -0.4290771484375, -0.2890625, -0.1490478515625, -0.009033203125, 0.1309814453125, 0.27099609375, 0.4110107421875, 0.551025390625, 0.6910400390625, 0.8310546875, 0.9710693359375, 1.111083984375, 1.2510986328125, 1.39111328125, 1.5311279296875, 1.671142578125, 1.8111572265625, 1.951171875, 2.0911865234375, 2.231201171875, 2.3712158203125, 2.51123046875, 2.6512451171875, 2.791259765625, 2.9312744140625, 3.0712890625, 3.2113037109375, 3.351318359375, 3.4913330078125, 3.63134765625, 3.7713623046875, 3.911376953125, 4.0513916015625, 4.19140625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 7.0, 10.0, 15.0, 56.0, 738.0, 3054.0, 105.0, 25.0, 16.0, 9.0, 12.0, 10.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.24428176879882812, -0.23001861572265625, -0.21575546264648438, -0.2014923095703125, -0.18722915649414062, -0.17296600341796875, -0.15870285034179688, -0.144439697265625, -0.13017654418945312, -0.11591339111328125, -0.10165023803710938, -0.0873870849609375, -0.07312393188476562, -0.05886077880859375, -0.044597625732421875, -0.03033447265625, -0.016071319580078125, -0.00180816650390625, 0.012454986572265625, 0.0267181396484375, 0.040981292724609375, 0.05524444580078125, 0.06950759887695312, 0.083770751953125, 0.09803390502929688, 0.11229705810546875, 0.12656021118164062, 0.1408233642578125, 0.15508651733398438, 0.16934967041015625, 0.18361282348632812, 0.1978759765625, 0.21213912963867188, 0.22640228271484375, 0.24066543579101562, 0.2549285888671875, 0.2691917419433594, 0.28345489501953125, 0.2977180480957031, 0.311981201171875, 0.3262443542480469, 0.34050750732421875, 0.3547706604003906, 0.3690338134765625, 0.3832969665527344, 0.39756011962890625, 0.4118232727050781, 0.42608642578125, 0.4403495788574219, 0.45461273193359375, 0.4688758850097656, 0.4831390380859375, 0.4974021911621094, 0.5116653442382812, 0.5259284973144531, 0.540191650390625, 0.5544548034667969, 0.5687179565429688, 0.5829811096191406, 0.5972442626953125, 0.6115074157714844, 0.6257705688476562, 0.6400337219238281, 0.654296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 10.0, 10.0, 16.0, 25.0, 30.0, 54.0, 104.0, 247.0, 229.0, 97.0, 49.0, 32.0, 24.0, 10.0, 11.0, 6.0, 6.0, 7.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.871871829032898, -0.8461560010910034, -0.8204401135444641, -0.7947242856025696, -0.7690083980560303, -0.7432925701141357, -0.7175767421722412, -0.6918609142303467, -0.6661450266838074, -0.6404291987419128, -0.6147133111953735, -0.588997483253479, -0.5632816553115845, -0.5375657677650452, -0.5118499398231506, -0.4861340820789337, -0.4604182243347168, -0.4347023665904999, -0.40898650884628296, -0.3832706809043884, -0.3575548231601715, -0.3318389654159546, -0.30612313747406006, -0.28040727972984314, -0.2546914219856262, -0.2289755642414093, -0.20325972139835358, -0.17754387855529785, -0.15182802081108093, -0.126112163066864, -0.10039632022380829, -0.07468047738075256, -0.04896456003189087, -0.023248709738254547, 0.002467140555381775, 0.028182990849018097, 0.05389884114265442, 0.07961469888687134, 0.10533054172992706, 0.1310463845729828, 0.1567622423171997, 0.18247810006141663, 0.20819394290447235, 0.23390978574752808, 0.259625643491745, 0.2853415012359619, 0.31105732917785645, 0.33677318692207336, 0.3624890446662903, 0.3882049024105072, 0.4139207601547241, 0.43963658809661865, 0.46535244584083557, 0.4910683035850525, 0.516784131526947, 0.5425000190734863, 0.5682158470153809, 0.5939316749572754, 0.6196475625038147, 0.6453633904457092, 0.6710792779922485, 0.6967951059341431, 0.7225109338760376, 0.7482267618179321, 0.7739426493644714]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 15.0, 15.0, 19.0, 26.0, 25.0, 35.0, 37.0, 60.0, 70.0, 67.0, 62.0, 57.0, 61.0, 59.0, 46.0, 57.0, 59.0, 38.0, 32.0, 35.0, 25.0, 25.0, 15.0, 13.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5420538783073425, -0.5289170145988464, -0.5157801508903503, -0.5026432871818542, -0.48950639367103577, -0.4763695299625397, -0.4632326364517212, -0.4500957727432251, -0.436958909034729, -0.4238220453262329, -0.4106851816177368, -0.39754828810691833, -0.38441142439842224, -0.37127456068992615, -0.35813766717910767, -0.3450008034706116, -0.3318639397621155, -0.3187270760536194, -0.3055902123451233, -0.2924533188343048, -0.2793164551258087, -0.2661795914173126, -0.25304269790649414, -0.23990583419799805, -0.22676897048950195, -0.21363210678100586, -0.20049522817134857, -0.18735834956169128, -0.1742214858531952, -0.1610846221446991, -0.1479477435350418, -0.13481086492538452, -0.12167400121688843, -0.10853713005781174, -0.09540025889873505, -0.08226338773965836, -0.06912651658058167, -0.055989645421504974, -0.042852774262428284, -0.029715903103351593, -0.016579031944274902, -0.0034421607851982117, 0.009694710373878479, 0.02283158153295517, 0.03596845269203186, 0.04910532385110855, 0.06224219501018524, 0.07537906616926193, 0.08851593732833862, 0.10165280848741531, 0.114789679646492, 0.1279265582561493, 0.14106342196464539, 0.15420028567314148, 0.16733716428279877, 0.18047404289245605, 0.19361090660095215, 0.20674777030944824, 0.21988464891910553, 0.23302152752876282, 0.2461583912372589, 0.259295254945755, 0.2724321484565735, 0.2855690121650696, 0.2987058758735657]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 12.0, 12.0, 16.0, 19.0, 35.0, 50.0, 78.0, 131.0, 219.0, 335.0, 617.0, 1148.0, 2276.0, 4737.0, 10959.0, 28950.0, 93128.0, 501136.0, 300892.0, 65199.0, 21941.0, 8699.0, 3830.0, 1833.0, 966.0, 528.0, 312.0, 184.0, 105.0, 53.0, 48.0, 37.0, 17.0, 15.0, 8.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3740234375, -1.329498291015625, -1.28497314453125, -1.240447998046875, -1.1959228515625, -1.151397705078125, -1.10687255859375, -1.062347412109375, -1.017822265625, -0.973297119140625, -0.92877197265625, -0.884246826171875, -0.8397216796875, -0.795196533203125, -0.75067138671875, -0.706146240234375, -0.66162109375, -0.617095947265625, -0.57257080078125, -0.528045654296875, -0.4835205078125, -0.438995361328125, -0.39447021484375, -0.349945068359375, -0.305419921875, -0.260894775390625, -0.21636962890625, -0.171844482421875, -0.1273193359375, -0.082794189453125, -0.03826904296875, 0.006256103515625, 0.05078125, 0.095306396484375, 0.13983154296875, 0.184356689453125, 0.2288818359375, 0.273406982421875, 0.31793212890625, 0.362457275390625, 0.406982421875, 0.451507568359375, 0.49603271484375, 0.540557861328125, 0.5850830078125, 0.629608154296875, 0.67413330078125, 0.718658447265625, 0.76318359375, 0.807708740234375, 0.85223388671875, 0.896759033203125, 0.9412841796875, 0.985809326171875, 1.03033447265625, 1.074859619140625, 1.119384765625, 1.163909912109375, 1.20843505859375, 1.252960205078125, 1.2974853515625, 1.342010498046875, 1.38653564453125, 1.431060791015625, 1.4755859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 11.0, 9.0, 19.0, 26.0, 29.0, 32.0, 44.0, 55.0, 70.0, 75.0, 73.0, 68.0, 63.0, 69.0, 61.0, 62.0, 43.0, 31.0, 36.0, 30.0, 22.0, 15.0, 12.0, 9.0, 5.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.19091796875, -0.1861114501953125, -0.181304931640625, -0.1764984130859375, -0.17169189453125, -0.1668853759765625, -0.162078857421875, -0.1572723388671875, -0.1524658203125, -0.1476593017578125, -0.142852783203125, -0.1380462646484375, -0.13323974609375, -0.1284332275390625, -0.123626708984375, -0.1188201904296875, -0.114013671875, -0.1092071533203125, -0.104400634765625, -0.0995941162109375, -0.09478759765625, -0.0899810791015625, -0.085174560546875, -0.0803680419921875, -0.0755615234375, -0.0707550048828125, -0.065948486328125, -0.0611419677734375, -0.05633544921875, -0.0515289306640625, -0.046722412109375, -0.0419158935546875, -0.037109375, -0.0323028564453125, -0.027496337890625, -0.0226898193359375, -0.01788330078125, -0.0130767822265625, -0.008270263671875, -0.0034637451171875, 0.0013427734375, 0.0061492919921875, 0.010955810546875, 0.0157623291015625, 0.02056884765625, 0.0253753662109375, 0.030181884765625, 0.0349884033203125, 0.039794921875, 0.0446014404296875, 0.049407958984375, 0.0542144775390625, 0.05902099609375, 0.0638275146484375, 0.068634033203125, 0.0734405517578125, 0.0782470703125, 0.0830535888671875, 0.087860107421875, 0.0926666259765625, 0.09747314453125, 0.1022796630859375, 0.107086181640625, 0.1118927001953125, 0.11669921875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 11.0, 20.0, 32.0, 32.0, 41.0, 49.0, 71.0, 105.0, 138.0, 187.0, 238.0, 378.0, 507.0, 743.0, 999.0, 1522.0, 2157.0, 3374.0, 4957.0, 7805.0, 12629.0, 21188.0, 40832.0, 112347.0, 676046.0, 78694.0, 33576.0, 18052.0, 10928.0, 6984.0, 4386.0, 2933.0, 1979.0, 1321.0, 929.0, 674.0, 505.0, 324.0, 239.0, 188.0, 127.0, 73.0, 52.0, 37.0, 50.0, 30.0, 25.0, 16.0, 11.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5478515625, -0.5309219360351562, -0.5139923095703125, -0.49706268310546875, -0.480133056640625, -0.46320343017578125, -0.4462738037109375, -0.42934417724609375, -0.41241455078125, -0.39548492431640625, -0.3785552978515625, -0.36162567138671875, -0.344696044921875, -0.32776641845703125, -0.3108367919921875, -0.29390716552734375, -0.2769775390625, -0.26004791259765625, -0.2431182861328125, -0.22618865966796875, -0.209259033203125, -0.19232940673828125, -0.1753997802734375, -0.15847015380859375, -0.14154052734375, -0.12461090087890625, -0.1076812744140625, -0.09075164794921875, -0.073822021484375, -0.05689239501953125, -0.0399627685546875, -0.02303314208984375, -0.006103515625, 0.01082611083984375, 0.0277557373046875, 0.04468536376953125, 0.061614990234375, 0.07854461669921875, 0.0954742431640625, 0.11240386962890625, 0.12933349609375, 0.14626312255859375, 0.1631927490234375, 0.18012237548828125, 0.197052001953125, 0.21398162841796875, 0.2309112548828125, 0.24784088134765625, 0.2647705078125, 0.28170013427734375, 0.2986297607421875, 0.31555938720703125, 0.332489013671875, 0.34941864013671875, 0.3663482666015625, 0.38327789306640625, 0.40020751953125, 0.41713714599609375, 0.4340667724609375, 0.45099639892578125, 0.467926025390625, 0.48485565185546875, 0.5017852783203125, 0.5187149047851562, 0.53564453125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 2.0, 3.0, 11.0, 2.0, 13.0, 19.0, 11.0, 33.0, 23.0, 25.0, 25.0, 28.0, 38.0, 28.0, 31.0, 32.0, 36.0, 41.0, 50.0, 35.0, 37.0, 31.0, 35.0, 40.0, 41.0, 33.0, 29.0, 23.0, 29.0, 24.0, 26.0, 20.0, 25.0, 22.0, 15.0, 15.0, 15.0, 11.0, 9.0, 13.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054412841796875, -0.05255746841430664, -0.05070209503173828, -0.04884672164916992, -0.04699134826660156, -0.0451359748840332, -0.043280601501464844, -0.041425228118896484, -0.039569854736328125, -0.037714481353759766, -0.035859107971191406, -0.03400373458862305, -0.03214836120605469, -0.030292987823486328, -0.02843761444091797, -0.02658224105834961, -0.02472686767578125, -0.02287149429321289, -0.02101612091064453, -0.019160747528076172, -0.017305374145507812, -0.015450000762939453, -0.013594627380371094, -0.011739253997802734, -0.009883880615234375, -0.008028507232666016, -0.006173133850097656, -0.004317760467529297, -0.0024623870849609375, -0.0006070137023925781, 0.0012483596801757812, 0.0031037330627441406, 0.0049591064453125, 0.006814479827880859, 0.008669853210449219, 0.010525226593017578, 0.012380599975585938, 0.014235973358154297, 0.016091346740722656, 0.017946720123291016, 0.019802093505859375, 0.021657466888427734, 0.023512840270996094, 0.025368213653564453, 0.027223587036132812, 0.029078960418701172, 0.03093433380126953, 0.03278970718383789, 0.03464508056640625, 0.03650045394897461, 0.03835582733154297, 0.04021120071411133, 0.04206657409667969, 0.04392194747924805, 0.045777320861816406, 0.047632694244384766, 0.049488067626953125, 0.051343441009521484, 0.053198814392089844, 0.0550541877746582, 0.05690956115722656, 0.05876493453979492, 0.06062030792236328, 0.06247568130493164, 0.0643310546875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 5.0, 7.0, 12.0, 19.0, 21.0, 36.0, 40.0, 52.0, 87.0, 103.0, 132.0, 218.0, 353.0, 624.0, 1105.0, 2271.0, 5022.0, 14379.0, 104002.0, 881643.0, 24500.0, 7312.0, 3079.0, 1458.0, 811.0, 431.0, 235.0, 164.0, 126.0, 85.0, 51.0, 45.0, 29.0, 27.0, 16.0, 10.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1495361328125, -0.14458274841308594, -0.13962936401367188, -0.1346759796142578, -0.12972259521484375, -0.12476921081542969, -0.11981582641601562, -0.11486244201660156, -0.1099090576171875, -0.10495567321777344, -0.10000228881835938, -0.09504890441894531, -0.09009552001953125, -0.08514213562011719, -0.08018875122070312, -0.07523536682128906, -0.070281982421875, -0.06532859802246094, -0.060375213623046875, -0.05542182922363281, -0.05046844482421875, -0.04551506042480469, -0.040561676025390625, -0.03560829162597656, -0.0306549072265625, -0.025701522827148438, -0.020748138427734375, -0.015794754028320312, -0.01084136962890625, -0.0058879852294921875, -0.000934600830078125, 0.0040187835693359375, 0.00897216796875, 0.013925552368164062, 0.018878936767578125, 0.023832321166992188, 0.02878570556640625, 0.03373908996582031, 0.038692474365234375, 0.04364585876464844, 0.0485992431640625, 0.05355262756347656, 0.058506011962890625, 0.06345939636230469, 0.06841278076171875, 0.07336616516113281, 0.07831954956054688, 0.08327293395996094, 0.088226318359375, 0.09317970275878906, 0.09813308715820312, 0.10308647155761719, 0.10803985595703125, 0.11299324035644531, 0.11794662475585938, 0.12290000915527344, 0.1278533935546875, 0.13280677795410156, 0.13776016235351562, 0.1427135467529297, 0.14766693115234375, 0.1526203155517578, 0.15757369995117188, 0.16252708435058594, 0.16748046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 8.0, 13.0, 6.0, 5.0, 16.0, 10.0, 16.0, 27.0, 17.0, 42.0, 36.0, 83.0, 109.0, 182.0, 143.0, 61.0, 54.0, 31.0, 19.0, 20.0, 18.0, 21.0, 4.0, 4.0, 9.0, 5.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-9.47713851928711e-06, -9.203329682350159e-06, -8.929520845413208e-06, -8.655712008476257e-06, -8.381903171539307e-06, -8.108094334602356e-06, -7.834285497665405e-06, -7.560476660728455e-06, -7.286667823791504e-06, -7.012858986854553e-06, -6.7390501499176025e-06, -6.465241312980652e-06, -6.191432476043701e-06, -5.9176236391067505e-06, -5.6438148021698e-06, -5.370005965232849e-06, -5.0961971282958984e-06, -4.822388291358948e-06, -4.548579454421997e-06, -4.274770617485046e-06, -4.000961780548096e-06, -3.727152943611145e-06, -3.4533441066741943e-06, -3.1795352697372437e-06, -2.905726432800293e-06, -2.6319175958633423e-06, -2.3581087589263916e-06, -2.084299921989441e-06, -1.8104910850524902e-06, -1.5366822481155396e-06, -1.2628734111785889e-06, -9.890645742416382e-07, -7.152557373046875e-07, -4.414469003677368e-07, -1.6763806343078613e-07, 1.0617077350616455e-07, 3.7997961044311523e-07, 6.537884473800659e-07, 9.275972843170166e-07, 1.2014061212539673e-06, 1.475214958190918e-06, 1.7490237951278687e-06, 2.0228326320648193e-06, 2.29664146900177e-06, 2.5704503059387207e-06, 2.8442591428756714e-06, 3.118067979812622e-06, 3.3918768167495728e-06, 3.6656856536865234e-06, 3.939494490623474e-06, 4.213303327560425e-06, 4.4871121644973755e-06, 4.760921001434326e-06, 5.034729838371277e-06, 5.3085386753082275e-06, 5.582347512245178e-06, 5.856156349182129e-06, 6.12996518611908e-06, 6.40377402305603e-06, 6.677582859992981e-06, 6.951391696929932e-06, 7.225200533866882e-06, 7.499009370803833e-06, 7.772818207740784e-06, 8.046627044677734e-06]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 5.0, 10.0, 11.0, 18.0, 19.0, 31.0, 60.0, 134.0, 364.0, 1591.0, 12363.0, 1014650.0, 16594.0, 1877.0, 452.0, 161.0, 61.0, 34.0, 23.0, 14.0, 15.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2003173828125, -0.19451904296875, -0.188720703125, -0.18292236328125, -0.1771240234375, -0.17132568359375, -0.16552734375, -0.15972900390625, -0.1539306640625, -0.14813232421875, -0.142333984375, -0.13653564453125, -0.1307373046875, -0.12493896484375, -0.119140625, -0.11334228515625, -0.1075439453125, -0.10174560546875, -0.095947265625, -0.09014892578125, -0.0843505859375, -0.07855224609375, -0.07275390625, -0.06695556640625, -0.0611572265625, -0.05535888671875, -0.049560546875, -0.04376220703125, -0.0379638671875, -0.03216552734375, -0.0263671875, -0.02056884765625, -0.0147705078125, -0.00897216796875, -0.003173828125, 0.00262451171875, 0.0084228515625, 0.01422119140625, 0.02001953125, 0.02581787109375, 0.0316162109375, 0.03741455078125, 0.043212890625, 0.04901123046875, 0.0548095703125, 0.06060791015625, 0.06640625, 0.07220458984375, 0.0780029296875, 0.08380126953125, 0.089599609375, 0.09539794921875, 0.1011962890625, 0.10699462890625, 0.11279296875, 0.11859130859375, 0.1243896484375, 0.13018798828125, 0.135986328125, 0.14178466796875, 0.1475830078125, 0.15338134765625, 0.1591796875, 0.16497802734375, 0.1707763671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 8.0, 9.0, 10.0, 12.0, 37.0, 47.0, 129.0, 457.0, 128.0, 70.0, 22.0, 21.0, 10.0, 8.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142822265625, -0.013869047164916992, -0.013455867767333984, -0.013042688369750977, -0.012629508972167969, -0.012216329574584961, -0.011803150177001953, -0.011389970779418945, -0.010976791381835938, -0.01056361198425293, -0.010150432586669922, -0.009737253189086914, -0.009324073791503906, -0.008910894393920898, -0.00849771499633789, -0.008084535598754883, -0.007671356201171875, -0.007258176803588867, -0.006844997406005859, -0.0064318180084228516, -0.006018638610839844, -0.005605459213256836, -0.005192279815673828, -0.00477910041809082, -0.0043659210205078125, -0.003952741622924805, -0.003539562225341797, -0.003126382827758789, -0.0027132034301757812, -0.0023000240325927734, -0.0018868446350097656, -0.0014736652374267578, -0.00106048583984375, -0.0006473064422607422, -0.00023412704467773438, 0.00017905235290527344, 0.0005922317504882812, 0.001005411148071289, 0.0014185905456542969, 0.0018317699432373047, 0.0022449493408203125, 0.0026581287384033203, 0.003071308135986328, 0.003484487533569336, 0.0038976669311523438, 0.0043108463287353516, 0.004724025726318359, 0.005137205123901367, 0.005550384521484375, 0.005963563919067383, 0.006376743316650391, 0.0067899227142333984, 0.007203102111816406, 0.007616281509399414, 0.008029460906982422, 0.00844264030456543, 0.008855819702148438, 0.009268999099731445, 0.009682178497314453, 0.010095357894897461, 0.010508537292480469, 0.010921716690063477, 0.011334896087646484, 0.011748075485229492, 0.0121612548828125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 13.0, 74.0, 618.0, 236.0, 54.0, 12.0, 6.0, 2.0, 3.0], "bins": [-1.804661512374878, -1.7734200954437256, -1.7421786785125732, -1.710937261581421, -1.679695963859558, -1.6484545469284058, -1.6172131299972534, -1.585971713066101, -1.5547302961349487, -1.5234888792037964, -1.492247462272644, -1.4610060453414917, -1.429764747619629, -1.3985233306884766, -1.3672819137573242, -1.3360404968261719, -1.3047990798950195, -1.2735576629638672, -1.2423162460327148, -1.2110748291015625, -1.1798335313796997, -1.1485921144485474, -1.117350697517395, -1.0861092805862427, -1.0548678636550903, -1.023626446723938, -0.9923850893974304, -0.9611436724662781, -0.9299022555351257, -0.8986608982086182, -0.8674194812774658, -0.8361780643463135, -0.8049367070198059, -0.7736952900886536, -0.742453932762146, -0.7112125158309937, -0.6799710988998413, -0.648729681968689, -0.6174883246421814, -0.586246907711029, -0.5550054907798767, -0.5237640738487244, -0.4925226867198944, -0.46128129959106445, -0.4300398826599121, -0.39879849553108215, -0.3675571084022522, -0.33631569147109985, -0.3050742745399475, -0.27383288741111755, -0.2425914704799652, -0.21135008335113525, -0.1801086664199829, -0.14886727929115295, -0.1176258772611618, -0.08638447523117065, -0.0551430881023407, -0.023901687934994698, 0.007339712232351303, 0.038581110537052155, 0.0698225125670433, 0.10106390714645386, 0.132305309176445, 0.16354671120643616, 0.1947881132364273]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 6.0, 15.0, 14.0, 19.0, 27.0, 26.0, 35.0, 43.0, 56.0, 67.0, 61.0, 66.0, 59.0, 58.0, 61.0, 47.0, 50.0, 53.0, 50.0, 30.0, 32.0, 29.0, 20.0, 18.0, 18.0, 9.0, 7.0, 4.0, 6.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.17152650654315948, -0.1673574447631836, -0.1631883829832077, -0.1590193212032318, -0.15485024452209473, -0.15068118274211884, -0.14651212096214294, -0.14234305918216705, -0.13817399740219116, -0.13400493562221527, -0.12983587384223938, -0.1256668120622635, -0.121497742831707, -0.11732868105173111, -0.11315961182117462, -0.10899055004119873, -0.10482148826122284, -0.10065242648124695, -0.09648336470127106, -0.09231429547071457, -0.08814523369073868, -0.08397617191076279, -0.0798071026802063, -0.07563804090023041, -0.07146897912025452, -0.06729991734027863, -0.06313085556030273, -0.058961786329746246, -0.054792724549770355, -0.050623662769794464, -0.046454597264528275, -0.042285531759262085, -0.038116469979286194, -0.0339474081993103, -0.029778342694044113, -0.025609279051423073, -0.021440215408802032, -0.017271151766180992, -0.013102088123559952, -0.008933024480938911, -0.004763960838317871, -0.0005948971956968307, 0.0035741664469242096, 0.00774323008954525, 0.01191229373216629, 0.01608135737478733, 0.02025042101740837, 0.02441948466002941, 0.02858854830265045, 0.03275761008262634, 0.03692667558789253, 0.04109574109315872, 0.04526480287313461, 0.049433864653110504, 0.053602930158376694, 0.05777199566364288, 0.061941057443618774, 0.06611011922359467, 0.07027918100357056, 0.07444825023412704, 0.07861731201410294, 0.08278637379407883, 0.08695544302463531, 0.0911245048046112, 0.0952935665845871]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 9.0, 11.0, 14.0, 19.0, 21.0, 27.0, 29.0, 49.0, 83.0, 142.0, 383.0, 1057.0, 3730.0, 18385.0, 138697.0, 782579.0, 86193.0, 12765.0, 2839.0, 856.0, 273.0, 132.0, 63.0, 40.0, 30.0, 22.0, 23.0, 22.0, 10.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48193359375, -0.46367645263671875, -0.4454193115234375, -0.42716217041015625, -0.408905029296875, -0.39064788818359375, -0.3723907470703125, -0.35413360595703125, -0.33587646484375, -0.31761932373046875, -0.2993621826171875, -0.28110504150390625, -0.262847900390625, -0.24459075927734375, -0.2263336181640625, -0.20807647705078125, -0.1898193359375, -0.17156219482421875, -0.1533050537109375, -0.13504791259765625, -0.116790771484375, -0.09853363037109375, -0.0802764892578125, -0.06201934814453125, -0.04376220703125, -0.02550506591796875, -0.0072479248046875, 0.01100921630859375, 0.029266357421875, 0.04752349853515625, 0.0657806396484375, 0.08403778076171875, 0.102294921875, 0.12055206298828125, 0.1388092041015625, 0.15706634521484375, 0.175323486328125, 0.19358062744140625, 0.2118377685546875, 0.23009490966796875, 0.24835205078125, 0.26660919189453125, 0.2848663330078125, 0.30312347412109375, 0.321380615234375, 0.33963775634765625, 0.3578948974609375, 0.37615203857421875, 0.3944091796875, 0.41266632080078125, 0.4309234619140625, 0.44918060302734375, 0.467437744140625, 0.48569488525390625, 0.5039520263671875, 0.5222091674804688, 0.54046630859375, 0.5587234497070312, 0.5769805908203125, 0.5952377319335938, 0.613494873046875, 0.6317520141601562, 0.6500091552734375, 0.6682662963867188, 0.6865234375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 11.0, 13.0, 22.0, 37.0, 64.0, 84.0, 108.0, 135.0, 112.0, 112.0, 92.0, 61.0, 68.0, 35.0, 20.0, 11.0, 7.0, 7.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0943603515625, -0.09232425689697266, -0.09028816223144531, -0.08825206756591797, -0.08621597290039062, -0.08417987823486328, -0.08214378356933594, -0.0801076889038086, -0.07807159423828125, -0.0760354995727539, -0.07399940490722656, -0.07196331024169922, -0.06992721557617188, -0.06789112091064453, -0.06585502624511719, -0.06381893157958984, -0.0617828369140625, -0.059746742248535156, -0.05771064758300781, -0.05567455291748047, -0.053638458251953125, -0.05160236358642578, -0.04956626892089844, -0.047530174255371094, -0.04549407958984375, -0.043457984924316406, -0.04142189025878906, -0.03938579559326172, -0.037349700927734375, -0.03531360626220703, -0.03327751159667969, -0.031241416931152344, -0.029205322265625, -0.027169227600097656, -0.025133132934570312, -0.02309703826904297, -0.021060943603515625, -0.01902484893798828, -0.016988754272460938, -0.014952659606933594, -0.01291656494140625, -0.010880470275878906, -0.008844375610351562, -0.006808280944824219, -0.004772186279296875, -0.0027360916137695312, -0.0006999969482421875, 0.0013360977172851562, 0.0033721923828125, 0.005408287048339844, 0.0074443817138671875, 0.009480476379394531, 0.011516571044921875, 0.013552665710449219, 0.015588760375976562, 0.017624855041503906, 0.01966094970703125, 0.021697044372558594, 0.023733139038085938, 0.02576923370361328, 0.027805328369140625, 0.02984142303466797, 0.03187751770019531, 0.033913612365722656, 0.03594970703125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 15.0, 25.0, 18.0, 42.0, 60.0, 84.0, 151.0, 245.0, 393.0, 728.0, 1265.0, 2421.0, 4781.0, 9280.0, 19145.0, 40905.0, 98706.0, 310550.0, 360925.0, 111447.0, 45381.0, 20754.0, 10092.0, 5167.0, 2712.0, 1316.0, 787.0, 421.0, 254.0, 166.0, 101.0, 63.0, 48.0, 28.0, 20.0, 10.0, 15.0, 5.0, 5.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.1012725830078125, -0.098114013671875, -0.0949554443359375, -0.091796875, -0.0886383056640625, -0.085479736328125, -0.0823211669921875, -0.07916259765625, -0.0760040283203125, -0.072845458984375, -0.0696868896484375, -0.0665283203125, -0.0633697509765625, -0.060211181640625, -0.0570526123046875, -0.05389404296875, -0.0507354736328125, -0.047576904296875, -0.0444183349609375, -0.041259765625, -0.0381011962890625, -0.034942626953125, -0.0317840576171875, -0.02862548828125, -0.0254669189453125, -0.022308349609375, -0.0191497802734375, -0.0159912109375, -0.0128326416015625, -0.009674072265625, -0.0065155029296875, -0.00335693359375, -0.0001983642578125, 0.002960205078125, 0.0061187744140625, 0.00927734375, 0.0124359130859375, 0.015594482421875, 0.0187530517578125, 0.02191162109375, 0.0250701904296875, 0.028228759765625, 0.0313873291015625, 0.0345458984375, 0.0377044677734375, 0.040863037109375, 0.0440216064453125, 0.04718017578125, 0.0503387451171875, 0.053497314453125, 0.0566558837890625, 0.059814453125, 0.0629730224609375, 0.066131591796875, 0.0692901611328125, 0.07244873046875, 0.0756072998046875, 0.078765869140625, 0.0819244384765625, 0.0850830078125, 0.0882415771484375, 0.091400146484375, 0.0945587158203125, 0.09771728515625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 7.0, 4.0, 16.0, 16.0, 14.0, 15.0, 20.0, 27.0, 20.0, 24.0, 27.0, 34.0, 38.0, 37.0, 37.0, 44.0, 36.0, 42.0, 43.0, 38.0, 34.0, 38.0, 47.0, 35.0, 37.0, 37.0, 38.0, 35.0, 18.0, 24.0, 24.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0219573974609375, -0.021258831024169922, -0.020560264587402344, -0.019861698150634766, -0.019163131713867188, -0.01846456527709961, -0.01776599884033203, -0.017067432403564453, -0.016368865966796875, -0.015670299530029297, -0.014971733093261719, -0.01427316665649414, -0.013574600219726562, -0.012876033782958984, -0.012177467346191406, -0.011478900909423828, -0.01078033447265625, -0.010081768035888672, -0.009383201599121094, -0.008684635162353516, -0.007986068725585938, -0.007287502288818359, -0.006588935852050781, -0.005890369415283203, -0.005191802978515625, -0.004493236541748047, -0.0037946701049804688, -0.0030961036682128906, -0.0023975372314453125, -0.0016989707946777344, -0.0010004043579101562, -0.0003018379211425781, 0.000396728515625, 0.0010952949523925781, 0.0017938613891601562, 0.0024924278259277344, 0.0031909942626953125, 0.0038895606994628906, 0.004588127136230469, 0.005286693572998047, 0.005985260009765625, 0.006683826446533203, 0.007382392883300781, 0.00808095932006836, 0.008779525756835938, 0.009478092193603516, 0.010176658630371094, 0.010875225067138672, 0.01157379150390625, 0.012272357940673828, 0.012970924377441406, 0.013669490814208984, 0.014368057250976562, 0.01506662368774414, 0.01576519012451172, 0.016463756561279297, 0.017162322998046875, 0.017860889434814453, 0.01855945587158203, 0.01925802230834961, 0.019956588745117188, 0.020655155181884766, 0.021353721618652344, 0.022052288055419922, 0.0227508544921875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 11.0, 9.0, 25.0, 34.0, 62.0, 104.0, 185.0, 355.0, 863.0, 2054.0, 6183.0, 30487.0, 752068.0, 229893.0, 18773.0, 4555.0, 1575.0, 629.0, 309.0, 155.0, 73.0, 48.0, 32.0, 23.0, 11.0, 17.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01084136962890625, -0.010478377342224121, -0.010115385055541992, -0.009752392768859863, -0.009389400482177734, -0.009026408195495605, -0.008663415908813477, -0.008300423622131348, -0.007937431335449219, -0.00757443904876709, -0.007211446762084961, -0.006848454475402832, -0.006485462188720703, -0.006122469902038574, -0.005759477615356445, -0.005396485328674316, -0.0050334930419921875, -0.004670500755310059, -0.00430750846862793, -0.003944516181945801, -0.003581523895263672, -0.003218531608581543, -0.002855539321899414, -0.002492547035217285, -0.0021295547485351562, -0.0017665624618530273, -0.0014035701751708984, -0.0010405778884887695, -0.0006775856018066406, -0.0003145933151245117, 4.839897155761719e-05, 0.0004113912582397461, 0.000774383544921875, 0.001137375831604004, 0.0015003681182861328, 0.0018633604049682617, 0.0022263526916503906, 0.0025893449783325195, 0.0029523372650146484, 0.0033153295516967773, 0.0036783218383789062, 0.004041314125061035, 0.004404306411743164, 0.004767298698425293, 0.005130290985107422, 0.005493283271789551, 0.00585627555847168, 0.006219267845153809, 0.0065822601318359375, 0.006945252418518066, 0.007308244705200195, 0.007671236991882324, 0.008034229278564453, 0.008397221565246582, 0.008760213851928711, 0.00912320613861084, 0.009486198425292969, 0.009849190711975098, 0.010212182998657227, 0.010575175285339355, 0.010938167572021484, 0.011301159858703613, 0.011664152145385742, 0.012027144432067871, 0.01239013671875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 9.0, 9.0, 9.0, 16.0, 16.0, 30.0, 49.0, 74.0, 104.0, 131.0, 167.0, 126.0, 65.0, 59.0, 30.0, 19.0, 13.0, 17.0, 11.0, 5.0, 10.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2351741790771484e-05, -2.1678395569324493e-05, -2.1005049347877502e-05, -2.033170312643051e-05, -1.965835690498352e-05, -1.898501068353653e-05, -1.831166446208954e-05, -1.7638318240642548e-05, -1.6964972019195557e-05, -1.6291625797748566e-05, -1.5618279576301575e-05, -1.4944933354854584e-05, -1.4271587133407593e-05, -1.3598240911960602e-05, -1.292489469051361e-05, -1.225154846906662e-05, -1.1578202247619629e-05, -1.0904856026172638e-05, -1.0231509804725647e-05, -9.558163583278656e-06, -8.884817361831665e-06, -8.211471140384674e-06, -7.538124918937683e-06, -6.864778697490692e-06, -6.191432476043701e-06, -5.51808625459671e-06, -4.844740033149719e-06, -4.171393811702728e-06, -3.4980475902557373e-06, -2.8247013688087463e-06, -2.1513551473617554e-06, -1.4780089259147644e-06, -8.046627044677734e-07, -1.3131648302078247e-07, 5.420297384262085e-07, 1.2153759598731995e-06, 1.8887221813201904e-06, 2.5620684027671814e-06, 3.2354146242141724e-06, 3.908760845661163e-06, 4.582107067108154e-06, 5.255453288555145e-06, 5.928799510002136e-06, 6.602145731449127e-06, 7.275491952896118e-06, 7.948838174343109e-06, 8.6221843957901e-06, 9.295530617237091e-06, 9.968876838684082e-06, 1.0642223060131073e-05, 1.1315569281578064e-05, 1.1988915503025055e-05, 1.2662261724472046e-05, 1.3335607945919037e-05, 1.4008954167366028e-05, 1.4682300388813019e-05, 1.535564661026001e-05, 1.6028992831707e-05, 1.6702339053153992e-05, 1.7375685274600983e-05, 1.8049031496047974e-05, 1.8722377717494965e-05, 1.9395723938941956e-05, 2.0069070160388947e-05, 2.0742416381835938e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 12.0, 7.0, 28.0, 35.0, 50.0, 80.0, 131.0, 177.0, 329.0, 491.0, 903.0, 1693.0, 2954.0, 5707.0, 11740.0, 26503.0, 68395.0, 241509.0, 481911.0, 127408.0, 42691.0, 17939.0, 8384.0, 4199.0, 2213.0, 1228.0, 720.0, 430.0, 248.0, 163.0, 92.0, 48.0, 37.0, 29.0, 21.0, 15.0, 6.0, 9.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00241851806640625, -0.002349942922592163, -0.002281367778778076, -0.0022127926349639893, -0.0021442174911499023, -0.0020756423473358154, -0.0020070672035217285, -0.0019384920597076416, -0.0018699169158935547, -0.0018013417720794678, -0.0017327666282653809, -0.001664191484451294, -0.001595616340637207, -0.0015270411968231201, -0.0014584660530090332, -0.0013898909091949463, -0.0013213157653808594, -0.0012527406215667725, -0.0011841654777526855, -0.0011155903339385986, -0.0010470151901245117, -0.0009784400463104248, -0.0009098649024963379, -0.000841289758682251, -0.0007727146148681641, -0.0007041394710540771, -0.0006355643272399902, -0.0005669891834259033, -0.0004984140396118164, -0.0004298388957977295, -0.0003612637519836426, -0.00029268860816955566, -0.00022411346435546875, -0.00015553832054138184, -8.696317672729492e-05, -1.8388032913208008e-05, 5.0187110900878906e-05, 0.00011876225471496582, 0.00018733739852905273, 0.00025591254234313965, 0.00032448768615722656, 0.0003930628299713135, 0.0004616379737854004, 0.0005302131175994873, 0.0005987882614135742, 0.0006673634052276611, 0.000735938549041748, 0.000804513692855835, 0.0008730888366699219, 0.0009416639804840088, 0.0010102391242980957, 0.0010788142681121826, 0.0011473894119262695, 0.0012159645557403564, 0.0012845396995544434, 0.0013531148433685303, 0.0014216899871826172, 0.001490265130996704, 0.001558840274810791, 0.001627415418624878, 0.0016959905624389648, 0.0017645657062530518, 0.0018331408500671387, 0.0019017159938812256, 0.0019702911376953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 8.0, 5.0, 8.0, 18.0, 15.0, 14.0, 19.0, 24.0, 33.0, 35.0, 54.0, 41.0, 60.0, 49.0, 66.0, 62.0, 64.0, 50.0, 62.0, 52.0, 40.0, 40.0, 35.0, 20.0, 26.0, 19.0, 13.0, 22.0, 7.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005540847778320312, -0.0005375519394874573, -0.0005210191011428833, -0.0005044862627983093, -0.00048795342445373535, -0.0004714205861091614, -0.0004548877477645874, -0.00043835490942001343, -0.00042182207107543945, -0.0004052892327308655, -0.0003887563943862915, -0.00037222355604171753, -0.00035569071769714355, -0.0003391578793525696, -0.0003226250410079956, -0.00030609220266342163, -0.00028955936431884766, -0.0002730265259742737, -0.0002564936876296997, -0.00023996084928512573, -0.00022342801094055176, -0.00020689517259597778, -0.0001903623342514038, -0.00017382949590682983, -0.00015729665756225586, -0.00014076381921768188, -0.0001242309808731079, -0.00010769814252853394, -9.116530418395996e-05, -7.463246583938599e-05, -5.809962749481201e-05, -4.156678915023804e-05, -2.5033950805664062e-05, -8.501112461090088e-06, 8.031725883483887e-06, 2.456456422805786e-05, 4.1097402572631836e-05, 5.763024091720581e-05, 7.416307926177979e-05, 9.069591760635376e-05, 0.00010722875595092773, 0.0001237615942955017, 0.00014029443264007568, 0.00015682727098464966, 0.00017336010932922363, 0.0001898929476737976, 0.00020642578601837158, 0.00022295862436294556, 0.00023949146270751953, 0.0002560243010520935, 0.0002725571393966675, 0.00028908997774124146, 0.00030562281608581543, 0.0003221556544303894, 0.0003386884927749634, 0.00035522133111953735, 0.00037175416946411133, 0.0003882870078086853, 0.0004048198461532593, 0.00042135268449783325, 0.0004378855228424072, 0.0004544183611869812, 0.0004709511995315552, 0.00048748403787612915, 0.0005040168762207031]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 21.0, 73.0, 395.0, 398.0, 74.0, 34.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4317481219768524, -0.4237499535083771, -0.41575175523757935, -0.407753586769104, -0.39975541830062866, -0.3917572498321533, -0.3837590515613556, -0.37576088309288025, -0.3677627146244049, -0.35976454615592957, -0.35176634788513184, -0.3437681794166565, -0.33577001094818115, -0.3277718424797058, -0.3197736442089081, -0.31177547574043274, -0.303777277469635, -0.29577910900115967, -0.28778091073036194, -0.2797827422618866, -0.27178457379341125, -0.2637864053249359, -0.2557882070541382, -0.24779003858566284, -0.2397918701171875, -0.23179368674755096, -0.22379551827907562, -0.2157973349094391, -0.20779916644096375, -0.1998009830713272, -0.19180279970169067, -0.18380463123321533, -0.17580646276474, -0.16780827939510345, -0.1598101109266281, -0.15181192755699158, -0.14381375908851624, -0.1358155757188797, -0.12781739234924316, -0.11981922388076782, -0.11182104051113129, -0.10382286459207535, -0.09582468867301941, -0.08782650530338287, -0.07982833683490753, -0.071830153465271, -0.06383197754621506, -0.05583380162715912, -0.04783562570810318, -0.03983744978904724, -0.0318392738699913, -0.023841094225645065, -0.015842918306589127, -0.007844742387533188, 0.00015343725681304932, 0.008151613175868988, 0.016149789094924927, 0.024147965013980865, 0.032146140933036804, 0.04014432057738304, 0.04814249649643898, 0.05614067241549492, 0.06413885205984116, 0.0721370279788971, 0.08013520389795303]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 14.0, 11.0, 17.0, 31.0, 31.0, 43.0, 58.0, 60.0, 87.0, 89.0, 78.0, 84.0, 65.0, 74.0, 58.0, 49.0, 39.0, 30.0, 26.0, 25.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07888586819171906, -0.07712051272392273, -0.0753551498055458, -0.07358979433774948, -0.07182443886995316, -0.07005907595157623, -0.06829372048377991, -0.06652836501598358, -0.06476300209760666, -0.06299764662981033, -0.06123228743672371, -0.059466928243637085, -0.05770156905055046, -0.055936213582754135, -0.05417085438966751, -0.052405498921871185, -0.05064014345407486, -0.048874784260988235, -0.04710942879319191, -0.045344069600105286, -0.04357871040701866, -0.041813354939222336, -0.04004799574613571, -0.038282640278339386, -0.03651727735996246, -0.03475191816687584, -0.032986562699079514, -0.03122120350599289, -0.029455846175551414, -0.02769048884510994, -0.025925129652023315, -0.02415977232158184, -0.022394414991140366, -0.02062905766069889, -0.018863698467612267, -0.01709834113717079, -0.015332983806729317, -0.013567625544965267, -0.011802267283201218, -0.010036909952759743, -0.008271551690995693, -0.006506193894892931, -0.004740836098790169, -0.0029754778370261192, -0.001210120040923357, 0.0005552377551794052, 0.0023205960169434547, 0.00408595334738493, 0.005851311609148979, 0.007616669405251741, 0.009382027201354504, 0.011147385463118553, 0.012912742793560028, 0.014678101055324078, 0.016443459317088127, 0.018208816647529602, 0.019974175840616226, 0.0217395331710577, 0.023504892364144325, 0.0252702496945858, 0.027035607025027275, 0.02880096435546875, 0.030566323548555374, 0.032331682741642, 0.034097038209438324]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 7.0, 22.0, 53.0, 123.0, 550.0, 2791.0, 4175239.0, 13277.0, 1749.0, 314.0, 101.0, 33.0, 4.0, 7.0, 2.0, 2.0], "bins": [-0.71923828125, -0.7061147689819336, -0.6929912567138672, -0.6798677444458008, -0.6667442321777344, -0.653620719909668, -0.6404972076416016, -0.6273736953735352, -0.6142501831054688, -0.6011266708374023, -0.5880031585693359, -0.5748796463012695, -0.5617561340332031, -0.5486326217651367, -0.5355091094970703, -0.5223855972290039, -0.5092620849609375, -0.4961385726928711, -0.4830150604248047, -0.4698915481567383, -0.4567680358886719, -0.44364452362060547, -0.43052101135253906, -0.41739749908447266, -0.40427398681640625, -0.39115047454833984, -0.37802696228027344, -0.36490345001220703, -0.3517799377441406, -0.3386564254760742, -0.3255329132080078, -0.3124094009399414, -0.299285888671875, -0.2861623764038086, -0.2730388641357422, -0.2599153518676758, -0.24679183959960938, -0.23366832733154297, -0.22054481506347656, -0.20742130279541016, -0.19429779052734375, -0.18117427825927734, -0.16805076599121094, -0.15492725372314453, -0.14180374145507812, -0.12868022918701172, -0.11555671691894531, -0.1024332046508789, -0.0893096923828125, -0.0761861801147461, -0.06306266784667969, -0.04993915557861328, -0.036815643310546875, -0.02369213104248047, -0.010568618774414062, 0.0025548934936523438, 0.01567840576171875, 0.028801918029785156, 0.04192543029785156, 0.05504894256591797, 0.06817245483398438, 0.08129596710205078, 0.09441947937011719, 0.1075429916381836, 0.12066650390625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 25.0, 32.0, 65.0, 102.0, 182.0, 173.0, 159.0, 117.0, 82.0, 45.0, 20.0, 4.0, 5.0, 3.0, 2.0], "bins": [-0.146728515625, -0.1440420150756836, -0.1413555145263672, -0.13866901397705078, -0.13598251342773438, -0.13329601287841797, -0.13060951232910156, -0.12792301177978516, -0.12523651123046875, -0.12255001068115234, -0.11986351013183594, -0.11717700958251953, -0.11449050903320312, -0.11180400848388672, -0.10911750793457031, -0.1064310073852539, -0.1037445068359375, -0.1010580062866211, -0.09837150573730469, -0.09568500518798828, -0.09299850463867188, -0.09031200408935547, -0.08762550354003906, -0.08493900299072266, -0.08225250244140625, -0.07956600189208984, -0.07687950134277344, -0.07419300079345703, -0.07150650024414062, -0.06881999969482422, -0.06613349914550781, -0.0634469985961914, -0.060760498046875, -0.058073997497558594, -0.05538749694824219, -0.05270099639892578, -0.050014495849609375, -0.04732799530029297, -0.04464149475097656, -0.041954994201660156, -0.03926849365234375, -0.036581993103027344, -0.03389549255371094, -0.03120899200439453, -0.028522491455078125, -0.02583599090576172, -0.023149490356445312, -0.020462989807128906, -0.0177764892578125, -0.015089988708496094, -0.012403488159179688, -0.009716987609863281, -0.007030487060546875, -0.004343986511230469, -0.0016574859619140625, 0.0010290145874023438, 0.00371551513671875, 0.006402015686035156, 0.009088516235351562, 0.011775016784667969, 0.014461517333984375, 0.01714801788330078, 0.019834518432617188, 0.022521018981933594, 0.02520751953125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 6.0, 1.0, 9.0, 10.0, 21.0, 28.0, 31.0, 42.0, 70.0, 88.0, 107.0, 148.0, 216.0, 313.0, 458.0, 645.0, 1109.0, 1773.0, 3929.0, 12893.0, 3840483.0, 313288.0, 10340.0, 3449.0, 1706.0, 1003.0, 621.0, 434.0, 310.0, 203.0, 137.0, 102.0, 90.0, 64.0, 39.0, 33.0, 20.0, 18.0, 12.0, 8.0, 4.0, 1.0, 8.0, 1.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0811767578125, -0.07846450805664062, -0.07575225830078125, -0.07304000854492188, -0.0703277587890625, -0.06761550903320312, -0.06490325927734375, -0.062191009521484375, -0.059478759765625, -0.056766510009765625, -0.05405426025390625, -0.051342010498046875, -0.0486297607421875, -0.045917510986328125, -0.04320526123046875, -0.040493011474609375, -0.03778076171875, -0.035068511962890625, -0.03235626220703125, -0.029644012451171875, -0.0269317626953125, -0.024219512939453125, -0.02150726318359375, -0.018795013427734375, -0.016082763671875, -0.013370513916015625, -0.01065826416015625, -0.007946014404296875, -0.0052337646484375, -0.002521514892578125, 0.00019073486328125, 0.002902984619140625, 0.005615234375, 0.008327484130859375, 0.01103973388671875, 0.013751983642578125, 0.0164642333984375, 0.019176483154296875, 0.02188873291015625, 0.024600982666015625, 0.027313232421875, 0.030025482177734375, 0.03273773193359375, 0.035449981689453125, 0.0381622314453125, 0.040874481201171875, 0.04358673095703125, 0.046298980712890625, 0.04901123046875, 0.051723480224609375, 0.05443572998046875, 0.057147979736328125, 0.0598602294921875, 0.06257247924804688, 0.06528472900390625, 0.06799697875976562, 0.070709228515625, 0.07342147827148438, 0.07613372802734375, 0.07884597778320312, 0.0815582275390625, 0.08427047729492188, 0.08698272705078125, 0.08969497680664062, 0.0924072265625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 15.0, 86.0, 509.0, 3259.0, 132.0, 27.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224456787109375, -0.021767854690551758, -0.021090030670166016, -0.020412206649780273, -0.01973438262939453, -0.01905655860900879, -0.018378734588623047, -0.017700910568237305, -0.017023086547851562, -0.01634526252746582, -0.015667438507080078, -0.014989614486694336, -0.014311790466308594, -0.013633966445922852, -0.01295614242553711, -0.012278318405151367, -0.011600494384765625, -0.010922670364379883, -0.01024484634399414, -0.009567022323608398, -0.008889198303222656, -0.008211374282836914, -0.007533550262451172, -0.00685572624206543, -0.0061779022216796875, -0.005500078201293945, -0.004822254180908203, -0.004144430160522461, -0.0034666061401367188, -0.0027887821197509766, -0.0021109580993652344, -0.0014331340789794922, -0.00075531005859375, -7.748603820800781e-05, 0.0006003379821777344, 0.0012781620025634766, 0.0019559860229492188, 0.002633810043334961, 0.003311634063720703, 0.003989458084106445, 0.0046672821044921875, 0.00534510612487793, 0.006022930145263672, 0.006700754165649414, 0.007378578186035156, 0.008056402206420898, 0.00873422622680664, 0.009412050247192383, 0.010089874267578125, 0.010767698287963867, 0.01144552230834961, 0.012123346328735352, 0.012801170349121094, 0.013478994369506836, 0.014156818389892578, 0.01483464241027832, 0.015512466430664062, 0.016190290451049805, 0.016868114471435547, 0.01754593849182129, 0.01822376251220703, 0.018901586532592773, 0.019579410552978516, 0.020257234573364258, 0.02093505859375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 13.0, 30.0, 66.0, 152.0, 469.0, 163.0, 52.0, 29.0, 18.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18576115369796753, -0.18185198307037354, -0.17794282734394073, -0.17403365671634674, -0.17012448608875275, -0.16621531546115875, -0.16230615973472595, -0.15839698910713196, -0.15448781847953796, -0.15057864785194397, -0.14666949212551117, -0.14276032149791718, -0.13885115087032318, -0.1349419802427292, -0.1310328245162964, -0.1271236538887024, -0.123214490711689, -0.1193053275346756, -0.1153961569070816, -0.1114869937300682, -0.10757782310247421, -0.10366865992546082, -0.09975948929786682, -0.09585032612085342, -0.09194116294384003, -0.08803199976682663, -0.08412282913923264, -0.08021366596221924, -0.07630449533462524, -0.07239533215761185, -0.06848616898059845, -0.06457699835300446, -0.06066783517599106, -0.05675866827368736, -0.05284950137138367, -0.04894033819437027, -0.045031167566776276, -0.04112200438976288, -0.03721283748745918, -0.03330367058515549, -0.02939450368285179, -0.025485336780548096, -0.0215761698782444, -0.017667004838585854, -0.013757837936282158, -0.009848671033978462, -0.005939505994319916, -0.00203033909201622, 0.0018788278102874756, 0.005787994246929884, 0.009697160683572292, 0.013606326654553413, 0.01751549355685711, 0.021424660459160805, 0.02533382549881935, 0.029242992401123047, 0.03315215930342674, 0.03706132620573044, 0.040970493108034134, 0.04487966001033783, 0.04878882318735123, 0.05269799381494522, 0.05660715699195862, 0.060516323894262314, 0.06442549079656601]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 4.0, 10.0, 17.0, 20.0, 21.0, 28.0, 38.0, 63.0, 51.0, 65.0, 54.0, 93.0, 83.0, 64.0, 56.0, 71.0, 60.0, 51.0, 50.0, 27.0, 22.0, 19.0, 16.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.053395695984363556, -0.05222116783261299, -0.05104663968086243, -0.04987211525440216, -0.048697587102651596, -0.04752305895090103, -0.04634853079915047, -0.0451740026473999, -0.043999478220939636, -0.04282495006918907, -0.04165042191743851, -0.04047589749097824, -0.039301369339227676, -0.03812684118747711, -0.03695231303572655, -0.03577778488397598, -0.03460326045751572, -0.03342873230576515, -0.03225420415401459, -0.031079677864909172, -0.029905151575803757, -0.028730623424053192, -0.027556095272302628, -0.026381568983197212, -0.0252070389688015, -0.024032510817050934, -0.02285798452794552, -0.021683456376194954, -0.02050893008708954, -0.019334401935338974, -0.01815987378358841, -0.016985347494482994, -0.01581081934273243, -0.01463629212230444, -0.01346176490187645, -0.012287236750125885, -0.01111271046102047, -0.009938182309269905, -0.008763655088841915, -0.007589127868413925, -0.006414600647985935, -0.005240073427557945, -0.004065546207129955, -0.002891018521040678, -0.001716491300612688, -0.0005419640801846981, 0.0006325636059045792, 0.0018070908263325691, 0.002981618046760559, 0.004156145267188549, 0.005330672487616539, 0.006505200173705816, 0.007679727394133806, 0.008854255080223083, 0.010028782300651073, 0.011203309521079063, 0.012377836741507053, 0.013552363961935043, 0.014726891182363033, 0.015901418402791023, 0.017075946554541588, 0.018250472843647003, 0.019425000995397568, 0.020599529147148132, 0.021774055436253548]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 12.0, 8.0, 18.0, 20.0, 28.0, 52.0, 81.0, 163.0, 331.0, 729.0, 2183.0, 7654.0, 37045.0, 377895.0, 560909.0, 48251.0, 8948.0, 2500.0, 932.0, 374.0, 176.0, 81.0, 56.0, 40.0, 23.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.149658203125, -0.14412879943847656, -0.13859939575195312, -0.1330699920654297, -0.12754058837890625, -0.12201118469238281, -0.11648178100585938, -0.11095237731933594, -0.1054229736328125, -0.09989356994628906, -0.09436416625976562, -0.08883476257324219, -0.08330535888671875, -0.07777595520019531, -0.07224655151367188, -0.06671714782714844, -0.061187744140625, -0.05565834045410156, -0.050128936767578125, -0.04459953308105469, -0.03907012939453125, -0.03354072570800781, -0.028011322021484375, -0.022481918334960938, -0.0169525146484375, -0.011423110961914062, -0.005893707275390625, -0.0003643035888671875, 0.00516510009765625, 0.010694503784179688, 0.016223907470703125, 0.021753311157226562, 0.02728271484375, 0.03281211853027344, 0.038341522216796875, 0.04387092590332031, 0.04940032958984375, 0.05492973327636719, 0.060459136962890625, 0.06598854064941406, 0.0715179443359375, 0.07704734802246094, 0.08257675170898438, 0.08810615539550781, 0.09363555908203125, 0.09916496276855469, 0.10469436645507812, 0.11022377014160156, 0.115753173828125, 0.12128257751464844, 0.12681198120117188, 0.1323413848876953, 0.13787078857421875, 0.1434001922607422, 0.14892959594726562, 0.15445899963378906, 0.1599884033203125, 0.16551780700683594, 0.17104721069335938, 0.1765766143798828, 0.18210601806640625, 0.1876354217529297, 0.19316482543945312, 0.19869422912597656, 0.2042236328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 9.0, 11.0, 22.0, 26.0, 45.0, 51.0, 60.0, 62.0, 107.0, 89.0, 85.0, 82.0, 79.0, 59.0, 69.0, 55.0, 30.0, 23.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.02227783203125, -0.02178359031677246, -0.021289348602294922, -0.020795106887817383, -0.020300865173339844, -0.019806623458862305, -0.019312381744384766, -0.018818140029907227, -0.018323898315429688, -0.01782965660095215, -0.01733541488647461, -0.01684117317199707, -0.01634693145751953, -0.015852689743041992, -0.015358448028564453, -0.014864206314086914, -0.014369964599609375, -0.013875722885131836, -0.013381481170654297, -0.012887239456176758, -0.012392997741699219, -0.01189875602722168, -0.01140451431274414, -0.010910272598266602, -0.010416030883789062, -0.009921789169311523, -0.009427547454833984, -0.008933305740356445, -0.008439064025878906, -0.007944822311401367, -0.007450580596923828, -0.006956338882446289, -0.00646209716796875, -0.005967855453491211, -0.005473613739013672, -0.004979372024536133, -0.004485130310058594, -0.003990888595581055, -0.0034966468811035156, -0.0030024051666259766, -0.0025081634521484375, -0.0020139217376708984, -0.0015196800231933594, -0.0010254383087158203, -0.0005311965942382812, -3.695487976074219e-05, 0.0004572868347167969, 0.0009515285491943359, 0.001445770263671875, 0.001940011978149414, 0.002434253692626953, 0.002928495407104492, 0.0034227371215820312, 0.00391697883605957, 0.004411220550537109, 0.0049054622650146484, 0.0053997039794921875, 0.0058939456939697266, 0.006388187408447266, 0.006882429122924805, 0.007376670837402344, 0.007870912551879883, 0.008365154266357422, 0.008859395980834961, 0.0093536376953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 9.0, 5.0, 7.0, 13.0, 21.0, 31.0, 45.0, 52.0, 74.0, 101.0, 173.0, 214.0, 300.0, 511.0, 713.0, 1035.0, 1539.0, 2420.0, 3961.0, 6581.0, 11235.0, 20656.0, 43342.0, 137284.0, 669100.0, 78012.0, 31386.0, 16033.0, 8907.0, 5345.0, 3299.0, 2035.0, 1357.0, 913.0, 601.0, 426.0, 227.0, 174.0, 99.0, 92.0, 65.0, 51.0, 34.0, 22.0, 29.0, 10.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.05084228515625, -0.04921770095825195, -0.047593116760253906, -0.04596853256225586, -0.04434394836425781, -0.042719364166259766, -0.04109477996826172, -0.03947019577026367, -0.037845611572265625, -0.03622102737426758, -0.03459644317626953, -0.032971858978271484, -0.03134727478027344, -0.02972269058227539, -0.028098106384277344, -0.026473522186279297, -0.02484893798828125, -0.023224353790283203, -0.021599769592285156, -0.01997518539428711, -0.018350601196289062, -0.016726016998291016, -0.015101432800292969, -0.013476848602294922, -0.011852264404296875, -0.010227680206298828, -0.008603096008300781, -0.006978511810302734, -0.0053539276123046875, -0.0037293434143066406, -0.0021047592163085938, -0.0004801750183105469, 0.0011444091796875, 0.002768993377685547, 0.004393577575683594, 0.006018161773681641, 0.0076427459716796875, 0.009267330169677734, 0.010891914367675781, 0.012516498565673828, 0.014141082763671875, 0.015765666961669922, 0.01739025115966797, 0.019014835357666016, 0.020639419555664062, 0.02226400375366211, 0.023888587951660156, 0.025513172149658203, 0.02713775634765625, 0.028762340545654297, 0.030386924743652344, 0.03201150894165039, 0.03363609313964844, 0.035260677337646484, 0.03688526153564453, 0.03850984573364258, 0.040134429931640625, 0.04175901412963867, 0.04338359832763672, 0.045008182525634766, 0.04663276672363281, 0.04825735092163086, 0.049881935119628906, 0.05150651931762695, 0.053131103515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 7.0, 12.0, 10.0, 17.0, 22.0, 24.0, 26.0, 31.0, 26.0, 37.0, 26.0, 56.0, 35.0, 45.0, 46.0, 51.0, 38.0, 55.0, 46.0, 36.0, 41.0, 41.0, 36.0, 43.0, 33.0, 23.0, 29.0, 22.0, 19.0, 14.0, 14.0, 8.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006427764892578125, -0.0062348246574401855, -0.006041884422302246, -0.005848944187164307, -0.005656003952026367, -0.005463063716888428, -0.005270123481750488, -0.005077183246612549, -0.004884243011474609, -0.00469130277633667, -0.0044983625411987305, -0.004305422306060791, -0.0041124820709228516, -0.003919541835784912, -0.0037266016006469727, -0.003533661365509033, -0.0033407211303710938, -0.0031477808952331543, -0.002954840660095215, -0.0027619004249572754, -0.002568960189819336, -0.0023760199546813965, -0.002183079719543457, -0.0019901394844055176, -0.0017971992492675781, -0.0016042590141296387, -0.0014113187789916992, -0.0012183785438537598, -0.0010254383087158203, -0.0008324980735778809, -0.0006395578384399414, -0.00044661760330200195, -0.0002536773681640625, -6.073713302612305e-05, 0.0001322031021118164, 0.00032514333724975586, 0.0005180835723876953, 0.0007110238075256348, 0.0009039640426635742, 0.0010969042778015137, 0.0012898445129394531, 0.0014827847480773926, 0.001675724983215332, 0.0018686652183532715, 0.002061605453491211, 0.0022545456886291504, 0.00244748592376709, 0.0026404261589050293, 0.0028333663940429688, 0.003026306629180908, 0.0032192468643188477, 0.003412187099456787, 0.0036051273345947266, 0.003798067569732666, 0.0039910078048706055, 0.004183948040008545, 0.004376888275146484, 0.004569828510284424, 0.004762768745422363, 0.004955708980560303, 0.005148649215698242, 0.005341589450836182, 0.005534529685974121, 0.0057274699211120605, 0.00592041015625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 11.0, 12.0, 16.0, 35.0, 34.0, 44.0, 72.0, 88.0, 93.0, 107.0, 144.0, 179.0, 261.0, 321.0, 434.0, 597.0, 854.0, 1000.0, 1415.0, 2177.0, 3939.0, 8115.0, 27159.0, 916642.0, 59022.0, 11611.0, 4937.0, 2837.0, 1681.0, 1111.0, 890.0, 652.0, 493.0, 359.0, 276.0, 186.0, 148.0, 118.0, 114.0, 79.0, 68.0, 63.0, 48.0, 32.0, 17.0, 11.0, 15.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.01506805419921875, -0.014592409133911133, -0.014116764068603516, -0.013641119003295898, -0.013165473937988281, -0.012689828872680664, -0.012214183807373047, -0.01173853874206543, -0.011262893676757812, -0.010787248611450195, -0.010311603546142578, -0.009835958480834961, -0.009360313415527344, -0.008884668350219727, -0.00840902328491211, -0.007933378219604492, -0.007457733154296875, -0.006982088088989258, -0.006506443023681641, -0.0060307979583740234, -0.005555152893066406, -0.005079507827758789, -0.004603862762451172, -0.004128217697143555, -0.0036525726318359375, -0.0031769275665283203, -0.002701282501220703, -0.002225637435913086, -0.0017499923706054688, -0.0012743473052978516, -0.0007987022399902344, -0.0003230571746826172, 0.000152587890625, 0.0006282329559326172, 0.0011038780212402344, 0.0015795230865478516, 0.0020551681518554688, 0.002530813217163086, 0.003006458282470703, 0.0034821033477783203, 0.0039577484130859375, 0.004433393478393555, 0.004909038543701172, 0.005384683609008789, 0.005860328674316406, 0.0063359737396240234, 0.006811618804931641, 0.007287263870239258, 0.007762908935546875, 0.008238554000854492, 0.00871419906616211, 0.009189844131469727, 0.009665489196777344, 0.010141134262084961, 0.010616779327392578, 0.011092424392700195, 0.011568069458007812, 0.01204371452331543, 0.012519359588623047, 0.012995004653930664, 0.013470649719238281, 0.013946294784545898, 0.014421939849853516, 0.014897584915161133, 0.01537322998046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 9.0, 12.0, 5.0, 17.0, 19.0, 14.0, 27.0, 18.0, 17.0, 17.0, 30.0, 24.0, 39.0, 41.0, 60.0, 68.0, 42.0, 77.0, 65.0, 56.0, 42.0, 34.0, 29.0, 11.0, 28.0, 19.0, 25.0, 20.0, 14.0, 14.0, 8.0, 7.0, 10.0, 9.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.159046173095703e-06, -3.048218786716461e-06, -2.9373914003372192e-06, -2.8265640139579773e-06, -2.7157366275787354e-06, -2.6049092411994934e-06, -2.4940818548202515e-06, -2.3832544684410095e-06, -2.2724270820617676e-06, -2.1615996956825256e-06, -2.0507723093032837e-06, -1.9399449229240417e-06, -1.8291175365447998e-06, -1.7182901501655579e-06, -1.607462763786316e-06, -1.496635377407074e-06, -1.385807991027832e-06, -1.27498060464859e-06, -1.1641532182693481e-06, -1.0533258318901062e-06, -9.424984455108643e-07, -8.316710591316223e-07, -7.208436727523804e-07, -6.100162863731384e-07, -4.991888999938965e-07, -3.8836151361465454e-07, -2.775341272354126e-07, -1.6670674085617065e-07, -5.587935447692871e-08, 5.494803190231323e-08, 1.6577541828155518e-07, 2.766028046607971e-07, 3.8743019104003906e-07, 4.98257577419281e-07, 6.09084963798523e-07, 7.199123501777649e-07, 8.307397365570068e-07, 9.415671229362488e-07, 1.0523945093154907e-06, 1.1632218956947327e-06, 1.2740492820739746e-06, 1.3848766684532166e-06, 1.4957040548324585e-06, 1.6065314412117004e-06, 1.7173588275909424e-06, 1.8281862139701843e-06, 1.9390136003494263e-06, 2.0498409867286682e-06, 2.16066837310791e-06, 2.271495759487152e-06, 2.382323145866394e-06, 2.493150532245636e-06, 2.603977918624878e-06, 2.71480530500412e-06, 2.825632691383362e-06, 2.9364600777626038e-06, 3.0472874641418457e-06, 3.1581148505210876e-06, 3.2689422369003296e-06, 3.3797696232795715e-06, 3.4905970096588135e-06, 3.6014243960380554e-06, 3.7122517824172974e-06, 3.823079168796539e-06, 3.933906555175781e-06]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 15.0, 20.0, 41.0, 103.0, 259.0, 686.0, 1998.0, 7114.0, 32624.0, 964134.0, 31494.0, 6900.0, 2052.0, 649.0, 247.0, 87.0, 50.0, 20.0, 10.0, 5.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0136566162109375, -0.013120889663696289, -0.012585163116455078, -0.012049436569213867, -0.011513710021972656, -0.010977983474731445, -0.010442256927490234, -0.009906530380249023, -0.009370803833007812, -0.008835077285766602, -0.00829935073852539, -0.00776362419128418, -0.007227897644042969, -0.006692171096801758, -0.006156444549560547, -0.005620718002319336, -0.005084991455078125, -0.004549264907836914, -0.004013538360595703, -0.003477811813354492, -0.0029420852661132812, -0.0024063587188720703, -0.0018706321716308594, -0.0013349056243896484, -0.0007991790771484375, -0.00026345252990722656, 0.0002722740173339844, 0.0008080005645751953, 0.0013437271118164062, 0.0018794536590576172, 0.002415180206298828, 0.002950906753540039, 0.00348663330078125, 0.004022359848022461, 0.004558086395263672, 0.005093812942504883, 0.005629539489746094, 0.006165266036987305, 0.006700992584228516, 0.0072367191314697266, 0.0077724456787109375, 0.008308172225952148, 0.00884389877319336, 0.00937962532043457, 0.009915351867675781, 0.010451078414916992, 0.010986804962158203, 0.011522531509399414, 0.012058258056640625, 0.012593984603881836, 0.013129711151123047, 0.013665437698364258, 0.014201164245605469, 0.01473689079284668, 0.01527261734008789, 0.0158083438873291, 0.016344070434570312, 0.016879796981811523, 0.017415523529052734, 0.017951250076293945, 0.018486976623535156, 0.019022703170776367, 0.019558429718017578, 0.02009415626525879, 0.0206298828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 4.0, 8.0, 6.0, 6.0, 10.0, 19.0, 35.0, 54.0, 479.0, 199.0, 49.0, 22.0, 13.0, 8.0, 5.0, 8.0, 5.0, 7.0, 3.0, 7.0, 8.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0020294189453125, -0.001977190375328064, -0.001924961805343628, -0.001872733235359192, -0.0018205046653747559, -0.0017682760953903198, -0.0017160475254058838, -0.0016638189554214478, -0.0016115903854370117, -0.0015593618154525757, -0.0015071332454681396, -0.0014549046754837036, -0.0014026761054992676, -0.0013504475355148315, -0.0012982189655303955, -0.0012459903955459595, -0.0011937618255615234, -0.0011415332555770874, -0.0010893046855926514, -0.0010370761156082153, -0.0009848475456237793, -0.0009326189756393433, -0.0008803904056549072, -0.0008281618356704712, -0.0007759332656860352, -0.0007237046957015991, -0.0006714761257171631, -0.000619247555732727, -0.000567018985748291, -0.000514790415763855, -0.00046256184577941895, -0.0004103332757949829, -0.0003581047058105469, -0.00030587613582611084, -0.0002536475658416748, -0.00020141899585723877, -0.00014919042587280273, -9.69618558883667e-05, -4.4733285903930664e-05, 7.495284080505371e-06, 5.9723854064941406e-05, 0.00011195242404937744, 0.00016418099403381348, 0.0002164095640182495, 0.00026863813400268555, 0.0003208667039871216, 0.0003730952739715576, 0.00042532384395599365, 0.0004775524139404297, 0.0005297809839248657, 0.0005820095539093018, 0.0006342381238937378, 0.0006864666938781738, 0.0007386952638626099, 0.0007909238338470459, 0.0008431524038314819, 0.000895380973815918, 0.000947609543800354, 0.00099983811378479, 0.001052066683769226, 0.0011042952537536621, 0.0011565238237380981, 0.0012087523937225342, 0.0012609809637069702, 0.0013132095336914062]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 5.0, 8.0, 7.0, 14.0, 27.0, 30.0, 51.0, 64.0, 154.0, 210.0, 162.0, 75.0, 62.0, 40.0, 26.0, 12.0, 11.0, 13.0, 12.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016007574275135994, -0.015460353344678879, -0.014913132414221764, -0.014365912415087223, -0.013818691484630108, -0.013271470554172993, -0.012724250555038452, -0.012177029624581337, -0.011629808694124222, -0.011082587763667107, -0.010535366833209991, -0.009988146834075451, -0.009440925903618336, -0.00889370497316122, -0.00834648497402668, -0.007799264043569565, -0.00725204311311245, -0.0067048221826553345, -0.006157601717859507, -0.005610381253063679, -0.005063160322606564, -0.004515939392149448, -0.0039687189273536205, -0.003421498229727149, -0.0028742775321006775, -0.002327056834474206, -0.0017798361368477345, -0.001232615439221263, -0.0006853947415947914, -0.0001381740439683199, 0.0004090466536581516, 0.0009562673512846231, 0.001503489911556244, 0.0020507106091827154, 0.002597931306809187, 0.0031451520044356585, 0.00369237270206213, 0.004239593632519245, 0.004786814097315073, 0.005334034562110901, 0.005881255492568016, 0.006428476423025131, 0.006975696887820959, 0.007522917352616787, 0.008070138283073902, 0.008617359213531017, 0.009164579212665558, 0.009711800143122673, 0.010259021073579788, 0.010806242004036903, 0.011353462934494019, 0.011900682933628559, 0.012447903864085674, 0.01299512479454279, 0.01354234479367733, 0.014089565724134445, 0.01463678665459156, 0.015184007585048676, 0.01573122851550579, 0.016278449445962906, 0.016825668513774872, 0.017372889444231987, 0.017920110374689102, 0.018467331305146217, 0.019014552235603333]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 26.0, 30.0, 31.0, 46.0, 53.0, 76.0, 50.0, 78.0, 81.0, 64.0, 74.0, 69.0, 61.0, 43.0, 49.0, 32.0, 29.0, 19.0, 15.0, 18.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.017659498378634453, -0.017265256494283676, -0.01687101647257805, -0.016476774588227272, -0.016082534566521645, -0.015688292682170868, -0.015294051729142666, -0.014899810776114464, -0.014505568891763687, -0.014111327938735485, -0.013717086985707283, -0.013322845101356506, -0.012928604148328304, -0.012534363195300102, -0.0121401222422719, -0.011745881289243698, -0.011351639404892921, -0.01095739845186472, -0.010563157498836517, -0.01016891561448574, -0.009774674661457539, -0.009380433708429337, -0.008986192755401134, -0.008591951802372932, -0.00819771084934473, -0.007803469896316528, -0.007409228477627039, -0.007014987524598837, -0.0066207461059093475, -0.0062265051528811455, -0.005832264199852943, -0.005438022781163454, -0.005043780896812677, -0.004649539943784475, -0.004255298525094986, -0.003861057572066784, -0.0034668161533772945, -0.0030725752003490925, -0.0026783340144902468, -0.002284092828631401, -0.0018898516427725554, -0.0014956104569137096, -0.001101369271054864, -0.00070712820161134, -0.00031288701575249434, 8.135405369102955e-05, 0.00047559523954987526, 0.000869836425408721, 0.0012640776112675667, 0.0016583187971264124, 0.002052559982985258, 0.00244680093601346, 0.0028410423547029495, 0.0032352833077311516, 0.0036295244935899973, 0.004023765679448843, 0.004418007098138332, 0.004812248051166534, 0.005206489469856024, 0.005600730422884226, 0.005994971841573715, 0.006389212794601917, 0.006783453747630119, 0.007177695166319609, 0.007571936119347811]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 4.0, 3.0, 7.0, 17.0, 23.0, 23.0, 32.0, 36.0, 66.0, 137.0, 338.0, 1006.0, 3846.0, 21724.0, 204036.0, 739122.0, 65413.0, 9555.0, 2005.0, 627.0, 206.0, 101.0, 60.0, 34.0, 23.0, 27.0, 19.0, 14.0, 14.0, 7.0, 9.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.050628662109375, -0.04915142059326172, -0.04767417907714844, -0.046196937561035156, -0.044719696044921875, -0.043242454528808594, -0.04176521301269531, -0.04028797149658203, -0.03881072998046875, -0.03733348846435547, -0.03585624694824219, -0.034379005432128906, -0.032901763916015625, -0.031424522399902344, -0.029947280883789062, -0.02847003936767578, -0.0269927978515625, -0.02551555633544922, -0.024038314819335938, -0.022561073303222656, -0.021083831787109375, -0.019606590270996094, -0.018129348754882812, -0.01665210723876953, -0.01517486572265625, -0.013697624206542969, -0.012220382690429688, -0.010743141174316406, -0.009265899658203125, -0.007788658142089844, -0.0063114166259765625, -0.004834175109863281, -0.00335693359375, -0.0018796920776367188, -0.0004024505615234375, 0.0010747909545898438, 0.002552032470703125, 0.004029273986816406, 0.0055065155029296875, 0.006983757019042969, 0.00846099853515625, 0.009938240051269531, 0.011415481567382812, 0.012892723083496094, 0.014369964599609375, 0.015847206115722656, 0.017324447631835938, 0.01880168914794922, 0.0202789306640625, 0.02175617218017578, 0.023233413696289062, 0.024710655212402344, 0.026187896728515625, 0.027665138244628906, 0.029142379760742188, 0.03061962127685547, 0.03209686279296875, 0.03357410430908203, 0.03505134582519531, 0.036528587341308594, 0.038005828857421875, 0.039483070373535156, 0.04096031188964844, 0.04243755340576172, 0.043914794921875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 18.0, 25.0, 29.0, 49.0, 60.0, 87.0, 105.0, 127.0, 106.0, 105.0, 80.0, 69.0, 53.0, 35.0, 20.0, 15.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00862884521484375, -0.008444875478744507, -0.008260905742645264, -0.00807693600654602, -0.007892966270446777, -0.007708996534347534, -0.007525026798248291, -0.007341057062149048, -0.007157087326049805, -0.0069731175899505615, -0.006789147853851318, -0.006605178117752075, -0.006421208381652832, -0.006237238645553589, -0.006053268909454346, -0.0058692991733551025, -0.005685329437255859, -0.005501359701156616, -0.005317389965057373, -0.00513342022895813, -0.004949450492858887, -0.0047654807567596436, -0.0045815110206604, -0.004397541284561157, -0.004213571548461914, -0.004029601812362671, -0.0038456320762634277, -0.0036616623401641846, -0.0034776926040649414, -0.0032937228679656982, -0.003109753131866455, -0.002925783395767212, -0.0027418136596679688, -0.0025578439235687256, -0.0023738741874694824, -0.0021899044513702393, -0.002005934715270996, -0.001821964979171753, -0.0016379952430725098, -0.0014540255069732666, -0.0012700557708740234, -0.0010860860347747803, -0.0009021162986755371, -0.0007181465625762939, -0.0005341768264770508, -0.0003502070903778076, -0.00016623735427856445, 1.773238182067871e-05, 0.00020170211791992188, 0.00038567185401916504, 0.0005696415901184082, 0.0007536113262176514, 0.0009375810623168945, 0.0011215507984161377, 0.0013055205345153809, 0.001489490270614624, 0.0016734600067138672, 0.0018574297428131104, 0.0020413994789123535, 0.0022253692150115967, 0.00240933895111084, 0.002593308687210083, 0.002777278423309326, 0.0029612481594085693, 0.0031452178955078125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 9.0, 12.0, 28.0, 21.0, 45.0, 72.0, 111.0, 194.0, 277.0, 501.0, 790.0, 1433.0, 2328.0, 3937.0, 6908.0, 12155.0, 21844.0, 41235.0, 81636.0, 176845.0, 329450.0, 186921.0, 86133.0, 42719.0, 22762.0, 12853.0, 7156.0, 4149.0, 2387.0, 1472.0, 838.0, 523.0, 309.0, 188.0, 108.0, 77.0, 33.0, 26.0, 21.0, 16.0, 13.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0071258544921875, -0.0069068074226379395, -0.006687760353088379, -0.006468713283538818, -0.006249666213989258, -0.006030619144439697, -0.005811572074890137, -0.005592525005340576, -0.005373477935791016, -0.005154430866241455, -0.0049353837966918945, -0.004716336727142334, -0.0044972896575927734, -0.004278242588043213, -0.004059195518493652, -0.003840148448944092, -0.0036211013793945312, -0.0034020543098449707, -0.00318300724029541, -0.0029639601707458496, -0.002744913101196289, -0.0025258660316467285, -0.002306818962097168, -0.0020877718925476074, -0.0018687248229980469, -0.0016496777534484863, -0.0014306306838989258, -0.0012115836143493652, -0.0009925365447998047, -0.0007734894752502441, -0.0005544424057006836, -0.00033539533615112305, -0.0001163482666015625, 0.00010269880294799805, 0.0003217458724975586, 0.0005407929420471191, 0.0007598400115966797, 0.0009788870811462402, 0.0011979341506958008, 0.0014169812202453613, 0.0016360282897949219, 0.0018550753593444824, 0.002074122428894043, 0.0022931694984436035, 0.002512216567993164, 0.0027312636375427246, 0.002950310707092285, 0.0031693577766418457, 0.0033884048461914062, 0.003607451915740967, 0.0038264989852905273, 0.004045546054840088, 0.0042645931243896484, 0.004483640193939209, 0.0047026872634887695, 0.00492173433303833, 0.005140781402587891, 0.005359828472137451, 0.005578875541687012, 0.005797922611236572, 0.006016969680786133, 0.006236016750335693, 0.006455063819885254, 0.0066741108894348145, 0.006893157958984375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 5.0, 6.0, 5.0, 14.0, 19.0, 17.0, 16.0, 20.0, 29.0, 20.0, 22.0, 30.0, 32.0, 35.0, 40.0, 46.0, 25.0, 49.0, 28.0, 45.0, 41.0, 39.0, 34.0, 45.0, 42.0, 37.0, 37.0, 18.0, 35.0, 20.0, 25.0, 22.0, 21.0, 8.0, 12.0, 12.0, 9.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018033981323242188, -0.0017411857843399048, -0.0016789734363555908, -0.0016167610883712769, -0.0015545487403869629, -0.001492336392402649, -0.001430124044418335, -0.001367911696434021, -0.001305699348449707, -0.001243487000465393, -0.001181274652481079, -0.0011190623044967651, -0.0010568499565124512, -0.0009946376085281372, -0.0009324252605438232, -0.0008702129125595093, -0.0008080005645751953, -0.0007457882165908813, -0.0006835758686065674, -0.0006213635206222534, -0.0005591511726379395, -0.0004969388246536255, -0.0004347264766693115, -0.00037251412868499756, -0.0003103017807006836, -0.00024808943271636963, -0.00018587708473205566, -0.0001236647367477417, -6.145238876342773e-05, 7.599592208862305e-07, 6.29723072052002e-05, 0.00012518465518951416, 0.00018739700317382812, 0.0002496093511581421, 0.00031182169914245605, 0.00037403404712677, 0.000436246395111084, 0.000498458743095398, 0.0005606710910797119, 0.0006228834390640259, 0.0006850957870483398, 0.0007473081350326538, 0.0008095204830169678, 0.0008717328310012817, 0.0009339451789855957, 0.0009961575269699097, 0.0010583698749542236, 0.0011205822229385376, 0.0011827945709228516, 0.0012450069189071655, 0.0013072192668914795, 0.0013694316148757935, 0.0014316439628601074, 0.0014938563108444214, 0.0015560686588287354, 0.0016182810068130493, 0.0016804933547973633, 0.0017427057027816772, 0.0018049180507659912, 0.0018671303987503052, 0.0019293427467346191, 0.001991555094718933, 0.002053767442703247, 0.002115979790687561, 0.002178192138671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 22.0, 14.0, 23.0, 25.0, 37.0, 60.0, 67.0, 110.0, 190.0, 244.0, 412.0, 751.0, 1394.0, 2447.0, 5201.0, 13463.0, 45535.0, 402029.0, 500075.0, 50430.0, 14300.0, 5620.0, 2655.0, 1394.0, 783.0, 442.0, 269.0, 176.0, 106.0, 95.0, 39.0, 43.0, 20.0, 23.0, 12.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006265640258789062, -0.0006063729524612427, -0.0005861818790435791, -0.0005659908056259155, -0.000545799732208252, -0.0005256086587905884, -0.0005054175853729248, -0.00048522651195526123, -0.00046503543853759766, -0.0004448443651199341, -0.0004246532917022705, -0.00040446221828460693, -0.00038427114486694336, -0.0003640800714492798, -0.0003438889980316162, -0.00032369792461395264, -0.00030350685119628906, -0.0002833157777786255, -0.0002631247043609619, -0.00024293363094329834, -0.00022274255752563477, -0.0002025514841079712, -0.00018236041069030762, -0.00016216933727264404, -0.00014197826385498047, -0.0001217871904373169, -0.00010159611701965332, -8.140504360198975e-05, -6.121397018432617e-05, -4.10228967666626e-05, -2.0831823348999023e-05, -6.407499313354492e-07, 1.9550323486328125e-05, 3.97413969039917e-05, 5.9932470321655273e-05, 8.012354373931885e-05, 0.00010031461715698242, 0.000120505690574646, 0.00014069676399230957, 0.00016088783740997314, 0.00018107891082763672, 0.0002012699842453003, 0.00022146105766296387, 0.00024165213108062744, 0.000261843204498291, 0.0002820342779159546, 0.00030222535133361816, 0.00032241642475128174, 0.0003426074981689453, 0.0003627985715866089, 0.00038298964500427246, 0.00040318071842193604, 0.0004233717918395996, 0.0004435628652572632, 0.00046375393867492676, 0.00048394501209259033, 0.0005041360855102539, 0.0005243271589279175, 0.0005445182323455811, 0.0005647093057632446, 0.0005849003791809082, 0.0006050914525985718, 0.0006252825260162354, 0.0006454735994338989, 0.0006656646728515625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 10.0, 8.0, 11.0, 20.0, 19.0, 42.0, 77.0, 110.0, 207.0, 173.0, 132.0, 70.0, 33.0, 27.0, 12.0, 11.0, 7.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5902332961559296e-05, -1.535378396511078e-05, -1.4805234968662262e-05, -1.4256685972213745e-05, -1.3708136975765228e-05, -1.3159587979316711e-05, -1.2611038982868195e-05, -1.2062489986419678e-05, -1.1513940989971161e-05, -1.0965391993522644e-05, -1.0416842997074127e-05, -9.86829400062561e-06, -9.319745004177094e-06, -8.771196007728577e-06, -8.22264701128006e-06, -7.674098014831543e-06, -7.125549018383026e-06, -6.577000021934509e-06, -6.0284510254859924e-06, -5.479902029037476e-06, -4.931353032588959e-06, -4.382804036140442e-06, -3.834255039691925e-06, -3.285706043243408e-06, -2.7371570467948914e-06, -2.1886080503463745e-06, -1.6400590538978577e-06, -1.0915100574493408e-06, -5.42961061000824e-07, 5.587935447692871e-09, 5.541369318962097e-07, 1.1026859283447266e-06, 1.6512349247932434e-06, 2.1997839212417603e-06, 2.748332917690277e-06, 3.296881914138794e-06, 3.845430910587311e-06, 4.393979907035828e-06, 4.9425289034843445e-06, 5.491077899932861e-06, 6.039626896381378e-06, 6.588175892829895e-06, 7.136724889278412e-06, 7.685273885726929e-06, 8.233822882175446e-06, 8.782371878623962e-06, 9.33092087507248e-06, 9.879469871520996e-06, 1.0428018867969513e-05, 1.097656786441803e-05, 1.1525116860866547e-05, 1.2073665857315063e-05, 1.262221485376358e-05, 1.3170763850212097e-05, 1.3719312846660614e-05, 1.4267861843109131e-05, 1.4816410839557648e-05, 1.5364959836006165e-05, 1.591350883245468e-05, 1.6462057828903198e-05, 1.7010606825351715e-05, 1.7559155821800232e-05, 1.810770481824875e-05, 1.8656253814697266e-05]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 8.0, 7.0, 1.0, 9.0, 15.0, 25.0, 27.0, 45.0, 66.0, 102.0, 156.0, 209.0, 314.0, 523.0, 783.0, 1250.0, 1911.0, 3204.0, 5152.0, 9361.0, 16623.0, 32109.0, 69067.0, 172726.0, 400326.0, 187438.0, 72230.0, 33845.0, 17386.0, 9408.0, 5424.0, 3265.0, 1982.0, 1214.0, 785.0, 543.0, 349.0, 230.0, 135.0, 95.0, 63.0, 45.0, 35.0, 29.0, 17.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016009807586669922, -0.00015502050518989563, -0.00014994293451309204, -0.00014486536383628845, -0.00013978779315948486, -0.00013471022248268127, -0.00012963265180587769, -0.0001245550811290741, -0.00011947751045227051, -0.00011439993977546692, -0.00010932236909866333, -0.00010424479842185974, -9.916722774505615e-05, -9.408965706825256e-05, -8.901208639144897e-05, -8.393451571464539e-05, -7.88569450378418e-05, -7.377937436103821e-05, -6.870180368423462e-05, -6.362423300743103e-05, -5.854666233062744e-05, -5.346909165382385e-05, -4.8391520977020264e-05, -4.3313950300216675e-05, -3.8236379623413086e-05, -3.31588089466095e-05, -2.8081238269805908e-05, -2.300366759300232e-05, -1.792609691619873e-05, -1.2848526239395142e-05, -7.770955562591553e-06, -2.693384885787964e-06, 2.384185791015625e-06, 7.461756467819214e-06, 1.2539327144622803e-05, 1.761689782142639e-05, 2.269446849822998e-05, 2.777203917503357e-05, 3.284960985183716e-05, 3.792718052864075e-05, 4.3004751205444336e-05, 4.8082321882247925e-05, 5.3159892559051514e-05, 5.82374632358551e-05, 6.331503391265869e-05, 6.839260458946228e-05, 7.347017526626587e-05, 7.854774594306946e-05, 8.362531661987305e-05, 8.870288729667664e-05, 9.378045797348022e-05, 9.885802865028381e-05, 0.0001039355993270874, 0.00010901317000389099, 0.00011409074068069458, 0.00011916831135749817, 0.00012424588203430176, 0.00012932345271110535, 0.00013440102338790894, 0.00013947859406471252, 0.0001445561647415161, 0.0001496337354183197, 0.0001547113060951233, 0.00015978887677192688, 0.00016486644744873047]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 9.0, 9.0, 3.0, 20.0, 15.0, 16.0, 25.0, 18.0, 26.0, 32.0, 51.0, 30.0, 41.0, 50.0, 55.0, 59.0, 58.0, 59.0, 50.0, 51.0, 46.0, 38.0, 39.0, 36.0, 28.0, 15.0, 21.0, 13.0, 19.0, 8.0, 6.0, 8.0, 8.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-4.756450653076172e-05, -4.609767347574234e-05, -4.463084042072296e-05, -4.316400736570358e-05, -4.1697174310684204e-05, -4.0230341255664825e-05, -3.876350820064545e-05, -3.729667514562607e-05, -3.582984209060669e-05, -3.436300903558731e-05, -3.289617598056793e-05, -3.1429342925548553e-05, -2.9962509870529175e-05, -2.8495676815509796e-05, -2.7028843760490417e-05, -2.556201070547104e-05, -2.409517765045166e-05, -2.262834459543228e-05, -2.1161511540412903e-05, -1.9694678485393524e-05, -1.8227845430374146e-05, -1.6761012375354767e-05, -1.5294179320335388e-05, -1.382734626531601e-05, -1.2360513210296631e-05, -1.0893680155277252e-05, -9.426847100257874e-06, -7.960014045238495e-06, -6.493180990219116e-06, -5.0263479351997375e-06, -3.559514880180359e-06, -2.0926818251609802e-06, -6.258487701416016e-07, 8.409842848777771e-07, 2.3078173398971558e-06, 3.7746503949165344e-06, 5.241483449935913e-06, 6.708316504955292e-06, 8.17514955997467e-06, 9.641982614994049e-06, 1.1108815670013428e-05, 1.2575648725032806e-05, 1.4042481780052185e-05, 1.5509314835071564e-05, 1.6976147890090942e-05, 1.844298094511032e-05, 1.99098140001297e-05, 2.137664705514908e-05, 2.2843480110168457e-05, 2.4310313165187836e-05, 2.5777146220207214e-05, 2.7243979275226593e-05, 2.871081233024597e-05, 3.017764538526535e-05, 3.164447844028473e-05, 3.311131149530411e-05, 3.4578144550323486e-05, 3.6044977605342865e-05, 3.7511810660362244e-05, 3.897864371538162e-05, 4.0445476770401e-05, 4.191230982542038e-05, 4.337914288043976e-05, 4.484597593545914e-05, 4.6312808990478516e-05]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 13.0, 19.0, 36.0, 112.0, 214.0, 319.0, 144.0, 63.0, 36.0, 24.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017428388819098473, -0.017043830826878548, -0.016659272834658623, -0.016274714842438698, -0.015890156850218773, -0.015505598857998848, -0.015121040865778923, -0.014736483804881573, -0.014351925812661648, -0.013967367820441723, -0.013582809828221798, -0.013198251836001873, -0.012813693843781948, -0.012429136782884598, -0.012044578790664673, -0.011660020798444748, -0.011275462806224823, -0.010890904814004898, -0.010506346821784973, -0.010121788829565048, -0.009737230837345123, -0.009352672845125198, -0.008968114852905273, -0.008583557792007923, -0.008198998868465424, -0.007814440876245499, -0.007429882884025574, -0.007045324891805649, -0.006660767365247011, -0.006276209373027086, -0.005891651380807161, -0.005507093854248524, -0.005122535862028599, -0.004737977869808674, -0.004353419877588749, -0.003968861885368824, -0.0035843043588101864, -0.0031997463665902615, -0.0028151883743703365, -0.0024306306149810553, -0.0020460726227611303, -0.0016615147469565272, -0.0012769568711519241, -0.0008923988789319992, -0.0005078410031273961, -0.000123283127322793, 0.0002612748648971319, 0.0006458326242864132, 0.0010303906165063381, 0.0014149484923109412, 0.0017995063681155443, 0.0021840643603354692, 0.0025686221197247505, 0.0029531801119446754, 0.0033377381041646004, 0.0037222958635538816, 0.00410685408860445, 0.004491412080824375, 0.0048759700730443, 0.005260528065264225, 0.005645085591822863, 0.0060296435840427876, 0.0064142015762627125, 0.00679875910282135, 0.007183317095041275]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 11.0, 13.0, 19.0, 35.0, 38.0, 49.0, 62.0, 71.0, 79.0, 84.0, 79.0, 75.0, 64.0, 67.0, 53.0, 50.0, 46.0, 31.0, 24.0, 26.0, 14.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00773725938051939, -0.00757012702524662, -0.00740299466997385, -0.007235862780362368, -0.007068730425089598, -0.006901598069816828, -0.006734466180205345, -0.006567333824932575, -0.006400201469659805, -0.006233069114387035, -0.0060659367591142654, -0.005898804869502783, -0.005731672514230013, -0.005564540158957243, -0.00539740826934576, -0.00523027591407299, -0.0050631435588002205, -0.0048960112035274506, -0.004728878848254681, -0.004561746958643198, -0.004394614603370428, -0.004227482248097658, -0.0040603503584861755, -0.0038932180032134056, -0.0037260856479406357, -0.0035589532926678658, -0.0033918211702257395, -0.003224689047783613, -0.0030575566925108433, -0.0028904243372380733, -0.002723292214795947, -0.002556160092353821, -0.0023890272714197636, -0.0022218949161469936, -0.0020547627937048674, -0.0018876305548474193, -0.0017204983159899712, -0.001553366077132523, -0.001386233838275075, -0.0012191015994176269, -0.0010519693605601788, -0.0008848371217027307, -0.0007177048828452826, -0.0005505726439878345, -0.00038344040513038635, -0.00021630816627293825, -4.917592741549015e-05, 0.00011795631144195795, 0.00028508855029940605, 0.00045222078915685415, 0.0006193530280143023, 0.0007864852668717504, 0.0009536175057291985, 0.0011207497445866466, 0.0012878819834440947, 0.0014550142223015428, 0.0016221464611589909, 0.001789278700016439, 0.001956410938873887, 0.0021235430613160133, 0.0022906754165887833, 0.002457807771861553, 0.0026249398943036795, 0.0027920720167458057, 0.0029592043720185757]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 13.0, 17.0, 38.0, 52.0, 96.0, 187.0, 420.0, 1018.0, 3062.0, 92781.0, 4088498.0, 5368.0, 1599.0, 566.0, 283.0, 130.0, 63.0, 37.0, 29.0, 9.0, 8.0, 2.0, 2.0, 2.0], "bins": [-0.019256591796875, -0.018872737884521484, -0.01848888397216797, -0.018105030059814453, -0.017721176147460938, -0.017337322235107422, -0.016953468322753906, -0.01656961441040039, -0.016185760498046875, -0.01580190658569336, -0.015418052673339844, -0.015034198760986328, -0.014650344848632812, -0.014266490936279297, -0.013882637023925781, -0.013498783111572266, -0.01311492919921875, -0.012731075286865234, -0.012347221374511719, -0.011963367462158203, -0.011579513549804688, -0.011195659637451172, -0.010811805725097656, -0.01042795181274414, -0.010044097900390625, -0.00966024398803711, -0.009276390075683594, -0.008892536163330078, -0.008508682250976562, -0.008124828338623047, -0.007740974426269531, -0.007357120513916016, -0.0069732666015625, -0.006589412689208984, -0.006205558776855469, -0.005821704864501953, -0.0054378509521484375, -0.005053997039794922, -0.004670143127441406, -0.004286289215087891, -0.003902435302734375, -0.0035185813903808594, -0.0031347274780273438, -0.002750873565673828, -0.0023670196533203125, -0.001983165740966797, -0.0015993118286132812, -0.0012154579162597656, -0.00083160400390625, -0.0004477500915527344, -6.389617919921875e-05, 0.0003199577331542969, 0.0007038116455078125, 0.0010876655578613281, 0.0014715194702148438, 0.0018553733825683594, 0.002239227294921875, 0.0026230812072753906, 0.0030069351196289062, 0.003390789031982422, 0.0037746429443359375, 0.004158496856689453, 0.004542350769042969, 0.004926204681396484, 0.00531005859375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 14.0, 15.0, 21.0, 36.0, 42.0, 59.0, 73.0, 70.0, 92.0, 91.0, 75.0, 73.0, 72.0, 57.0, 57.0, 57.0, 27.0, 18.0, 18.0, 16.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00673675537109375, -0.006592810153961182, -0.006448864936828613, -0.006304919719696045, -0.0061609745025634766, -0.006017029285430908, -0.00587308406829834, -0.0057291388511657715, -0.005585193634033203, -0.005441248416900635, -0.005297303199768066, -0.005153357982635498, -0.00500941276550293, -0.004865467548370361, -0.004721522331237793, -0.004577577114105225, -0.004433631896972656, -0.004289686679840088, -0.0041457414627075195, -0.004001796245574951, -0.003857851028442383, -0.0037139058113098145, -0.003569960594177246, -0.0034260153770446777, -0.0032820701599121094, -0.003138124942779541, -0.0029941797256469727, -0.0028502345085144043, -0.002706289291381836, -0.0025623440742492676, -0.0024183988571166992, -0.002274453639984131, -0.0021305084228515625, -0.001986563205718994, -0.0018426179885864258, -0.0016986727714538574, -0.001554727554321289, -0.0014107823371887207, -0.0012668371200561523, -0.001122891902923584, -0.0009789466857910156, -0.0008350014686584473, -0.0006910562515258789, -0.0005471110343933105, -0.0004031658172607422, -0.00025922060012817383, -0.00011527538299560547, 2.866983413696289e-05, 0.00017261505126953125, 0.0003165602684020996, 0.00046050548553466797, 0.0006044507026672363, 0.0007483959197998047, 0.000892341136932373, 0.0010362863540649414, 0.0011802315711975098, 0.0013241767883300781, 0.0014681220054626465, 0.0016120672225952148, 0.0017560124397277832, 0.0018999576568603516, 0.00204390287399292, 0.0021878480911254883, 0.0023317933082580566, 0.002475738525390625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 12.0, 21.0, 28.0, 34.0, 87.0, 154.0, 315.0, 657.0, 1757.0, 5474.0, 48577.0, 4117891.0, 13982.0, 3208.0, 1134.0, 458.0, 206.0, 118.0, 61.0, 45.0, 19.0, 20.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0147857666015625, -0.014389276504516602, -0.013992786407470703, -0.013596296310424805, -0.013199806213378906, -0.012803316116333008, -0.01240682601928711, -0.012010335922241211, -0.011613845825195312, -0.011217355728149414, -0.010820865631103516, -0.010424375534057617, -0.010027885437011719, -0.00963139533996582, -0.009234905242919922, -0.008838415145874023, -0.008441925048828125, -0.008045434951782227, -0.007648944854736328, -0.00725245475769043, -0.006855964660644531, -0.006459474563598633, -0.006062984466552734, -0.005666494369506836, -0.0052700042724609375, -0.004873514175415039, -0.004477024078369141, -0.004080533981323242, -0.0036840438842773438, -0.0032875537872314453, -0.002891063690185547, -0.0024945735931396484, -0.00209808349609375, -0.0017015933990478516, -0.0013051033020019531, -0.0009086132049560547, -0.0005121231079101562, -0.00011563301086425781, 0.0002808570861816406, 0.0006773471832275391, 0.0010738372802734375, 0.001470327377319336, 0.0018668174743652344, 0.002263307571411133, 0.0026597976684570312, 0.0030562877655029297, 0.003452777862548828, 0.0038492679595947266, 0.004245758056640625, 0.0046422481536865234, 0.005038738250732422, 0.00543522834777832, 0.005831718444824219, 0.006228208541870117, 0.006624698638916016, 0.007021188735961914, 0.0074176788330078125, 0.007814168930053711, 0.00821065902709961, 0.008607149124145508, 0.009003639221191406, 0.009400129318237305, 0.009796619415283203, 0.010193109512329102, 0.010589599609375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 10.0, 35.0, 204.0, 3366.0, 312.0, 65.0, 22.0, 17.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013113021850585938, -0.00125788152217865, -0.001204460859298706, -0.0011510401964187622, -0.0010976195335388184, -0.0010441988706588745, -0.0009907782077789307, -0.0009373575448989868, -0.000883936882019043, -0.0008305162191390991, -0.0007770955562591553, -0.0007236748933792114, -0.0006702542304992676, -0.0006168335676193237, -0.0005634129047393799, -0.000509992241859436, -0.0004565715789794922, -0.00040315091609954834, -0.0003497302532196045, -0.00029630959033966064, -0.0002428889274597168, -0.00018946826457977295, -0.0001360476016998291, -8.262693881988525e-05, -2.9206275939941406e-05, 2.421438694000244e-05, 7.763504981994629e-05, 0.00013105571269989014, 0.00018447637557983398, 0.00023789703845977783, 0.0002913177013397217, 0.00034473836421966553, 0.0003981590270996094, 0.0004515796899795532, 0.0005050003528594971, 0.0005584210157394409, 0.0006118416786193848, 0.0006652623414993286, 0.0007186830043792725, 0.0007721036672592163, 0.0008255243301391602, 0.000878944993019104, 0.0009323656558990479, 0.0009857863187789917, 0.0010392069816589355, 0.0010926276445388794, 0.0011460483074188232, 0.001199468970298767, 0.001252889633178711, 0.0013063102960586548, 0.0013597309589385986, 0.0014131516218185425, 0.0014665722846984863, 0.0015199929475784302, 0.001573413610458374, 0.0016268342733383179, 0.0016802549362182617, 0.0017336755990982056, 0.0017870962619781494, 0.0018405169248580933, 0.0018939375877380371, 0.001947358250617981, 0.002000778913497925, 0.0020541995763778687, 0.0021076202392578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 14.0, 24.0, 41.0, 78.0, 118.0, 228.0, 183.0, 130.0, 48.0, 50.0, 22.0, 14.0, 14.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007670904975384474, -0.007463676854968071, -0.007256448734551668, -0.007049220614135265, -0.0068419924937188625, -0.00663476437330246, -0.006427536718547344, -0.006220308132469654, -0.006013080477714539, -0.005805852357298136, -0.005598624236881733, -0.00539139611646533, -0.005184167996048927, -0.0049769398756325245, -0.004769711755216122, -0.004562484100461006, -0.004355255514383316, -0.004148027393966913, -0.00394079927355051, -0.0037335711531341076, -0.0035263430327177048, -0.003319114912301302, -0.003111887024715543, -0.00290465890429914, -0.002697430783882737, -0.0024902026634663343, -0.0022829745430499315, -0.0020757466554641724, -0.0018685184186324477, -0.001661290298216045, -0.001454062294214964, -0.001246834173798561, -0.0010396065190434456, -0.0008323783986270428, -0.0006251503364183009, -0.00041792227420955896, -0.00021069415379315615, -3.4660333767533302e-06, 0.00020376197062432766, 0.0004109900910407305, 0.0006182182114571333, 0.0008254463318735361, 0.001032674452289939, 0.00123990245629102, 0.0014471305767074227, 0.0016543586971238256, 0.0018615867011249065, 0.0020688148215413094, 0.002276042941957712, 0.002483271062374115, 0.002690499182790518, 0.0028977273032069206, 0.0031049554236233234, 0.0033121835440397263, 0.0035194114316254854, 0.0037266395520418882, 0.003933867439627647, 0.00414109556004405, 0.004348323680460453, 0.004555551800876856, 0.004762779921293259, 0.0049700080417096615, 0.005177236162126064, 0.00538446381688118, 0.00559169240295887]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 15.0, 25.0, 29.0, 27.0, 33.0, 34.0, 52.0, 56.0, 62.0, 54.0, 65.0, 67.0, 49.0, 54.0, 54.0, 50.0, 34.0, 35.0, 46.0, 27.0, 20.0, 19.0, 21.0, 24.0, 11.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038289313670247793, -0.003729134565219283, -0.0036293375305831432, -0.003529540728777647, -0.003429743694141507, -0.003329946892336011, -0.003230149857699871, -0.003130353055894375, -0.003030556021258235, -0.0029307592194527388, -0.002830962184816599, -0.0027311653830111027, -0.002631368348374963, -0.0025315715465694666, -0.0024317745119333267, -0.0023319777101278305, -0.0022321809083223343, -0.002132384106516838, -0.002032587071880698, -0.0019327901536598802, -0.0018329932354390621, -0.001733196433633566, -0.001633399398997426, -0.0015336025971919298, -0.00143380556255579, -0.001334008644334972, -0.0012342117261141539, -0.0011344148078933358, -0.0010346178896725178, -0.0009348210296593606, -0.0008350241114385426, -0.0007352271932177246, -0.0006354302167892456, -0.0005356332985684276, -0.0004358363803476095, -0.00033603949123062193, -0.0002362425730098039, -0.0001364456838928163, -3.664876567199826e-05, 6.314815254881978e-05, 0.00016294507076963782, 0.00026274198899045587, 0.0003625389072112739, 0.0004623357963282615, 0.0005621326854452491, 0.0006619296036660671, 0.0007617265218868852, 0.0008615234401077032, 0.0009613203583285213, 0.0010611172765493393, 0.0011609141947701573, 0.0012607111129909754, 0.0013605080312117934, 0.0014603049494326115, 0.0015601017512381077, 0.0016598987858742476, 0.0017596955876797438, 0.0018594925059005618, 0.00195928942412138, 0.002059086225926876, 0.002158883260563016, 0.002258680062368512, 0.002358477097004652, 0.0024582738988101482, 0.002558070933446288]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 4.0, 12.0, 20.0, 21.0, 24.0, 51.0, 72.0, 106.0, 187.0, 365.0, 762.0, 1453.0, 2904.0, 6269.0, 13922.0, 32184.0, 79440.0, 211684.0, 412130.0, 171703.0, 65896.0, 26943.0, 11831.0, 5446.0, 2513.0, 1169.0, 615.0, 342.0, 182.0, 108.0, 69.0, 48.0, 29.0, 13.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007778167724609375, -0.007522284984588623, -0.007266402244567871, -0.007010519504547119, -0.006754636764526367, -0.006498754024505615, -0.006242871284484863, -0.005986988544464111, -0.005731105804443359, -0.005475223064422607, -0.0052193403244018555, -0.0049634575843811035, -0.0047075748443603516, -0.0044516921043396, -0.004195809364318848, -0.003939926624298096, -0.0036840438842773438, -0.003428161144256592, -0.00317227840423584, -0.002916395664215088, -0.002660512924194336, -0.002404630184173584, -0.002148747444152832, -0.00189286470413208, -0.0016369819641113281, -0.0013810992240905762, -0.0011252164840698242, -0.0008693337440490723, -0.0006134510040283203, -0.00035756826400756836, -0.0001016855239868164, 0.00015419721603393555, 0.0004100799560546875, 0.0006659626960754395, 0.0009218454360961914, 0.0011777281761169434, 0.0014336109161376953, 0.0016894936561584473, 0.0019453763961791992, 0.002201259136199951, 0.002457141876220703, 0.002713024616241455, 0.002968907356262207, 0.003224790096282959, 0.003480672836303711, 0.003736555576324463, 0.003992438316345215, 0.004248321056365967, 0.004504203796386719, 0.004760086536407471, 0.005015969276428223, 0.005271852016448975, 0.0055277347564697266, 0.0057836174964904785, 0.0060395002365112305, 0.006295382976531982, 0.006551265716552734, 0.006807148456573486, 0.007063031196594238, 0.00731891393661499, 0.007574796676635742, 0.007830679416656494, 0.008086562156677246, 0.008342444896697998, 0.00859832763671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 7.0, 3.0, 12.0, 15.0, 24.0, 23.0, 27.0, 34.0, 49.0, 60.0, 48.0, 43.0, 50.0, 54.0, 70.0, 43.0, 48.0, 77.0, 47.0, 47.0, 36.0, 29.0, 29.0, 23.0, 28.0, 17.0, 19.0, 13.0, 13.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001979827880859375, -0.0019270479679107666, -0.0018742680549621582, -0.0018214881420135498, -0.0017687082290649414, -0.001715928316116333, -0.0016631484031677246, -0.0016103684902191162, -0.0015575885772705078, -0.0015048086643218994, -0.001452028751373291, -0.0013992488384246826, -0.0013464689254760742, -0.0012936890125274658, -0.0012409090995788574, -0.001188129186630249, -0.0011353492736816406, -0.0010825693607330322, -0.0010297894477844238, -0.0009770095348358154, -0.000924229621887207, -0.0008714497089385986, -0.0008186697959899902, -0.0007658898830413818, -0.0007131099700927734, -0.000660330057144165, -0.0006075501441955566, -0.0005547702312469482, -0.0005019903182983398, -0.00044921040534973145, -0.00039643049240112305, -0.00034365057945251465, -0.00029087066650390625, -0.00023809075355529785, -0.00018531084060668945, -0.00013253092765808105, -7.975101470947266e-05, -2.6971101760864258e-05, 2.580881118774414e-05, 7.858872413635254e-05, 0.00013136863708496094, 0.00018414855003356934, 0.00023692846298217773, 0.00028970837593078613, 0.00034248828887939453, 0.00039526820182800293, 0.00044804811477661133, 0.0005008280277252197, 0.0005536079406738281, 0.0006063878536224365, 0.0006591677665710449, 0.0007119476795196533, 0.0007647275924682617, 0.0008175075054168701, 0.0008702874183654785, 0.0009230673313140869, 0.0009758472442626953, 0.0010286271572113037, 0.0010814070701599121, 0.0011341869831085205, 0.001186966896057129, 0.0012397468090057373, 0.0012925267219543457, 0.001345306634902954, 0.0013980865478515625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 12.0, 12.0, 22.0, 30.0, 74.0, 71.0, 93.0, 140.0, 181.0, 240.0, 357.0, 507.0, 812.0, 1189.0, 1770.0, 2529.0, 3957.0, 6546.0, 10462.0, 18158.0, 34849.0, 84386.0, 661550.0, 121895.0, 43838.0, 21617.0, 12210.0, 7353.0, 4684.0, 2858.0, 1875.0, 1371.0, 826.0, 644.0, 422.0, 293.0, 230.0, 138.0, 97.0, 71.0, 58.0, 27.0, 18.0, 19.0, 19.0, 8.0, 8.0, 13.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.007328033447265625, -0.007096469402313232, -0.00686490535736084, -0.006633341312408447, -0.006401777267456055, -0.006170213222503662, -0.0059386491775512695, -0.005707085132598877, -0.005475521087646484, -0.005243957042694092, -0.005012392997741699, -0.004780828952789307, -0.004549264907836914, -0.0043177008628845215, -0.004086136817932129, -0.0038545727729797363, -0.0036230087280273438, -0.003391444683074951, -0.0031598806381225586, -0.002928316593170166, -0.0026967525482177734, -0.002465188503265381, -0.0022336244583129883, -0.0020020604133605957, -0.0017704963684082031, -0.0015389323234558105, -0.001307368278503418, -0.0010758042335510254, -0.0008442401885986328, -0.0006126761436462402, -0.00038111209869384766, -0.00014954805374145508, 8.20159912109375e-05, 0.0003135800361633301, 0.0005451440811157227, 0.0007767081260681152, 0.0010082721710205078, 0.0012398362159729004, 0.001471400260925293, 0.0017029643058776855, 0.0019345283508300781, 0.0021660923957824707, 0.0023976564407348633, 0.002629220485687256, 0.0028607845306396484, 0.003092348575592041, 0.0033239126205444336, 0.003555476665496826, 0.0037870407104492188, 0.004018604755401611, 0.004250168800354004, 0.0044817328453063965, 0.004713296890258789, 0.004944860935211182, 0.005176424980163574, 0.005407989025115967, 0.005639553070068359, 0.005871117115020752, 0.0061026811599731445, 0.006334245204925537, 0.00656580924987793, 0.006797373294830322, 0.007028937339782715, 0.007260501384735107, 0.0074920654296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 9.0, 26.0, 27.0, 14.0, 18.0, 21.0, 41.0, 35.0, 41.0, 41.0, 38.0, 50.0, 46.0, 53.0, 48.0, 48.0, 32.0, 34.0, 37.0, 37.0, 35.0, 33.0, 32.0, 28.0, 26.0, 12.0, 20.0, 16.0, 11.0, 14.0, 8.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009393692016601562, -0.0009109973907470703, -0.0008826255798339844, -0.0008542537689208984, -0.0008258819580078125, -0.0007975101470947266, -0.0007691383361816406, -0.0007407665252685547, -0.0007123947143554688, -0.0006840229034423828, -0.0006556510925292969, -0.0006272792816162109, -0.000598907470703125, -0.0005705356597900391, -0.0005421638488769531, -0.0005137920379638672, -0.00048542022705078125, -0.0004570484161376953, -0.0004286766052246094, -0.00040030479431152344, -0.0003719329833984375, -0.00034356117248535156, -0.0003151893615722656, -0.0002868175506591797, -0.00025844573974609375, -0.0002300739288330078, -0.00020170211791992188, -0.00017333030700683594, -0.00014495849609375, -0.00011658668518066406, -8.821487426757812e-05, -5.984306335449219e-05, -3.147125244140625e-05, -3.0994415283203125e-06, 2.5272369384765625e-05, 5.364418029785156e-05, 8.20159912109375e-05, 0.00011038780212402344, 0.00013875961303710938, 0.0001671314239501953, 0.00019550323486328125, 0.0002238750457763672, 0.0002522468566894531, 0.00028061866760253906, 0.000308990478515625, 0.00033736228942871094, 0.0003657341003417969, 0.0003941059112548828, 0.00042247772216796875, 0.0004508495330810547, 0.0004792213439941406, 0.0005075931549072266, 0.0005359649658203125, 0.0005643367767333984, 0.0005927085876464844, 0.0006210803985595703, 0.0006494522094726562, 0.0006778240203857422, 0.0007061958312988281, 0.0007345676422119141, 0.000762939453125, 0.0007913112640380859, 0.0008196830749511719, 0.0008480548858642578, 0.0008764266967773438]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 12.0, 9.0, 18.0, 24.0, 41.0, 49.0, 62.0, 71.0, 95.0, 130.0, 254.0, 341.0, 585.0, 1011.0, 1709.0, 3551.0, 8567.0, 34488.0, 901917.0, 72233.0, 13358.0, 4588.0, 2212.0, 1192.0, 718.0, 415.0, 250.0, 186.0, 120.0, 85.0, 78.0, 45.0, 30.0, 21.0, 22.0, 16.0, 12.0, 7.0, 4.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013570785522460938, -0.0013155490159988403, -0.001274019479751587, -0.0012324899435043335, -0.00119096040725708, -0.0011494308710098267, -0.0011079013347625732, -0.0010663717985153198, -0.0010248422622680664, -0.000983312726020813, -0.0009417831897735596, -0.0009002536535263062, -0.0008587241172790527, -0.0008171945810317993, -0.0007756650447845459, -0.0007341355085372925, -0.0006926059722900391, -0.0006510764360427856, -0.0006095468997955322, -0.0005680173635482788, -0.0005264878273010254, -0.00048495829105377197, -0.00044342875480651855, -0.00040189921855926514, -0.0003603696823120117, -0.0003188401460647583, -0.0002773106098175049, -0.00023578107357025146, -0.00019425153732299805, -0.00015272200107574463, -0.00011119246482849121, -6.966292858123779e-05, -2.8133392333984375e-05, 1.3396143913269043e-05, 5.492568016052246e-05, 9.645521640777588e-05, 0.0001379847526550293, 0.00017951428890228271, 0.00022104382514953613, 0.00026257336139678955, 0.00030410289764404297, 0.0003456324338912964, 0.0003871619701385498, 0.0004286915063858032, 0.00047022104263305664, 0.0005117505788803101, 0.0005532801151275635, 0.0005948096513748169, 0.0006363391876220703, 0.0006778687238693237, 0.0007193982601165771, 0.0007609277963638306, 0.000802457332611084, 0.0008439868688583374, 0.0008855164051055908, 0.0009270459413528442, 0.0009685754776000977, 0.001010105013847351, 0.0010516345500946045, 0.001093164086341858, 0.0011346936225891113, 0.0011762231588363647, 0.0012177526950836182, 0.0012592822313308716, 0.001300811767578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 4.0, 5.0, 3.0, 5.0, 6.0, 9.0, 4.0, 13.0, 16.0, 7.0, 24.0, 10.0, 34.0, 19.0, 60.0, 88.0, 49.0, 163.0, 69.0, 112.0, 38.0, 65.0, 27.0, 33.0, 26.0, 7.0, 18.0, 10.0, 10.0, 4.0, 10.0, 10.0, 2.0, 4.0, 5.0, 8.0, 1.0, 2.0, 2.0, 7.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4102628231048584e-06, -2.3171305656433105e-06, -2.2239983081817627e-06, -2.130866050720215e-06, -2.037733793258667e-06, -1.944601535797119e-06, -1.8514692783355713e-06, -1.7583370208740234e-06, -1.6652047634124756e-06, -1.5720725059509277e-06, -1.4789402484893799e-06, -1.385807991027832e-06, -1.2926757335662842e-06, -1.1995434761047363e-06, -1.1064112186431885e-06, -1.0132789611816406e-06, -9.201467037200928e-07, -8.270144462585449e-07, -7.338821887969971e-07, -6.407499313354492e-07, -5.476176738739014e-07, -4.544854164123535e-07, -3.6135315895080566e-07, -2.682209014892578e-07, -1.7508864402770996e-07, -8.195638656616211e-08, 1.1175870895385742e-08, 1.043081283569336e-07, 1.9744038581848145e-07, 2.905726432800293e-07, 3.8370490074157715e-07, 4.76837158203125e-07, 5.699694156646729e-07, 6.631016731262207e-07, 7.562339305877686e-07, 8.493661880493164e-07, 9.424984455108643e-07, 1.0356307029724121e-06, 1.12876296043396e-06, 1.2218952178955078e-06, 1.3150274753570557e-06, 1.4081597328186035e-06, 1.5012919902801514e-06, 1.5944242477416992e-06, 1.687556505203247e-06, 1.780688762664795e-06, 1.8738210201263428e-06, 1.9669532775878906e-06, 2.0600855350494385e-06, 2.1532177925109863e-06, 2.246350049972534e-06, 2.339482307434082e-06, 2.43261456489563e-06, 2.5257468223571777e-06, 2.6188790798187256e-06, 2.7120113372802734e-06, 2.8051435947418213e-06, 2.898275852203369e-06, 2.991408109664917e-06, 3.084540367126465e-06, 3.1776726245880127e-06, 3.2708048820495605e-06, 3.3639371395111084e-06, 3.4570693969726562e-06]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 1.0, 6.0, 4.0, 7.0, 12.0, 24.0, 35.0, 74.0, 187.0, 492.0, 1351.0, 4807.0, 48126.0, 974409.0, 14757.0, 2713.0, 932.0, 359.0, 152.0, 49.0, 23.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0015592575073242188, -0.001509442925453186, -0.0014596283435821533, -0.0014098137617111206, -0.0013599991798400879, -0.0013101845979690552, -0.0012603700160980225, -0.0012105554342269897, -0.001160740852355957, -0.0011109262704849243, -0.0010611116886138916, -0.0010112971067428589, -0.0009614825248718262, -0.0009116679430007935, -0.0008618533611297607, -0.000812038779258728, -0.0007622241973876953, -0.0007124096155166626, -0.0006625950336456299, -0.0006127804517745972, -0.0005629658699035645, -0.0005131512880325317, -0.000463336706161499, -0.0004135221242904663, -0.0003637075424194336, -0.0003138929605484009, -0.00026407837867736816, -0.00021426379680633545, -0.00016444921493530273, -0.00011463463306427002, -6.48200511932373e-05, -1.500546932220459e-05, 3.4809112548828125e-05, 8.462369441986084e-05, 0.00013443827629089355, 0.00018425285816192627, 0.00023406744003295898, 0.0002838820219039917, 0.0003336966037750244, 0.00038351118564605713, 0.00043332576751708984, 0.00048314034938812256, 0.0005329549312591553, 0.000582769513130188, 0.0006325840950012207, 0.0006823986768722534, 0.0007322132587432861, 0.0007820278406143188, 0.0008318424224853516, 0.0008816570043563843, 0.000931471586227417, 0.0009812861680984497, 0.0010311007499694824, 0.0010809153318405151, 0.0011307299137115479, 0.0011805444955825806, 0.0012303590774536133, 0.001280173659324646, 0.0013299882411956787, 0.0013798028230667114, 0.0014296174049377441, 0.0014794319868087769, 0.0015292465686798096, 0.0015790611505508423, 0.001628875732421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 15.0, 13.0, 25.0, 31.0, 60.0, 101.0, 299.0, 196.0, 74.0, 38.0, 26.0, 20.0, 19.0, 11.0, 9.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.630752563476562e-05, -8.350051939487457e-05, -8.069351315498352e-05, -7.788650691509247e-05, -7.507950067520142e-05, -7.227249443531036e-05, -6.946548819541931e-05, -6.665848195552826e-05, -6.385147571563721e-05, -6.104446947574615e-05, -5.82374632358551e-05, -5.543045699596405e-05, -5.2623450756073e-05, -4.9816444516181946e-05, -4.7009438276290894e-05, -4.420243203639984e-05, -4.139542579650879e-05, -3.858841955661774e-05, -3.5781413316726685e-05, -3.297440707683563e-05, -3.016740083694458e-05, -2.7360394597053528e-05, -2.4553388357162476e-05, -2.1746382117271423e-05, -1.893937587738037e-05, -1.613236963748932e-05, -1.3325363397598267e-05, -1.0518357157707214e-05, -7.711350917816162e-06, -4.90434467792511e-06, -2.0973384380340576e-06, 7.096678018569946e-07, 3.516674041748047e-06, 6.323680281639099e-06, 9.130686521530151e-06, 1.1937692761421204e-05, 1.4744699001312256e-05, 1.7551705241203308e-05, 2.035871148109436e-05, 2.3165717720985413e-05, 2.5972723960876465e-05, 2.8779730200767517e-05, 3.158673644065857e-05, 3.439374268054962e-05, 3.7200748920440674e-05, 4.0007755160331726e-05, 4.281476140022278e-05, 4.562176764011383e-05, 4.842877388000488e-05, 5.1235780119895935e-05, 5.404278635978699e-05, 5.684979259967804e-05, 5.965679883956909e-05, 6.246380507946014e-05, 6.52708113193512e-05, 6.807781755924225e-05, 7.08848237991333e-05, 7.369183003902435e-05, 7.64988362789154e-05, 7.930584251880646e-05, 8.211284875869751e-05, 8.491985499858856e-05, 8.772686123847961e-05, 9.053386747837067e-05, 9.334087371826172e-05]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 24.0, 53.0, 107.0, 221.0, 269.0, 154.0, 57.0, 44.0, 23.0, 21.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006544268224388361, -0.006399817764759064, -0.006255367770791054, -0.0061109173111617565, -0.005966467317193747, -0.005822016857564449, -0.005677566863596439, -0.005533116403967142, -0.005388665944337845, -0.005244215484708548, -0.005099765490740538, -0.00495531503111124, -0.0048108650371432304, -0.004666414577513933, -0.004521964117884636, -0.004377514123916626, -0.004233064129948616, -0.004088613670319319, -0.003944163676351309, -0.0037997132167220116, -0.003655262989923358, -0.0035108127631247044, -0.0033663625363260508, -0.003221912309527397, -0.0030774618498981, -0.0029330116230994463, -0.0027885613963007927, -0.0026441109366714954, -0.002499660709872842, -0.0023552104830741882, -0.0022107602562755346, -0.002066310029476881, -0.0019218595698475838, -0.0017774093430489302, -0.0016329589998349547, -0.0014885087730363011, -0.0013440584298223257, -0.001199608203023672, -0.0010551579762250185, -0.0009107076330110431, -0.0007662574062123895, -0.000621807121206075, -0.0004773568653035909, -0.00033290660940110683, -0.00018845632439479232, -4.40060393884778e-05, 0.0001004441874101758, 0.00024489453062415123, 0.00038934475742280483, 0.0005337950424291193, 0.0006782453274354339, 0.0008226955542340875, 0.000967145839240402, 0.0011115961242467165, 0.00125604635104537, 0.0014004966942593455, 0.0015449469210579991, 0.0016893971478566527, 0.0018338474910706282, 0.0019782977178692818, 0.0021227479446679354, 0.002267198171466589, 0.0024116486310958862, 0.00255609885789454, 0.0027005490846931934]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 8.0, 9.0, 5.0, 10.0, 23.0, 25.0, 31.0, 22.0, 27.0, 43.0, 62.0, 49.0, 56.0, 66.0, 60.0, 48.0, 58.0, 63.0, 46.0, 46.0, 35.0, 37.0, 30.0, 30.0, 26.0, 17.0, 25.0, 20.0, 17.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019329448696225882, -0.0018824501894414425, -0.0018319555092602968, -0.001781460945494473, -0.0017309662653133273, -0.0016804715851321816, -0.0016299770213663578, -0.0015794823411852121, -0.0015289876610040665, -0.0014784929808229208, -0.0014279983006417751, -0.0013775037368759513, -0.0013270090566948056, -0.00127651437651366, -0.0012260198127478361, -0.0011755251325666904, -0.0011250304523855448, -0.0010745357722043991, -0.0010240410920232534, -0.0009735465282574296, -0.0009230518480762839, -0.0008725571678951383, -0.0008220625459216535, -0.0007715679239481688, -0.0007210732437670231, -0.0006705785635858774, -0.0006200839416123927, -0.0005695893196389079, -0.0005190946394577622, -0.00046859998838044703, -0.0004181053373031318, -0.0003676106862258166, -0.0003171161515638232, -0.000266621500486508, -0.0002161268494091928, -0.0001656321983318776, -0.00011513754725456238, -6.464289617724717e-05, -1.4148245099931955e-05, 3.6346405977383256e-05, 8.684105705469847e-05, 0.00013733570813201368, 0.0001878303592093289, 0.0002383250102866441, 0.0002888196613639593, 0.0003393143124412745, 0.00038980896351858974, 0.00044030361459590495, 0.0004907982656732202, 0.0005412929458543658, 0.0005917875678278506, 0.0006422821898013353, 0.000692776869982481, 0.0007432715501636267, 0.0007937661721371114, 0.0008442607941105962, 0.0008947554742917418, 0.0009452501544728875, 0.0009957447182387114, 0.001046239398419857, 0.0010967340786010027, 0.0011472287587821484, 0.001197723438963294, 0.0012482180027291179, 0.0012987126829102635]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 9.0, 17.0, 17.0, 23.0, 41.0, 43.0, 81.0, 154.0, 268.0, 618.0, 1639.0, 5025.0, 16359.0, 61732.0, 331580.0, 503496.0, 93783.0, 23173.0, 6783.0, 2148.0, 792.0, 346.0, 144.0, 88.0, 56.0, 39.0, 21.0, 23.0, 14.0, 13.0, 10.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004352569580078125, -0.004179418087005615, -0.0040062665939331055, -0.0038331151008605957, -0.003659963607788086, -0.003486812114715576, -0.0033136606216430664, -0.0031405091285705566, -0.002967357635498047, -0.002794206142425537, -0.0026210546493530273, -0.0024479031562805176, -0.002274751663208008, -0.002101600170135498, -0.0019284486770629883, -0.0017552971839904785, -0.0015821456909179688, -0.001408994197845459, -0.0012358427047729492, -0.0010626912117004395, -0.0008895397186279297, -0.0007163882255554199, -0.0005432367324829102, -0.0003700852394104004, -0.00019693374633789062, -2.378225326538086e-05, 0.0001493692398071289, 0.00032252073287963867, 0.0004956722259521484, 0.0006688237190246582, 0.000841975212097168, 0.0010151267051696777, 0.0011882781982421875, 0.0013614296913146973, 0.001534581184387207, 0.0017077326774597168, 0.0018808841705322266, 0.0020540356636047363, 0.002227187156677246, 0.002400338649749756, 0.0025734901428222656, 0.0027466416358947754, 0.002919793128967285, 0.003092944622039795, 0.0032660961151123047, 0.0034392476081848145, 0.0036123991012573242, 0.003785550594329834, 0.003958702087402344, 0.0041318535804748535, 0.004305005073547363, 0.004478156566619873, 0.004651308059692383, 0.004824459552764893, 0.004997611045837402, 0.005170762538909912, 0.005343914031982422, 0.005517065525054932, 0.005690217018127441, 0.005863368511199951, 0.006036520004272461, 0.006209671497344971, 0.0063828229904174805, 0.00655597448348999, 0.0067291259765625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 14.0, 11.0, 14.0, 28.0, 31.0, 28.0, 42.0, 57.0, 71.0, 73.0, 75.0, 73.0, 80.0, 59.0, 65.0, 46.0, 46.0, 46.0, 33.0, 29.0, 23.0, 18.0, 11.0, 8.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013341903686523438, -0.0013035759329795837, -0.0012729614973068237, -0.0012423470616340637, -0.0012117326259613037, -0.0011811181902885437, -0.0011505037546157837, -0.0011198893189430237, -0.0010892748832702637, -0.0010586604475975037, -0.0010280460119247437, -0.0009974315762519836, -0.0009668171405792236, -0.0009362027049064636, -0.0009055882692337036, -0.0008749738335609436, -0.0008443593978881836, -0.0008137449622154236, -0.0007831305265426636, -0.0007525160908699036, -0.0007219016551971436, -0.0006912872195243835, -0.0006606727838516235, -0.0006300583481788635, -0.0005994439125061035, -0.0005688294768333435, -0.0005382150411605835, -0.0005076006054878235, -0.0004769861698150635, -0.00044637173414230347, -0.00041575729846954346, -0.00038514286279678345, -0.00035452842712402344, -0.00032391399145126343, -0.0002932995557785034, -0.0002626851201057434, -0.0002320706844329834, -0.0002014562487602234, -0.00017084181308746338, -0.00014022737741470337, -0.00010961294174194336, -7.899850606918335e-05, -4.838407039642334e-05, -1.776963472366333e-05, 1.284480094909668e-05, 4.345923662185669e-05, 7.40736722946167e-05, 0.00010468810796737671, 0.00013530254364013672, 0.00016591697931289673, 0.00019653141498565674, 0.00022714585065841675, 0.00025776028633117676, 0.00028837472200393677, 0.0003189891576766968, 0.0003496035933494568, 0.0003802180290222168, 0.0004108324646949768, 0.0004414469003677368, 0.0004720613360404968, 0.0005026757717132568, 0.0005332902073860168, 0.0005639046430587769, 0.0005945190787315369, 0.0006251335144042969]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 12.0, 8.0, 11.0, 17.0, 19.0, 21.0, 36.0, 35.0, 98.0, 143.0, 273.0, 644.0, 1631.0, 3690.0, 9974.0, 27548.0, 84414.0, 297085.0, 426613.0, 132564.0, 40209.0, 14387.0, 5334.0, 2098.0, 825.0, 393.0, 180.0, 95.0, 56.0, 35.0, 30.0, 20.0, 14.0, 8.0, 7.0, 8.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.0033321380615234375, -0.0032425224781036377, -0.003152906894683838, -0.003063291311264038, -0.0029736757278442383, -0.0028840601444244385, -0.0027944445610046387, -0.002704828977584839, -0.002615213394165039, -0.0025255978107452393, -0.0024359822273254395, -0.0023463666439056396, -0.00225675106048584, -0.00216713547706604, -0.0020775198936462402, -0.0019879043102264404, -0.0018982887268066406, -0.0018086731433868408, -0.001719057559967041, -0.0016294419765472412, -0.0015398263931274414, -0.0014502108097076416, -0.0013605952262878418, -0.001270979642868042, -0.0011813640594482422, -0.0010917484760284424, -0.0010021328926086426, -0.0009125173091888428, -0.000822901725769043, -0.0007332861423492432, -0.0006436705589294434, -0.0005540549755096436, -0.00046443939208984375, -0.00037482380867004395, -0.00028520822525024414, -0.00019559264183044434, -0.00010597705841064453, -1.6361474990844727e-05, 7.325410842895508e-05, 0.00016286969184875488, 0.0002524852752685547, 0.0003421008586883545, 0.0004317164421081543, 0.0005213320255279541, 0.0006109476089477539, 0.0007005631923675537, 0.0007901787757873535, 0.0008797943592071533, 0.0009694099426269531, 0.001059025526046753, 0.0011486411094665527, 0.0012382566928863525, 0.0013278722763061523, 0.0014174878597259521, 0.001507103443145752, 0.0015967190265655518, 0.0016863346099853516, 0.0017759501934051514, 0.0018655657768249512, 0.001955181360244751, 0.0020447969436645508, 0.0021344125270843506, 0.0022240281105041504, 0.00231364369392395, 0.00240325927734375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 6.0, 11.0, 10.0, 10.0, 18.0, 18.0, 28.0, 23.0, 20.0, 32.0, 35.0, 47.0, 52.0, 43.0, 46.0, 54.0, 55.0, 47.0, 58.0, 32.0, 43.0, 34.0, 34.0, 29.0, 32.0, 34.0, 31.0, 19.0, 21.0, 19.0, 11.0, 11.0, 9.0, 10.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004646778106689453, -0.0004471801221370697, -0.0004296824336051941, -0.0004121847450733185, -0.00039468705654144287, -0.00037718936800956726, -0.00035969167947769165, -0.00034219399094581604, -0.00032469630241394043, -0.0003071986138820648, -0.0002897009253501892, -0.0002722032368183136, -0.000254705548286438, -0.00023720785975456238, -0.00021971017122268677, -0.00020221248269081116, -0.00018471479415893555, -0.00016721710562705994, -0.00014971941709518433, -0.00013222172856330872, -0.0001147240400314331, -9.72263514995575e-05, -7.972866296768188e-05, -6.223097443580627e-05, -4.4733285903930664e-05, -2.7235597372055054e-05, -9.737908840179443e-06, 7.759779691696167e-06, 2.5257468223571777e-05, 4.275515675544739e-05, 6.0252845287323e-05, 7.775053381919861e-05, 9.524822235107422e-05, 0.00011274591088294983, 0.00013024359941482544, 0.00014774128794670105, 0.00016523897647857666, 0.00018273666501045227, 0.00020023435354232788, 0.0002177320420742035, 0.0002352297306060791, 0.0002527274191379547, 0.0002702251076698303, 0.00028772279620170593, 0.00030522048473358154, 0.00032271817326545715, 0.00034021586179733276, 0.0003577135503292084, 0.000375211238861084, 0.0003927089273929596, 0.0004102066159248352, 0.0004277043044567108, 0.0004452019929885864, 0.00046269968152046204, 0.00048019737005233765, 0.0004976950585842133, 0.0005151927471160889, 0.0005326904356479645, 0.0005501881241798401, 0.0005676858127117157, 0.0005851835012435913, 0.0006026811897754669, 0.0006201788783073425, 0.0006376765668392181, 0.0006551742553710938]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 17.0, 17.0, 16.0, 37.0, 49.0, 53.0, 107.0, 149.0, 259.0, 429.0, 813.0, 1527.0, 3525.0, 8947.0, 30459.0, 243744.0, 683474.0, 52879.0, 12999.0, 4681.0, 1988.0, 973.0, 499.0, 328.0, 191.0, 108.0, 89.0, 59.0, 29.0, 31.0, 23.0, 10.0, 10.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0001443624496459961, -0.00014037080109119415, -0.0001363791525363922, -0.00013238750398159027, -0.00012839585542678833, -0.0001244042068719864, -0.00012041255831718445, -0.00011642090976238251, -0.00011242926120758057, -0.00010843761265277863, -0.00010444596409797668, -0.00010045431554317474, -9.64626669883728e-05, -9.247101843357086e-05, -8.847936987876892e-05, -8.448772132396698e-05, -8.049607276916504e-05, -7.65044242143631e-05, -7.251277565956116e-05, -6.852112710475922e-05, -6.452947854995728e-05, -6.0537829995155334e-05, -5.6546181440353394e-05, -5.255453288555145e-05, -4.856288433074951e-05, -4.457123577594757e-05, -4.057958722114563e-05, -3.658793866634369e-05, -3.259629011154175e-05, -2.8604641556739807e-05, -2.4612993001937866e-05, -2.0621344447135925e-05, -1.6629695892333984e-05, -1.2638047337532043e-05, -8.646398782730103e-06, -4.654750227928162e-06, -6.631016731262207e-07, 3.3285468816757202e-06, 7.320195436477661e-06, 1.1311843991279602e-05, 1.5303492546081543e-05, 1.9295141100883484e-05, 2.3286789655685425e-05, 2.7278438210487366e-05, 3.127008676528931e-05, 3.526173532009125e-05, 3.925338387489319e-05, 4.324503242969513e-05, 4.723668098449707e-05, 5.122832953929901e-05, 5.521997809410095e-05, 5.921162664890289e-05, 6.320327520370483e-05, 6.719492375850677e-05, 7.118657231330872e-05, 7.517822086811066e-05, 7.91698694229126e-05, 8.316151797771454e-05, 8.715316653251648e-05, 9.114481508731842e-05, 9.513646364212036e-05, 9.91281121969223e-05, 0.00010311976075172424, 0.00010711140930652618, 0.00011110305786132812]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 10.0, 21.0, 23.0, 20.0, 47.0, 87.0, 135.0, 197.0, 181.0, 92.0, 53.0, 36.0, 18.0, 11.0, 15.0, 5.0, 0.0, 5.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.424022674560547e-06, -5.2032992243766785e-06, -4.98257577419281e-06, -4.761852324008942e-06, -4.541128873825073e-06, -4.320405423641205e-06, -4.0996819734573364e-06, -3.878958523273468e-06, -3.6582350730895996e-06, -3.437511622905731e-06, -3.216788172721863e-06, -2.9960647225379944e-06, -2.775341272354126e-06, -2.5546178221702576e-06, -2.333894371986389e-06, -2.1131709218025208e-06, -1.8924474716186523e-06, -1.671724021434784e-06, -1.4510005712509155e-06, -1.2302771210670471e-06, -1.0095536708831787e-06, -7.888302206993103e-07, -5.681067705154419e-07, -3.473833203315735e-07, -1.2665987014770508e-07, 9.406358003616333e-08, 3.1478703022003174e-07, 5.355104804039001e-07, 7.562339305877686e-07, 9.76957380771637e-07, 1.1976808309555054e-06, 1.4184042811393738e-06, 1.6391277313232422e-06, 1.8598511815071106e-06, 2.080574631690979e-06, 2.3012980818748474e-06, 2.522021532058716e-06, 2.7427449822425842e-06, 2.9634684324264526e-06, 3.184191882610321e-06, 3.4049153327941895e-06, 3.625638782978058e-06, 3.846362233161926e-06, 4.067085683345795e-06, 4.287809133529663e-06, 4.5085325837135315e-06, 4.7292560338974e-06, 4.949979484081268e-06, 5.170702934265137e-06, 5.391426384449005e-06, 5.6121498346328735e-06, 5.832873284816742e-06, 6.05359673500061e-06, 6.274320185184479e-06, 6.495043635368347e-06, 6.7157670855522156e-06, 6.936490535736084e-06, 7.157213985919952e-06, 7.377937436103821e-06, 7.598660886287689e-06, 7.819384336471558e-06, 8.040107786655426e-06, 8.260831236839294e-06, 8.481554687023163e-06, 8.702278137207031e-06]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 18.0, 27.0, 40.0, 62.0, 87.0, 151.0, 360.0, 719.0, 1612.0, 4611.0, 13695.0, 52474.0, 378965.0, 501463.0, 69241.0, 16208.0, 5232.0, 1857.0, 818.0, 419.0, 189.0, 107.0, 57.0, 37.0, 25.0, 21.0, 5.0, 12.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.194280624389648e-05, -6.98314979672432e-05, -6.77201896905899e-05, -6.560888141393661e-05, -6.349757313728333e-05, -6.138626486063004e-05, -5.9274956583976746e-05, -5.7163648307323456e-05, -5.5052340030670166e-05, -5.2941031754016876e-05, -5.0829723477363586e-05, -4.87184152007103e-05, -4.660710692405701e-05, -4.449579864740372e-05, -4.238449037075043e-05, -4.027318209409714e-05, -3.816187381744385e-05, -3.605056554079056e-05, -3.393925726413727e-05, -3.182794898748398e-05, -2.971664071083069e-05, -2.76053324341774e-05, -2.549402415752411e-05, -2.338271588087082e-05, -2.127140760421753e-05, -1.916009932756424e-05, -1.704879105091095e-05, -1.493748277425766e-05, -1.282617449760437e-05, -1.071486622095108e-05, -8.60355794429779e-06, -6.492249667644501e-06, -4.380941390991211e-06, -2.269633114337921e-06, -1.5832483768463135e-07, 1.9529834389686584e-06, 4.064291715621948e-06, 6.175599992275238e-06, 8.286908268928528e-06, 1.0398216545581818e-05, 1.2509524822235107e-05, 1.4620833098888397e-05, 1.6732141375541687e-05, 1.8843449652194977e-05, 2.0954757928848267e-05, 2.3066066205501556e-05, 2.5177374482154846e-05, 2.7288682758808136e-05, 2.9399991035461426e-05, 3.1511299312114716e-05, 3.3622607588768005e-05, 3.5733915865421295e-05, 3.7845224142074585e-05, 3.9956532418727875e-05, 4.2067840695381165e-05, 4.4179148972034454e-05, 4.6290457248687744e-05, 4.8401765525341034e-05, 5.0513073801994324e-05, 5.2624382078647614e-05, 5.47356903553009e-05, 5.684699863195419e-05, 5.895830690860748e-05, 6.106961518526077e-05, 6.318092346191406e-05]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 11.0, 7.0, 16.0, 11.0, 14.0, 19.0, 24.0, 25.0, 28.0, 54.0, 60.0, 68.0, 69.0, 74.0, 61.0, 59.0, 63.0, 57.0, 55.0, 36.0, 36.0, 28.0, 20.0, 20.0, 18.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0728836059570312e-05, -1.0376796126365662e-05, -1.002475619316101e-05, -9.67271625995636e-06, -9.320676326751709e-06, -8.968636393547058e-06, -8.616596460342407e-06, -8.264556527137756e-06, -7.912516593933105e-06, -7.560476660728455e-06, -7.208436727523804e-06, -6.856396794319153e-06, -6.504356861114502e-06, -6.152316927909851e-06, -5.8002769947052e-06, -5.448237061500549e-06, -5.0961971282958984e-06, -4.7441571950912476e-06, -4.392117261886597e-06, -4.040077328681946e-06, -3.688037395477295e-06, -3.335997462272644e-06, -2.983957529067993e-06, -2.6319175958633423e-06, -2.2798776626586914e-06, -1.9278377294540405e-06, -1.5757977962493896e-06, -1.2237578630447388e-06, -8.717179298400879e-07, -5.19677996635437e-07, -1.6763806343078613e-07, 1.8440186977386475e-07, 5.364418029785156e-07, 8.884817361831665e-07, 1.2405216693878174e-06, 1.5925616025924683e-06, 1.944601535797119e-06, 2.29664146900177e-06, 2.648681402206421e-06, 3.0007213354110718e-06, 3.3527612686157227e-06, 3.7048012018203735e-06, 4.056841135025024e-06, 4.408881068229675e-06, 4.760921001434326e-06, 5.112960934638977e-06, 5.465000867843628e-06, 5.817040801048279e-06, 6.16908073425293e-06, 6.5211206674575806e-06, 6.8731606006622314e-06, 7.225200533866882e-06, 7.577240467071533e-06, 7.929280400276184e-06, 8.281320333480835e-06, 8.633360266685486e-06, 8.985400199890137e-06, 9.337440133094788e-06, 9.689480066299438e-06, 1.004151999950409e-05, 1.039355993270874e-05, 1.0745599865913391e-05, 1.1097639799118042e-05, 1.1449679732322693e-05, 1.1801719665527344e-05]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 16.0, 28.0, 39.0, 63.0, 134.0, 180.0, 194.0, 105.0, 80.0, 48.0, 29.0, 22.0, 15.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0028877919539809227, -0.0028240089304745197, -0.0027602259069681168, -0.002696442883461714, -0.002632659859955311, -0.0025688770692795515, -0.0025050940457731485, -0.0024413110222667456, -0.0023775279987603426, -0.0023137449752539396, -0.0022499619517475367, -0.0021861789282411337, -0.0021223961375653744, -0.0020586131140589714, -0.0019948300905525684, -0.0019310470670461655, -0.0018672640435397625, -0.0018034810200333595, -0.0017396979965269566, -0.0016759150894358754, -0.0016121320659294724, -0.0015483490424230695, -0.0014845661353319883, -0.0014207831118255854, -0.0013570000883191824, -0.0012932170648127794, -0.0012294340413063765, -0.0011656511342152953, -0.0011018681107088923, -0.0010380850872024894, -0.0009743021219037473, -0.0009105191566050053, -0.0008467359002679586, -0.0007829528767615557, -0.0007191699114628136, -0.0006553869461640716, -0.0005916039226576686, -0.0005278208991512656, -0.00046403793385252357, -0.00040025493944995105, -0.00033647194504737854, -0.00027268895064480603, -0.00020890595624223351, -0.000145122961839661, -8.133996743708849e-05, -1.7556973034515977e-05, 4.6226021368056536e-05, 0.00011000901577062905, 0.00017379201017320156, 0.00023757500457577407, 0.0003013579989783466, 0.0003651409933809191, 0.0004289239877834916, 0.0004927070112898946, 0.0005564899765886366, 0.0006202729418873787, 0.0006840559653937817, 0.0007478389889001846, 0.0008116219541989267, 0.0008754049194976687, 0.0009391879430040717, 0.0010029709665104747, 0.0010667538736015558, 0.0011305368971079588, 0.0011943199206143618]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 4.0, 7.0, 12.0, 15.0, 17.0, 10.0, 16.0, 14.0, 14.0, 24.0, 34.0, 36.0, 25.0, 35.0, 47.0, 36.0, 29.0, 34.0, 35.0, 36.0, 44.0, 46.0, 41.0, 44.0, 30.0, 43.0, 36.0, 39.0, 24.0, 22.0, 17.0, 20.0, 16.0, 11.0, 10.0, 11.0, 6.0, 12.0, 5.0, 9.0, 11.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007161087123677135, -0.0006936354329809546, -0.0006711621535941958, -0.000648688874207437, -0.0006262155948206782, -0.0006037422572262585, -0.0005812689778394997, -0.0005587956984527409, -0.0005363224190659821, -0.0005138491396792233, -0.0004913758602924645, -0.00046890255180187523, -0.00044642927241511643, -0.0004239559930283576, -0.00040148268453776836, -0.00037900940515100956, -0.00035653612576425076, -0.00033406284637749195, -0.00031158956699073315, -0.0002891162585001439, -0.0002666429791133851, -0.0002441696997266263, -0.00022169640578795224, -0.0001992231118492782, -0.0001767498324625194, -0.0001542765530757606, -0.00013180325913708657, -0.00010932997247437015, -8.685668581165373e-05, -6.438339914893731e-05, -4.1910112486220896e-05, -1.9436818547546864e-05, 3.0364026315510273e-06, 2.5509689294267446e-05, 4.7982975956983864e-05, 7.045626261970028e-05, 9.29295492824167e-05, 0.00011540283594513312, 0.00013787612260784954, 0.00016034941654652357, 0.00018282269593328238, 0.00020529597532004118, 0.0002277692692587152, 0.00025024256319738925, 0.00027271584258414805, 0.00029518912197090685, 0.0003176624304614961, 0.0003401357098482549, 0.0003626089892350137, 0.00038508226862177253, 0.00040755554800853133, 0.0004300288564991206, 0.0004525021358858794, 0.0004749754152726382, 0.0004974487237632275, 0.0005199220031499863, 0.0005423952825367451, 0.0005648685619235039, 0.0005873418413102627, 0.0006098151206970215, 0.0006322884000837803, 0.0006547617376782, 0.0006772350170649588, 0.0006997082964517176, 0.0007221815758384764]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 9.0, 16.0, 26.0, 31.0, 45.0, 51.0, 84.0, 109.0, 135.0, 196.0, 298.0, 426.0, 593.0, 887.0, 1350.0, 2367.0, 5781.0, 26381.0, 285177.0, 3791944.0, 60088.0, 9788.0, 3348.0, 1751.0, 1075.0, 687.0, 503.0, 338.0, 207.0, 158.0, 113.0, 83.0, 62.0, 40.0, 38.0, 23.0, 24.0, 8.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0012540817260742188, -0.0012220889329910278, -0.001190096139907837, -0.001158103346824646, -0.001126110553741455, -0.0010941177606582642, -0.0010621249675750732, -0.0010301321744918823, -0.0009981393814086914, -0.0009661465883255005, -0.0009341537952423096, -0.0009021610021591187, -0.0008701682090759277, -0.0008381754159927368, -0.0008061826229095459, -0.000774189829826355, -0.0007421970367431641, -0.0007102042436599731, -0.0006782114505767822, -0.0006462186574935913, -0.0006142258644104004, -0.0005822330713272095, -0.0005502402782440186, -0.0005182474851608276, -0.0004862546920776367, -0.0004542618989944458, -0.0004222691059112549, -0.00039027631282806396, -0.00035828351974487305, -0.00032629072666168213, -0.0002942979335784912, -0.0002623051404953003, -0.00023031234741210938, -0.00019831955432891846, -0.00016632676124572754, -0.00013433396816253662, -0.0001023411750793457, -7.034838199615479e-05, -3.835558891296387e-05, -6.362795829772949e-06, 2.562999725341797e-05, 5.762279033660889e-05, 8.96155834197998e-05, 0.00012160837650299072, 0.00015360116958618164, 0.00018559396266937256, 0.00021758675575256348, 0.0002495795488357544, 0.0002815723419189453, 0.00031356513500213623, 0.00034555792808532715, 0.00037755072116851807, 0.000409543514251709, 0.0004415363073348999, 0.0004735291004180908, 0.0005055218935012817, 0.0005375146865844727, 0.0005695074796676636, 0.0006015002727508545, 0.0006334930658340454, 0.0006654858589172363, 0.0006974786520004272, 0.0007294714450836182, 0.0007614642381668091, 0.00079345703125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 11.0, 23.0, 8.0, 13.0, 17.0, 25.0, 35.0, 34.0, 49.0, 32.0, 50.0, 41.0, 52.0, 41.0, 50.0, 58.0, 49.0, 50.0, 46.0, 46.0, 40.0, 36.0, 25.0, 29.0, 25.0, 17.0, 15.0, 14.0, 11.0, 7.0, 5.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000885009765625, -0.0008595138788223267, -0.0008340179920196533, -0.00080852210521698, -0.0007830262184143066, -0.0007575303316116333, -0.00073203444480896, -0.0007065385580062866, -0.0006810426712036133, -0.0006555467844009399, -0.0006300508975982666, -0.0006045550107955933, -0.0005790591239929199, -0.0005535632371902466, -0.0005280673503875732, -0.0005025714635848999, -0.00047707557678222656, -0.0004515796899795532, -0.0004260838031768799, -0.00040058791637420654, -0.0003750920295715332, -0.00034959614276885986, -0.0003241002559661865, -0.0002986043691635132, -0.00027310848236083984, -0.0002476125955581665, -0.00022211670875549316, -0.00019662082195281982, -0.00017112493515014648, -0.00014562904834747314, -0.0001201331615447998, -9.463727474212646e-05, -6.914138793945312e-05, -4.3645501136779785e-05, -1.8149614334106445e-05, 7.3462724685668945e-06, 3.2842159271240234e-05, 5.8338046073913574e-05, 8.383393287658691e-05, 0.00010932981967926025, 0.0001348257064819336, 0.00016032159328460693, 0.00018581748008728027, 0.0002113133668899536, 0.00023680925369262695, 0.0002623051404953003, 0.00028780102729797363, 0.00031329691410064697, 0.0003387928009033203, 0.00036428868770599365, 0.000389784574508667, 0.00041528046131134033, 0.00044077634811401367, 0.000466272234916687, 0.0004917681217193604, 0.0005172640085220337, 0.000542759895324707, 0.0005682557821273804, 0.0005937516689300537, 0.000619247555732727, 0.0006447434425354004, 0.0006702393293380737, 0.0006957352161407471, 0.0007212311029434204, 0.0007467269897460938]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 15.0, 26.0, 94.0, 242.0, 840.0, 6493.0, 4163088.0, 21234.0, 1707.0, 336.0, 121.0, 50.0, 21.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01215362548828125, -0.011868953704833984, -0.011584281921386719, -0.011299610137939453, -0.011014938354492188, -0.010730266571044922, -0.010445594787597656, -0.01016092300415039, -0.009876251220703125, -0.00959157943725586, -0.009306907653808594, -0.009022235870361328, -0.008737564086914062, -0.008452892303466797, -0.008168220520019531, -0.007883548736572266, -0.007598876953125, -0.007314205169677734, -0.007029533386230469, -0.006744861602783203, -0.0064601898193359375, -0.006175518035888672, -0.005890846252441406, -0.005606174468994141, -0.005321502685546875, -0.005036830902099609, -0.004752159118652344, -0.004467487335205078, -0.0041828155517578125, -0.003898143768310547, -0.0036134719848632812, -0.0033288002014160156, -0.00304412841796875, -0.0027594566345214844, -0.0024747848510742188, -0.002190113067626953, -0.0019054412841796875, -0.0016207695007324219, -0.0013360977172851562, -0.0010514259338378906, -0.000766754150390625, -0.0004820823669433594, -0.00019741058349609375, 8.726119995117188e-05, 0.0003719329833984375, 0.0006566047668457031, 0.0009412765502929688, 0.0012259483337402344, 0.0015106201171875, 0.0017952919006347656, 0.0020799636840820312, 0.002364635467529297, 0.0026493072509765625, 0.002933979034423828, 0.0032186508178710938, 0.0035033226013183594, 0.003787994384765625, 0.004072666168212891, 0.004357337951660156, 0.004642009735107422, 0.0049266815185546875, 0.005211353302001953, 0.005496025085449219, 0.005780696868896484, 0.00606536865234375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 2.0, 9.0, 5.0, 6.0, 14.0, 76.0, 539.0, 3199.0, 150.0, 37.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005550384521484375, -0.0005346089601516724, -0.0005141794681549072, -0.0004937499761581421, -0.00047332048416137695, -0.0004528909921646118, -0.0004324615001678467, -0.00041203200817108154, -0.0003916025161743164, -0.00037117302417755127, -0.00035074353218078613, -0.000330314040184021, -0.00030988454818725586, -0.0002894550561904907, -0.0002690255641937256, -0.00024859607219696045, -0.0002281665802001953, -0.00020773708820343018, -0.00018730759620666504, -0.0001668781042098999, -0.00014644861221313477, -0.00012601912021636963, -0.00010558962821960449, -8.516013622283936e-05, -6.473064422607422e-05, -4.430115222930908e-05, -2.3871660232543945e-05, -3.4421682357788086e-06, 1.6987323760986328e-05, 3.7416815757751465e-05, 5.78463077545166e-05, 7.827579975128174e-05, 9.870529174804688e-05, 0.00011913478374481201, 0.00013956427574157715, 0.00015999376773834229, 0.00018042325973510742, 0.00020085275173187256, 0.0002212822437286377, 0.00024171173572540283, 0.00026214122772216797, 0.0002825707197189331, 0.00030300021171569824, 0.0003234297037124634, 0.0003438591957092285, 0.00036428868770599365, 0.0003847181797027588, 0.0004051476716995239, 0.00042557716369628906, 0.0004460066556930542, 0.00046643614768981934, 0.00048686563968658447, 0.0005072951316833496, 0.0005277246236801147, 0.0005481541156768799, 0.000568583607673645, 0.0005890130996704102, 0.0006094425916671753, 0.0006298720836639404, 0.0006503015756607056, 0.0006707310676574707, 0.0006911605596542358, 0.000711590051651001, 0.0007320195436477661, 0.0007524490356445312]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 13.0, 20.0, 31.0, 51.0, 77.0, 104.0, 178.0, 150.0, 111.0, 81.0, 53.0, 27.0, 13.0, 24.0, 7.0, 10.0, 8.0, 2.0, 8.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0019750697538256645, -0.001929537858814001, -0.0018840059638023376, -0.0018384740687906742, -0.0017929421737790108, -0.0017474101623520255, -0.001701878267340362, -0.0016563463723286986, -0.0016108144773170352, -0.0015652825823053718, -0.0015197506872937083, -0.0014742187922820449, -0.0014286867808550596, -0.0013831548858433962, -0.0013376229908317327, -0.0012920910958200693, -0.0012465592008084059, -0.0012010273057967424, -0.001155495410785079, -0.0011099635157734156, -0.0010644316207617521, -0.0010188996093347669, -0.0009733677143231034, -0.00092783581931144, -0.0008823039242997766, -0.0008367720292881131, -0.0007912401342764497, -0.0007457081810571253, -0.0007001762860454619, -0.0006546443910337985, -0.0006091124378144741, -0.0005635805428028107, -0.0005180485895834863, -0.0004725166945718229, -0.000426984770456329, -0.0003814528463408351, -0.00033592095132917166, -0.0002903890563175082, -0.0002448571322020143, -0.00019932520808652043, -0.000153793313074857, -0.00010826140351127833, -6.272949394769967e-05, -1.7197584384121e-05, 2.8334325179457664e-05, 7.386623474303633e-05, 0.000119398144306615, 0.0001649300684221089, 0.00021046196343377233, 0.00025599385844543576, 0.00030152578256092966, 0.00034705770667642355, 0.000392589601688087, 0.0004381214966997504, 0.0004836534208152443, 0.0005291853449307382, 0.0005747172399424016, 0.0006202491349540651, 0.0006657810881733894, 0.0007113129831850529, 0.0007568448781967163, 0.0008023767732083797, 0.0008479086682200432, 0.0008934406214393675, 0.000938972516451031]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 5.0, 8.0, 12.0, 17.0, 12.0, 19.0, 11.0, 20.0, 17.0, 22.0, 30.0, 32.0, 31.0, 38.0, 41.0, 35.0, 35.0, 34.0, 44.0, 45.0, 45.0, 40.0, 36.0, 46.0, 35.0, 37.0, 27.0, 14.0, 35.0, 24.0, 22.0, 20.0, 16.0, 11.0, 14.0, 7.0, 9.0, 6.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005885913851670921, -0.0005695504951290786, -0.0005505095468834043, -0.0005314686568453908, -0.0005124277668073773, -0.0004933868767693639, -0.00047434595762751997, -0.00045530503848567605, -0.0004362641484476626, -0.00041722325840964913, -0.0003981823392678052, -0.0003791414201259613, -0.00036010053008794785, -0.0003410596400499344, -0.00032201872090809047, -0.00030297780176624656, -0.0002839369117282331, -0.00026489602169021964, -0.0002458551025483757, -0.00022681419795844704, -0.00020777329336851835, -0.00018873238877858967, -0.00016969148418866098, -0.0001506505795987323, -0.0001316096750088036, -0.00011256877041887492, -9.352786582894623e-05, -7.448696123901755e-05, -5.544605664908886e-05, -3.640515205916017e-05, -1.7364247469231486e-05, 1.6766571206972003e-06, 2.0717503502964973e-05, 3.975840809289366e-05, 5.879931268282235e-05, 7.784021727275103e-05, 9.688112186267972e-05, 0.0001159220264526084, 0.0001349629310425371, 0.00015400383563246578, 0.00017304474022239447, 0.00019208564481232315, 0.00021112654940225184, 0.00023016745399218053, 0.0002492083585821092, 0.00026824924862012267, 0.0002872901677619666, 0.0003063310869038105, 0.00032537197694182396, 0.0003444128669798374, 0.00036345378612168133, 0.00038249470526352525, 0.0004015355953015387, 0.00042057648533955216, 0.0004396174044813961, 0.00045865832362324, 0.00047769921366125345, 0.0004967401036992669, 0.0005157809937372804, 0.0005348219419829547, 0.0005538628320209682, 0.0005729037220589817, 0.000591944670304656, 0.0006109855603426695, 0.0006300264503806829]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 24.0, 34.0, 56.0, 83.0, 95.0, 176.0, 245.0, 387.0, 645.0, 1118.0, 1867.0, 3346.0, 6129.0, 11654.0, 23428.0, 51090.0, 129846.0, 430531.0, 238824.0, 78952.0, 34348.0, 16309.0, 8502.0, 4502.0, 2553.0, 1463.0, 865.0, 503.0, 337.0, 208.0, 121.0, 88.0, 65.0, 45.0, 29.0, 15.0, 18.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0024127960205078125, -0.0023391246795654297, -0.002265453338623047, -0.002191781997680664, -0.0021181106567382812, -0.0020444393157958984, -0.0019707679748535156, -0.0018970966339111328, -0.00182342529296875, -0.0017497539520263672, -0.0016760826110839844, -0.0016024112701416016, -0.0015287399291992188, -0.001455068588256836, -0.0013813972473144531, -0.0013077259063720703, -0.0012340545654296875, -0.0011603832244873047, -0.0010867118835449219, -0.001013040542602539, -0.0009393692016601562, -0.0008656978607177734, -0.0007920265197753906, -0.0007183551788330078, -0.000644683837890625, -0.0005710124969482422, -0.0004973411560058594, -0.00042366981506347656, -0.00034999847412109375, -0.00027632713317871094, -0.00020265579223632812, -0.0001289844512939453, -5.53131103515625e-05, 1.8358230590820312e-05, 9.202957153320312e-05, 0.00016570091247558594, 0.00023937225341796875, 0.00031304359436035156, 0.0003867149353027344, 0.0004603862762451172, 0.0005340576171875, 0.0006077289581298828, 0.0006814002990722656, 0.0007550716400146484, 0.0008287429809570312, 0.0009024143218994141, 0.0009760856628417969, 0.0010497570037841797, 0.0011234283447265625, 0.0011970996856689453, 0.0012707710266113281, 0.001344442367553711, 0.0014181137084960938, 0.0014917850494384766, 0.0015654563903808594, 0.0016391277313232422, 0.001712799072265625, 0.0017864704132080078, 0.0018601417541503906, 0.0019338130950927734, 0.0020074844360351562, 0.002081155776977539, 0.002154827117919922, 0.0022284984588623047, 0.0023021697998046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 8.0, 8.0, 3.0, 14.0, 20.0, 23.0, 19.0, 25.0, 32.0, 42.0, 39.0, 55.0, 44.0, 50.0, 44.0, 53.0, 67.0, 60.0, 54.0, 48.0, 44.0, 43.0, 35.0, 33.0, 27.0, 21.0, 22.0, 8.0, 9.0, 5.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006403923034667969, -0.0006224364042282104, -0.000604480504989624, -0.0005865246057510376, -0.0005685687065124512, -0.0005506128072738647, -0.0005326569080352783, -0.0005147010087966919, -0.0004967451095581055, -0.00047878921031951904, -0.0004608333110809326, -0.0004428774118423462, -0.00042492151260375977, -0.00040696561336517334, -0.0003890097141265869, -0.0003710538148880005, -0.00035309791564941406, -0.00033514201641082764, -0.0003171861171722412, -0.0002992302179336548, -0.00028127431869506836, -0.00026331841945648193, -0.0002453625202178955, -0.00022740662097930908, -0.00020945072174072266, -0.00019149482250213623, -0.0001735389232635498, -0.00015558302402496338, -0.00013762712478637695, -0.00011967122554779053, -0.0001017153263092041, -8.375942707061768e-05, -6.580352783203125e-05, -4.7847628593444824e-05, -2.98917293548584e-05, -1.1935830116271973e-05, 6.020069122314453e-06, 2.397596836090088e-05, 4.1931867599487305e-05, 5.988776683807373e-05, 7.784366607666016e-05, 9.579956531524658e-05, 0.00011375546455383301, 0.00013171136379241943, 0.00014966726303100586, 0.00016762316226959229, 0.0001855790615081787, 0.00020353496074676514, 0.00022149085998535156, 0.000239446759223938, 0.0002574026584625244, 0.00027535855770111084, 0.00029331445693969727, 0.0003112703561782837, 0.0003292262554168701, 0.00034718215465545654, 0.00036513805389404297, 0.0003830939531326294, 0.0004010498523712158, 0.00041900575160980225, 0.00043696165084838867, 0.0004549175500869751, 0.0004728734493255615, 0.000490829348564148, 0.0005087852478027344]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 8.0, 12.0, 10.0, 22.0, 35.0, 36.0, 52.0, 100.0, 127.0, 169.0, 254.0, 401.0, 539.0, 745.0, 1074.0, 1625.0, 2479.0, 3943.0, 6109.0, 10553.0, 19880.0, 45720.0, 258694.0, 588560.0, 54419.0, 22273.0, 11484.0, 6704.0, 4109.0, 2775.0, 1749.0, 1210.0, 788.0, 506.0, 394.0, 297.0, 195.0, 126.0, 101.0, 67.0, 51.0, 50.0, 36.0, 28.0, 14.0, 11.0, 10.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0026531219482421875, -0.002567768096923828, -0.0024824142456054688, -0.0023970603942871094, -0.00231170654296875, -0.0022263526916503906, -0.0021409988403320312, -0.002055644989013672, -0.0019702911376953125, -0.0018849372863769531, -0.0017995834350585938, -0.0017142295837402344, -0.001628875732421875, -0.0015435218811035156, -0.0014581680297851562, -0.0013728141784667969, -0.0012874603271484375, -0.0012021064758300781, -0.0011167526245117188, -0.0010313987731933594, -0.000946044921875, -0.0008606910705566406, -0.0007753372192382812, -0.0006899833679199219, -0.0006046295166015625, -0.0005192756652832031, -0.00043392181396484375, -0.0003485679626464844, -0.000263214111328125, -0.00017786026000976562, -9.250640869140625e-05, -7.152557373046875e-06, 7.82012939453125e-05, 0.00016355514526367188, 0.00024890899658203125, 0.0003342628479003906, 0.00041961669921875, 0.0005049705505371094, 0.0005903244018554688, 0.0006756782531738281, 0.0007610321044921875, 0.0008463859558105469, 0.0009317398071289062, 0.0010170936584472656, 0.001102447509765625, 0.0011878013610839844, 0.0012731552124023438, 0.0013585090637207031, 0.0014438629150390625, 0.0015292167663574219, 0.0016145706176757812, 0.0016999244689941406, 0.0017852783203125, 0.0018706321716308594, 0.0019559860229492188, 0.002041339874267578, 0.0021266937255859375, 0.002212047576904297, 0.0022974014282226562, 0.0023827552795410156, 0.002468109130859375, 0.0025534629821777344, 0.0026388168334960938, 0.002724170684814453, 0.0028095245361328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 1.0, 5.0, 1.0, 4.0, 11.0, 5.0, 9.0, 12.0, 10.0, 17.0, 23.0, 17.0, 11.0, 26.0, 22.0, 39.0, 30.0, 34.0, 36.0, 42.0, 35.0, 38.0, 44.0, 42.0, 30.0, 58.0, 51.0, 29.0, 48.0, 34.0, 26.0, 25.0, 31.0, 28.0, 21.0, 21.0, 12.0, 7.0, 9.0, 10.0, 10.0, 5.0, 4.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00032520294189453125, -0.00031500309705734253, -0.0003048032522201538, -0.0002946034073829651, -0.00028440356254577637, -0.00027420371770858765, -0.0002640038728713989, -0.0002538040280342102, -0.00024360418319702148, -0.00023340433835983276, -0.00022320449352264404, -0.00021300464868545532, -0.0002028048038482666, -0.00019260495901107788, -0.00018240511417388916, -0.00017220526933670044, -0.00016200542449951172, -0.000151805579662323, -0.00014160573482513428, -0.00013140588998794556, -0.00012120604515075684, -0.00011100620031356812, -0.0001008063554763794, -9.060651063919067e-05, -8.040666580200195e-05, -7.020682096481323e-05, -6.000697612762451e-05, -4.980713129043579e-05, -3.960728645324707e-05, -2.940744161605835e-05, -1.920759677886963e-05, -9.007751941680908e-06, 1.1920928955078125e-06, 1.1391937732696533e-05, 2.1591782569885254e-05, 3.1791627407073975e-05, 4.1991472244262695e-05, 5.2191317081451416e-05, 6.239116191864014e-05, 7.259100675582886e-05, 8.279085159301758e-05, 9.29906964302063e-05, 0.00010319054126739502, 0.00011339038610458374, 0.00012359023094177246, 0.00013379007577896118, 0.0001439899206161499, 0.00015418976545333862, 0.00016438961029052734, 0.00017458945512771606, 0.00018478929996490479, 0.0001949891448020935, 0.00020518898963928223, 0.00021538883447647095, 0.00022558867931365967, 0.0002357885241508484, 0.0002459883689880371, 0.00025618821382522583, 0.00026638805866241455, 0.00027658790349960327, 0.000286787748336792, 0.0002969875931739807, 0.00030718743801116943, 0.00031738728284835815, 0.0003275871276855469]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 11.0, 7.0, 25.0, 15.0, 25.0, 29.0, 53.0, 50.0, 79.0, 93.0, 142.0, 233.0, 279.0, 435.0, 674.0, 1003.0, 1628.0, 2693.0, 5035.0, 10208.0, 27536.0, 755079.0, 196708.0, 24890.0, 9621.0, 4795.0, 2575.0, 1559.0, 991.0, 656.0, 373.0, 315.0, 225.0, 151.0, 84.0, 81.0, 56.0, 34.0, 32.0, 25.0, 18.0, 13.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0025463104248046875, -0.0024552345275878906, -0.0023641586303710938, -0.002273082733154297, -0.0021820068359375, -0.002090930938720703, -0.0019998550415039062, -0.0019087791442871094, -0.0018177032470703125, -0.0017266273498535156, -0.0016355514526367188, -0.0015444755554199219, -0.001453399658203125, -0.0013623237609863281, -0.0012712478637695312, -0.0011801719665527344, -0.0010890960693359375, -0.0009980201721191406, -0.0009069442749023438, -0.0008158683776855469, -0.00072479248046875, -0.0006337165832519531, -0.0005426406860351562, -0.0004515647888183594, -0.0003604888916015625, -0.0002694129943847656, -0.00017833709716796875, -8.726119995117188e-05, 3.814697265625e-06, 9.489059448242188e-05, 0.00018596649169921875, 0.0002770423889160156, 0.0003681182861328125, 0.0004591941833496094, 0.0005502700805664062, 0.0006413459777832031, 0.000732421875, 0.0008234977722167969, 0.0009145736694335938, 0.0010056495666503906, 0.0010967254638671875, 0.0011878013610839844, 0.0012788772583007812, 0.0013699531555175781, 0.001461029052734375, 0.0015521049499511719, 0.0016431808471679688, 0.0017342567443847656, 0.0018253326416015625, 0.0019164085388183594, 0.0020074844360351562, 0.002098560333251953, 0.00218963623046875, 0.002280712127685547, 0.0023717880249023438, 0.0024628639221191406, 0.0025539398193359375, 0.0026450157165527344, 0.0027360916137695312, 0.002827167510986328, 0.002918243408203125, 0.003009319305419922, 0.0031003952026367188, 0.0031914710998535156, 0.0032825469970703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 13.0, 22.0, 35.0, 42.0, 78.0, 192.0, 291.0, 129.0, 70.0, 41.0, 15.0, 19.0, 12.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5020370483398438e-05, -1.4345161616802216e-05, -1.3669952750205994e-05, -1.2994743883609772e-05, -1.231953501701355e-05, -1.1644326150417328e-05, -1.0969117283821106e-05, -1.0293908417224884e-05, -9.618699550628662e-06, -8.94349068403244e-06, -8.268281817436218e-06, -7.593072950839996e-06, -6.917864084243774e-06, -6.2426552176475525e-06, -5.5674463510513306e-06, -4.892237484455109e-06, -4.217028617858887e-06, -3.541819751262665e-06, -2.866610884666443e-06, -2.191402018070221e-06, -1.516193151473999e-06, -8.409842848777771e-07, -1.6577541828155518e-07, 5.094334483146667e-07, 1.1846423149108887e-06, 1.8598511815071106e-06, 2.5350600481033325e-06, 3.2102689146995544e-06, 3.885477781295776e-06, 4.560686647891998e-06, 5.23589551448822e-06, 5.911104381084442e-06, 6.586313247680664e-06, 7.261522114276886e-06, 7.936730980873108e-06, 8.61193984746933e-06, 9.287148714065552e-06, 9.962357580661774e-06, 1.0637566447257996e-05, 1.1312775313854218e-05, 1.198798418045044e-05, 1.2663193047046661e-05, 1.3338401913642883e-05, 1.4013610780239105e-05, 1.4688819646835327e-05, 1.536402851343155e-05, 1.603923738002777e-05, 1.6714446246623993e-05, 1.7389655113220215e-05, 1.8064863979816437e-05, 1.874007284641266e-05, 1.941528171300888e-05, 2.0090490579605103e-05, 2.0765699446201324e-05, 2.1440908312797546e-05, 2.211611717939377e-05, 2.279132604598999e-05, 2.3466534912586212e-05, 2.4141743779182434e-05, 2.4816952645778656e-05, 2.5492161512374878e-05, 2.61673703789711e-05, 2.6842579245567322e-05, 2.7517788112163544e-05, 2.8192996978759766e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 7.0, 7.0, 10.0, 12.0, 22.0, 23.0, 43.0, 87.0, 276.0, 998.0, 6810.0, 818519.0, 214367.0, 5986.0, 907.0, 285.0, 84.0, 41.0, 29.0, 14.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00685882568359375, -0.006650805473327637, -0.0064427852630615234, -0.00623476505279541, -0.006026744842529297, -0.005818724632263184, -0.00561070442199707, -0.005402684211730957, -0.005194664001464844, -0.0049866437911987305, -0.004778623580932617, -0.004570603370666504, -0.004362583160400391, -0.004154562950134277, -0.003946542739868164, -0.0037385225296020508, -0.0035305023193359375, -0.0033224821090698242, -0.003114461898803711, -0.0029064416885375977, -0.0026984214782714844, -0.002490401268005371, -0.002282381057739258, -0.0020743608474731445, -0.0018663406372070312, -0.001658320426940918, -0.0014503002166748047, -0.0012422800064086914, -0.0010342597961425781, -0.0008262395858764648, -0.0006182193756103516, -0.0004101991653442383, -0.000202178955078125, 5.841255187988281e-06, 0.00021386146545410156, 0.00042188167572021484, 0.0006299018859863281, 0.0008379220962524414, 0.0010459423065185547, 0.001253962516784668, 0.0014619827270507812, 0.0016700029373168945, 0.0018780231475830078, 0.002086043357849121, 0.0022940635681152344, 0.0025020837783813477, 0.002710103988647461, 0.0029181241989135742, 0.0031261444091796875, 0.0033341646194458008, 0.003542184829711914, 0.0037502050399780273, 0.003958225250244141, 0.004166245460510254, 0.004374265670776367, 0.0045822858810424805, 0.004790306091308594, 0.004998326301574707, 0.00520634651184082, 0.005414366722106934, 0.005622386932373047, 0.00583040714263916, 0.0060384273529052734, 0.006246447563171387, 0.0064544677734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 7.0, 3.0, 13.0, 13.0, 19.0, 18.0, 17.0, 32.0, 39.0, 46.0, 550.0, 38.0, 41.0, 35.0, 28.0, 24.0, 19.0, 18.0, 11.0, 10.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003688335418701172, -0.0003567449748516083, -0.00034465640783309937, -0.00033256784081459045, -0.00032047927379608154, -0.00030839070677757263, -0.0002963021397590637, -0.0002842135727405548, -0.0002721250057220459, -0.000260036438703537, -0.0002479478716850281, -0.00023585930466651917, -0.00022377073764801025, -0.00021168217062950134, -0.00019959360361099243, -0.00018750503659248352, -0.0001754164695739746, -0.0001633279025554657, -0.0001512393355369568, -0.00013915076851844788, -0.00012706220149993896, -0.00011497363448143005, -0.00010288506746292114, -9.079650044441223e-05, -7.870793342590332e-05, -6.661936640739441e-05, -5.45307993888855e-05, -4.244223237037659e-05, -3.0353665351867676e-05, -1.8265098333358765e-05, -6.1765313148498535e-06, 5.912035703659058e-06, 1.800060272216797e-05, 3.008916974067688e-05, 4.217773675918579e-05, 5.42663037776947e-05, 6.635487079620361e-05, 7.844343781471252e-05, 9.053200483322144e-05, 0.00010262057185173035, 0.00011470913887023926, 0.00012679770588874817, 0.00013888627290725708, 0.000150974839925766, 0.0001630634069442749, 0.0001751519739627838, 0.00018724054098129272, 0.00019932910799980164, 0.00021141767501831055, 0.00022350624203681946, 0.00023559480905532837, 0.0002476833760738373, 0.0002597719430923462, 0.0002718605101108551, 0.000283949077129364, 0.0002960376441478729, 0.00030812621116638184, 0.00032021477818489075, 0.00033230334520339966, 0.00034439191222190857, 0.0003564804792404175, 0.0003685690462589264, 0.0003806576132774353, 0.0003927461802959442, 0.0004048347473144531]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 7.0, 13.0, 6.0, 13.0, 29.0, 41.0, 65.0, 122.0, 175.0, 163.0, 90.0, 66.0, 52.0, 38.0, 26.0, 26.0, 10.0, 16.0, 4.0, 10.0, 6.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009822493884712458, -0.00095309381140396, -0.0009239382343366742, -0.0008947826572693884, -0.0008656270802021027, -0.0008364715613424778, -0.000807315984275192, -0.0007781604072079062, -0.0007490048301406205, -0.0007198492530733347, -0.0006906936760060489, -0.0006615380989387631, -0.0006323825800791383, -0.0006032269448041916, -0.0005740714259445667, -0.000544915848877281, -0.0005157602718099952, -0.0004866046947427094, -0.0004574491176754236, -0.0004282935697119683, -0.0003991379926446825, -0.00036998241557739675, -0.00034082686761394143, -0.00031167129054665565, -0.0002825157134793699, -0.0002533601364120841, -0.00022420457389671355, -0.000195049011381343, -0.00016589343431405723, -0.00013673785724677145, -0.00010758229473140091, -7.842673221603036e-05, -4.927109694108367e-05, -2.0115527149755508e-05, 9.040042641572654e-06, 3.8195612432900816e-05, 6.735118222422898e-05, 9.650675929151475e-05, 0.0001256623218068853, 0.00015481788432225585, 0.00018397346138954163, 0.0002131290384568274, 0.00024228460097219795, 0.0002714401634875685, 0.0003005957405548543, 0.00032975131762214005, 0.00035890686558559537, 0.00038806244265288115, 0.0004172180197201669, 0.0004463735967874527, 0.0004755291738547385, 0.0005046847509220243, 0.0005338402697816491, 0.0005629959050565958, 0.0005921514239162207, 0.0006213070009835064, 0.0006504625780507922, 0.000679618155118078, 0.0007087737321853638, 0.0007379293092526495, 0.0007670848863199353, 0.0007962404051795602, 0.000825395982246846, 0.0008545515593141317, 0.0008837071363814175]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 1.0, 7.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 8.0, 15.0, 10.0, 14.0, 22.0, 16.0, 26.0, 32.0, 22.0, 23.0, 38.0, 47.0, 41.0, 28.0, 41.0, 31.0, 44.0, 41.0, 40.0, 41.0, 43.0, 34.0, 36.0, 33.0, 24.0, 32.0, 22.0, 27.0, 22.0, 19.0, 22.0, 13.0, 15.0, 4.0, 4.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038273248355835676, -0.00036986335180699825, -0.0003569941909518093, -0.0003441250592004508, -0.00033125592744909227, -0.0003183867665939033, -0.0003055176348425448, -0.0002926485030911863, -0.0002797793713398278, -0.00026691023958846927, -0.0002540410787332803, -0.0002411719469819218, -0.00022830281523056328, -0.00021543366892728955, -0.0002025645226240158, -0.0001896953908726573, -0.00017682623001746833, -0.0001639570837141946, -0.0001510879519628361, -0.00013821880565956235, -0.00012534967390820384, -0.0001124805276049301, -9.961138130165637e-05, -8.674224227434024e-05, -7.387310324702412e-05, -6.1003964219707996e-05, -4.8134821554413065e-05, -3.5265678889118135e-05, -2.2396539861802012e-05, -9.527400834485888e-06, 3.341745468787849e-06, 1.6210884496103972e-05, 2.9080052627250552e-05, 4.1949191654566675e-05, 5.4818334319861606e-05, 6.768747698515654e-05, 8.055661601247266e-05, 9.342575503978878e-05, 0.00010629490134306252, 0.00011916404037037864, 0.00013203317939769477, 0.0001449023257009685, 0.000157771457452327, 0.00017064060375560075, 0.0001835097500588745, 0.000196378881810233, 0.00020924802811350673, 0.00022211717441678047, 0.00023498630616813898, 0.0002478554379194975, 0.00026072459877468646, 0.00027359373052604496, 0.0002864628622774035, 0.00029933202313259244, 0.00031220115488395095, 0.00032507028663530946, 0.00033793941838666797, 0.0003508085501380265, 0.00036367771099321544, 0.00037654684274457395, 0.00038941597449593246, 0.0004022851353511214, 0.00041515426710247993, 0.00042802339885383844, 0.0004408925597090274]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 12.0, 7.0, 16.0, 19.0, 25.0, 50.0, 70.0, 100.0, 120.0, 220.0, 316.0, 460.0, 726.0, 1267.0, 2237.0, 4000.0, 7186.0, 14221.0, 30355.0, 68083.0, 186473.0, 416620.0, 186267.0, 68281.0, 30201.0, 14321.0, 7305.0, 3959.0, 2199.0, 1239.0, 752.0, 475.0, 311.0, 201.0, 142.0, 98.0, 59.0, 38.0, 37.0, 17.0, 17.0, 9.0, 5.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00103759765625, -0.0010035783052444458, -0.0009695589542388916, -0.0009355396032333374, -0.0009015202522277832, -0.000867500901222229, -0.0008334815502166748, -0.0007994621992111206, -0.0007654428482055664, -0.0007314234972000122, -0.000697404146194458, -0.0006633847951889038, -0.0006293654441833496, -0.0005953460931777954, -0.0005613267421722412, -0.000527307391166687, -0.0004932880401611328, -0.0004592686891555786, -0.0004252493381500244, -0.0003912299871444702, -0.000357210636138916, -0.0003231912851333618, -0.0002891719341278076, -0.0002551525831222534, -0.00022113323211669922, -0.00018711388111114502, -0.00015309453010559082, -0.00011907517910003662, -8.505582809448242e-05, -5.103647708892822e-05, -1.7017126083374023e-05, 1.7002224922180176e-05, 5.1021575927734375e-05, 8.504092693328857e-05, 0.00011906027793884277, 0.00015307962894439697, 0.00018709897994995117, 0.00022111833095550537, 0.00025513768196105957, 0.00028915703296661377, 0.00032317638397216797, 0.00035719573497772217, 0.00039121508598327637, 0.00042523443698883057, 0.00045925378799438477, 0.000493273138999939, 0.0005272924900054932, 0.0005613118410110474, 0.0005953311920166016, 0.0006293505430221558, 0.00066336989402771, 0.0006973892450332642, 0.0007314085960388184, 0.0007654279470443726, 0.0007994472980499268, 0.000833466649055481, 0.0008674860000610352, 0.0009015053510665894, 0.0009355247020721436, 0.0009695440530776978, 0.001003563404083252, 0.0010375827550888062, 0.0010716021060943604, 0.0011056214570999146, 0.0011396408081054688]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 6.0, 19.0, 18.0, 19.0, 30.0, 30.0, 41.0, 40.0, 52.0, 50.0, 58.0, 66.0, 79.0, 64.0, 60.0, 61.0, 56.0, 40.0, 38.0, 42.0, 32.0, 21.0, 16.0, 9.0, 10.0, 9.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032639503479003906, -0.00031721219420433044, -0.0003080293536186218, -0.0002988465130329132, -0.0002896636724472046, -0.00028048083186149597, -0.00027129799127578735, -0.00026211515069007874, -0.0002529323101043701, -0.0002437494695186615, -0.00023456662893295288, -0.00022538378834724426, -0.00021620094776153564, -0.00020701810717582703, -0.0001978352665901184, -0.0001886524260044098, -0.00017946958541870117, -0.00017028674483299255, -0.00016110390424728394, -0.00015192106366157532, -0.0001427382230758667, -0.00013355538249015808, -0.00012437254190444946, -0.00011518970131874084, -0.00010600686073303223, -9.682402014732361e-05, -8.764117956161499e-05, -7.845833897590637e-05, -6.927549839019775e-05, -6.0092657804489136e-05, -5.090981721878052e-05, -4.17269766330719e-05, -3.254413604736328e-05, -2.3361295461654663e-05, -1.4178454875946045e-05, -4.995614290237427e-06, 4.187226295471191e-06, 1.337006688117981e-05, 2.2552907466888428e-05, 3.1735748052597046e-05, 4.0918588638305664e-05, 5.010142922401428e-05, 5.92842698097229e-05, 6.846711039543152e-05, 7.764995098114014e-05, 8.683279156684875e-05, 9.601563215255737e-05, 0.00010519847273826599, 0.00011438131332397461, 0.00012356415390968323, 0.00013274699449539185, 0.00014192983508110046, 0.00015111267566680908, 0.0001602955162525177, 0.00016947835683822632, 0.00017866119742393494, 0.00018784403800964355, 0.00019702687859535217, 0.0002062097191810608, 0.0002153925597667694, 0.00022457540035247803, 0.00023375824093818665, 0.00024294108152389526, 0.0002521239221096039, 0.0002613067626953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 6.0, 4.0, 5.0, 8.0, 14.0, 11.0, 21.0, 11.0, 11.0, 20.0, 20.0, 35.0, 48.0, 81.0, 172.0, 450.0, 1210.0, 3741.0, 12582.0, 44904.0, 195228.0, 579523.0, 156946.0, 37796.0, 10548.0, 3257.0, 1023.0, 406.0, 156.0, 75.0, 56.0, 36.0, 22.0, 24.0, 17.0, 20.0, 14.0, 15.0, 7.0, 11.0, 9.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0012845993041992188, -0.0012449920177459717, -0.0012053847312927246, -0.0011657774448394775, -0.0011261701583862305, -0.0010865628719329834, -0.0010469555854797363, -0.0010073482990264893, -0.0009677410125732422, -0.0009281337261199951, -0.000888526439666748, -0.000848919153213501, -0.0008093118667602539, -0.0007697045803070068, -0.0007300972938537598, -0.0006904900074005127, -0.0006508827209472656, -0.0006112754344940186, -0.0005716681480407715, -0.0005320608615875244, -0.0004924535751342773, -0.0004528462886810303, -0.0004132390022277832, -0.00037363171577453613, -0.00033402442932128906, -0.000294417142868042, -0.0002548098564147949, -0.00021520256996154785, -0.00017559528350830078, -0.0001359879970550537, -9.638071060180664e-05, -5.677342414855957e-05, -1.71661376953125e-05, 2.244114875793457e-05, 6.204843521118164e-05, 0.00010165572166442871, 0.00014126300811767578, 0.00018087029457092285, 0.00022047758102416992, 0.000260084867477417, 0.00029969215393066406, 0.00033929944038391113, 0.0003789067268371582, 0.0004185140132904053, 0.00045812129974365234, 0.0004977285861968994, 0.0005373358726501465, 0.0005769431591033936, 0.0006165504455566406, 0.0006561577320098877, 0.0006957650184631348, 0.0007353723049163818, 0.0007749795913696289, 0.000814586877822876, 0.000854194164276123, 0.0008938014507293701, 0.0009334087371826172, 0.0009730160236358643, 0.0010126233100891113, 0.0010522305965423584, 0.0010918378829956055, 0.0011314451694488525, 0.0011710524559020996, 0.0012106597423553467, 0.0012502670288085938]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 10.0, 8.0, 9.0, 17.0, 8.0, 18.0, 22.0, 17.0, 22.0, 26.0, 27.0, 24.0, 36.0, 41.0, 31.0, 37.0, 41.0, 45.0, 48.0, 39.0, 34.0, 33.0, 44.0, 35.0, 33.0, 35.0, 33.0, 23.0, 24.0, 23.0, 23.0, 16.0, 27.0, 17.0, 12.0, 18.0, 6.0, 15.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.00017249584197998047, -0.00016709975898265839, -0.0001617036759853363, -0.00015630759298801422, -0.00015091150999069214, -0.00014551542699337006, -0.00014011934399604797, -0.0001347232609987259, -0.0001293271780014038, -0.00012393109500408173, -0.00011853501200675964, -0.00011313892900943756, -0.00010774284601211548, -0.0001023467630147934, -9.695068001747131e-05, -9.155459702014923e-05, -8.615851402282715e-05, -8.076243102550507e-05, -7.536634802818298e-05, -6.99702650308609e-05, -6.457418203353882e-05, -5.9178099036216736e-05, -5.378201603889465e-05, -4.838593304157257e-05, -4.298985004425049e-05, -3.7593767046928406e-05, -3.219768404960632e-05, -2.680160105228424e-05, -2.1405518054962158e-05, -1.6009435057640076e-05, -1.0613352060317993e-05, -5.217269062995911e-06, 1.7881393432617188e-07, 5.574896931648254e-06, 1.0970979928970337e-05, 1.636706292629242e-05, 2.1763145923614502e-05, 2.7159228920936584e-05, 3.255531191825867e-05, 3.795139491558075e-05, 4.334747791290283e-05, 4.8743560910224915e-05, 5.4139643907547e-05, 5.953572690486908e-05, 6.493180990219116e-05, 7.032789289951324e-05, 7.572397589683533e-05, 8.112005889415741e-05, 8.651614189147949e-05, 9.191222488880157e-05, 9.730830788612366e-05, 0.00010270439088344574, 0.00010810047388076782, 0.0001134965568780899, 0.00011889263987541199, 0.00012428872287273407, 0.00012968480587005615, 0.00013508088886737823, 0.00014047697186470032, 0.0001458730548620224, 0.00015126913785934448, 0.00015666522085666656, 0.00016206130385398865, 0.00016745738685131073, 0.0001728534698486328]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 6.0, 10.0, 18.0, 17.0, 26.0, 56.0, 81.0, 139.0, 297.0, 556.0, 1135.0, 2623.0, 7128.0, 28364.0, 452593.0, 511342.0, 31422.0, 7648.0, 2666.0, 1143.0, 576.0, 280.0, 153.0, 94.0, 66.0, 40.0, 20.0, 14.0, 13.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2869319915771484e-05, -5.0838105380535126e-05, -4.880689084529877e-05, -4.677567631006241e-05, -4.474446177482605e-05, -4.271324723958969e-05, -4.068203270435333e-05, -3.8650818169116974e-05, -3.6619603633880615e-05, -3.4588389098644257e-05, -3.25571745634079e-05, -3.052596002817154e-05, -2.849474549293518e-05, -2.6463530957698822e-05, -2.4432316422462463e-05, -2.2401101887226105e-05, -2.0369887351989746e-05, -1.8338672816753387e-05, -1.630745828151703e-05, -1.427624374628067e-05, -1.2245029211044312e-05, -1.0213814675807953e-05, -8.182600140571594e-06, -6.151385605335236e-06, -4.120171070098877e-06, -2.0889565348625183e-06, -5.774199962615967e-08, 1.973472535610199e-06, 4.004687070846558e-06, 6.035901606082916e-06, 8.067116141319275e-06, 1.0098330676555634e-05, 1.2129545211791992e-05, 1.416075974702835e-05, 1.619197428226471e-05, 1.8223188817501068e-05, 2.0254403352737427e-05, 2.2285617887973785e-05, 2.4316832423210144e-05, 2.6348046958446503e-05, 2.837926149368286e-05, 3.041047602891922e-05, 3.244169056415558e-05, 3.447290509939194e-05, 3.6504119634628296e-05, 3.8535334169864655e-05, 4.056654870510101e-05, 4.259776324033737e-05, 4.462897777557373e-05, 4.666019231081009e-05, 4.869140684604645e-05, 5.0722621381282806e-05, 5.2753835916519165e-05, 5.4785050451755524e-05, 5.681626498699188e-05, 5.884747952222824e-05, 6.08786940574646e-05, 6.290990859270096e-05, 6.494112312793732e-05, 6.697233766317368e-05, 6.900355219841003e-05, 7.103476673364639e-05, 7.306598126888275e-05, 7.509719580411911e-05, 7.712841033935547e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 1.0, 4.0, 4.0, 3.0, 21.0, 6.0, 11.0, 21.0, 15.0, 22.0, 66.0, 55.0, 66.0, 127.0, 88.0, 151.0, 74.0, 49.0, 73.0, 27.0, 15.0, 39.0, 12.0, 6.0, 12.0, 8.0, 4.0, 8.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.039836883544922e-06, -2.9588118195533752e-06, -2.8777867555618286e-06, -2.796761691570282e-06, -2.7157366275787354e-06, -2.6347115635871887e-06, -2.553686499595642e-06, -2.4726614356040955e-06, -2.391636371612549e-06, -2.310611307621002e-06, -2.2295862436294556e-06, -2.148561179637909e-06, -2.0675361156463623e-06, -1.9865110516548157e-06, -1.905485987663269e-06, -1.8244609236717224e-06, -1.7434358596801758e-06, -1.6624107956886292e-06, -1.5813857316970825e-06, -1.5003606677055359e-06, -1.4193356037139893e-06, -1.3383105397224426e-06, -1.257285475730896e-06, -1.1762604117393494e-06, -1.0952353477478027e-06, -1.014210283756256e-06, -9.331852197647095e-07, -8.521601557731628e-07, -7.711350917816162e-07, -6.901100277900696e-07, -6.09084963798523e-07, -5.280598998069763e-07, -4.470348358154297e-07, -3.6600977182388306e-07, -2.849847078323364e-07, -2.039596438407898e-07, -1.2293457984924316e-07, -4.190951585769653e-08, 3.91155481338501e-08, 1.2014061212539673e-07, 2.0116567611694336e-07, 2.8219074010849e-07, 3.632158041000366e-07, 4.4424086809158325e-07, 5.252659320831299e-07, 6.062909960746765e-07, 6.873160600662231e-07, 7.683411240577698e-07, 8.493661880493164e-07, 9.30391252040863e-07, 1.0114163160324097e-06, 1.0924413800239563e-06, 1.173466444015503e-06, 1.2544915080070496e-06, 1.3355165719985962e-06, 1.4165416359901428e-06, 1.4975666999816895e-06, 1.578591763973236e-06, 1.6596168279647827e-06, 1.7406418919563293e-06, 1.821666955947876e-06, 1.9026920199394226e-06, 1.9837170839309692e-06, 2.064742147922516e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 21.0, 26.0, 41.0, 87.0, 168.0, 365.0, 1051.0, 2770.0, 9803.0, 47222.0, 574782.0, 364946.0, 34731.0, 8421.0, 2478.0, 863.0, 384.0, 142.0, 84.0, 49.0, 21.0, 16.0, 9.0, 13.0, 7.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.814697265625e-05, -3.702286630868912e-05, -3.5898759961128235e-05, -3.477465361356735e-05, -3.365054726600647e-05, -3.252644091844559e-05, -3.1402334570884705e-05, -3.0278228223323822e-05, -2.915412187576294e-05, -2.8030015528202057e-05, -2.6905909180641174e-05, -2.5781802833080292e-05, -2.465769648551941e-05, -2.3533590137958527e-05, -2.2409483790397644e-05, -2.128537744283676e-05, -2.016127109527588e-05, -1.9037164747714996e-05, -1.7913058400154114e-05, -1.678895205259323e-05, -1.566484570503235e-05, -1.4540739357471466e-05, -1.3416633009910583e-05, -1.2292526662349701e-05, -1.1168420314788818e-05, -1.0044313967227936e-05, -8.920207619667053e-06, -7.79610127210617e-06, -6.671994924545288e-06, -5.5478885769844055e-06, -4.423782229423523e-06, -3.2996758818626404e-06, -2.175569534301758e-06, -1.0514631867408752e-06, 7.264316082000732e-08, 1.1967495083808899e-06, 2.3208558559417725e-06, 3.444962203502655e-06, 4.569068551063538e-06, 5.69317489862442e-06, 6.817281246185303e-06, 7.941387593746185e-06, 9.065493941307068e-06, 1.018960028886795e-05, 1.1313706636428833e-05, 1.2437812983989716e-05, 1.3561919331550598e-05, 1.468602567911148e-05, 1.5810132026672363e-05, 1.6934238374233246e-05, 1.805834472179413e-05, 1.918245106935501e-05, 2.0306557416915894e-05, 2.1430663764476776e-05, 2.255477011203766e-05, 2.367887645959854e-05, 2.4802982807159424e-05, 2.5927089154720306e-05, 2.705119550228119e-05, 2.817530184984207e-05, 2.9299408197402954e-05, 3.0423514544963837e-05, 3.154762089252472e-05, 3.26717272400856e-05, 3.3795833587646484e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 13.0, 10.0, 10.0, 15.0, 8.0, 28.0, 19.0, 34.0, 57.0, 36.0, 74.0, 55.0, 80.0, 63.0, 93.0, 60.0, 67.0, 61.0, 33.0, 40.0, 23.0, 25.0, 18.0, 14.0, 13.0, 7.0, 7.0, 6.0, 7.0, 0.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.377216100692749e-06, -4.2244791984558105e-06, -4.071742296218872e-06, -3.919005393981934e-06, -3.766268491744995e-06, -3.6135315895080566e-06, -3.460794687271118e-06, -3.3080577850341797e-06, -3.155320882797241e-06, -3.0025839805603027e-06, -2.8498470783233643e-06, -2.6971101760864258e-06, -2.5443732738494873e-06, -2.391636371612549e-06, -2.2388994693756104e-06, -2.086162567138672e-06, -1.9334256649017334e-06, -1.780688762664795e-06, -1.6279518604278564e-06, -1.475214958190918e-06, -1.3224780559539795e-06, -1.169741153717041e-06, -1.0170042514801025e-06, -8.642673492431641e-07, -7.115304470062256e-07, -5.587935447692871e-07, -4.0605664253234863e-07, -2.5331974029541016e-07, -1.0058283805847168e-07, 5.21540641784668e-08, 2.0489096641540527e-07, 3.5762786865234375e-07, 5.103647708892822e-07, 6.631016731262207e-07, 8.158385753631592e-07, 9.685754776000977e-07, 1.1213123798370361e-06, 1.2740492820739746e-06, 1.426786184310913e-06, 1.5795230865478516e-06, 1.73225998878479e-06, 1.8849968910217285e-06, 2.037733793258667e-06, 2.1904706954956055e-06, 2.343207597732544e-06, 2.4959444999694824e-06, 2.648681402206421e-06, 2.8014183044433594e-06, 2.954155206680298e-06, 3.1068921089172363e-06, 3.259629011154175e-06, 3.4123659133911133e-06, 3.5651028156280518e-06, 3.7178397178649902e-06, 3.870576620101929e-06, 4.023313522338867e-06, 4.176050424575806e-06, 4.328787326812744e-06, 4.481524229049683e-06, 4.634261131286621e-06, 4.7869980335235596e-06, 4.939734935760498e-06, 5.0924718379974365e-06, 5.245208740234375e-06]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 12.0, 16.0, 21.0, 58.0, 95.0, 128.0, 178.0, 181.0, 97.0, 80.0, 37.0, 26.0, 16.0, 13.0, 12.0, 10.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009259617072530091, -0.0009061835589818656, -0.0008864054689183831, -0.0008666273206472397, -0.0008468491723760962, -0.0008270710823126137, -0.0008072929340414703, -0.0007875148439779878, -0.0007677366957068443, -0.0007479585474357009, -0.0007281804573722184, -0.0007084023091010749, -0.0006886242190375924, -0.000668846070766449, -0.0006490679224953055, -0.0006292897742241621, -0.0006095116841606796, -0.0005897335358895361, -0.0005699554458260536, -0.0005501772975549102, -0.0005303991492837667, -0.0005106210592202842, -0.0004908429109491408, -0.0004710647917818278, -0.00045128667261451483, -0.00043150855344720185, -0.00041173043427988887, -0.00039195228600874543, -0.00037217416684143245, -0.00035239604767411947, -0.00033261789940297604, -0.00031283978023566306, -0.0002930616319645196, -0.00027328351279720664, -0.0002535053645260632, -0.00023372724535875022, -0.00021394912619143724, -0.00019417100702412426, -0.00017439287330489606, -0.00015461473958566785, -0.00013483662041835487, -0.00011505849397508428, -9.528036753181368e-05, -7.550224108854309e-05, -5.572411464527249e-05, -3.59459882020019e-05, -1.6167861758731306e-05, 3.6102719604969025e-06, 2.3388391127809882e-05, 4.3166517571080476e-05, 6.294464401435107e-05, 8.272277045762166e-05, 0.00010250089690089226, 0.00012227901606820524, 0.00014205714978743345, 0.00016183528350666165, 0.00018161340267397463, 0.0002013915218412876, 0.00022116965556051582, 0.00024094778927974403, 0.000260725908447057, 0.00028050402761437, 0.00030028214678168297, 0.0003200602950528264, 0.0003398384142201394]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 5.0, 7.0, 6.0, 5.0, 13.0, 13.0, 15.0, 16.0, 14.0, 23.0, 30.0, 39.0, 44.0, 31.0, 40.0, 36.0, 51.0, 52.0, 35.0, 52.0, 45.0, 57.0, 40.0, 43.0, 44.0, 41.0, 34.0, 32.0, 24.0, 26.0, 19.0, 14.0, 13.0, 8.0, 6.0, 7.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0003207006957381964, -0.00031171218142844737, -0.00030272366711869836, -0.00029373515280894935, -0.00028474663849920034, -0.00027575812418945134, -0.00026676960987970233, -0.0002577810955699533, -0.0002487925812602043, -0.0002398040669504553, -0.0002308155526407063, -0.0002218270383309573, -0.00021283852402120829, -0.00020385000971145928, -0.00019486149540171027, -0.00018587298109196126, -0.00017688445223029703, -0.00016789593792054802, -0.00015890742361079901, -0.00014991890930105, -0.000140930394991301, -0.000131941880681552, -0.00012295335181988776, -0.00011396484478609636, -0.00010497633047634736, -9.598781616659835e-05, -8.699930185684934e-05, -7.801078027114272e-05, -6.902226596139371e-05, -6.0033755289623514e-05, -5.10452373418957e-05, -4.205672303214669e-05, -3.3068208722397685e-05, -2.4079694412648678e-05, -1.5091178283910267e-05, -6.102662155171856e-06, 2.885852154577151e-06, 1.1874366464326158e-05, 2.0862884412053972e-05, 2.985139872180298e-05, 3.883991303155199e-05, 4.7828427341300994e-05, 5.681694165105e-05, 6.580546323675662e-05, 7.479397754650563e-05, 8.378249185625464e-05, 9.277100616600364e-05, 0.00010175952047575265, 0.00011074803478550166, 0.00011973654909525067, 0.00012872506340499967, 0.00013771357771474868, 0.0001467020920244977, 0.0001556906063342467, 0.00016467913519591093, 0.00017366764950565994, 0.00018265616381540895, 0.00019164467812515795, 0.00020063319243490696, 0.00020962170674465597, 0.00021861022105440497, 0.00022759873536415398, 0.000236587249673903, 0.000245575763983652, 0.000254564278293401]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 11.0, 4.0, 8.0, 13.0, 17.0, 18.0, 24.0, 30.0, 41.0, 68.0, 104.0, 120.0, 181.0, 281.0, 404.0, 679.0, 1196.0, 2483.0, 6631.0, 301587.0, 3860719.0, 12835.0, 3186.0, 1471.0, 759.0, 477.0, 308.0, 187.0, 112.0, 111.0, 53.0, 45.0, 27.0, 27.0, 14.0, 19.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.00101470947265625, -0.000986635684967041, -0.000958561897277832, -0.000930488109588623, -0.0009024143218994141, -0.0008743405342102051, -0.0008462667465209961, -0.0008181929588317871, -0.0007901191711425781, -0.0007620453834533691, -0.0007339715957641602, -0.0007058978080749512, -0.0006778240203857422, -0.0006497502326965332, -0.0006216764450073242, -0.0005936026573181152, -0.0005655288696289062, -0.0005374550819396973, -0.0005093812942504883, -0.0004813075065612793, -0.0004532337188720703, -0.00042515993118286133, -0.00039708614349365234, -0.00036901235580444336, -0.0003409385681152344, -0.0003128647804260254, -0.0002847909927368164, -0.0002567172050476074, -0.00022864341735839844, -0.00020056962966918945, -0.00017249584197998047, -0.00014442205429077148, -0.0001163482666015625, -8.827447891235352e-05, -6.020069122314453e-05, -3.212690353393555e-05, -4.0531158447265625e-06, 2.4020671844482422e-05, 5.2094459533691406e-05, 8.016824722290039e-05, 0.00010824203491210938, 0.00013631582260131836, 0.00016438961029052734, 0.00019246339797973633, 0.0002205371856689453, 0.0002486109733581543, 0.0002766847610473633, 0.00030475854873657227, 0.00033283233642578125, 0.00036090612411499023, 0.0003889799118041992, 0.0004170536994934082, 0.0004451274871826172, 0.00047320127487182617, 0.0005012750625610352, 0.0005293488502502441, 0.0005574226379394531, 0.0005854964256286621, 0.0006135702133178711, 0.0006416440010070801, 0.0006697177886962891, 0.000697791576385498, 0.000725865364074707, 0.000753939151763916, 0.000782012939453125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 6.0, 3.0, 9.0, 6.0, 3.0, 13.0, 15.0, 15.0, 15.0, 25.0, 35.0, 33.0, 43.0, 42.0, 49.0, 27.0, 41.0, 51.0, 51.0, 53.0, 60.0, 46.0, 50.0, 45.0, 44.0, 40.0, 29.0, 27.0, 27.0, 22.0, 20.0, 12.0, 8.0, 8.0, 10.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025463104248046875, -0.0002471022307872772, -0.0002395734190940857, -0.00023204460740089417, -0.00022451579570770264, -0.0002169869840145111, -0.00020945817232131958, -0.00020192936062812805, -0.00019440054893493652, -0.000186871737241745, -0.00017934292554855347, -0.00017181411385536194, -0.0001642853021621704, -0.00015675649046897888, -0.00014922767877578735, -0.00014169886708259583, -0.0001341700553894043, -0.00012664124369621277, -0.00011911243200302124, -0.00011158362030982971, -0.00010405480861663818, -9.652599692344666e-05, -8.899718523025513e-05, -8.14683735370636e-05, -7.393956184387207e-05, -6.641075015068054e-05, -5.8881938457489014e-05, -5.1353126764297485e-05, -4.382431507110596e-05, -3.629550337791443e-05, -2.87666916847229e-05, -2.1237879991531372e-05, -1.3709068298339844e-05, -6.1802566051483154e-06, 1.3485550880432129e-06, 8.877366781234741e-06, 1.640617847442627e-05, 2.3934990167617798e-05, 3.1463801860809326e-05, 3.8992613554000854e-05, 4.652142524719238e-05, 5.405023694038391e-05, 6.157904863357544e-05, 6.910786032676697e-05, 7.66366720199585e-05, 8.416548371315002e-05, 9.169429540634155e-05, 9.922310709953308e-05, 0.00010675191879272461, 0.00011428073048591614, 0.00012180954217910767, 0.0001293383538722992, 0.00013686716556549072, 0.00014439597725868225, 0.00015192478895187378, 0.0001594536006450653, 0.00016698241233825684, 0.00017451122403144836, 0.0001820400357246399, 0.00018956884741783142, 0.00019709765911102295, 0.00020462647080421448, 0.000212155282497406, 0.00021968409419059753, 0.00022721290588378906]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 14.0, 19.0, 68.0, 222.0, 777.0, 3629.0, 40508.0, 4135745.0, 10853.0, 1771.0, 469.0, 107.0, 46.0, 18.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024566650390625, -0.002380579710006714, -0.0023044943809509277, -0.0022284090518951416, -0.0021523237228393555, -0.0020762383937835693, -0.002000153064727783, -0.001924067735671997, -0.001847982406616211, -0.0017718970775604248, -0.0016958117485046387, -0.0016197264194488525, -0.0015436410903930664, -0.0014675557613372803, -0.0013914704322814941, -0.001315385103225708, -0.0012392997741699219, -0.0011632144451141357, -0.0010871291160583496, -0.0010110437870025635, -0.0009349584579467773, -0.0008588731288909912, -0.0007827877998352051, -0.0007067024707794189, -0.0006306171417236328, -0.0005545318126678467, -0.00047844648361206055, -0.0004023611545562744, -0.0003262758255004883, -0.00025019049644470215, -0.00017410516738891602, -9.801983833312988e-05, -2.193450927734375e-05, 5.415081977844238e-05, 0.00013023614883422852, 0.00020632147789001465, 0.0002824068069458008, 0.0003584921360015869, 0.00043457746505737305, 0.0005106627941131592, 0.0005867481231689453, 0.0006628334522247314, 0.0007389187812805176, 0.0008150041103363037, 0.0008910894393920898, 0.000967174768447876, 0.0010432600975036621, 0.0011193454265594482, 0.0011954307556152344, 0.0012715160846710205, 0.0013476014137268066, 0.0014236867427825928, 0.001499772071838379, 0.001575857400894165, 0.0016519427299499512, 0.0017280280590057373, 0.0018041133880615234, 0.0018801987171173096, 0.0019562840461730957, 0.002032369375228882, 0.002108454704284668, 0.002184540033340454, 0.0022606253623962402, 0.0023367106914520264, 0.0024127960205078125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 15.0, 8.0, 19.0, 50.0, 135.0, 674.0, 2669.0, 333.0, 81.0, 31.0, 10.0, 9.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018358230590820312, -0.00017787516117095947, -0.00017216801643371582, -0.00016646087169647217, -0.00016075372695922852, -0.00015504658222198486, -0.0001493394374847412, -0.00014363229274749756, -0.0001379251480102539, -0.00013221800327301025, -0.0001265108585357666, -0.00012080371379852295, -0.0001150965690612793, -0.00010938942432403564, -0.00010368227958679199, -9.797513484954834e-05, -9.226799011230469e-05, -8.656084537506104e-05, -8.085370063781738e-05, -7.514655590057373e-05, -6.943941116333008e-05, -6.373226642608643e-05, -5.8025121688842773e-05, -5.231797695159912e-05, -4.661083221435547e-05, -4.0903687477111816e-05, -3.5196542739868164e-05, -2.9489398002624512e-05, -2.378225326538086e-05, -1.8075108528137207e-05, -1.2367963790893555e-05, -6.660819053649902e-06, -9.5367431640625e-07, 4.753470420837402e-06, 1.0460615158081055e-05, 1.6167759895324707e-05, 2.187490463256836e-05, 2.7582049369812012e-05, 3.3289194107055664e-05, 3.8996338844299316e-05, 4.470348358154297e-05, 5.041062831878662e-05, 5.6117773056030273e-05, 6.182491779327393e-05, 6.753206253051758e-05, 7.323920726776123e-05, 7.894635200500488e-05, 8.465349674224854e-05, 9.036064147949219e-05, 9.606778621673584e-05, 0.00010177493095397949, 0.00010748207569122314, 0.0001131892204284668, 0.00011889636516571045, 0.0001246035099029541, 0.00013031065464019775, 0.0001360177993774414, 0.00014172494411468506, 0.0001474320888519287, 0.00015313923358917236, 0.00015884637832641602, 0.00016455352306365967, 0.00017026066780090332, 0.00017596781253814697, 0.00018167495727539062]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 6.0, 12.0, 11.0, 15.0, 15.0, 30.0, 46.0, 58.0, 89.0, 142.0, 170.0, 137.0, 88.0, 49.0, 39.0, 30.0, 16.0, 12.0, 14.0, 2.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005347136757336557, -0.0005218240548856556, -0.0005089343758299947, -0.0004960447549819946, -0.0004831551050301641, -0.0004702654550783336, -0.0004573758051265031, -0.0004444861551746726, -0.00043159653432667255, -0.00041870688437484205, -0.00040581723442301154, -0.0003929276135750115, -0.000380037963623181, -0.0003671483136713505, -0.00035425866371951997, -0.00034136901376768947, -0.00032847936381585896, -0.00031558971386402845, -0.00030270006391219795, -0.00028981041396036744, -0.0002769207931123674, -0.0002640311431605369, -0.0002511414932087064, -0.00023825184325687587, -0.0002253622078569606, -0.0002124725579051301, -0.0001995829225052148, -0.0001866932725533843, -0.0001738036226015538, -0.00016091398720163852, -0.000148024337249808, -0.00013513470184989274, -0.00012224505189806223, -0.00010935540922218934, -9.646576654631644e-05, -8.357611659448594e-05, -7.068647391861305e-05, -5.7796831242740154e-05, -4.490718129090965e-05, -3.2017538615036756e-05, -1.9127895939163864e-05, -6.238251444301568e-06, 6.651393050560728e-06, 1.9541039364412427e-05, 3.243068204028532e-05, 4.532032471615821e-05, 5.820997466798872e-05, 7.109961734386161e-05, 8.39892600197345e-05, 9.68789026956074e-05, 0.00010976854537148029, 0.0001226581953233108, 0.00013554783072322607, 0.00014843748067505658, 0.00016132713062688708, 0.0001742167805787176, 0.00018710641597863287, 0.00019999606593046337, 0.00021288570133037865, 0.00022577535128220916, 0.00023866500123403966, 0.00025155465118587017, 0.0002644442720338702, 0.0002773339219857007, 0.00029022357193753123]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 9.0, 21.0, 13.0, 26.0, 25.0, 17.0, 35.0, 30.0, 42.0, 29.0, 33.0, 46.0, 39.0, 45.0, 50.0, 36.0, 44.0, 50.0, 39.0, 38.0, 49.0, 36.0, 32.0, 24.0, 20.0, 23.0, 18.0, 17.0, 13.0, 14.0, 8.0, 13.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018477697449270636, -0.00017835899780038744, -0.0001719410065561533, -0.00016552302986383438, -0.00015910505317151546, -0.00015268707647919655, -0.0001462690852349624, -0.0001398511085426435, -0.00013343313185032457, -0.00012701515515800565, -0.00012059717118972912, -0.0001141791872214526, -0.00010776121052913368, -0.00010134322656085715, -9.492524259258062e-05, -8.85072659002617e-05, -8.208928193198517e-05, -7.567129796370864e-05, -6.925332127138972e-05, -6.283533730311319e-05, -5.6417360610794276e-05, -4.9999376642517745e-05, -4.358139631222002e-05, -3.71634159819223e-05, -3.0745435651624575e-05, -2.4327455321326852e-05, -1.790947499102913e-05, -1.1491492841742001e-05, -5.073512511444278e-06, 1.344469637842849e-06, 7.762449968140572e-06, 1.4180430298438296e-05, 2.059841062873602e-05, 2.7016390959033743e-05, 3.3434371289331466e-05, 3.9852355257607996e-05, 4.627033194992691e-05, 5.268831591820344e-05, 5.910629624850117e-05, 6.552427657879889e-05, 7.19422532711178e-05, 7.836023723939434e-05, 8.477821393171325e-05, 9.119619789998978e-05, 9.76141745923087e-05, 0.00010403215856058523, 0.00011045014252886176, 0.00011686811922118068, 0.0001232860959134996, 0.0001297040726058185, 0.00013612206385005265, 0.00014254004054237157, 0.0001489580172346905, 0.00015537600847892463, 0.00016179398517124355, 0.00016821196186356246, 0.0001746299531077966, 0.00018104792980011553, 0.00018746592104434967, 0.0001938838977366686, 0.0002003018744289875, 0.00020671985112130642, 0.00021313784236554056, 0.00021955581905785948, 0.0002259737957501784]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 14.0, 22.0, 30.0, 36.0, 40.0, 54.0, 82.0, 108.0, 185.0, 233.0, 343.0, 571.0, 745.0, 1273.0, 2007.0, 3047.0, 5356.0, 10078.0, 19883.0, 44000.0, 116645.0, 382268.0, 295496.0, 91578.0, 36609.0, 16520.0, 8403.0, 4825.0, 2885.0, 1748.0, 1112.0, 739.0, 487.0, 299.0, 252.0, 180.0, 129.0, 82.0, 60.0, 27.0, 32.0, 19.0, 11.0, 8.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0], "bins": [-0.0006518363952636719, -0.0006331503391265869, -0.000614464282989502, -0.000595778226852417, -0.000577092170715332, -0.0005584061145782471, -0.0005397200584411621, -0.0005210340023040771, -0.0005023479461669922, -0.0004836618900299072, -0.00046497583389282227, -0.0004462897777557373, -0.00042760372161865234, -0.0004089176654815674, -0.0003902316093444824, -0.00037154555320739746, -0.0003528594970703125, -0.00033417344093322754, -0.0003154873847961426, -0.0002968013286590576, -0.00027811527252197266, -0.0002594292163848877, -0.00024074316024780273, -0.00022205710411071777, -0.0002033710479736328, -0.00018468499183654785, -0.0001659989356994629, -0.00014731287956237793, -0.00012862682342529297, -0.00010994076728820801, -9.125471115112305e-05, -7.256865501403809e-05, -5.3882598876953125e-05, -3.5196542739868164e-05, -1.6510486602783203e-05, 2.175569534301758e-06, 2.086162567138672e-05, 3.954768180847168e-05, 5.823373794555664e-05, 7.69197940826416e-05, 9.560585021972656e-05, 0.00011429190635681152, 0.00013297796249389648, 0.00015166401863098145, 0.0001703500747680664, 0.00018903613090515137, 0.00020772218704223633, 0.0002264082431793213, 0.00024509429931640625, 0.0002637803554534912, 0.00028246641159057617, 0.00030115246772766113, 0.0003198385238647461, 0.00033852458000183105, 0.000357210636138916, 0.000375896692276001, 0.00039458274841308594, 0.0004132688045501709, 0.00043195486068725586, 0.0004506409168243408, 0.0004693269729614258, 0.00048801302909851074, 0.0005066990852355957, 0.0005253851413726807, 0.0005440711975097656]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 7.0, 9.0, 8.0, 16.0, 15.0, 15.0, 21.0, 21.0, 29.0, 30.0, 29.0, 34.0, 45.0, 51.0, 51.0, 50.0, 34.0, 41.0, 40.0, 42.0, 36.0, 48.0, 41.0, 38.0, 37.0, 29.0, 33.0, 23.0, 28.0, 22.0, 9.0, 15.0, 5.0, 5.0, 9.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.000217437744140625, -0.00021149218082427979, -0.00020554661750793457, -0.00019960105419158936, -0.00019365549087524414, -0.00018770992755889893, -0.0001817643642425537, -0.0001758188009262085, -0.00016987323760986328, -0.00016392767429351807, -0.00015798211097717285, -0.00015203654766082764, -0.00014609098434448242, -0.0001401454210281372, -0.000134199857711792, -0.00012825429439544678, -0.00012230873107910156, -0.00011636316776275635, -0.00011041760444641113, -0.00010447204113006592, -9.85264778137207e-05, -9.258091449737549e-05, -8.663535118103027e-05, -8.068978786468506e-05, -7.474422454833984e-05, -6.879866123199463e-05, -6.285309791564941e-05, -5.69075345993042e-05, -5.0961971282958984e-05, -4.501640796661377e-05, -3.9070844650268555e-05, -3.312528133392334e-05, -2.7179718017578125e-05, -2.123415470123291e-05, -1.5288591384887695e-05, -9.34302806854248e-06, -3.3974647521972656e-06, 2.5480985641479492e-06, 8.493661880493164e-06, 1.4439225196838379e-05, 2.0384788513183594e-05, 2.633035182952881e-05, 3.2275915145874023e-05, 3.822147846221924e-05, 4.416704177856445e-05, 5.011260509490967e-05, 5.605816841125488e-05, 6.20037317276001e-05, 6.794929504394531e-05, 7.389485836029053e-05, 7.984042167663574e-05, 8.578598499298096e-05, 9.173154830932617e-05, 9.767711162567139e-05, 0.0001036226749420166, 0.00010956823825836182, 0.00011551380157470703, 0.00012145936489105225, 0.00012740492820739746, 0.00013335049152374268, 0.0001392960548400879, 0.0001452416181564331, 0.00015118718147277832, 0.00015713274478912354, 0.00016307830810546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 8.0, 17.0, 18.0, 31.0, 33.0, 31.0, 46.0, 70.0, 103.0, 134.0, 175.0, 224.0, 313.0, 387.0, 592.0, 798.0, 1187.0, 1776.0, 2807.0, 4614.0, 8592.0, 17069.0, 45166.0, 330660.0, 539014.0, 52534.0, 18708.0, 8978.0, 5043.0, 2991.0, 1949.0, 1281.0, 883.0, 638.0, 414.0, 330.0, 248.0, 190.0, 133.0, 106.0, 70.0, 55.0, 32.0, 20.0, 26.0, 16.0, 5.0, 13.0, 5.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006833076477050781, -0.0006613060832023621, -0.000639304518699646, -0.0006173029541969299, -0.0005953013896942139, -0.0005732998251914978, -0.0005512982606887817, -0.0005292966961860657, -0.0005072951316833496, -0.00048529356718063354, -0.0004632920026779175, -0.0004412904381752014, -0.00041928887367248535, -0.0003972873091697693, -0.0003752857446670532, -0.00035328418016433716, -0.0003312826156616211, -0.00030928105115890503, -0.00028727948665618896, -0.0002652779221534729, -0.00024327635765075684, -0.00022127479314804077, -0.0001992732286453247, -0.00017727166414260864, -0.00015527009963989258, -0.00013326853513717651, -0.00011126697063446045, -8.926540613174438e-05, -6.726384162902832e-05, -4.5262277126312256e-05, -2.326071262359619e-05, -1.259148120880127e-06, 2.0742416381835938e-05, 4.2743980884552e-05, 6.474554538726807e-05, 8.674710988998413e-05, 0.0001087486743927002, 0.00013075023889541626, 0.00015275180339813232, 0.0001747533679008484, 0.00019675493240356445, 0.00021875649690628052, 0.00024075806140899658, 0.00026275962591171265, 0.0002847611904144287, 0.0003067627549171448, 0.00032876431941986084, 0.0003507658839225769, 0.00037276744842529297, 0.00039476901292800903, 0.0004167705774307251, 0.00043877214193344116, 0.0004607737064361572, 0.0004827752709388733, 0.0005047768354415894, 0.0005267783999443054, 0.0005487799644470215, 0.0005707815289497375, 0.0005927830934524536, 0.0006147846579551697, 0.0006367862224578857, 0.0006587877869606018, 0.0006807893514633179, 0.0007027909159660339, 0.00072479248046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 13.0, 3.0, 11.0, 8.0, 6.0, 6.0, 13.0, 13.0, 10.0, 12.0, 22.0, 22.0, 27.0, 32.0, 36.0, 23.0, 27.0, 33.0, 40.0, 43.0, 48.0, 34.0, 36.0, 36.0, 37.0, 29.0, 31.0, 36.0, 37.0, 34.0, 27.0, 24.0, 25.0, 29.0, 16.0, 18.0, 10.0, 19.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 8.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00010335445404052734, -0.00010002404451370239, -9.669363498687744e-05, -9.336322546005249e-05, -9.003281593322754e-05, -8.670240640640259e-05, -8.337199687957764e-05, -8.004158735275269e-05, -7.671117782592773e-05, -7.338076829910278e-05, -7.005035877227783e-05, -6.671994924545288e-05, -6.338953971862793e-05, -6.005913019180298e-05, -5.672872066497803e-05, -5.3398311138153076e-05, -5.0067901611328125e-05, -4.6737492084503174e-05, -4.340708255767822e-05, -4.007667303085327e-05, -3.674626350402832e-05, -3.341585397720337e-05, -3.0085444450378418e-05, -2.6755034923553467e-05, -2.3424625396728516e-05, -2.0094215869903564e-05, -1.6763806343078613e-05, -1.3433396816253662e-05, -1.0102987289428711e-05, -6.77257776260376e-06, -3.4421682357788086e-06, -1.1175870895385742e-07, 3.2186508178710938e-06, 6.549060344696045e-06, 9.879469871520996e-06, 1.3209879398345947e-05, 1.65402889251709e-05, 1.987069845199585e-05, 2.32011079788208e-05, 2.6531517505645752e-05, 2.9861927032470703e-05, 3.3192336559295654e-05, 3.6522746086120605e-05, 3.985315561294556e-05, 4.318356513977051e-05, 4.651397466659546e-05, 4.984438419342041e-05, 5.317479372024536e-05, 5.650520324707031e-05, 5.9835612773895264e-05, 6.316602230072021e-05, 6.649643182754517e-05, 6.982684135437012e-05, 7.315725088119507e-05, 7.648766040802002e-05, 7.981806993484497e-05, 8.314847946166992e-05, 8.647888898849487e-05, 8.980929851531982e-05, 9.313970804214478e-05, 9.647011756896973e-05, 9.980052709579468e-05, 0.00010313093662261963, 0.00010646134614944458, 0.00010979175567626953]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 8.0, 8.0, 4.0, 14.0, 16.0, 22.0, 31.0, 38.0, 54.0, 68.0, 99.0, 126.0, 164.0, 236.0, 340.0, 507.0, 715.0, 1170.0, 1852.0, 3375.0, 6895.0, 18369.0, 91192.0, 815002.0, 76185.0, 17021.0, 6397.0, 3214.0, 1808.0, 1140.0, 758.0, 501.0, 359.0, 239.0, 167.0, 124.0, 74.0, 59.0, 41.0, 41.0, 27.0, 20.0, 20.0, 12.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0007023811340332031, -0.0006793215870857239, -0.0006562620401382446, -0.0006332024931907654, -0.0006101429462432861, -0.0005870833992958069, -0.0005640238523483276, -0.0005409643054008484, -0.0005179047584533691, -0.0004948452115058899, -0.00047178566455841064, -0.0004487261176109314, -0.00042566657066345215, -0.0004026070237159729, -0.00037954747676849365, -0.0003564879298210144, -0.00033342838287353516, -0.0003103688359260559, -0.00028730928897857666, -0.0002642497420310974, -0.00024119019508361816, -0.00021813064813613892, -0.00019507110118865967, -0.00017201155424118042, -0.00014895200729370117, -0.00012589246034622192, -0.00010283291339874268, -7.977336645126343e-05, -5.671381950378418e-05, -3.365427255630493e-05, -1.0594725608825684e-05, 1.2464821338653564e-05, 3.552436828613281e-05, 5.858391523361206e-05, 8.164346218109131e-05, 0.00010470300912857056, 0.0001277625560760498, 0.00015082210302352905, 0.0001738816499710083, 0.00019694119691848755, 0.0002200007438659668, 0.00024306029081344604, 0.0002661198377609253, 0.00028917938470840454, 0.0003122389316558838, 0.00033529847860336304, 0.0003583580255508423, 0.00038141757249832153, 0.0004044771194458008, 0.00042753666639328003, 0.0004505962133407593, 0.0004736557602882385, 0.0004967153072357178, 0.000519774854183197, 0.0005428344011306763, 0.0005658939480781555, 0.0005889534950256348, 0.000612013041973114, 0.0006350725889205933, 0.0006581321358680725, 0.0006811916828155518, 0.000704251229763031, 0.0007273107767105103, 0.0007503703236579895, 0.0007734298706054688]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 5.0, 14.0, 13.0, 19.0, 16.0, 25.0, 28.0, 40.0, 32.0, 48.0, 50.0, 215.0, 135.0, 42.0, 51.0, 46.0, 48.0, 29.0, 28.0, 11.0, 19.0, 16.0, 14.0, 6.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.288818359375e-05, -2.2231601178646088e-05, -2.1575018763542175e-05, -2.0918436348438263e-05, -2.026185393333435e-05, -1.9605271518230438e-05, -1.8948689103126526e-05, -1.8292106688022614e-05, -1.76355242729187e-05, -1.697894185781479e-05, -1.6322359442710876e-05, -1.5665777027606964e-05, -1.5009194612503052e-05, -1.435261219739914e-05, -1.3696029782295227e-05, -1.3039447367191315e-05, -1.2382864952087402e-05, -1.172628253698349e-05, -1.1069700121879578e-05, -1.0413117706775665e-05, -9.756535291671753e-06, -9.09995287656784e-06, -8.443370461463928e-06, -7.786788046360016e-06, -7.1302056312561035e-06, -6.473623216152191e-06, -5.817040801048279e-06, -5.1604583859443665e-06, -4.503875970840454e-06, -3.847293555736542e-06, -3.1907111406326294e-06, -2.534128725528717e-06, -1.8775463104248047e-06, -1.2209638953208923e-06, -5.6438148021698e-07, 9.220093488693237e-08, 7.487833499908447e-07, 1.405365765094757e-06, 2.0619481801986694e-06, 2.7185305953025818e-06, 3.375113010406494e-06, 4.0316954255104065e-06, 4.688277840614319e-06, 5.344860255718231e-06, 6.0014426708221436e-06, 6.658025085926056e-06, 7.314607501029968e-06, 7.97118991613388e-06, 8.627772331237793e-06, 9.284354746341705e-06, 9.940937161445618e-06, 1.059751957654953e-05, 1.1254101991653442e-05, 1.1910684406757355e-05, 1.2567266821861267e-05, 1.322384923696518e-05, 1.3880431652069092e-05, 1.4537014067173004e-05, 1.5193596482276917e-05, 1.585017889738083e-05, 1.650676131248474e-05, 1.7163343727588654e-05, 1.7819926142692566e-05, 1.8476508557796478e-05, 1.913309097290039e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 5.0, 8.0, 8.0, 19.0, 38.0, 79.0, 229.0, 890.0, 5719.0, 680448.0, 354543.0, 5206.0, 906.0, 226.0, 95.0, 53.0, 20.0, 12.0, 8.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028629302978515625, -0.002787560224533081, -0.0027121901512145996, -0.002636820077896118, -0.0025614500045776367, -0.0024860799312591553, -0.002410709857940674, -0.0023353397846221924, -0.002259969711303711, -0.0021845996379852295, -0.002109229564666748, -0.0020338594913482666, -0.001958489418029785, -0.0018831193447113037, -0.0018077492713928223, -0.0017323791980743408, -0.0016570091247558594, -0.001581639051437378, -0.0015062689781188965, -0.001430898904800415, -0.0013555288314819336, -0.0012801587581634521, -0.0012047886848449707, -0.0011294186115264893, -0.0010540485382080078, -0.0009786784648895264, -0.0009033083915710449, -0.0008279383182525635, -0.000752568244934082, -0.0006771981716156006, -0.0006018280982971191, -0.0005264580249786377, -0.00045108795166015625, -0.0003757178783416748, -0.00030034780502319336, -0.00022497773170471191, -0.00014960765838623047, -7.423758506774902e-05, 1.1324882507324219e-06, 7.650256156921387e-05, 0.0001518726348876953, 0.00022724270820617676, 0.0003026127815246582, 0.00037798285484313965, 0.0004533529281616211, 0.0005287230014801025, 0.000604093074798584, 0.0006794631481170654, 0.0007548332214355469, 0.0008302032947540283, 0.0009055733680725098, 0.0009809434413909912, 0.0010563135147094727, 0.001131683588027954, 0.0012070536613464355, 0.001282423734664917, 0.0013577938079833984, 0.0014331638813018799, 0.0015085339546203613, 0.0015839040279388428, 0.0016592741012573242, 0.0017346441745758057, 0.0018100142478942871, 0.0018853843212127686, 0.00196075439453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 12.0, 6.0, 18.0, 24.0, 30.0, 44.0, 69.0, 80.0, 131.0, 271.0, 87.0, 57.0, 39.0, 29.0, 22.0, 14.0, 11.0, 7.0, 4.0, 3.0, 3.0, 5.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.638071060180664e-05, -9.269360452890396e-05, -8.900649845600128e-05, -8.53193923830986e-05, -8.163228631019592e-05, -7.794518023729324e-05, -7.425807416439056e-05, -7.057096809148788e-05, -6.68838620185852e-05, -6.319675594568253e-05, -5.9509649872779846e-05, -5.582254379987717e-05, -5.213543772697449e-05, -4.844833165407181e-05, -4.476122558116913e-05, -4.107411950826645e-05, -3.738701343536377e-05, -3.369990736246109e-05, -3.001280128955841e-05, -2.632569521665573e-05, -2.2638589143753052e-05, -1.8951483070850372e-05, -1.5264376997947693e-05, -1.1577270925045013e-05, -7.890164852142334e-06, -4.2030587792396545e-06, -5.159527063369751e-07, 3.1711533665657043e-06, 6.858259439468384e-06, 1.0545365512371063e-05, 1.4232471585273743e-05, 1.7919577658176422e-05, 2.16066837310791e-05, 2.529378980398178e-05, 2.898089587688446e-05, 3.266800194978714e-05, 3.635510802268982e-05, 4.00422140955925e-05, 4.372932016849518e-05, 4.741642624139786e-05, 5.110353231430054e-05, 5.4790638387203217e-05, 5.8477744460105896e-05, 6.216485053300858e-05, 6.585195660591125e-05, 6.953906267881393e-05, 7.322616875171661e-05, 7.691327482461929e-05, 8.060038089752197e-05, 8.428748697042465e-05, 8.797459304332733e-05, 9.166169911623001e-05, 9.534880518913269e-05, 9.903591126203537e-05, 0.00010272301733493805, 0.00010641012340784073, 0.00011009722948074341, 0.00011378433555364609, 0.00011747144162654877, 0.00012115854769945145, 0.00012484565377235413, 0.0001285327598452568, 0.00013221986591815948, 0.00013590697199106216, 0.00013959407806396484]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 15.0, 13.0, 27.0, 48.0, 51.0, 108.0, 163.0, 143.0, 89.0, 75.0, 59.0, 42.0, 24.0, 26.0, 18.0, 13.0, 17.0, 10.0, 6.0, 3.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003027108032256365, -0.00029292784165591, -0.00028314488008618355, -0.00027336194762028754, -0.00026357898605056107, -0.0002537960244808346, -0.00024401306291110814, -0.00023423010134138167, -0.00022444715432357043, -0.00021466419275384396, -0.00020488124573603272, -0.00019509828416630626, -0.0001853153225965798, -0.00017553237557876855, -0.00016574941400904208, -0.00015596646699123085, -0.00014618350542150438, -0.0001364005438517779, -0.00012661759683396667, -0.0001168346352642402, -0.00010705168097047135, -9.72687266767025e-05, -8.748576510697603e-05, -7.770281081320718e-05, -6.791985651943833e-05, -5.8136902225669473e-05, -4.835394429392181e-05, -3.857098636217415e-05, -2.87880320684053e-05, -1.9005077774636447e-05, -9.222119842888787e-06, 5.608380888588727e-07, 1.0343821486458182e-05, 2.012677759921644e-05, 2.9909733711974695e-05, 3.9692691643722355e-05, 4.947564593749121e-05, 5.925860023126006e-05, 6.904156180098653e-05, 7.882451609475538e-05, 8.860747038852423e-05, 9.839042468229309e-05, 0.00010817337897606194, 0.00011795634054578841, 0.00012773930211551487, 0.0001375222491333261, 0.00014730521070305258, 0.00015708815772086382, 0.00016687111929059029, 0.00017665408086031675, 0.000186437027878128, 0.00019621998944785446, 0.0002060029364656657, 0.00021578589803539217, 0.00022556885960511863, 0.0002353518211748451, 0.0002451347536407411, 0.0002549177152104676, 0.00026470067678019404, 0.00027448360924609005, 0.0002842665708158165, 0.000294049532385543, 0.00030383249395526946, 0.0003136154555249959, 0.0003233984170947224]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 13.0, 11.0, 9.0, 19.0, 16.0, 24.0, 26.0, 25.0, 32.0, 24.0, 39.0, 36.0, 28.0, 47.0, 50.0, 50.0, 43.0, 41.0, 53.0, 51.0, 44.0, 36.0, 36.0, 26.0, 28.0, 35.0, 23.0, 15.0, 26.0, 11.0, 10.0, 11.0, 8.0, 14.0, 3.0, 9.0, 4.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015145477664191276, -0.0001459842169424519, -0.00014051365724299103, -0.00013504309754353017, -0.00012957252329215407, -0.0001241019635926932, -0.00011863140389323235, -0.00011316084419377148, -0.00010769028449431062, -0.00010221972479484975, -9.674916509538889e-05, -9.127859811997041e-05, -8.580803842050955e-05, -8.033747872104868e-05, -7.48669117456302e-05, -6.939635204616934e-05, -6.392579234670848e-05, -5.845523264724761e-05, -5.298466930980794e-05, -4.751410597236827e-05, -4.2043546272907406e-05, -3.657298657344654e-05, -3.110242323600687e-05, -2.56318598985672e-05, -2.0161300199106336e-05, -1.4690738680656068e-05, -9.2201771622058e-06, -3.749615643755533e-06, 1.7209458746947348e-06, 7.1915073931450024e-06, 1.266206891159527e-05, 1.813263224903494e-05, 2.3603206500411034e-05, 2.90737680188613e-05, 3.454432953731157e-05, 4.001489287475124e-05, 4.5485452574212104e-05, 5.095601227367297e-05, 5.642657561111264e-05, 6.189713894855231e-05, 6.736769864801317e-05, 7.283825834747404e-05, 7.83088180469349e-05, 8.377938502235338e-05, 8.924994472181424e-05, 9.472050442127511e-05, 0.00010019107139669359, 0.00010566163109615445, 0.00011113219079561532, 0.00011660275049507618, 0.00012207331019453704, 0.0001275438698939979, 0.00013301442959345877, 0.00013848500384483486, 0.00014395556354429573, 0.0001494261232437566, 0.00015489668294321746, 0.00016036724264267832, 0.00016583780234213918, 0.00017130836204160005, 0.00017677893629297614, 0.000182249495992437, 0.00018772005569189787, 0.00019319061539135873, 0.0001986611750908196]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 13.0, 11.0, 28.0, 37.0, 59.0, 78.0, 124.0, 181.0, 301.0, 444.0, 629.0, 954.0, 1622.0, 2480.0, 3927.0, 6584.0, 10822.0, 18921.0, 33726.0, 64246.0, 135818.0, 305454.0, 240643.0, 103152.0, 51127.0, 27742.0, 15598.0, 9012.0, 5600.0, 3309.0, 2119.0, 1280.0, 817.0, 537.0, 402.0, 243.0, 181.0, 105.0, 59.0, 60.0, 38.0, 25.0, 14.0, 9.0, 9.0, 5.0, 1.0, 5.0, 4.0], "bins": [-0.0004036426544189453, -0.00039268285036087036, -0.0003817230463027954, -0.00037076324224472046, -0.0003598034381866455, -0.00034884363412857056, -0.0003378838300704956, -0.00032692402601242065, -0.0003159642219543457, -0.00030500441789627075, -0.0002940446138381958, -0.00028308480978012085, -0.0002721250057220459, -0.00026116520166397095, -0.000250205397605896, -0.00023924559354782104, -0.0002282857894897461, -0.00021732598543167114, -0.0002063661813735962, -0.00019540637731552124, -0.0001844465732574463, -0.00017348676919937134, -0.0001625269651412964, -0.00015156716108322144, -0.00014060735702514648, -0.00012964755296707153, -0.00011868774890899658, -0.00010772794485092163, -9.676814079284668e-05, -8.580833673477173e-05, -7.484853267669678e-05, -6.388872861862183e-05, -5.2928924560546875e-05, -4.1969120502471924e-05, -3.100931644439697e-05, -2.004951238632202e-05, -9.08970832824707e-06, 1.8700957298278809e-06, 1.2829899787902832e-05, 2.3789703845977783e-05, 3.4749507904052734e-05, 4.5709311962127686e-05, 5.666911602020264e-05, 6.762892007827759e-05, 7.858872413635254e-05, 8.954852819442749e-05, 0.00010050833225250244, 0.00011146813631057739, 0.00012242794036865234, 0.0001333877444267273, 0.00014434754848480225, 0.0001553073525428772, 0.00016626715660095215, 0.0001772269606590271, 0.00018818676471710205, 0.000199146568775177, 0.00021010637283325195, 0.0002210661768913269, 0.00023202598094940186, 0.0002429857850074768, 0.00025394558906555176, 0.0002649053931236267, 0.00027586519718170166, 0.0002868250012397766, 0.00029778480529785156]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 4.0, 6.0, 4.0, 12.0, 21.0, 15.0, 17.0, 23.0, 34.0, 25.0, 32.0, 40.0, 45.0, 30.0, 48.0, 49.0, 47.0, 57.0, 45.0, 41.0, 54.0, 36.0, 40.0, 41.0, 28.0, 31.0, 22.0, 23.0, 26.0, 16.0, 16.0, 13.0, 13.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.00010329484939575195, -0.00010046642273664474, -9.763799607753754e-05, -9.480956941843033e-05, -9.198114275932312e-05, -8.915271610021591e-05, -8.63242894411087e-05, -8.34958627820015e-05, -8.066743612289429e-05, -7.783900946378708e-05, -7.501058280467987e-05, -7.218215614557266e-05, -6.935372948646545e-05, -6.652530282735825e-05, -6.369687616825104e-05, -6.086844950914383e-05, -5.804002285003662e-05, -5.521159619092941e-05, -5.2383169531822205e-05, -4.9554742872714996e-05, -4.672631621360779e-05, -4.389788955450058e-05, -4.106946289539337e-05, -3.824103623628616e-05, -3.5412609577178955e-05, -3.258418291807175e-05, -2.975575625896454e-05, -2.692732959985733e-05, -2.4098902940750122e-05, -2.1270476281642914e-05, -1.8442049622535706e-05, -1.5613622963428497e-05, -1.2785196304321289e-05, -9.95676964521408e-06, -7.1283429861068726e-06, -4.299916326999664e-06, -1.471489667892456e-06, 1.3569369912147522e-06, 4.1853636503219604e-06, 7.013790309429169e-06, 9.842216968536377e-06, 1.2670643627643585e-05, 1.5499070286750793e-05, 1.8327496945858002e-05, 2.115592360496521e-05, 2.3984350264072418e-05, 2.6812776923179626e-05, 2.9641203582286835e-05, 3.246963024139404e-05, 3.529805690050125e-05, 3.812648355960846e-05, 4.095491021871567e-05, 4.3783336877822876e-05, 4.6611763536930084e-05, 4.944019019603729e-05, 5.22686168551445e-05, 5.509704351425171e-05, 5.792547017335892e-05, 6.0753896832466125e-05, 6.358232349157333e-05, 6.641075015068054e-05, 6.923917680978775e-05, 7.206760346889496e-05, 7.489603012800217e-05, 7.772445678710938e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 23.0, 18.0, 22.0, 36.0, 60.0, 78.0, 137.0, 232.0, 399.0, 676.0, 1211.0, 2116.0, 4123.0, 7952.0, 15599.0, 32882.0, 76374.0, 214568.0, 411919.0, 163261.0, 61387.0, 27357.0, 13368.0, 6681.0, 3530.0, 1969.0, 1059.0, 588.0, 340.0, 213.0, 126.0, 80.0, 54.0, 28.0, 25.0, 11.0, 15.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00030231475830078125, -0.00029202550649642944, -0.00028173625469207764, -0.00027144700288772583, -0.000261157751083374, -0.0002508684992790222, -0.0002405792474746704, -0.0002302899956703186, -0.0002200007438659668, -0.000209711492061615, -0.00019942224025726318, -0.00018913298845291138, -0.00017884373664855957, -0.00016855448484420776, -0.00015826523303985596, -0.00014797598123550415, -0.00013768672943115234, -0.00012739747762680054, -0.00011710822582244873, -0.00010681897401809692, -9.652972221374512e-05, -8.624047040939331e-05, -7.59512186050415e-05, -6.56619668006897e-05, -5.537271499633789e-05, -4.5083463191986084e-05, -3.479421138763428e-05, -2.450495958328247e-05, -1.4215707778930664e-05, -3.926455974578857e-06, 6.362795829772949e-06, 1.6652047634124756e-05, 2.6941299438476562e-05, 3.723055124282837e-05, 4.7519803047180176e-05, 5.780905485153198e-05, 6.809830665588379e-05, 7.83875584602356e-05, 8.86768102645874e-05, 9.896606206893921e-05, 0.00010925531387329102, 0.00011954456567764282, 0.00012983381748199463, 0.00014012306928634644, 0.00015041232109069824, 0.00016070157289505005, 0.00017099082469940186, 0.00018128007650375366, 0.00019156932830810547, 0.00020185858011245728, 0.00021214783191680908, 0.0002224370837211609, 0.0002327263355255127, 0.0002430155873298645, 0.0002533048391342163, 0.0002635940909385681, 0.0002738833427429199, 0.00028417259454727173, 0.00029446184635162354, 0.00030475109815597534, 0.00031504034996032715, 0.00032532960176467896, 0.00033561885356903076, 0.00034590810537338257, 0.0003561973571777344]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 7.0, 9.0, 13.0, 11.0, 21.0, 24.0, 22.0, 19.0, 21.0, 29.0, 38.0, 32.0, 48.0, 43.0, 58.0, 44.0, 40.0, 39.0, 48.0, 38.0, 33.0, 40.0, 37.0, 38.0, 30.0, 34.0, 28.0, 20.0, 17.0, 19.0, 18.0, 7.0, 18.0, 6.0, 15.0, 5.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-8.153915405273438e-05, -7.914472371339798e-05, -7.675029337406158e-05, -7.435586303472519e-05, -7.19614326953888e-05, -6.95670023560524e-05, -6.7172572016716e-05, -6.477814167737961e-05, -6.238371133804321e-05, -5.998928099870682e-05, -5.759485065937042e-05, -5.520042032003403e-05, -5.280598998069763e-05, -5.0411559641361237e-05, -4.801712930202484e-05, -4.5622698962688446e-05, -4.322826862335205e-05, -4.0833838284015656e-05, -3.843940794467926e-05, -3.6044977605342865e-05, -3.365054726600647e-05, -3.1256116926670074e-05, -2.886168658733368e-05, -2.6467256247997284e-05, -2.407282590866089e-05, -2.1678395569324493e-05, -1.9283965229988098e-05, -1.6889534890651703e-05, -1.4495104551315308e-05, -1.2100674211978912e-05, -9.706243872642517e-06, -7.311813533306122e-06, -4.9173831939697266e-06, -2.5229528546333313e-06, -1.2852251529693604e-07, 2.2659078240394592e-06, 4.6603381633758545e-06, 7.05476850271225e-06, 9.449198842048645e-06, 1.184362918138504e-05, 1.4238059520721436e-05, 1.663248986005783e-05, 1.9026920199394226e-05, 2.142135053873062e-05, 2.3815780878067017e-05, 2.6210211217403412e-05, 2.8604641556739807e-05, 3.09990718960762e-05, 3.33935022354126e-05, 3.578793257474899e-05, 3.818236291408539e-05, 4.0576793253421783e-05, 4.297122359275818e-05, 4.5365653932094574e-05, 4.776008427143097e-05, 5.0154514610767365e-05, 5.254894495010376e-05, 5.4943375289440155e-05, 5.733780562877655e-05, 5.9732235968112946e-05, 6.212666630744934e-05, 6.452109664678574e-05, 6.691552698612213e-05, 6.930995732545853e-05, 7.170438766479492e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 2.0, 11.0, 10.0, 16.0, 21.0, 35.0, 42.0, 57.0, 91.0, 149.0, 212.0, 342.0, 562.0, 852.0, 1717.0, 3289.0, 7363.0, 20394.0, 86592.0, 713619.0, 163849.0, 30385.0, 9925.0, 4112.0, 2032.0, 1088.0, 607.0, 391.0, 280.0, 146.0, 101.0, 85.0, 48.0, 39.0, 22.0, 14.0, 10.0, 13.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -3.0160881578922272e-05, -2.9208138585090637e-05, -2.8255395591259003e-05, -2.7302652597427368e-05, -2.6349909603595734e-05, -2.53971666097641e-05, -2.4444423615932465e-05, -2.349168062210083e-05, -2.2538937628269196e-05, -2.158619463443756e-05, -2.0633451640605927e-05, -1.9680708646774292e-05, -1.8727965652942657e-05, -1.7775222659111023e-05, -1.682247966527939e-05, -1.5869736671447754e-05, -1.491699367761612e-05, -1.3964250683784485e-05, -1.301150768995285e-05, -1.2058764696121216e-05, -1.1106021702289581e-05, -1.0153278708457947e-05, -9.200535714626312e-06, -8.247792720794678e-06, -7.295049726963043e-06, -6.342306733131409e-06, -5.389563739299774e-06, -4.43682074546814e-06, -3.484077751636505e-06, -2.5313347578048706e-06, -1.578591763973236e-06, -6.258487701416016e-07, 3.2689422369003296e-07, 1.2796372175216675e-06, 2.232380211353302e-06, 3.1851232051849365e-06, 4.137866199016571e-06, 5.0906091928482056e-06, 6.04335218667984e-06, 6.996095180511475e-06, 7.948838174343109e-06, 8.901581168174744e-06, 9.854324162006378e-06, 1.0807067155838013e-05, 1.1759810149669647e-05, 1.2712553143501282e-05, 1.3665296137332916e-05, 1.461803913116455e-05, 1.5570782124996185e-05, 1.652352511882782e-05, 1.7476268112659454e-05, 1.842901110649109e-05, 1.9381754100322723e-05, 2.0334497094154358e-05, 2.1287240087985992e-05, 2.2239983081817627e-05, 2.319272607564926e-05, 2.4145469069480896e-05, 2.509821206331253e-05, 2.6050955057144165e-05, 2.70036980509758e-05, 2.7956441044807434e-05, 2.890918403863907e-05, 2.9861927032470703e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 9.0, 5.0, 7.0, 21.0, 14.0, 14.0, 22.0, 68.0, 37.0, 55.0, 70.0, 227.0, 107.0, 86.0, 53.0, 75.0, 20.0, 26.0, 27.0, 10.0, 15.0, 5.0, 10.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9511207938194275e-06, -1.8756836652755737e-06, -1.80024653673172e-06, -1.7248094081878662e-06, -1.6493722796440125e-06, -1.5739351511001587e-06, -1.498498022556305e-06, -1.4230608940124512e-06, -1.3476237654685974e-06, -1.2721866369247437e-06, -1.1967495083808899e-06, -1.1213123798370361e-06, -1.0458752512931824e-06, -9.704381227493286e-07, -8.950009942054749e-07, -8.195638656616211e-07, -7.441267371177673e-07, -6.686896085739136e-07, -5.932524800300598e-07, -5.178153514862061e-07, -4.423782229423523e-07, -3.6694109439849854e-07, -2.915039658546448e-07, -2.1606683731079102e-07, -1.4062970876693726e-07, -6.51925802230835e-08, 1.0244548320770264e-08, 8.568167686462402e-08, 1.6111880540847778e-07, 2.3655593395233154e-07, 3.119930624961853e-07, 3.8743019104003906e-07, 4.628673195838928e-07, 5.383044481277466e-07, 6.137415766716003e-07, 6.891787052154541e-07, 7.646158337593079e-07, 8.400529623031616e-07, 9.154900908470154e-07, 9.909272193908691e-07, 1.066364347934723e-06, 1.1418014764785767e-06, 1.2172386050224304e-06, 1.2926757335662842e-06, 1.368112862110138e-06, 1.4435499906539917e-06, 1.5189871191978455e-06, 1.5944242477416992e-06, 1.669861376285553e-06, 1.7452985048294067e-06, 1.8207356333732605e-06, 1.8961727619171143e-06, 1.971609890460968e-06, 2.0470470190048218e-06, 2.1224841475486755e-06, 2.1979212760925293e-06, 2.273358404636383e-06, 2.348795533180237e-06, 2.4242326617240906e-06, 2.4996697902679443e-06, 2.575106918811798e-06, 2.650544047355652e-06, 2.7259811758995056e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 13.0, 18.0, 21.0, 34.0, 60.0, 93.0, 175.0, 306.0, 673.0, 1658.0, 3665.0, 10422.0, 29523.0, 115551.0, 664953.0, 163173.0, 39560.0, 10778.0, 4285.0, 1932.0, 757.0, 383.0, 214.0, 97.0, 72.0, 45.0, 24.0, 24.0, 16.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.390146255493164e-05, -2.3282133042812347e-05, -2.2662803530693054e-05, -2.204347401857376e-05, -2.1424144506454468e-05, -2.0804814994335175e-05, -2.018548548221588e-05, -1.9566155970096588e-05, -1.8946826457977295e-05, -1.8327496945858002e-05, -1.770816743373871e-05, -1.7088837921619415e-05, -1.6469508409500122e-05, -1.585017889738083e-05, -1.5230849385261536e-05, -1.4611519873142242e-05, -1.399219036102295e-05, -1.3372860848903656e-05, -1.2753531336784363e-05, -1.213420182466507e-05, -1.1514872312545776e-05, -1.0895542800426483e-05, -1.027621328830719e-05, -9.656883776187897e-06, -9.037554264068604e-06, -8.41822475194931e-06, -7.798895239830017e-06, -7.179565727710724e-06, -6.560236215591431e-06, -5.9409067034721375e-06, -5.321577191352844e-06, -4.702247679233551e-06, -4.082918167114258e-06, -3.4635886549949646e-06, -2.8442591428756714e-06, -2.224929630756378e-06, -1.605600118637085e-06, -9.862706065177917e-07, -3.6694109439849854e-07, 2.523884177207947e-07, 8.717179298400879e-07, 1.491047441959381e-06, 2.1103769540786743e-06, 2.7297064661979675e-06, 3.3490359783172607e-06, 3.968365490436554e-06, 4.587695002555847e-06, 5.20702451467514e-06, 5.826354026794434e-06, 6.445683538913727e-06, 7.06501305103302e-06, 7.684342563152313e-06, 8.303672075271606e-06, 8.9230015873909e-06, 9.542331099510193e-06, 1.0161660611629486e-05, 1.078099012374878e-05, 1.1400319635868073e-05, 1.2019649147987366e-05, 1.2638978660106659e-05, 1.3258308172225952e-05, 1.3877637684345245e-05, 1.4496967196464539e-05, 1.5116296708583832e-05, 1.5735626220703125e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 9.0, 11.0, 4.0, 18.0, 20.0, 18.0, 30.0, 30.0, 78.0, 54.0, 59.0, 73.0, 128.0, 77.0, 68.0, 61.0, 65.0, 49.0, 36.0, 24.0, 23.0, 21.0, 6.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4570693969726562e-06, -3.323890268802643e-06, -3.1907111406326294e-06, -3.057532012462616e-06, -2.9243528842926025e-06, -2.791173756122589e-06, -2.6579946279525757e-06, -2.5248154997825623e-06, -2.391636371612549e-06, -2.2584572434425354e-06, -2.125278115272522e-06, -1.9920989871025085e-06, -1.8589198589324951e-06, -1.7257407307624817e-06, -1.5925616025924683e-06, -1.4593824744224548e-06, -1.3262033462524414e-06, -1.193024218082428e-06, -1.0598450899124146e-06, -9.266659617424011e-07, -7.934868335723877e-07, -6.603077054023743e-07, -5.271285772323608e-07, -3.939494490623474e-07, -2.60770320892334e-07, -1.2759119272232056e-07, 5.587935447692871e-09, 1.387670636177063e-07, 2.7194619178771973e-07, 4.0512531995773315e-07, 5.383044481277466e-07, 6.7148357629776e-07, 8.046627044677734e-07, 9.378418326377869e-07, 1.0710209608078003e-06, 1.2042000889778137e-06, 1.3373792171478271e-06, 1.4705583453178406e-06, 1.603737473487854e-06, 1.7369166016578674e-06, 1.8700957298278809e-06, 2.0032748579978943e-06, 2.1364539861679077e-06, 2.269633114337921e-06, 2.4028122425079346e-06, 2.535991370677948e-06, 2.6691704988479614e-06, 2.802349627017975e-06, 2.9355287551879883e-06, 3.0687078833580017e-06, 3.201887011528015e-06, 3.3350661396980286e-06, 3.468245267868042e-06, 3.6014243960380554e-06, 3.734603524208069e-06, 3.867782652378082e-06, 4.000961780548096e-06, 4.134140908718109e-06, 4.2673200368881226e-06, 4.400499165058136e-06, 4.533678293228149e-06, 4.666857421398163e-06, 4.800036549568176e-06, 4.93321567773819e-06, 5.066394805908203e-06]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 7.0, 18.0, 15.0, 16.0, 33.0, 34.0, 40.0, 72.0, 103.0, 116.0, 132.0, 112.0, 65.0, 46.0, 31.0, 35.0, 25.0, 22.0, 15.0, 9.0, 11.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017374464368913323, -0.00016832290566526353, -0.0001629011530894786, -0.00015747941506560892, -0.00015205767704173923, -0.0001466359244659543, -0.0001412141864420846, -0.00013579244841821492, -0.00013037069584243, -0.0001249489578185603, -0.00011952720524277538, -0.00011410546721890569, -0.00010868372191907838, -0.00010326197661925107, -9.784023859538138e-05, -9.241849329555407e-05, -8.699674799572676e-05, -8.157500269589946e-05, -7.615325739607215e-05, -7.073151937220246e-05, -6.530977407237515e-05, -5.988802877254784e-05, -5.446628711069934e-05, -4.904454544885084e-05, -4.362280014902353e-05, -3.8201054849196225e-05, -3.2779313187347725e-05, -2.735756970650982e-05, -2.1935826225671917e-05, -1.6514082744834013e-05, -1.109233926399611e-05, -5.670597602147609e-06, -2.4885230232030153e-07, 5.172891178517602e-06, 1.0594634659355506e-05, 1.601637814019341e-05, 2.1438121621031314e-05, 2.6859865101869218e-05, 3.228160858270712e-05, 3.770335024455562e-05, 4.312509554438293e-05, 4.854684084421024e-05, 5.396858250605874e-05, 5.939032416790724e-05, 6.481206946773455e-05, 7.023381476756185e-05, 7.565555279143155e-05, 8.107729809125885e-05, 8.649904339108616e-05, 9.192078869091347e-05, 9.734253399074078e-05, 0.00010276427201461047, 0.00010818601731443778, 0.00011360776261426508, 0.00011902950063813478, 0.00012445123866200447, 0.0001298729912377894, 0.00013529472926165909, 0.000140716481837444, 0.0001461382198613137, 0.00015155997243709862, 0.00015698171046096832, 0.000162403448484838, 0.00016782520106062293, 0.00017324693908449262]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 6.0, 13.0, 8.0, 9.0, 15.0, 13.0, 22.0, 17.0, 17.0, 25.0, 26.0, 45.0, 38.0, 34.0, 46.0, 42.0, 42.0, 39.0, 54.0, 51.0, 39.0, 40.0, 41.0, 39.0, 34.0, 23.0, 33.0, 39.0, 30.0, 18.0, 14.0, 10.0, 15.0, 12.0, 12.0, 10.0, 4.0, 2.0, 6.0, 0.0, 7.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.07458272902295e-05, -7.754982652841136e-05, -7.43538184906356e-05, -7.115781772881746e-05, -6.796181696699932e-05, -6.476581620518118e-05, -6.156980816740543e-05, -5.8373807405587286e-05, -5.517780300579034e-05, -5.198179860599339e-05, -4.878579784417525e-05, -4.55897934443783e-05, -4.2393789044581354e-05, -3.919778828276321e-05, -3.6001783882966265e-05, -3.280577948316932e-05, -2.9609778721351177e-05, -2.6413776140543632e-05, -2.3217773559736088e-05, -2.002176915993914e-05, -1.6825766579131596e-05, -1.3629763998324051e-05, -1.0433759598527104e-05, -7.237757017719559e-06, -4.041754436912015e-06, -8.457514013571199e-07, 2.3502516341977753e-06, 5.546255124500021e-06, 8.742257705307566e-06, 1.193826028611511e-05, 1.5134264685912058e-05, 1.8330267266719602e-05, 2.1526269847527146e-05, 2.472227242833469e-05, 2.7918275009142235e-05, 3.111427940893918e-05, 3.4310280170757324e-05, 3.750628457055427e-05, 4.070228897035122e-05, 4.389828973216936e-05, 4.709429413196631e-05, 5.0290298531763256e-05, 5.3486299293581396e-05, 5.6682303693378344e-05, 5.987830809317529e-05, 6.307430885499343e-05, 6.627030961681157e-05, 6.946631765458733e-05, 7.266231841640547e-05, 7.585831917822361e-05, 7.905432721599936e-05, 8.22503279778175e-05, 8.544632873963565e-05, 8.86423367774114e-05, 9.183833753922954e-05, 9.503433830104768e-05, 9.823034633882344e-05, 0.00010142634710064158, 0.00010462235513841733, 0.00010781835590023547, 0.00011101435666205361, 0.00011421035742387176, 0.00011740636546164751, 0.00012060236622346565, 0.0001237983669852838]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 12.0, 17.0, 20.0, 28.0, 59.0, 72.0, 95.0, 128.0, 204.0, 288.0, 396.0, 622.0, 839.0, 1194.0, 1822.0, 2851.0, 4331.0, 7068.0, 12434.0, 24885.0, 65010.0, 3550140.0, 435322.0, 40632.0, 18712.0, 10041.0, 5858.0, 3740.0, 2384.0, 1540.0, 1019.0, 709.0, 525.0, 383.0, 229.0, 173.0, 132.0, 101.0, 65.0, 64.0, 37.0, 24.0, 19.0, 12.0, 18.0, 8.0, 6.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0002989768981933594, -0.0002892687916755676, -0.0002795606851577759, -0.00026985257863998413, -0.0002601444721221924, -0.00025043636560440063, -0.0002407282590866089, -0.00023102015256881714, -0.0002213120460510254, -0.00021160393953323364, -0.0002018958330154419, -0.00019218772649765015, -0.0001824796199798584, -0.00017277151346206665, -0.0001630634069442749, -0.00015335530042648315, -0.0001436471939086914, -0.00013393908739089966, -0.0001242309808731079, -0.00011452287435531616, -0.00010481476783752441, -9.510666131973267e-05, -8.539855480194092e-05, -7.569044828414917e-05, -6.598234176635742e-05, -5.6274235248565674e-05, -4.6566128730773926e-05, -3.685802221298218e-05, -2.714991569519043e-05, -1.744180917739868e-05, -7.733702659606934e-06, 1.9744038581848145e-06, 1.1682510375976562e-05, 2.139061689376831e-05, 3.109872341156006e-05, 4.080682992935181e-05, 5.0514936447143555e-05, 6.02230429649353e-05, 6.993114948272705e-05, 7.96392560005188e-05, 8.934736251831055e-05, 9.90554690361023e-05, 0.00010876357555389404, 0.00011847168207168579, 0.00012817978858947754, 0.0001378878951072693, 0.00014759600162506104, 0.00015730410814285278, 0.00016701221466064453, 0.00017672032117843628, 0.00018642842769622803, 0.00019613653421401978, 0.00020584464073181152, 0.00021555274724960327, 0.00022526085376739502, 0.00023496896028518677, 0.0002446770668029785, 0.00025438517332077026, 0.000264093279838562, 0.00027380138635635376, 0.0002835094928741455, 0.00029321759939193726, 0.000302925705909729, 0.00031263381242752075, 0.0003223419189453125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 4.0, 10.0, 7.0, 16.0, 14.0, 19.0, 19.0, 19.0, 16.0, 27.0, 43.0, 29.0, 28.0, 38.0, 52.0, 32.0, 54.0, 44.0, 39.0, 42.0, 41.0, 48.0, 35.0, 37.0, 39.0, 29.0, 44.0, 25.0, 15.0, 23.0, 21.0, 9.0, 19.0, 14.0, 8.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.46574592590332e-05, -5.285535007715225e-05, -5.10532408952713e-05, -4.925113171339035e-05, -4.74490225315094e-05, -4.564691334962845e-05, -4.38448041677475e-05, -4.204269498586655e-05, -4.0240585803985596e-05, -3.8438476622104645e-05, -3.6636367440223694e-05, -3.483425825834274e-05, -3.303214907646179e-05, -3.123003989458084e-05, -2.942793071269989e-05, -2.762582153081894e-05, -2.5823712348937988e-05, -2.4021603167057037e-05, -2.2219493985176086e-05, -2.0417384803295135e-05, -1.8615275621414185e-05, -1.6813166439533234e-05, -1.5011057257652283e-05, -1.3208948075771332e-05, -1.1406838893890381e-05, -9.60472971200943e-06, -7.802620530128479e-06, -6.000511348247528e-06, -4.198402166366577e-06, -2.3962929844856262e-06, -5.941838026046753e-07, 1.2079253792762756e-06, 3.0100345611572266e-06, 4.8121437430381775e-06, 6.614252924919128e-06, 8.41636210680008e-06, 1.021847128868103e-05, 1.2020580470561981e-05, 1.3822689652442932e-05, 1.5624798834323883e-05, 1.7426908016204834e-05, 1.9229017198085785e-05, 2.1031126379966736e-05, 2.2833235561847687e-05, 2.4635344743728638e-05, 2.643745392560959e-05, 2.823956310749054e-05, 3.004167228937149e-05, 3.184378147125244e-05, 3.364589065313339e-05, 3.544799983501434e-05, 3.7250109016895294e-05, 3.9052218198776245e-05, 4.0854327380657196e-05, 4.265643656253815e-05, 4.44585457444191e-05, 4.626065492630005e-05, 4.8062764108181e-05, 4.986487329006195e-05, 5.16669824719429e-05, 5.346909165382385e-05, 5.5271200835704803e-05, 5.7073310017585754e-05, 5.8875419199466705e-05, 6.0677528381347656e-05]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 24.0, 26.0, 44.0, 49.0, 111.0, 157.0, 247.0, 410.0, 643.0, 1128.0, 1969.0, 3604.0, 6805.0, 13726.0, 30617.0, 88858.0, 2545451.0, 1360177.0, 83116.0, 28991.0, 13354.0, 6411.0, 3571.0, 1944.0, 1125.0, 587.0, 403.0, 240.0, 155.0, 103.0, 71.0, 47.0, 35.0, 16.0, 14.0, 8.0, 4.0, 5.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003306865692138672, -0.00032123178243637085, -0.0003117769956588745, -0.0003023222088813782, -0.00029286742210388184, -0.0002834126353263855, -0.00027395784854888916, -0.0002645030617713928, -0.0002550482749938965, -0.00024559348821640015, -0.0002361387014389038, -0.00022668391466140747, -0.00021722912788391113, -0.0002077743411064148, -0.00019831955432891846, -0.00018886476755142212, -0.00017940998077392578, -0.00016995519399642944, -0.0001605004072189331, -0.00015104562044143677, -0.00014159083366394043, -0.0001321360468864441, -0.00012268126010894775, -0.00011322647333145142, -0.00010377168655395508, -9.431689977645874e-05, -8.48621129989624e-05, -7.540732622146606e-05, -6.595253944396973e-05, -5.649775266647339e-05, -4.704296588897705e-05, -3.758817911148071e-05, -2.8133392333984375e-05, -1.8678605556488037e-05, -9.2238187789917e-06, 2.3096799850463867e-07, 9.685754776000977e-06, 1.9140541553497314e-05, 2.8595328330993652e-05, 3.805011510848999e-05, 4.750490188598633e-05, 5.6959688663482666e-05, 6.6414475440979e-05, 7.586926221847534e-05, 8.532404899597168e-05, 9.477883577346802e-05, 0.00010423362255096436, 0.0001136884093284607, 0.00012314319610595703, 0.00013259798288345337, 0.0001420527696609497, 0.00015150755643844604, 0.00016096234321594238, 0.00017041712999343872, 0.00017987191677093506, 0.0001893267035484314, 0.00019878149032592773, 0.00020823627710342407, 0.0002176910638809204, 0.00022714585065841675, 0.00023660063743591309, 0.0002460554242134094, 0.00025551021099090576, 0.0002649649977684021, 0.00027441978454589844]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 10.0, 5.0, 12.0, 14.0, 21.0, 13.0, 21.0, 25.0, 42.0, 40.0, 67.0, 142.0, 389.0, 1822.0, 896.0, 225.0, 106.0, 46.0, 43.0, 21.0, 22.0, 16.0, 13.0, 13.0, 12.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-05, -5.385745316743851e-05, -5.168654024600983e-05, -4.9515627324581146e-05, -4.7344714403152466e-05, -4.5173801481723785e-05, -4.3002888560295105e-05, -4.0831975638866425e-05, -3.8661062717437744e-05, -3.6490149796009064e-05, -3.431923687458038e-05, -3.21483239531517e-05, -2.9977411031723022e-05, -2.7806498110294342e-05, -2.563558518886566e-05, -2.346467226743698e-05, -2.12937593460083e-05, -1.912284642457962e-05, -1.695193350315094e-05, -1.478102058172226e-05, -1.2610107660293579e-05, -1.0439194738864899e-05, -8.268281817436218e-06, -6.097368896007538e-06, -3.926455974578857e-06, -1.755543053150177e-06, 4.153698682785034e-07, 2.586282789707184e-06, 4.757195711135864e-06, 6.928108632564545e-06, 9.099021553993225e-06, 1.1269934475421906e-05, 1.3440847396850586e-05, 1.5611760318279266e-05, 1.7782673239707947e-05, 1.9953586161136627e-05, 2.2124499082565308e-05, 2.4295412003993988e-05, 2.646632492542267e-05, 2.863723784685135e-05, 3.080815076828003e-05, 3.297906368970871e-05, 3.514997661113739e-05, 3.732088953256607e-05, 3.949180245399475e-05, 4.166271537542343e-05, 4.383362829685211e-05, 4.600454121828079e-05, 4.817545413970947e-05, 5.034636706113815e-05, 5.2517279982566833e-05, 5.4688192903995514e-05, 5.6859105825424194e-05, 5.9030018746852875e-05, 6.120093166828156e-05, 6.337184458971024e-05, 6.554275751113892e-05, 6.77136704325676e-05, 6.988458335399628e-05, 7.205549627542496e-05, 7.422640919685364e-05, 7.639732211828232e-05, 7.8568235039711e-05, 8.073914796113968e-05, 8.291006088256836e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 10.0, 7.0, 7.0, 13.0, 18.0, 22.0, 35.0, 47.0, 60.0, 65.0, 102.0, 162.0, 118.0, 91.0, 68.0, 51.0, 34.0, 26.0, 12.0, 15.0, 7.0, 8.0, 10.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011004980478901416, -0.00010574657062534243, -0.0001014433364616707, -9.714010957395658e-05, -9.283687541028485e-05, -8.853364124661312e-05, -8.4230414358899e-05, -7.992718019522727e-05, -7.562394603155553e-05, -7.13207118678838e-05, -6.701747770421207e-05, -6.271425081649795e-05, -5.841101665282622e-05, -5.410778248915449e-05, -4.980455196346156e-05, -4.550132143776864e-05, -4.1198087274096906e-05, -3.6894853110425174e-05, -3.259162258473225e-05, -2.828839024004992e-05, -2.3985157895367593e-05, -1.9681925550685264e-05, -1.5378693206002936e-05, -1.1075460861320607e-05, -6.772228516638279e-06, -2.4689961719559506e-06, 1.8342361727263778e-06, 6.137468517408706e-06, 1.0440700862091035e-05, 1.4743933206773363e-05, 1.904716555145569e-05, 2.335039789613802e-05, 2.7653644792735577e-05, 3.195687895640731e-05, 3.6260109482100233e-05, 4.056334000779316e-05, 4.486657417146489e-05, 4.916980833513662e-05, 5.347303886082955e-05, 5.777626938652247e-05, 6.20795035501942e-05, 6.638273771386594e-05, 7.068597187753767e-05, 7.498919876525179e-05, 7.929243292892352e-05, 8.359566709259525e-05, 8.789889398030937e-05, 9.22021281439811e-05, 9.650536230765283e-05, 0.00010080859647132456, 0.0001051118306349963, 0.00010941505752271041, 0.00011371829168638214, 0.00011802152585005388, 0.000122324752737768, 0.00012662798690143973, 0.00013093122106511146, 0.0001352344552287832, 0.00013953768939245492, 0.00014384092355612665, 0.00014814414316788316, 0.0001524473773315549, 0.00015675061149522662, 0.00016105384565889835, 0.00016535707982257009]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 10.0, 13.0, 16.0, 15.0, 27.0, 23.0, 27.0, 34.0, 35.0, 42.0, 35.0, 37.0, 38.0, 40.0, 33.0, 55.0, 39.0, 51.0, 41.0, 51.0, 45.0, 37.0, 41.0, 46.0, 29.0, 19.0, 14.0, 22.0, 15.0, 14.0, 14.0, 6.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.697717228438705e-05, -7.449855911545455e-05, -7.201994594652206e-05, -6.954133277758956e-05, -6.706271960865706e-05, -6.458409916376695e-05, -6.210548599483445e-05, -5.9626872825901955e-05, -5.714825965696946e-05, -5.466964648803696e-05, -5.219103331910446e-05, -4.971241651219316e-05, -4.723380334326066e-05, -4.475519017432816e-05, -4.227657336741686e-05, -3.979796019848436e-05, -3.7319347029551864e-05, -3.4840733860619366e-05, -3.236212069168687e-05, -2.9883503884775564e-05, -2.7404890715843067e-05, -2.492627754691057e-05, -2.2447662558988668e-05, -1.9969047571066767e-05, -1.749043440213427e-05, -1.501182032370707e-05, -1.2533206245279871e-05, -1.0054592166852672e-05, -7.575978088425472e-06, -5.097364009998273e-06, -2.618749931571074e-06, -1.4013494364917278e-07, 2.338485501240939e-06, 4.817099579668138e-06, 7.2957136580953375e-06, 9.774327736522537e-06, 1.2252941814949736e-05, 1.4731555893376935e-05, 1.7210169971804135e-05, 1.9688784959726036e-05, 2.2167398128658533e-05, 2.464601129759103e-05, 2.712462628551293e-05, 2.9603241273434833e-05, 3.208185444236733e-05, 3.456046761129983e-05, 3.703908441821113e-05, 3.951769758714363e-05, 4.199631075607613e-05, 4.4474923925008625e-05, 4.695353709394112e-05, 4.943215390085243e-05, 5.1910767069784924e-05, 5.438938023871742e-05, 5.6867997045628726e-05, 5.9346610214561224e-05, 6.182522338349372e-05, 6.430383655242622e-05, 6.678244972135872e-05, 6.926106289029121e-05, 7.173967605922371e-05, 7.421829650411382e-05, 7.669690967304632e-05, 7.917552284197882e-05, 8.165413601091132e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 17.0, 14.0, 17.0, 27.0, 49.0, 64.0, 86.0, 115.0, 179.0, 270.0, 429.0, 656.0, 1074.0, 1971.0, 3940.0, 8771.0, 22860.0, 70492.0, 286424.0, 478120.0, 115039.0, 34031.0, 12492.0, 5403.0, 2483.0, 1309.0, 765.0, 452.0, 300.0, 197.0, 146.0, 86.0, 80.0, 48.0, 29.0, 27.0, 27.0, 19.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00021135807037353516, -0.00020479224622249603, -0.0001982264220714569, -0.00019166059792041779, -0.00018509477376937866, -0.00017852894961833954, -0.00017196312546730042, -0.0001653973013162613, -0.00015883147716522217, -0.00015226565301418304, -0.00014569982886314392, -0.0001391340047121048, -0.00013256818056106567, -0.00012600235641002655, -0.00011943653225898743, -0.0001128707081079483, -0.00010630488395690918, -9.973905980587006e-05, -9.317323565483093e-05, -8.660741150379181e-05, -8.004158735275269e-05, -7.347576320171356e-05, -6.690993905067444e-05, -6.0344114899635315e-05, -5.377829074859619e-05, -4.721246659755707e-05, -4.0646642446517944e-05, -3.408081829547882e-05, -2.7514994144439697e-05, -2.0949169993400574e-05, -1.438334584236145e-05, -7.817521691322327e-06, -1.2516975402832031e-06, 5.31412661075592e-06, 1.1879950761795044e-05, 1.8445774912834167e-05, 2.501159906387329e-05, 3.1577423214912415e-05, 3.814324736595154e-05, 4.470907151699066e-05, 5.1274895668029785e-05, 5.784071981906891e-05, 6.440654397010803e-05, 7.097236812114716e-05, 7.753819227218628e-05, 8.41040164232254e-05, 9.066984057426453e-05, 9.723566472530365e-05, 0.00010380148887634277, 0.0001103673130273819, 0.00011693313717842102, 0.00012349896132946014, 0.00013006478548049927, 0.0001366306096315384, 0.00014319643378257751, 0.00014976225793361664, 0.00015632808208465576, 0.00016289390623569489, 0.000169459730386734, 0.00017602555453777313, 0.00018259137868881226, 0.00018915720283985138, 0.0001957230269908905, 0.00020228885114192963, 0.00020885467529296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 6.0, 5.0, 18.0, 17.0, 13.0, 22.0, 38.0, 40.0, 32.0, 39.0, 41.0, 37.0, 46.0, 42.0, 51.0, 51.0, 35.0, 39.0, 65.0, 42.0, 42.0, 35.0, 33.0, 42.0, 43.0, 22.0, 21.0, 13.0, 16.0, 7.0, 9.0, 7.0, 4.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.14199447631836e-05, -7.885042577981949e-05, -7.628090679645538e-05, -7.371138781309128e-05, -7.114186882972717e-05, -6.857234984636307e-05, -6.600283086299896e-05, -6.343331187963486e-05, -6.086379289627075e-05, -5.829427391290665e-05, -5.572475492954254e-05, -5.3155235946178436e-05, -5.058571696281433e-05, -4.8016197979450226e-05, -4.544667899608612e-05, -4.2877160012722015e-05, -4.030764102935791e-05, -3.7738122045993805e-05, -3.51686030626297e-05, -3.2599084079265594e-05, -3.002956509590149e-05, -2.7460046112537384e-05, -2.489052712917328e-05, -2.2321008145809174e-05, -1.975148916244507e-05, -1.7181970179080963e-05, -1.4612451195716858e-05, -1.2042932212352753e-05, -9.473413228988647e-06, -6.903894245624542e-06, -4.334375262260437e-06, -1.7648562788963318e-06, 8.046627044677734e-07, 3.3741816878318787e-06, 5.943700671195984e-06, 8.513219654560089e-06, 1.1082738637924194e-05, 1.36522576212883e-05, 1.6221776604652405e-05, 1.879129558801651e-05, 2.1360814571380615e-05, 2.393033355474472e-05, 2.6499852538108826e-05, 2.906937152147293e-05, 3.1638890504837036e-05, 3.420840948820114e-05, 3.6777928471565247e-05, 3.934744745492935e-05, 4.191696643829346e-05, 4.448648542165756e-05, 4.705600440502167e-05, 4.962552338838577e-05, 5.219504237174988e-05, 5.476456135511398e-05, 5.733408033847809e-05, 5.9903599321842194e-05, 6.24731183052063e-05, 6.50426372885704e-05, 6.761215627193451e-05, 7.018167525529861e-05, 7.275119423866272e-05, 7.532071322202682e-05, 7.789023220539093e-05, 8.045975118875504e-05, 8.302927017211914e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 1.0, 5.0, 11.0, 13.0, 18.0, 18.0, 33.0, 43.0, 67.0, 75.0, 115.0, 139.0, 173.0, 236.0, 336.0, 550.0, 828.0, 1385.0, 2876.0, 7572.0, 31440.0, 501385.0, 456302.0, 30374.0, 7630.0, 2814.0, 1446.0, 846.0, 505.0, 376.0, 250.0, 161.0, 126.0, 91.0, 75.0, 67.0, 44.0, 29.0, 16.0, 19.0, 13.0, 12.0, 8.0, 8.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0003409385681152344, -0.000330604612827301, -0.0003202706575393677, -0.0003099367022514343, -0.000299602746963501, -0.0002892687916755676, -0.0002789348363876343, -0.00026860088109970093, -0.0002582669258117676, -0.00024793297052383423, -0.00023759901523590088, -0.00022726505994796753, -0.00021693110466003418, -0.00020659714937210083, -0.00019626319408416748, -0.00018592923879623413, -0.00017559528350830078, -0.00016526132822036743, -0.00015492737293243408, -0.00014459341764450073, -0.00013425946235656738, -0.00012392550706863403, -0.00011359155178070068, -0.00010325759649276733, -9.292364120483398e-05, -8.258968591690063e-05, -7.225573062896729e-05, -6.192177534103394e-05, -5.1587820053100586e-05, -4.1253864765167236e-05, -3.091990947723389e-05, -2.0585954189300537e-05, -1.0251998901367188e-05, 8.195638656616211e-08, 1.0415911674499512e-05, 2.074986696243286e-05, 3.108382225036621e-05, 4.141777753829956e-05, 5.175173282623291e-05, 6.208568811416626e-05, 7.241964340209961e-05, 8.275359869003296e-05, 9.308755397796631e-05, 0.00010342150926589966, 0.00011375546455383301, 0.00012408941984176636, 0.0001344233751296997, 0.00014475733041763306, 0.0001550912857055664, 0.00016542524099349976, 0.0001757591962814331, 0.00018609315156936646, 0.0001964271068572998, 0.00020676106214523315, 0.0002170950174331665, 0.00022742897272109985, 0.0002377629280090332, 0.00024809688329696655, 0.0002584308385848999, 0.00026876479387283325, 0.0002790987491607666, 0.00028943270444869995, 0.0002997666597366333, 0.00031010061502456665, 0.0003204345703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 13.0, 18.0, 13.0, 19.0, 14.0, 22.0, 24.0, 33.0, 32.0, 23.0, 43.0, 39.0, 46.0, 52.0, 40.0, 52.0, 36.0, 45.0, 42.0, 32.0, 40.0, 31.0, 31.0, 25.0, 24.0, 21.0, 19.0, 17.0, 21.0, 18.0, 16.0, 21.0, 14.0, 3.0, 5.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.3272972106933594e-05, -4.187319427728653e-05, -4.0473416447639465e-05, -3.90736386179924e-05, -3.767386078834534e-05, -3.627408295869827e-05, -3.487430512905121e-05, -3.3474527299404144e-05, -3.207474946975708e-05, -3.0674971640110016e-05, -2.927519381046295e-05, -2.7875415980815887e-05, -2.6475638151168823e-05, -2.507586032152176e-05, -2.3676082491874695e-05, -2.227630466222763e-05, -2.0876526832580566e-05, -1.9476749002933502e-05, -1.8076971173286438e-05, -1.6677193343639374e-05, -1.527741551399231e-05, -1.3877637684345245e-05, -1.2477859854698181e-05, -1.1078082025051117e-05, -9.678304195404053e-06, -8.278526365756989e-06, -6.878748536109924e-06, -5.47897070646286e-06, -4.079192876815796e-06, -2.6794150471687317e-06, -1.2796372175216675e-06, 1.2014061212539673e-07, 1.519918441772461e-06, 2.919696271419525e-06, 4.319474101066589e-06, 5.7192519307136536e-06, 7.119029760360718e-06, 8.518807590007782e-06, 9.918585419654846e-06, 1.131836324930191e-05, 1.2718141078948975e-05, 1.4117918908596039e-05, 1.5517696738243103e-05, 1.6917474567890167e-05, 1.831725239753723e-05, 1.9717030227184296e-05, 2.111680805683136e-05, 2.2516585886478424e-05, 2.3916363716125488e-05, 2.5316141545772552e-05, 2.6715919375419617e-05, 2.811569720506668e-05, 2.9515475034713745e-05, 3.091525286436081e-05, 3.2315030694007874e-05, 3.371480852365494e-05, 3.5114586353302e-05, 3.6514364182949066e-05, 3.791414201259613e-05, 3.9313919842243195e-05, 4.071369767189026e-05, 4.211347550153732e-05, 4.351325333118439e-05, 4.491303116083145e-05, 4.6312808990478516e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 13.0, 6.0, 21.0, 20.0, 26.0, 42.0, 76.0, 85.0, 84.0, 142.0, 167.0, 215.0, 292.0, 430.0, 578.0, 867.0, 1332.0, 1877.0, 2964.0, 4726.0, 7873.0, 14461.0, 30102.0, 83411.0, 701087.0, 120138.0, 36517.0, 16671.0, 8796.0, 5457.0, 3222.0, 2122.0, 1369.0, 943.0, 609.0, 437.0, 370.0, 269.0, 184.0, 130.0, 92.0, 67.0, 55.0, 48.0, 35.0, 31.0, 16.0, 15.0, 14.0, 6.0, 10.0, 8.0, 5.0, 9.0, 1.0, 6.0], "bins": [-4.088878631591797e-05, -3.9635226130485535e-05, -3.83816659450531e-05, -3.7128105759620667e-05, -3.587454557418823e-05, -3.46209853887558e-05, -3.3367425203323364e-05, -3.211386501789093e-05, -3.0860304832458496e-05, -2.9606744647026062e-05, -2.8353184461593628e-05, -2.7099624276161194e-05, -2.584606409072876e-05, -2.4592503905296326e-05, -2.333894371986389e-05, -2.2085383534431458e-05, -2.0831823348999023e-05, -1.957826316356659e-05, -1.8324702978134155e-05, -1.707114279270172e-05, -1.5817582607269287e-05, -1.4564022421836853e-05, -1.3310462236404419e-05, -1.2056902050971985e-05, -1.080334186553955e-05, -9.549781680107117e-06, -8.296221494674683e-06, -7.0426613092422485e-06, -5.7891011238098145e-06, -4.53554093837738e-06, -3.2819807529449463e-06, -2.028420567512512e-06, -7.748603820800781e-07, 4.78699803352356e-07, 1.73225998878479e-06, 2.985820174217224e-06, 4.239380359649658e-06, 5.492940545082092e-06, 6.746500730514526e-06, 8.00006091594696e-06, 9.253621101379395e-06, 1.0507181286811829e-05, 1.1760741472244263e-05, 1.3014301657676697e-05, 1.4267861843109131e-05, 1.5521422028541565e-05, 1.6774982213974e-05, 1.8028542399406433e-05, 1.9282102584838867e-05, 2.05356627702713e-05, 2.1789222955703735e-05, 2.304278314113617e-05, 2.4296343326568604e-05, 2.5549903512001038e-05, 2.680346369743347e-05, 2.8057023882865906e-05, 2.931058406829834e-05, 3.0564144253730774e-05, 3.181770443916321e-05, 3.307126462459564e-05, 3.4324824810028076e-05, 3.557838499546051e-05, 3.6831945180892944e-05, 3.808550536632538e-05, 3.933906555175781e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 3.0, 6.0, 9.0, 14.0, 8.0, 13.0, 13.0, 18.0, 26.0, 18.0, 30.0, 34.0, 34.0, 37.0, 33.0, 57.0, 81.0, 116.0, 66.0, 52.0, 42.0, 33.0, 25.0, 24.0, 18.0, 32.0, 21.0, 14.0, 15.0, 13.0, 12.0, 12.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.9669532775878906e-06, -1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 6.0, 12.0, 18.0, 33.0, 38.0, 67.0, 103.0, 154.0, 243.0, 358.0, 584.0, 938.0, 1748.0, 2898.0, 5085.0, 10242.0, 20935.0, 50170.0, 188102.0, 611796.0, 91071.0, 32579.0, 14963.0, 7085.0, 3842.0, 2238.0, 1250.0, 727.0, 423.0, 300.0, 168.0, 115.0, 84.0, 65.0, 41.0, 27.0, 11.0, 11.0, 6.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0], "bins": [-5.173683166503906e-05, -5.0348229706287384e-05, -4.8959627747535706e-05, -4.757102578878403e-05, -4.618242383003235e-05, -4.479382187128067e-05, -4.340521991252899e-05, -4.201661795377731e-05, -4.0628015995025635e-05, -3.9239414036273956e-05, -3.785081207752228e-05, -3.64622101187706e-05, -3.507360816001892e-05, -3.368500620126724e-05, -3.2296404242515564e-05, -3.0907802283763885e-05, -2.9519200325012207e-05, -2.813059836626053e-05, -2.674199640750885e-05, -2.535339444875717e-05, -2.3964792490005493e-05, -2.2576190531253815e-05, -2.1187588572502136e-05, -1.9798986613750458e-05, -1.841038465499878e-05, -1.70217826962471e-05, -1.5633180737495422e-05, -1.4244578778743744e-05, -1.2855976819992065e-05, -1.1467374861240387e-05, -1.0078772902488708e-05, -8.69017094373703e-06, -7.3015689849853516e-06, -5.912967026233673e-06, -4.524365067481995e-06, -3.135763108730316e-06, -1.7471611499786377e-06, -3.5855919122695923e-07, 1.0300427675247192e-06, 2.4186447262763977e-06, 3.807246685028076e-06, 5.195848643779755e-06, 6.584450602531433e-06, 7.973052561283112e-06, 9.36165452003479e-06, 1.0750256478786469e-05, 1.2138858437538147e-05, 1.3527460396289825e-05, 1.4916062355041504e-05, 1.6304664313793182e-05, 1.769326627254486e-05, 1.908186823129654e-05, 2.0470470190048218e-05, 2.1859072148799896e-05, 2.3247674107551575e-05, 2.4636276066303253e-05, 2.602487802505493e-05, 2.741347998380661e-05, 2.880208194255829e-05, 3.0190683901309967e-05, 3.1579285860061646e-05, 3.2967887818813324e-05, 3.4356489777565e-05, 3.574509173631668e-05, 3.713369369506836e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 5.0, 13.0, 12.0, 17.0, 17.0, 21.0, 24.0, 22.0, 40.0, 43.0, 51.0, 58.0, 133.0, 125.0, 115.0, 59.0, 37.0, 44.0, 24.0, 22.0, 15.0, 15.0, 15.0, 7.0, 12.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-06, -9.211711585521698e-06, -8.886680006980896e-06, -8.561648428440094e-06, -8.236616849899292e-06, -7.91158527135849e-06, -7.586553692817688e-06, -7.261522114276886e-06, -6.936490535736084e-06, -6.611458957195282e-06, -6.28642737865448e-06, -5.961395800113678e-06, -5.636364221572876e-06, -5.311332643032074e-06, -4.986301064491272e-06, -4.66126948595047e-06, -4.336237907409668e-06, -4.011206328868866e-06, -3.686174750328064e-06, -3.361143171787262e-06, -3.03611159324646e-06, -2.711080014705658e-06, -2.386048436164856e-06, -2.061016857624054e-06, -1.735985279083252e-06, -1.41095370054245e-06, -1.085922122001648e-06, -7.60890543460846e-07, -4.3585896492004395e-07, -1.1082738637924194e-07, 2.1420419216156006e-07, 5.392357707023621e-07, 8.642673492431641e-07, 1.189298927783966e-06, 1.514330506324768e-06, 1.83936208486557e-06, 2.164393663406372e-06, 2.489425241947174e-06, 2.814456820487976e-06, 3.139488399028778e-06, 3.46451997756958e-06, 3.789551556110382e-06, 4.114583134651184e-06, 4.439614713191986e-06, 4.764646291732788e-06, 5.08967787027359e-06, 5.414709448814392e-06, 5.739741027355194e-06, 6.064772605895996e-06, 6.389804184436798e-06, 6.7148357629776e-06, 7.039867341518402e-06, 7.364898920059204e-06, 7.689930498600006e-06, 8.014962077140808e-06, 8.33999365568161e-06, 8.665025234222412e-06, 8.990056812763214e-06, 9.315088391304016e-06, 9.640119969844818e-06, 9.96515154838562e-06, 1.0290183126926422e-05, 1.0615214705467224e-05, 1.0940246284008026e-05, 1.1265277862548828e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 11.0, 7.0, 10.0, 7.0, 15.0, 28.0, 26.0, 34.0, 60.0, 77.0, 145.0, 160.0, 123.0, 90.0, 50.0, 38.0, 31.0, 26.0, 18.0, 10.0, 13.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011092721251770854, -0.0001067316989065148, -0.00010253618529532105, -9.83406716841273e-05, -9.414515807293355e-05, -8.994964446173981e-05, -8.575413085054606e-05, -8.155861723935232e-05, -7.736310362815857e-05, -7.316759001696482e-05, -6.897207640577108e-05, -6.477656279457733e-05, -6.0581049183383584e-05, -5.638553557218984e-05, -5.219002196099609e-05, -4.7994508349802345e-05, -4.37989947386086e-05, -3.960348112741485e-05, -3.5407967516221106e-05, -3.121245390502736e-05, -2.7016940293833613e-05, -2.2821426682639867e-05, -1.862591307144612e-05, -1.4430399460252374e-05, -1.0234885849058628e-05, -6.039372237864882e-06, -1.8438586266711354e-06, 2.351654984522611e-06, 6.547168595716357e-06, 1.0742682206910104e-05, 1.493819581810385e-05, 1.9133709429297596e-05, 2.3329208488576114e-05, 2.752472209976986e-05, 3.172023571096361e-05, 3.591574932215735e-05, 4.01112629333511e-05, 4.4306776544544846e-05, 4.850229015573859e-05, 5.269780376693234e-05, 5.6893317378126085e-05, 6.108883098931983e-05, 6.528434460051358e-05, 6.947985821170732e-05, 7.367537182290107e-05, 7.787088543409482e-05, 8.206639904528856e-05, 8.626191265648231e-05, 9.045742626767606e-05, 9.46529398788698e-05, 9.884845349006355e-05, 0.0001030439671012573, 0.00010723948071245104, 0.00011143499432364479, 0.00011563050793483853, 0.00011982602154603228, 0.00012402153515722603, 0.00012821704149246216, 0.00013241256237961352, 0.00013660808326676488, 0.000140803589602001, 0.00014499909593723714, 0.0001491946168243885, 0.00015339013771153986, 0.000157585644046776]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 8.0, 5.0, 9.0, 8.0, 15.0, 17.0, 22.0, 19.0, 23.0, 35.0, 33.0, 37.0, 46.0, 35.0, 34.0, 43.0, 44.0, 34.0, 42.0, 53.0, 41.0, 54.0, 48.0, 41.0, 45.0, 35.0, 36.0, 18.0, 24.0, 19.0, 15.0, 16.0, 15.0, 9.0, 5.0, 6.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.012996502453461e-05, -6.782536365790293e-05, -6.552076229127124e-05, -6.321616820059717e-05, -6.091156683396548e-05, -5.8606965467333794e-05, -5.630236410070211e-05, -5.399776273407042e-05, -5.169316500541754e-05, -4.9388563638785854e-05, -4.7083965910132974e-05, -4.477936454350129e-05, -4.24747631768696e-05, -4.017016544821672e-05, -3.7865564081585035e-05, -3.5560966352932155e-05, -3.325636498630047e-05, -3.095176361966878e-05, -2.8647165891015902e-05, -2.6342564524384215e-05, -2.4037964976741932e-05, -2.173336542909965e-05, -1.9428764062467963e-05, -1.712416451482568e-05, -1.4819564967183396e-05, -1.2514965419541113e-05, -1.0210364962404128e-05, -7.905764505267143e-06, -5.60116495762486e-06, -3.296565409982577e-06, -9.91964952845592e-07, 1.3126355042913929e-06, 3.617235051933676e-06, 5.92183505432331e-06, 8.226435056712944e-06, 1.0531035513849929e-05, 1.2835635061492212e-05, 1.5140234609134495e-05, 1.7444835975766182e-05, 1.9749435523408465e-05, 2.2054035071050748e-05, 2.435863461869303e-05, 2.6663234166335315e-05, 2.8967835532967e-05, 3.127243689959869e-05, 3.357703462825157e-05, 3.5881635994883254e-05, 3.8186233723536134e-05, 4.049083509016782e-05, 4.279543645679951e-05, 4.510003418545239e-05, 4.7404635552084073e-05, 4.970923328073695e-05, 5.201383464736864e-05, 5.4318436014000326e-05, 5.662303738063201e-05, 5.892763510928489e-05, 6.123223283793777e-05, 6.353683420456946e-05, 6.584143557120115e-05, 6.814603693783283e-05, 7.045063830446452e-05, 7.275523239513859e-05, 7.505983376177028e-05, 7.736443512840196e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 11.0, 14.0, 22.0, 25.0, 34.0, 56.0, 74.0, 114.0, 176.0, 209.0, 352.0, 557.0, 785.0, 1305.0, 2018.0, 3349.0, 5579.0, 9672.0, 17128.0, 31879.0, 61986.0, 136720.0, 329436.0, 243040.0, 97965.0, 47813.0, 24704.0, 13533.0, 7854.0, 4501.0, 2766.0, 1705.0, 1070.0, 687.0, 444.0, 294.0, 203.0, 144.0, 89.0, 79.0, 40.0, 39.0, 29.0, 17.0, 8.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0001742839813232422, -0.0001691281795501709, -0.0001639723777770996, -0.00015881657600402832, -0.00015366077423095703, -0.00014850497245788574, -0.00014334917068481445, -0.00013819336891174316, -0.00013303756713867188, -0.00012788176536560059, -0.0001227259635925293, -0.00011757016181945801, -0.00011241436004638672, -0.00010725855827331543, -0.00010210275650024414, -9.694695472717285e-05, -9.179115295410156e-05, -8.663535118103027e-05, -8.147954940795898e-05, -7.63237476348877e-05, -7.11679458618164e-05, -6.601214408874512e-05, -6.085634231567383e-05, -5.570054054260254e-05, -5.054473876953125e-05, -4.538893699645996e-05, -4.023313522338867e-05, -3.507733345031738e-05, -2.9921531677246094e-05, -2.4765729904174805e-05, -1.9609928131103516e-05, -1.4454126358032227e-05, -9.298324584960938e-06, -4.1425228118896484e-06, 1.0132789611816406e-06, 6.16908073425293e-06, 1.1324882507324219e-05, 1.6480684280395508e-05, 2.1636486053466797e-05, 2.6792287826538086e-05, 3.1948089599609375e-05, 3.7103891372680664e-05, 4.225969314575195e-05, 4.741549491882324e-05, 5.257129669189453e-05, 5.772709846496582e-05, 6.288290023803711e-05, 6.80387020111084e-05, 7.319450378417969e-05, 7.835030555725098e-05, 8.350610733032227e-05, 8.866190910339355e-05, 9.381771087646484e-05, 9.897351264953613e-05, 0.00010412931442260742, 0.00010928511619567871, 0.00011444091796875, 0.00011959671974182129, 0.00012475252151489258, 0.00012990832328796387, 0.00013506412506103516, 0.00014021992683410645, 0.00014537572860717773, 0.00015053153038024902, 0.0001556873321533203]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 11.0, 18.0, 15.0, 29.0, 24.0, 37.0, 32.0, 43.0, 48.0, 51.0, 41.0, 44.0, 55.0, 66.0, 51.0, 46.0, 44.0, 65.0, 43.0, 39.0, 38.0, 27.0, 14.0, 25.0, 18.0, 13.0, 11.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.26173210144043e-05, -4.121754318475723e-05, -3.981776535511017e-05, -3.8417987525463104e-05, -3.701820969581604e-05, -3.5618431866168976e-05, -3.421865403652191e-05, -3.281887620687485e-05, -3.141909837722778e-05, -3.001932054758072e-05, -2.8619542717933655e-05, -2.721976488828659e-05, -2.5819987058639526e-05, -2.4420209228992462e-05, -2.3020431399345398e-05, -2.1620653569698334e-05, -2.022087574005127e-05, -1.8821097910404205e-05, -1.742132008075714e-05, -1.6021542251110077e-05, -1.4621764421463013e-05, -1.3221986591815948e-05, -1.1822208762168884e-05, -1.042243093252182e-05, -9.022653102874756e-06, -7.622875273227692e-06, -6.2230974435806274e-06, -4.823319613933563e-06, -3.423541784286499e-06, -2.023763954639435e-06, -6.239861249923706e-07, 7.757917046546936e-07, 2.175569534301758e-06, 3.575347363948822e-06, 4.975125193595886e-06, 6.3749030232429504e-06, 7.774680852890015e-06, 9.174458682537079e-06, 1.0574236512184143e-05, 1.1974014341831207e-05, 1.3373792171478271e-05, 1.4773570001125336e-05, 1.61733478307724e-05, 1.7573125660419464e-05, 1.897290349006653e-05, 2.0372681319713593e-05, 2.1772459149360657e-05, 2.317223697900772e-05, 2.4572014808654785e-05, 2.597179263830185e-05, 2.7371570467948914e-05, 2.8771348297595978e-05, 3.0171126127243042e-05, 3.1570903956890106e-05, 3.297068178653717e-05, 3.4370459616184235e-05, 3.57702374458313e-05, 3.717001527547836e-05, 3.856979310512543e-05, 3.996957093477249e-05, 4.1369348764419556e-05, 4.276912659406662e-05, 4.4168904423713684e-05, 4.556868225336075e-05, 4.696846008300781e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 7.0, 19.0, 11.0, 34.0, 43.0, 59.0, 101.0, 119.0, 260.0, 336.0, 528.0, 844.0, 1326.0, 2109.0, 3376.0, 5397.0, 9040.0, 15521.0, 25707.0, 45783.0, 86733.0, 193623.0, 324722.0, 161179.0, 73999.0, 40029.0, 23090.0, 13521.0, 8178.0, 4795.0, 2980.0, 1765.0, 1161.0, 778.0, 457.0, 286.0, 206.0, 125.0, 87.0, 66.0, 36.0, 38.0, 27.0, 4.0, 10.0, 14.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00011259317398071289, -0.00010900571942329407, -0.00010541826486587524, -0.00010183081030845642, -9.82433557510376e-05, -9.465590119361877e-05, -9.106844663619995e-05, -8.748099207878113e-05, -8.38935375213623e-05, -8.030608296394348e-05, -7.671862840652466e-05, -7.313117384910583e-05, -6.954371929168701e-05, -6.595626473426819e-05, -6.236881017684937e-05, -5.878135561943054e-05, -5.519390106201172e-05, -5.1606446504592896e-05, -4.801899194717407e-05, -4.443153738975525e-05, -4.0844082832336426e-05, -3.72566282749176e-05, -3.366917371749878e-05, -3.0081719160079956e-05, -2.6494264602661133e-05, -2.290681004524231e-05, -1.9319355487823486e-05, -1.5731900930404663e-05, -1.214444637298584e-05, -8.556991815567017e-06, -4.969537258148193e-06, -1.3820827007293701e-06, 2.205371856689453e-06, 5.792826414108276e-06, 9.3802809715271e-06, 1.2967735528945923e-05, 1.6555190086364746e-05, 2.014264464378357e-05, 2.3730099201202393e-05, 2.7317553758621216e-05, 3.090500831604004e-05, 3.449246287345886e-05, 3.8079917430877686e-05, 4.166737198829651e-05, 4.525482654571533e-05, 4.8842281103134155e-05, 5.242973566055298e-05, 5.60171902179718e-05, 5.9604644775390625e-05, 6.319209933280945e-05, 6.677955389022827e-05, 7.03670084476471e-05, 7.395446300506592e-05, 7.754191756248474e-05, 8.112937211990356e-05, 8.471682667732239e-05, 8.830428123474121e-05, 9.189173579216003e-05, 9.547919034957886e-05, 9.906664490699768e-05, 0.0001026540994644165, 0.00010624155402183533, 0.00010982900857925415, 0.00011341646313667297, 0.0001170039176940918]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 5.0, 8.0, 9.0, 18.0, 18.0, 15.0, 22.0, 24.0, 24.0, 25.0, 26.0, 29.0, 24.0, 30.0, 39.0, 40.0, 37.0, 47.0, 37.0, 45.0, 43.0, 45.0, 60.0, 46.0, 36.0, 33.0, 38.0, 33.0, 20.0, 22.0, 14.0, 15.0, 17.0, 10.0, 11.0, 10.0, 7.0, 3.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.808736801147461e-05, -3.6928802728652954e-05, -3.57702374458313e-05, -3.4611672163009644e-05, -3.345310688018799e-05, -3.229454159736633e-05, -3.113597631454468e-05, -2.9977411031723022e-05, -2.8818845748901367e-05, -2.7660280466079712e-05, -2.6501715183258057e-05, -2.53431499004364e-05, -2.4184584617614746e-05, -2.302601933479309e-05, -2.1867454051971436e-05, -2.070888876914978e-05, -1.9550323486328125e-05, -1.839175820350647e-05, -1.7233192920684814e-05, -1.607462763786316e-05, -1.4916062355041504e-05, -1.3757497072219849e-05, -1.2598931789398193e-05, -1.1440366506576538e-05, -1.0281801223754883e-05, -9.123235940933228e-06, -7.964670658111572e-06, -6.806105375289917e-06, -5.647540092468262e-06, -4.4889748096466064e-06, -3.330409526824951e-06, -2.171844244003296e-06, -1.0132789611816406e-06, 1.4528632164001465e-07, 1.30385160446167e-06, 2.462416887283325e-06, 3.6209821701049805e-06, 4.779547452926636e-06, 5.938112735748291e-06, 7.096678018569946e-06, 8.255243301391602e-06, 9.413808584213257e-06, 1.0572373867034912e-05, 1.1730939149856567e-05, 1.2889504432678223e-05, 1.4048069715499878e-05, 1.5206634998321533e-05, 1.636520028114319e-05, 1.7523765563964844e-05, 1.86823308467865e-05, 1.9840896129608154e-05, 2.099946141242981e-05, 2.2158026695251465e-05, 2.331659197807312e-05, 2.4475157260894775e-05, 2.563372254371643e-05, 2.6792287826538086e-05, 2.795085310935974e-05, 2.9109418392181396e-05, 3.0267983675003052e-05, 3.142654895782471e-05, 3.258511424064636e-05, 3.374367952346802e-05, 3.490224480628967e-05, 3.606081008911133e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 2.0, 5.0, 5.0, 15.0, 12.0, 17.0, 23.0, 44.0, 66.0, 61.0, 112.0, 164.0, 233.0, 365.0, 560.0, 1098.0, 1807.0, 3561.0, 8160.0, 30034.0, 176563.0, 729292.0, 67145.0, 17344.0, 5551.0, 2639.0, 1380.0, 868.0, 453.0, 309.0, 223.0, 140.0, 76.0, 60.0, 37.0, 35.0, 27.0, 22.0, 15.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-05, -1.6137957572937012e-05, -1.558661460876465e-05, -1.5035271644592285e-05, -1.4483928680419922e-05, -1.3932585716247559e-05, -1.3381242752075195e-05, -1.2829899787902832e-05, -1.2278556823730469e-05, -1.1727213859558105e-05, -1.1175870895385742e-05, -1.0624527931213379e-05, -1.0073184967041016e-05, -9.521842002868652e-06, -8.970499038696289e-06, -8.419156074523926e-06, -7.867813110351562e-06, -7.316470146179199e-06, -6.765127182006836e-06, -6.213784217834473e-06, -5.662441253662109e-06, -5.111098289489746e-06, -4.559755325317383e-06, -4.0084123611450195e-06, -3.4570693969726562e-06, -2.905726432800293e-06, -2.3543834686279297e-06, -1.8030405044555664e-06, -1.2516975402832031e-06, -7.003545761108398e-07, -1.4901161193847656e-07, 4.023313522338867e-07, 9.5367431640625e-07, 1.5050172805786133e-06, 2.0563602447509766e-06, 2.60770320892334e-06, 3.159046173095703e-06, 3.7103891372680664e-06, 4.26173210144043e-06, 4.813075065612793e-06, 5.364418029785156e-06, 5.9157609939575195e-06, 6.467103958129883e-06, 7.018446922302246e-06, 7.569789886474609e-06, 8.121132850646973e-06, 8.672475814819336e-06, 9.2238187789917e-06, 9.775161743164062e-06, 1.0326504707336426e-05, 1.0877847671508789e-05, 1.1429190635681152e-05, 1.1980533599853516e-05, 1.2531876564025879e-05, 1.3083219528198242e-05, 1.3634562492370605e-05, 1.4185905456542969e-05, 1.4737248420715332e-05, 1.5288591384887695e-05, 1.583993434906006e-05, 1.6391277313232422e-05, 1.6942620277404785e-05, 1.749396324157715e-05, 1.8045306205749512e-05, 1.8596649169921875e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 0.0, 6.0, 0.0, 14.0, 16.0, 0.0, 22.0, 65.0, 0.0, 109.0, 165.0, 0.0, 192.0, 0.0, 163.0, 113.0, 0.0, 48.0, 32.0, 0.0, 17.0, 11.0, 0.0, 10.0, 5.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.430511474609375e-06, -1.3923272490501404e-06, -1.3541430234909058e-06, -1.3159587979316711e-06, -1.2777745723724365e-06, -1.239590346813202e-06, -1.2014061212539673e-06, -1.1632218956947327e-06, -1.125037670135498e-06, -1.0868534445762634e-06, -1.0486692190170288e-06, -1.0104849934577942e-06, -9.723007678985596e-07, -9.34116542339325e-07, -8.959323167800903e-07, -8.577480912208557e-07, -8.195638656616211e-07, -7.813796401023865e-07, -7.431954145431519e-07, -7.050111889839172e-07, -6.668269634246826e-07, -6.28642737865448e-07, -5.904585123062134e-07, -5.522742867469788e-07, -5.140900611877441e-07, -4.759058356285095e-07, -4.377216100692749e-07, -3.995373845100403e-07, -3.6135315895080566e-07, -3.2316893339157104e-07, -2.849847078323364e-07, -2.468004822731018e-07, -2.086162567138672e-07, -1.7043203115463257e-07, -1.3224780559539795e-07, -9.406358003616333e-08, -5.587935447692871e-08, -1.7695128917694092e-08, 2.0489096641540527e-08, 5.8673322200775146e-08, 9.685754776000977e-08, 1.3504177331924438e-07, 1.73225998878479e-07, 2.1141022443771362e-07, 2.4959444999694824e-07, 2.8777867555618286e-07, 3.259629011154175e-07, 3.641471266746521e-07, 4.023313522338867e-07, 4.4051557779312134e-07, 4.78699803352356e-07, 5.168840289115906e-07, 5.550682544708252e-07, 5.932524800300598e-07, 6.314367055892944e-07, 6.69620931148529e-07, 7.078051567077637e-07, 7.459893822669983e-07, 7.841736078262329e-07, 8.223578333854675e-07, 8.605420589447021e-07, 8.987262845039368e-07, 9.369105100631714e-07, 9.75094735622406e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 10.0, 16.0, 16.0, 22.0, 31.0, 45.0, 64.0, 37.0, 72.0, 132.0, 142.0, 232.0, 308.0, 450.0, 638.0, 872.0, 1261.0, 1989.0, 3162.0, 5183.0, 9341.0, 18852.0, 45546.0, 77272.0, 492126.0, 271450.0, 66017.0, 24405.0, 11580.0, 6276.0, 3753.0, 2283.0, 1494.0, 1007.0, 699.0, 474.0, 359.0, 245.0, 192.0, 89.0, 89.0, 76.0, 53.0, 43.0, 39.0, 29.0, 19.0, 13.0, 15.0, 7.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0], "bins": [-5.7220458984375e-06, -5.54695725440979e-06, -5.37186861038208e-06, -5.19677996635437e-06, -5.02169132232666e-06, -4.84660267829895e-06, -4.67151403427124e-06, -4.49642539024353e-06, -4.32133674621582e-06, -4.14624810218811e-06, -3.9711594581604e-06, -3.7960708141326904e-06, -3.6209821701049805e-06, -3.4458935260772705e-06, -3.2708048820495605e-06, -3.0957162380218506e-06, -2.9206275939941406e-06, -2.7455389499664307e-06, -2.5704503059387207e-06, -2.3953616619110107e-06, -2.2202730178833008e-06, -2.045184373855591e-06, -1.8700957298278809e-06, -1.695007085800171e-06, -1.519918441772461e-06, -1.344829797744751e-06, -1.169741153717041e-06, -9.94652509689331e-07, -8.195638656616211e-07, -6.444752216339111e-07, -4.6938657760620117e-07, -2.942979335784912e-07, -1.1920928955078125e-07, 5.587935447692871e-08, 2.3096799850463867e-07, 4.0605664253234863e-07, 5.811452865600586e-07, 7.562339305877686e-07, 9.313225746154785e-07, 1.1064112186431885e-06, 1.2814998626708984e-06, 1.4565885066986084e-06, 1.6316771507263184e-06, 1.8067657947540283e-06, 1.9818544387817383e-06, 2.1569430828094482e-06, 2.332031726837158e-06, 2.507120370864868e-06, 2.682209014892578e-06, 2.857297658920288e-06, 3.032386302947998e-06, 3.207474946975708e-06, 3.382563591003418e-06, 3.557652235031128e-06, 3.732740879058838e-06, 3.907829523086548e-06, 4.082918167114258e-06, 4.258006811141968e-06, 4.433095455169678e-06, 4.608184099197388e-06, 4.783272743225098e-06, 4.958361387252808e-06, 5.133450031280518e-06, 5.3085386753082275e-06, 5.4836273193359375e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 8.0, 6.0, 3.0, 5.0, 13.0, 19.0, 15.0, 21.0, 39.0, 51.0, 67.0, 77.0, 102.0, 113.0, 97.0, 88.0, 76.0, 49.0, 37.0, 21.0, 19.0, 18.0, 10.0, 10.0, 2.0, 6.0, 3.0, 1.0, 7.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7872080206871033e-06, -1.7266720533370972e-06, -1.666136085987091e-06, -1.605600118637085e-06, -1.5450641512870789e-06, -1.4845281839370728e-06, -1.4239922165870667e-06, -1.3634562492370605e-06, -1.3029202818870544e-06, -1.2423843145370483e-06, -1.1818483471870422e-06, -1.1213123798370361e-06, -1.06077641248703e-06, -1.000240445137024e-06, -9.397044777870178e-07, -8.791685104370117e-07, -8.186325430870056e-07, -7.580965757369995e-07, -6.975606083869934e-07, -6.370246410369873e-07, -5.764886736869812e-07, -5.159527063369751e-07, -4.55416738986969e-07, -3.948807716369629e-07, -3.343448042869568e-07, -2.738088369369507e-07, -2.1327286958694458e-07, -1.5273690223693848e-07, -9.220093488693237e-08, -3.166496753692627e-08, 2.8870999813079834e-08, 8.940696716308594e-08, 1.4994293451309204e-07, 2.1047890186309814e-07, 2.7101486921310425e-07, 3.3155083656311035e-07, 3.9208680391311646e-07, 4.5262277126312256e-07, 5.131587386131287e-07, 5.736947059631348e-07, 6.342306733131409e-07, 6.94766640663147e-07, 7.553026080131531e-07, 8.158385753631592e-07, 8.763745427131653e-07, 9.369105100631714e-07, 9.974464774131775e-07, 1.0579824447631836e-06, 1.1185184121131897e-06, 1.1790543794631958e-06, 1.239590346813202e-06, 1.300126314163208e-06, 1.3606622815132141e-06, 1.4211982488632202e-06, 1.4817342162132263e-06, 1.5422701835632324e-06, 1.6028061509132385e-06, 1.6633421182632446e-06, 1.7238780856132507e-06, 1.7844140529632568e-06, 1.844950020313263e-06, 1.905485987663269e-06, 1.966021955013275e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 2.0, 2.0, 6.0, 9.0, 9.0, 15.0, 14.0, 12.0, 17.0, 24.0, 31.0, 35.0, 40.0, 49.0, 100.0, 107.0, 127.0, 100.0, 64.0, 40.0, 46.0, 33.0, 29.0, 19.0, 8.0, 9.0, 13.0, 12.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.968936602585018e-05, -5.776734906248748e-05, -5.5845335737103596e-05, -5.39233187737409e-05, -5.2001305448357016e-05, -5.007928848499432e-05, -4.815727152163163e-05, -4.623525819624774e-05, -4.4313244870863855e-05, -4.239122790750116e-05, -4.0469214582117274e-05, -3.854719761875458e-05, -3.6625184293370694e-05, -3.4703167330008e-05, -3.2781150366645306e-05, -3.085913704126142e-05, -2.8937120077898726e-05, -2.7015104933525436e-05, -2.5093089789152145e-05, -2.317107282578945e-05, -2.1249059500405565e-05, -1.932704253704287e-05, -1.740502739266958e-05, -1.548301224829629e-05, -1.3560997103923e-05, -1.163898195954971e-05, -9.71696681517642e-06, -7.794950761308428e-06, -5.872935616935138e-06, -3.950920472561847e-06, -2.0289044186938554e-06, -1.0688927432056516e-07, 1.815125870052725e-06, 3.7371412417996908e-06, 5.6591566135466564e-06, 7.5811722126672976e-06, 9.503187357040588e-06, 1.1425202501413878e-05, 1.334721855528187e-05, 1.526923369965516e-05, 1.719124884402845e-05, 1.911326398840174e-05, 2.103527913277503e-05, 2.295729427714832e-05, 2.4879311240511015e-05, 2.6801324565894902e-05, 2.8723341529257596e-05, 3.064535849262029e-05, 3.2567371818004176e-05, 3.448938878136687e-05, 3.6411402106750757e-05, 3.833341907011345e-05, 4.025543239549734e-05, 4.217744935886003e-05, 4.409946268424392e-05, 4.602147964760661e-05, 4.7943496610969305e-05, 4.9865513574332e-05, 5.1787526899715886e-05, 5.370954386307858e-05, 5.5631557188462466e-05, 5.755357415182516e-05, 5.9475591115187854e-05, 6.139760080259293e-05, 6.331961776595563e-05]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 6.0, 6.0, 2.0, 11.0, 12.0, 12.0, 25.0, 17.0, 24.0, 36.0, 31.0, 27.0, 39.0, 51.0, 40.0, 44.0, 48.0, 43.0, 45.0, 29.0, 40.0, 34.0, 43.0, 45.0, 35.0, 30.0, 29.0, 23.0, 25.0, 21.0, 22.0, 18.0, 13.0, 10.0, 16.0, 7.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.544032708508894e-05, -4.411777263158001e-05, -4.279521817807108e-05, -4.147266736254096e-05, -4.015011290903203e-05, -3.8827558455523103e-05, -3.7505004002014175e-05, -3.618244954850525e-05, -3.4859898732975125e-05, -3.35373442794662e-05, -3.221478982595727e-05, -3.089223901042715e-05, -2.956968455691822e-05, -2.824713010340929e-05, -2.6924575649900362e-05, -2.5602021196391433e-05, -2.4279466742882505e-05, -2.2956912289373577e-05, -2.1634359654854052e-05, -2.0311805201345123e-05, -1.89892525668256e-05, -1.766669811331667e-05, -1.634414365980774e-05, -1.5021590115793515e-05, -1.3699036571779288e-05, -1.2376483027765062e-05, -1.1053929483750835e-05, -9.731375030241907e-06, -8.40882148622768e-06, -7.086267942213453e-06, -5.763713488704525e-06, -4.441159944690298e-06, -3.1186027626972646e-06, -1.7960489913093625e-06, -4.734952199214604e-07, 8.490587788401172e-07, 2.171612322854344e-06, 3.4941658668685704e-06, 4.816720320377499e-06, 6.1392738643917255e-06, 7.461827408405952e-06, 8.784380952420179e-06, 1.0106934496434405e-05, 1.1429488949943334e-05, 1.275204249395756e-05, 1.4074596037971787e-05, 1.5397150491480716e-05, 1.671970312600024e-05, 1.804225757950917e-05, 1.9364812033018097e-05, 2.0687364667537622e-05, 2.200991912104655e-05, 2.3332471755566075e-05, 2.4655026209075004e-05, 2.5977580662583932e-05, 2.730013511609286e-05, 2.8622687750612386e-05, 2.9945242204121314e-05, 3.126779483864084e-05, 3.259034929214977e-05, 3.3912903745658696e-05, 3.523545456118882e-05, 3.655801265267655e-05, 3.7880563468206674e-05, 3.92031179217156e-05]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 8.0, 13.0, 20.0, 20.0, 27.0, 22.0, 40.0, 75.0, 76.0, 95.0, 115.0, 197.0, 261.0, 334.0, 442.0, 615.0, 775.0, 1079.0, 1477.0, 2253.0, 3174.0, 5089.0, 8694.0, 16897.0, 74143.0, 3763421.0, 263688.0, 21706.0, 10663.0, 5892.0, 3912.0, 2496.0, 1687.0, 1247.0, 1014.0, 677.0, 466.0, 409.0, 296.0, 193.0, 136.0, 132.0, 97.0, 49.0, 41.0, 35.0, 22.0, 20.0, 9.0, 12.0, 6.0, 3.0, 4.0, 5.0, 6.0, 1.0], "bins": [-0.00011926889419555664, -0.00011572428047657013, -0.00011217966675758362, -0.00010863505303859711, -0.0001050904393196106, -0.00010154582560062408, -9.800121188163757e-05, -9.445659816265106e-05, -9.091198444366455e-05, -8.736737072467804e-05, -8.382275700569153e-05, -8.027814328670502e-05, -7.67335295677185e-05, -7.3188915848732e-05, -6.964430212974548e-05, -6.609968841075897e-05, -6.255507469177246e-05, -5.901046097278595e-05, -5.546584725379944e-05, -5.192123353481293e-05, -4.8376619815826416e-05, -4.4832006096839905e-05, -4.1287392377853394e-05, -3.774277865886688e-05, -3.419816493988037e-05, -3.065355122089386e-05, -2.710893750190735e-05, -2.3564323782920837e-05, -2.0019710063934326e-05, -1.6475096344947815e-05, -1.2930482625961304e-05, -9.385868906974792e-06, -5.841255187988281e-06, -2.29664146900177e-06, 1.2479722499847412e-06, 4.7925859689712524e-06, 8.337199687957764e-06, 1.1881813406944275e-05, 1.5426427125930786e-05, 1.8971040844917297e-05, 2.251565456390381e-05, 2.606026828289032e-05, 2.960488200187683e-05, 3.314949572086334e-05, 3.6694109439849854e-05, 4.0238723158836365e-05, 4.3783336877822876e-05, 4.732795059680939e-05, 5.08725643157959e-05, 5.441717803478241e-05, 5.796179175376892e-05, 6.150640547275543e-05, 6.505101919174194e-05, 6.859563291072845e-05, 7.214024662971497e-05, 7.568486034870148e-05, 7.922947406768799e-05, 8.27740877866745e-05, 8.631870150566101e-05, 8.986331522464752e-05, 9.340792894363403e-05, 9.695254266262054e-05, 0.00010049715638160706, 0.00010404177010059357, 0.00010758638381958008]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 4.0, 8.0, 10.0, 4.0, 5.0, 13.0, 10.0, 19.0, 17.0, 21.0, 18.0, 24.0, 32.0, 31.0, 39.0, 46.0, 34.0, 43.0, 43.0, 40.0, 49.0, 30.0, 33.0, 39.0, 50.0, 40.0, 33.0, 34.0, 33.0, 25.0, 21.0, 22.0, 23.0, 13.0, 15.0, 11.0, 10.0, 17.0, 16.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.580881118774414e-05, -2.5044195353984833e-05, -2.4279579520225525e-05, -2.3514963686466217e-05, -2.275034785270691e-05, -2.19857320189476e-05, -2.1221116185188293e-05, -2.0456500351428986e-05, -1.9691884517669678e-05, -1.892726868391037e-05, -1.8162652850151062e-05, -1.7398037016391754e-05, -1.6633421182632446e-05, -1.586880534887314e-05, -1.510418951511383e-05, -1.4339573681354523e-05, -1.3574957847595215e-05, -1.2810342013835907e-05, -1.2045726180076599e-05, -1.1281110346317291e-05, -1.0516494512557983e-05, -9.751878678798676e-06, -8.987262845039368e-06, -8.22264701128006e-06, -7.458031177520752e-06, -6.693415343761444e-06, -5.928799510002136e-06, -5.164183676242828e-06, -4.3995678424835205e-06, -3.6349520087242126e-06, -2.8703361749649048e-06, -2.105720341205597e-06, -1.341104507446289e-06, -5.764886736869812e-07, 1.8812716007232666e-07, 9.527429938316345e-07, 1.7173588275909424e-06, 2.4819746613502502e-06, 3.246590495109558e-06, 4.011206328868866e-06, 4.775822162628174e-06, 5.540437996387482e-06, 6.3050538301467896e-06, 7.069669663906097e-06, 7.834285497665405e-06, 8.598901331424713e-06, 9.363517165184021e-06, 1.0128132998943329e-05, 1.0892748832702637e-05, 1.1657364666461945e-05, 1.2421980500221252e-05, 1.318659633398056e-05, 1.3951212167739868e-05, 1.4715828001499176e-05, 1.5480443835258484e-05, 1.6245059669017792e-05, 1.70096755027771e-05, 1.7774291336536407e-05, 1.8538907170295715e-05, 1.9303523004055023e-05, 2.006813883781433e-05, 2.083275467157364e-05, 2.1597370505332947e-05, 2.2361986339092255e-05, 2.3126602172851562e-05]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 5.0, 6.0, 14.0, 26.0, 30.0, 44.0, 89.0, 131.0, 235.0, 447.0, 1002.0, 1838.0, 4146.0, 9212.0, 25044.0, 104931.0, 3778242.0, 212266.0, 34599.0, 11958.0, 5170.0, 2292.0, 1221.0, 584.0, 335.0, 173.0, 101.0, 44.0, 27.0, 31.0, 12.0, 5.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015246868133544922, -0.0001474916934967041, -0.00014251470565795898, -0.00013753771781921387, -0.00013256072998046875, -0.00012758374214172363, -0.00012260675430297852, -0.0001176297664642334, -0.00011265277862548828, -0.00010767579078674316, -0.00010269880294799805, -9.772181510925293e-05, -9.274482727050781e-05, -8.77678394317627e-05, -8.279085159301758e-05, -7.781386375427246e-05, -7.283687591552734e-05, -6.785988807678223e-05, -6.288290023803711e-05, -5.790591239929199e-05, -5.2928924560546875e-05, -4.795193672180176e-05, -4.297494888305664e-05, -3.7997961044311523e-05, -3.3020973205566406e-05, -2.804398536682129e-05, -2.3066997528076172e-05, -1.8090009689331055e-05, -1.3113021850585938e-05, -8.13603401184082e-06, -3.159046173095703e-06, 1.817941665649414e-06, 6.794929504394531e-06, 1.1771917343139648e-05, 1.6748905181884766e-05, 2.1725893020629883e-05, 2.6702880859375e-05, 3.167986869812012e-05, 3.6656856536865234e-05, 4.163384437561035e-05, 4.661083221435547e-05, 5.1587820053100586e-05, 5.65648078918457e-05, 6.154179573059082e-05, 6.651878356933594e-05, 7.149577140808105e-05, 7.647275924682617e-05, 8.144974708557129e-05, 8.64267349243164e-05, 9.140372276306152e-05, 9.638071060180664e-05, 0.00010135769844055176, 0.00010633468627929688, 0.00011131167411804199, 0.00011628866195678711, 0.00012126564979553223, 0.00012624263763427734, 0.00013121962547302246, 0.00013619661331176758, 0.0001411736011505127, 0.0001461505889892578, 0.00015112757682800293, 0.00015610456466674805, 0.00016108155250549316, 0.00016605854034423828]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 13.0, 11.0, 16.0, 21.0, 33.0, 44.0, 101.0, 265.0, 826.0, 1735.0, 490.0, 180.0, 70.0, 47.0, 32.0, 30.0, 21.0, 17.0, 9.0, 14.0, 9.0, 11.0, 6.0, 8.0, 2.0, 5.0, 6.0, 3.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6047229766845703e-05, -2.52649188041687e-05, -2.44826078414917e-05, -2.3700296878814697e-05, -2.2917985916137695e-05, -2.2135674953460693e-05, -2.135336399078369e-05, -2.057105302810669e-05, -1.9788742065429688e-05, -1.9006431102752686e-05, -1.8224120140075684e-05, -1.744180917739868e-05, -1.665949821472168e-05, -1.5877187252044678e-05, -1.5094876289367676e-05, -1.4312565326690674e-05, -1.3530254364013672e-05, -1.274794340133667e-05, -1.1965632438659668e-05, -1.1183321475982666e-05, -1.0401010513305664e-05, -9.618699550628662e-06, -8.83638858795166e-06, -8.054077625274658e-06, -7.271766662597656e-06, -6.489455699920654e-06, -5.707144737243652e-06, -4.92483377456665e-06, -4.1425228118896484e-06, -3.3602118492126465e-06, -2.5779008865356445e-06, -1.7955899238586426e-06, -1.0132789611816406e-06, -2.3096799850463867e-07, 5.513429641723633e-07, 1.3336539268493652e-06, 2.115964889526367e-06, 2.898275852203369e-06, 3.680586814880371e-06, 4.462897777557373e-06, 5.245208740234375e-06, 6.027519702911377e-06, 6.809830665588379e-06, 7.592141628265381e-06, 8.374452590942383e-06, 9.156763553619385e-06, 9.939074516296387e-06, 1.0721385478973389e-05, 1.150369644165039e-05, 1.2286007404327393e-05, 1.3068318367004395e-05, 1.3850629329681396e-05, 1.4632940292358398e-05, 1.54152512550354e-05, 1.6197562217712402e-05, 1.6979873180389404e-05, 1.7762184143066406e-05, 1.8544495105743408e-05, 1.932680606842041e-05, 2.0109117031097412e-05, 2.0891427993774414e-05, 2.1673738956451416e-05, 2.2456049919128418e-05, 2.323836088180542e-05, 2.4020671844482422e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 8.0, 15.0, 25.0, 28.0, 38.0, 41.0, 64.0, 80.0, 160.0, 157.0, 109.0, 69.0, 53.0, 38.0, 25.0, 20.0, 12.0, 11.0, 9.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.573209975613281e-05, -6.395512900780886e-05, -6.217815825948492e-05, -6.040119114913978e-05, -5.862422040081583e-05, -5.684725329047069e-05, -5.507028254214674e-05, -5.3293311793822795e-05, -5.151634104549885e-05, -4.97393702971749e-05, -4.796240318682976e-05, -4.6185432438505813e-05, -4.4408461690181866e-05, -4.2631494579836726e-05, -4.085452383151278e-05, -3.907755308318883e-05, -3.730058597284369e-05, -3.5523615224519745e-05, -3.3746648114174604e-05, -3.196967736585066e-05, -3.019270661752671e-05, -2.8415737688192166e-05, -2.6638768758857623e-05, -2.4861798010533676e-05, -2.3084829081199132e-05, -2.1307860151864588e-05, -1.953088940354064e-05, -1.7753920474206097e-05, -1.5976951544871554e-05, -1.4199980796547607e-05, -1.2423011867213063e-05, -1.0646042028383818e-05, -8.869068551575765e-06, -7.09209871274652e-06, -5.315129328664625e-06, -3.5381599445827305e-06, -1.7611901057534851e-06, 1.5779733075760305e-08, 1.792748662410304e-06, 3.5697185012395494e-06, 5.346688340068795e-06, 7.12365817889804e-06, 8.900628017727286e-06, 1.067759694706183e-05, 1.2454566785891075e-05, 1.423153662472032e-05, 1.6008505554054864e-05, 1.7785474483389407e-05, 1.9562445231713355e-05, 2.1339414161047898e-05, 2.3116384909371845e-05, 2.489335383870639e-05, 2.6670324587030336e-05, 2.844729351636488e-05, 3.0224262445699424e-05, 3.200123319402337e-05, 3.377820394234732e-05, 3.5555174690671265e-05, 3.7332141801016405e-05, 3.910911254934035e-05, 4.08860832976643e-05, 4.266305040800944e-05, 4.444002115633339e-05, 4.6216991904657334e-05, 4.7993959015002474e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 9.0, 16.0, 15.0, 16.0, 13.0, 12.0, 27.0, 30.0, 21.0, 28.0, 38.0, 33.0, 30.0, 36.0, 51.0, 44.0, 33.0, 37.0, 29.0, 38.0, 44.0, 35.0, 32.0, 37.0, 30.0, 30.0, 19.0, 25.0, 25.0, 23.0, 19.0, 19.0, 12.0, 9.0, 12.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.827235948643647e-05, -2.7422167477197945e-05, -2.6571977286948822e-05, -2.5721785277710296e-05, -2.4871595087461174e-05, -2.4021403078222647e-05, -2.317121106898412e-05, -2.2321020878735e-05, -2.1470828869496472e-05, -2.0620636860257946e-05, -1.9770446670008823e-05, -1.8920254660770297e-05, -1.8070064470521174e-05, -1.7219872461282648e-05, -1.6369682271033525e-05, -1.5519490261795e-05, -1.4669299162051175e-05, -1.381910806230735e-05, -1.2968916962563526e-05, -1.2118725862819701e-05, -1.1268533853581175e-05, -1.041834275383735e-05, -9.568151654093526e-06, -8.717959644855e-06, -7.867769454605877e-06, -7.017578354862053e-06, -6.167386800370878e-06, -5.317195700627053e-06, -4.467004146135878e-06, -3.6168130463920534e-06, -2.766621946648229e-06, -1.9164303921570536e-06, -1.0662388376658782e-06, -2.160475673917972e-07, 6.341437028822838e-07, 1.484334916312946e-06, 2.334526243430446e-06, 3.184717570547946e-06, 4.03490867029177e-06, 4.885100224782946e-06, 5.73529132452677e-06, 6.5854824242705945e-06, 7.43567397876177e-06, 8.285865078505594e-06, 9.136056178249419e-06, 9.986248187487945e-06, 1.0836438377737068e-05, 1.1686630386975594e-05, 1.2536821486719418e-05, 1.3387012586463243e-05, 1.4237203686207067e-05, 1.5087394785950892e-05, 1.5937586795189418e-05, 1.678777698543854e-05, 1.7637968994677067e-05, 1.8488161003915593e-05, 1.9338351194164716e-05, 2.0188543203403242e-05, 2.1038733393652365e-05, 2.188892540289089e-05, 2.2739115593140014e-05, 2.358930760237854e-05, 2.4439497792627662e-05, 2.528968980186619e-05, 2.6139881811104715e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 5.0, 4.0, 6.0, 4.0, 15.0, 9.0, 29.0, 24.0, 42.0, 65.0, 80.0, 98.0, 145.0, 211.0, 282.0, 426.0, 555.0, 822.0, 1082.0, 1568.0, 2379.0, 3322.0, 4920.0, 7070.0, 11825.0, 17152.0, 27066.0, 44565.0, 76825.0, 142774.0, 270283.0, 188826.0, 96821.0, 54730.0, 32951.0, 20644.0, 13119.0, 9230.0, 5731.0, 3886.0, 2651.0, 1782.0, 1308.0, 903.0, 680.0, 474.0, 340.0, 224.0, 174.0, 117.0, 93.0, 59.0, 57.0, 29.0, 23.0, 23.0, 12.0, 9.0, 11.0, 3.0, 3.0, 1.0, 4.0], "bins": [-2.849102020263672e-05, -2.7592293918132782e-05, -2.6693567633628845e-05, -2.579484134912491e-05, -2.489611506462097e-05, -2.3997388780117035e-05, -2.3098662495613098e-05, -2.219993621110916e-05, -2.1301209926605225e-05, -2.0402483642101288e-05, -1.950375735759735e-05, -1.8605031073093414e-05, -1.7706304788589478e-05, -1.680757850408554e-05, -1.5908852219581604e-05, -1.5010125935077667e-05, -1.411139965057373e-05, -1.3212673366069794e-05, -1.2313947081565857e-05, -1.141522079706192e-05, -1.0516494512557983e-05, -9.617768228054047e-06, -8.71904194355011e-06, -7.820315659046173e-06, -6.921589374542236e-06, -6.0228630900382996e-06, -5.124136805534363e-06, -4.225410521030426e-06, -3.3266842365264893e-06, -2.4279579520225525e-06, -1.5292316675186157e-06, -6.30505383014679e-07, 2.682209014892578e-07, 1.1669471859931946e-06, 2.0656734704971313e-06, 2.964399755001068e-06, 3.863126039505005e-06, 4.761852324008942e-06, 5.660578608512878e-06, 6.559304893016815e-06, 7.458031177520752e-06, 8.356757462024689e-06, 9.255483746528625e-06, 1.0154210031032562e-05, 1.1052936315536499e-05, 1.1951662600040436e-05, 1.2850388884544373e-05, 1.374911516904831e-05, 1.4647841453552246e-05, 1.5546567738056183e-05, 1.644529402256012e-05, 1.7344020307064056e-05, 1.8242746591567993e-05, 1.914147287607193e-05, 2.0040199160575867e-05, 2.0938925445079803e-05, 2.183765172958374e-05, 2.2736378014087677e-05, 2.3635104298591614e-05, 2.453383058309555e-05, 2.5432556867599487e-05, 2.6331283152103424e-05, 2.723000943660736e-05, 2.8128735721111298e-05, 2.9027462005615234e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 18.0, 7.0, 13.0, 12.0, 20.0, 29.0, 20.0, 27.0, 29.0, 26.0, 34.0, 49.0, 35.0, 40.0, 40.0, 42.0, 30.0, 44.0, 41.0, 44.0, 38.0, 34.0, 37.0, 28.0, 30.0, 23.0, 18.0, 29.0, 14.0, 19.0, 17.0, 11.0, 13.0, 12.0, 6.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.9027462005615234e-05, -2.815108746290207e-05, -2.7274712920188904e-05, -2.639833837747574e-05, -2.5521963834762573e-05, -2.4645589292049408e-05, -2.3769214749336243e-05, -2.2892840206623077e-05, -2.2016465663909912e-05, -2.1140091121196747e-05, -2.026371657848358e-05, -1.9387342035770416e-05, -1.851096749305725e-05, -1.7634592950344086e-05, -1.675821840763092e-05, -1.5881843864917755e-05, -1.500546932220459e-05, -1.4129094779491425e-05, -1.325272023677826e-05, -1.2376345694065094e-05, -1.1499971151351929e-05, -1.0623596608638763e-05, -9.747222065925598e-06, -8.870847523212433e-06, -7.994472980499268e-06, -7.118098437786102e-06, -6.241723895072937e-06, -5.365349352359772e-06, -4.4889748096466064e-06, -3.612600266933441e-06, -2.736225724220276e-06, -1.8598511815071106e-06, -9.834766387939453e-07, -1.0710209608078003e-07, 7.692724466323853e-07, 1.6456469893455505e-06, 2.522021532058716e-06, 3.398396074771881e-06, 4.274770617485046e-06, 5.151145160198212e-06, 6.027519702911377e-06, 6.903894245624542e-06, 7.780268788337708e-06, 8.656643331050873e-06, 9.533017873764038e-06, 1.0409392416477203e-05, 1.1285766959190369e-05, 1.2162141501903534e-05, 1.30385160446167e-05, 1.3914890587329865e-05, 1.479126513004303e-05, 1.5667639672756195e-05, 1.654401421546936e-05, 1.7420388758182526e-05, 1.829676330089569e-05, 1.9173137843608856e-05, 2.004951238632202e-05, 2.0925886929035187e-05, 2.1802261471748352e-05, 2.2678636014461517e-05, 2.3555010557174683e-05, 2.4431385099887848e-05, 2.5307759642601013e-05, 2.618413418531418e-05, 2.7060508728027344e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 12.0, 15.0, 14.0, 25.0, 34.0, 41.0, 69.0, 81.0, 143.0, 168.0, 239.0, 399.0, 589.0, 871.0, 1379.0, 2086.0, 3532.0, 5383.0, 9140.0, 17093.0, 29870.0, 67726.0, 180035.0, 468082.0, 144658.0, 53322.0, 27322.0, 13962.0, 8381.0, 5283.0, 2913.0, 1890.0, 1259.0, 763.0, 589.0, 375.0, 229.0, 183.0, 117.0, 88.0, 52.0, 34.0, 33.0, 21.0, 12.0, 17.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.743171691894531e-05, -3.6275945603847504e-05, -3.5120174288749695e-05, -3.3964402973651886e-05, -3.280863165855408e-05, -3.165286034345627e-05, -3.049708902835846e-05, -2.934131771326065e-05, -2.8185546398162842e-05, -2.7029775083065033e-05, -2.5874003767967224e-05, -2.4718232452869415e-05, -2.3562461137771606e-05, -2.2406689822673798e-05, -2.125091850757599e-05, -2.009514719247818e-05, -1.893937587738037e-05, -1.7783604562282562e-05, -1.6627833247184753e-05, -1.5472061932086945e-05, -1.4316290616989136e-05, -1.3160519301891327e-05, -1.2004747986793518e-05, -1.084897667169571e-05, -9.6932053565979e-06, -8.537434041500092e-06, -7.381662726402283e-06, -6.225891411304474e-06, -5.070120096206665e-06, -3.914348781108856e-06, -2.7585774660110474e-06, -1.6028061509132385e-06, -4.470348358154297e-07, 7.087364792823792e-07, 1.864507794380188e-06, 3.020279109477997e-06, 4.176050424575806e-06, 5.3318217396736145e-06, 6.487593054771423e-06, 7.643364369869232e-06, 8.799135684967041e-06, 9.95490700006485e-06, 1.1110678315162659e-05, 1.2266449630260468e-05, 1.3422220945358276e-05, 1.4577992260456085e-05, 1.5733763575553894e-05, 1.6889534890651703e-05, 1.8045306205749512e-05, 1.920107752084732e-05, 2.035684883594513e-05, 2.1512620151042938e-05, 2.2668391466140747e-05, 2.3824162781238556e-05, 2.4979934096336365e-05, 2.6135705411434174e-05, 2.7291476726531982e-05, 2.844724804162979e-05, 2.96030193567276e-05, 3.075879067182541e-05, 3.191456198692322e-05, 3.3070333302021027e-05, 3.4226104617118835e-05, 3.5381875932216644e-05, 3.653764724731445e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 10.0, 4.0, 14.0, 7.0, 10.0, 12.0, 19.0, 21.0, 37.0, 27.0, 30.0, 22.0, 29.0, 39.0, 35.0, 49.0, 34.0, 21.0, 25.0, 55.0, 38.0, 37.0, 32.0, 36.0, 36.0, 31.0, 44.0, 38.0, 21.0, 25.0, 33.0, 13.0, 23.0, 22.0, 12.0, 6.0, 5.0, 12.0, 9.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8775463104248047e-05, -1.8221326172351837e-05, -1.7667189240455627e-05, -1.7113052308559418e-05, -1.6558915376663208e-05, -1.6004778444766998e-05, -1.545064151287079e-05, -1.4896504580974579e-05, -1.4342367649078369e-05, -1.378823071718216e-05, -1.323409378528595e-05, -1.267995685338974e-05, -1.212581992149353e-05, -1.157168298959732e-05, -1.101754605770111e-05, -1.0463409125804901e-05, -9.909272193908691e-06, -9.355135262012482e-06, -8.800998330116272e-06, -8.246861398220062e-06, -7.692724466323853e-06, -7.138587534427643e-06, -6.584450602531433e-06, -6.030313670635223e-06, -5.476176738739014e-06, -4.922039806842804e-06, -4.367902874946594e-06, -3.8137659430503845e-06, -3.259629011154175e-06, -2.705492079257965e-06, -2.1513551473617554e-06, -1.5972182154655457e-06, -1.043081283569336e-06, -4.889443516731262e-07, 6.51925802230835e-08, 6.193295121192932e-07, 1.173466444015503e-06, 1.7276033759117126e-06, 2.2817403078079224e-06, 2.835877239704132e-06, 3.390014171600342e-06, 3.9441511034965515e-06, 4.498288035392761e-06, 5.052424967288971e-06, 5.606561899185181e-06, 6.16069883108139e-06, 6.7148357629776e-06, 7.26897269487381e-06, 7.82310962677002e-06, 8.37724655866623e-06, 8.931383490562439e-06, 9.485520422458649e-06, 1.0039657354354858e-05, 1.0593794286251068e-05, 1.1147931218147278e-05, 1.1702068150043488e-05, 1.2256205081939697e-05, 1.2810342013835907e-05, 1.3364478945732117e-05, 1.3918615877628326e-05, 1.4472752809524536e-05, 1.5026889741420746e-05, 1.5581026673316956e-05, 1.6135163605213165e-05, 1.6689300537109375e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 11.0, 7.0, 18.0, 23.0, 49.0, 78.0, 36.0, 66.0, 140.0, 195.0, 288.0, 344.0, 572.0, 955.0, 1451.0, 2598.0, 3198.0, 11019.0, 43401.0, 885082.0, 72029.0, 12723.0, 6459.0, 3046.0, 1612.0, 1064.0, 493.0, 586.0, 337.0, 225.0, 111.0, 69.0, 54.0, 55.0, 50.0, 39.0, 12.0, 11.0, 10.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-7.3909759521484375e-06, -7.164664566516876e-06, -6.938353180885315e-06, -6.712041795253754e-06, -6.485730409622192e-06, -6.259419023990631e-06, -6.03310763835907e-06, -5.8067962527275085e-06, -5.580484867095947e-06, -5.354173481464386e-06, -5.127862095832825e-06, -4.9015507102012634e-06, -4.675239324569702e-06, -4.448927938938141e-06, -4.22261655330658e-06, -3.996305167675018e-06, -3.769993782043457e-06, -3.5436823964118958e-06, -3.3173710107803345e-06, -3.091059625148773e-06, -2.864748239517212e-06, -2.6384368538856506e-06, -2.4121254682540894e-06, -2.185814082622528e-06, -1.959502696990967e-06, -1.7331913113594055e-06, -1.5068799257278442e-06, -1.280568540096283e-06, -1.0542571544647217e-06, -8.279457688331604e-07, -6.016343832015991e-07, -3.7532299757003784e-07, -1.4901161193847656e-07, 7.729977369308472e-08, 3.03611159324646e-07, 5.299225449562073e-07, 7.562339305877686e-07, 9.825453162193298e-07, 1.2088567018508911e-06, 1.4351680874824524e-06, 1.6614794731140137e-06, 1.887790858745575e-06, 2.1141022443771362e-06, 2.3404136300086975e-06, 2.566725015640259e-06, 2.79303640127182e-06, 3.0193477869033813e-06, 3.2456591725349426e-06, 3.471970558166504e-06, 3.698281943798065e-06, 3.9245933294296265e-06, 4.150904715061188e-06, 4.377216100692749e-06, 4.60352748632431e-06, 4.829838871955872e-06, 5.056150257587433e-06, 5.282461643218994e-06, 5.508773028850555e-06, 5.735084414482117e-06, 5.961395800113678e-06, 6.187707185745239e-06, 6.4140185713768005e-06, 6.640329957008362e-06, 6.866641342639923e-06, 7.092952728271484e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 9.0, 0.0, 2.0, 8.0, 13.0, 0.0, 9.0, 7.0, 0.0, 7.0, 3.0, 26.0, 0.0, 10.0, 77.0, 0.0, 57.0, 551.0, 61.0, 0.0, 90.0, 8.0, 22.0, 0.0, 5.0, 4.0, 0.0, 7.0, 4.0, 9.0, 0.0, 13.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.387670636177063e-06, -1.344829797744751e-06, -1.301988959312439e-06, -1.259148120880127e-06, -1.216307282447815e-06, -1.173466444015503e-06, -1.130625605583191e-06, -1.087784767150879e-06, -1.044943928718567e-06, -1.0021030902862549e-06, -9.592622518539429e-07, -9.164214134216309e-07, -8.735805749893188e-07, -8.307397365570068e-07, -7.878988981246948e-07, -7.450580596923828e-07, -7.022172212600708e-07, -6.593763828277588e-07, -6.165355443954468e-07, -5.736947059631348e-07, -5.308538675308228e-07, -4.880130290985107e-07, -4.4517219066619873e-07, -4.023313522338867e-07, -3.594905138015747e-07, -3.166496753692627e-07, -2.738088369369507e-07, -2.3096799850463867e-07, -1.8812716007232666e-07, -1.4528632164001465e-07, -1.0244548320770264e-07, -5.960464477539063e-08, -1.6763806343078613e-08, 2.60770320892334e-08, 6.891787052154541e-08, 1.1175870895385742e-07, 1.5459954738616943e-07, 1.9744038581848145e-07, 2.4028122425079346e-07, 2.8312206268310547e-07, 3.259629011154175e-07, 3.688037395477295e-07, 4.116445779800415e-07, 4.544854164123535e-07, 4.973262548446655e-07, 5.401670932769775e-07, 5.830079317092896e-07, 6.258487701416016e-07, 6.686896085739136e-07, 7.115304470062256e-07, 7.543712854385376e-07, 7.972121238708496e-07, 8.400529623031616e-07, 8.828938007354736e-07, 9.257346391677856e-07, 9.685754776000977e-07, 1.0114163160324097e-06, 1.0542571544647217e-06, 1.0970979928970337e-06, 1.1399388313293457e-06, 1.1827796697616577e-06, 1.2256205081939697e-06, 1.2684613466262817e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 25.0, 29.0, 44.0, 89.0, 120.0, 258.0, 384.0, 865.0, 1432.0, 4104.0, 7722.0, 29382.0, 237553.0, 688821.0, 55128.0, 12144.0, 5948.0, 1977.0, 1224.0, 503.0, 358.0, 144.0, 99.0, 64.0, 37.0, 24.0, 19.0, 11.0, 3.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.000301361083984e-06, -8.72928649187088e-06, -8.458271622657776e-06, -8.187256753444672e-06, -7.916241884231567e-06, -7.645227015018463e-06, -7.374212145805359e-06, -7.103197276592255e-06, -6.83218240737915e-06, -6.561167538166046e-06, -6.290152668952942e-06, -6.019137799739838e-06, -5.748122930526733e-06, -5.477108061313629e-06, -5.206093192100525e-06, -4.935078322887421e-06, -4.664063453674316e-06, -4.393048584461212e-06, -4.122033715248108e-06, -3.851018846035004e-06, -3.5800039768218994e-06, -3.308989107608795e-06, -3.037974238395691e-06, -2.7669593691825867e-06, -2.4959444999694824e-06, -2.224929630756378e-06, -1.953914761543274e-06, -1.6828998923301697e-06, -1.4118850231170654e-06, -1.1408701539039612e-06, -8.698552846908569e-07, -5.988404154777527e-07, -3.2782554626464844e-07, -5.681067705154419e-08, 2.1420419216156006e-07, 4.852190613746643e-07, 7.562339305877686e-07, 1.0272487998008728e-06, 1.298263669013977e-06, 1.5692785382270813e-06, 1.8402934074401855e-06, 2.11130827665329e-06, 2.382323145866394e-06, 2.6533380150794983e-06, 2.9243528842926025e-06, 3.1953677535057068e-06, 3.466382622718811e-06, 3.7373974919319153e-06, 4.0084123611450195e-06, 4.279427230358124e-06, 4.550442099571228e-06, 4.821456968784332e-06, 5.0924718379974365e-06, 5.363486707210541e-06, 5.634501576423645e-06, 5.905516445636749e-06, 6.1765313148498535e-06, 6.447546184062958e-06, 6.718561053276062e-06, 6.989575922489166e-06, 7.2605907917022705e-06, 7.531605660915375e-06, 7.802620530128479e-06, 8.073635399341583e-06, 8.344650268554688e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 6.0, 0.0, 6.0, 11.0, 8.0, 0.0, 18.0, 30.0, 21.0, 0.0, 51.0, 70.0, 127.0, 0.0, 310.0, 123.0, 64.0, 0.0, 39.0, 38.0, 14.0, 0.0, 9.0, 16.0, 6.0, 0.0, 12.0, 2.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 10.0, 10.0, 15.0, 27.0, 27.0, 41.0, 45.0, 62.0, 112.0, 149.0, 152.0, 98.0, 60.0, 43.0, 32.0, 26.0, 17.0, 13.0, 12.0, 5.0, 8.0, 2.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.306580326054245e-05, -6.143443897599354e-05, -5.980306741548702e-05, -5.8171699492959306e-05, -5.654033157043159e-05, -5.4908963647903875e-05, -5.327759572537616e-05, -5.164623144082725e-05, -5.001485988032073e-05, -4.838349195779301e-05, -4.67521240352653e-05, -4.512075611273758e-05, -4.3489388190209866e-05, -4.185802026768215e-05, -4.0226652345154434e-05, -3.8595288060605526e-05, -3.696392013807781e-05, -3.5332552215550095e-05, -3.370118429302238e-05, -3.2069816370494664e-05, -3.0438448447966948e-05, -2.8807080525439233e-05, -2.717571442190092e-05, -2.5544346499373205e-05, -2.391297857684549e-05, -2.2281610654317774e-05, -2.065024273179006e-05, -1.9018876628251746e-05, -1.738750870572403e-05, -1.5756140783196315e-05, -1.41247728606686e-05, -1.2493404938140884e-05, -1.0862040653591976e-05, -9.23067273106426e-06, -7.599305263283895e-06, -5.967937795503531e-06, -4.336569872975815e-06, -2.7052019504480995e-06, -1.0738349374150857e-06, 5.575329851126298e-07, 2.1889009076403454e-06, 3.820268830168061e-06, 5.451636297948426e-06, 7.08300376572879e-06, 8.714371688256506e-06, 1.0345739610784221e-05, 1.1977106623817235e-05, 1.360847454634495e-05, 1.5239842468872666e-05, 1.6871210391400382e-05, 1.8502578313928097e-05, 2.0133946236455813e-05, 2.176531415898353e-05, 2.3396682081511244e-05, 2.5028048185049556e-05, 2.6659416107577272e-05, 2.8290784030104987e-05, 2.9922151952632703e-05, 3.1553518056171015e-05, 3.318488597869873e-05, 3.4816253901226446e-05, 3.644762182375416e-05, 3.807898974628188e-05, 3.971035766880959e-05, 4.134172559133731e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 9.0, 16.0, 16.0, 13.0, 10.0, 18.0, 25.0, 32.0, 22.0, 27.0, 33.0, 36.0, 26.0, 37.0, 54.0, 37.0, 36.0, 39.0, 28.0, 37.0, 41.0, 40.0, 28.0, 40.0, 32.0, 24.0, 28.0, 23.0, 22.0, 19.0, 27.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.6595669623930007e-05, -2.579747342679184e-05, -2.4999275410664268e-05, -2.42010792135261e-05, -2.340288119739853e-05, -2.260468500026036e-05, -2.1806488803122193e-05, -2.100829078699462e-05, -2.0210094589856453e-05, -1.9411898392718285e-05, -1.8613700376590714e-05, -1.7815504179452546e-05, -1.7017307982314378e-05, -1.6219109966186807e-05, -1.542091376904864e-05, -1.4622716662415769e-05, -1.38245195557829e-05, -1.302632244915003e-05, -1.222812534251716e-05, -1.1429929145378992e-05, -1.0631732038746122e-05, -9.833534932113253e-06, -9.035338734975085e-06, -8.237141628342215e-06, -7.438944521709345e-06, -6.640747415076476e-06, -5.842550763190957e-06, -5.044354111305438e-06, -4.246157004672568e-06, -3.4479598980396986e-06, -2.64976324615418e-06, -1.851566594268661e-06, -1.0533713066251948e-06, -2.551744273660006e-07, 5.430224518931936e-07, 1.341219331152388e-06, 2.139416210411582e-06, 2.937613317044452e-06, 3.7358099689299706e-06, 4.5340066208154894e-06, 5.332203727448359e-06, 6.130400834081229e-06, 6.928597485966748e-06, 7.726794137852266e-06, 8.524991244485136e-06, 9.323188351118006e-06, 1.0121384548256174e-05, 1.0919581654889043e-05, 1.1717778761521913e-05, 1.2515975868154783e-05, 1.3314172974787652e-05, 1.411236917192582e-05, 1.491056627855869e-05, 1.570876338519156e-05, 1.6506959582329728e-05, 1.7305155779467896e-05, 1.8103353795595467e-05, 1.8901549992733635e-05, 1.9699748008861206e-05, 2.0497944205999374e-05, 2.1296142222126946e-05, 2.2094338419265114e-05, 2.289253461640328e-05, 2.3690732632530853e-05, 2.448892882966902e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 13.0, 25.0, 25.0, 50.0, 62.0, 100.0, 142.0, 208.0, 344.0, 522.0, 722.0, 1209.0, 1778.0, 2825.0, 4397.0, 7240.0, 11469.0, 18885.0, 33723.0, 59878.0, 126576.0, 296953.0, 253528.0, 101474.0, 51868.0, 29544.0, 16885.0, 10528.0, 6214.0, 4024.0, 2641.0, 1608.0, 1084.0, 670.0, 470.0, 311.0, 181.0, 133.0, 71.0, 49.0, 44.0, 22.0, 18.0, 11.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0], "bins": [-6.717443466186523e-05, -6.530247628688812e-05, -6.343051791191101e-05, -6.15585595369339e-05, -5.968660116195679e-05, -5.7814642786979675e-05, -5.5942684412002563e-05, -5.407072603702545e-05, -5.219876766204834e-05, -5.032680928707123e-05, -4.8454850912094116e-05, -4.6582892537117004e-05, -4.471093416213989e-05, -4.283897578716278e-05, -4.096701741218567e-05, -3.909505903720856e-05, -3.7223100662231445e-05, -3.5351142287254333e-05, -3.347918391227722e-05, -3.160722553730011e-05, -2.9735267162322998e-05, -2.7863308787345886e-05, -2.5991350412368774e-05, -2.4119392037391663e-05, -2.224743366241455e-05, -2.037547528743744e-05, -1.8503516912460327e-05, -1.6631558537483215e-05, -1.4759600162506104e-05, -1.2887641787528992e-05, -1.101568341255188e-05, -9.143725037574768e-06, -7.271766662597656e-06, -5.3998082876205444e-06, -3.5278499126434326e-06, -1.6558915376663208e-06, 2.1606683731079102e-07, 2.088025212287903e-06, 3.959983587265015e-06, 5.8319419622421265e-06, 7.703900337219238e-06, 9.57585871219635e-06, 1.1447817087173462e-05, 1.3319775462150574e-05, 1.5191733837127686e-05, 1.7063692212104797e-05, 1.893565058708191e-05, 2.080760896205902e-05, 2.2679567337036133e-05, 2.4551525712013245e-05, 2.6423484086990356e-05, 2.8295442461967468e-05, 3.016740083694458e-05, 3.203935921192169e-05, 3.3911317586898804e-05, 3.5783275961875916e-05, 3.765523433685303e-05, 3.952719271183014e-05, 4.139915108680725e-05, 4.327110946178436e-05, 4.5143067836761475e-05, 4.7015026211738586e-05, 4.88869845867157e-05, 5.075894296169281e-05, 5.263090133666992e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 8.0, 9.0, 6.0, 5.0, 10.0, 11.0, 21.0, 23.0, 21.0, 19.0, 26.0, 37.0, 34.0, 39.0, 51.0, 52.0, 50.0, 55.0, 52.0, 45.0, 51.0, 48.0, 50.0, 34.0, 27.0, 35.0, 38.0, 23.0, 27.0, 16.0, 20.0, 13.0, 8.0, 10.0, 5.0, 6.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.9788742065429688e-05, -1.9244849681854248e-05, -1.870095729827881e-05, -1.815706491470337e-05, -1.761317253112793e-05, -1.706928014755249e-05, -1.652538776397705e-05, -1.598149538040161e-05, -1.5437602996826172e-05, -1.4893710613250732e-05, -1.4349818229675293e-05, -1.3805925846099854e-05, -1.3262033462524414e-05, -1.2718141078948975e-05, -1.2174248695373535e-05, -1.1630356311798096e-05, -1.1086463928222656e-05, -1.0542571544647217e-05, -9.998679161071777e-06, -9.454786777496338e-06, -8.910894393920898e-06, -8.367002010345459e-06, -7.82310962677002e-06, -7.27921724319458e-06, -6.735324859619141e-06, -6.191432476043701e-06, -5.647540092468262e-06, -5.103647708892822e-06, -4.559755325317383e-06, -4.015862941741943e-06, -3.471970558166504e-06, -2.9280781745910645e-06, -2.384185791015625e-06, -1.8402934074401855e-06, -1.296401023864746e-06, -7.525086402893066e-07, -2.086162567138672e-07, 3.3527612686157227e-07, 8.791685104370117e-07, 1.4230608940124512e-06, 1.9669532775878906e-06, 2.51084566116333e-06, 3.0547380447387695e-06, 3.598630428314209e-06, 4.1425228118896484e-06, 4.686415195465088e-06, 5.230307579040527e-06, 5.774199962615967e-06, 6.318092346191406e-06, 6.861984729766846e-06, 7.405877113342285e-06, 7.949769496917725e-06, 8.493661880493164e-06, 9.037554264068604e-06, 9.581446647644043e-06, 1.0125339031219482e-05, 1.0669231414794922e-05, 1.1213123798370361e-05, 1.17570161819458e-05, 1.230090856552124e-05, 1.284480094909668e-05, 1.3388693332672119e-05, 1.3932585716247559e-05, 1.4476478099822998e-05, 1.5020370483398438e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 4.0, 12.0, 16.0, 24.0, 12.0, 43.0, 57.0, 122.0, 182.0, 346.0, 679.0, 1462.0, 2714.0, 5529.0, 11882.0, 24628.0, 58052.0, 153337.0, 441678.0, 214028.0, 73552.0, 31847.0, 14580.0, 6860.0, 3378.0, 1721.0, 830.0, 386.0, 209.0, 140.0, 81.0, 45.0, 26.0, 23.0, 16.0, 10.0, 13.0, 4.0, 5.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.300210952758789e-05, -6.087683141231537e-05, -5.875155329704285e-05, -5.6626275181770325e-05, -5.45009970664978e-05, -5.237571895122528e-05, -5.025044083595276e-05, -4.812516272068024e-05, -4.5999884605407715e-05, -4.387460649013519e-05, -4.174932837486267e-05, -3.962405025959015e-05, -3.749877214431763e-05, -3.5373494029045105e-05, -3.324821591377258e-05, -3.112293779850006e-05, -2.899765968322754e-05, -2.6872381567955017e-05, -2.4747103452682495e-05, -2.2621825337409973e-05, -2.049654722213745e-05, -1.837126910686493e-05, -1.6245990991592407e-05, -1.4120712876319885e-05, -1.1995434761047363e-05, -9.870156645774841e-06, -7.74487853050232e-06, -5.619600415229797e-06, -3.4943222999572754e-06, -1.3690441846847534e-06, 7.562339305877686e-07, 2.8815120458602905e-06, 5.0067901611328125e-06, 7.1320682764053345e-06, 9.257346391677856e-06, 1.1382624506950378e-05, 1.35079026222229e-05, 1.5633180737495422e-05, 1.7758458852767944e-05, 1.9883736968040466e-05, 2.2009015083312988e-05, 2.413429319858551e-05, 2.6259571313858032e-05, 2.8384849429130554e-05, 3.0510127544403076e-05, 3.26354056596756e-05, 3.476068377494812e-05, 3.688596189022064e-05, 3.9011240005493164e-05, 4.1136518120765686e-05, 4.326179623603821e-05, 4.538707435131073e-05, 4.751235246658325e-05, 4.9637630581855774e-05, 5.1762908697128296e-05, 5.388818681240082e-05, 5.601346492767334e-05, 5.813874304294586e-05, 6.0264021158218384e-05, 6.23892992734909e-05, 6.451457738876343e-05, 6.663985550403595e-05, 6.876513361930847e-05, 7.0890411734581e-05, 7.301568984985352e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 7.0, 6.0, 4.0, 11.0, 17.0, 16.0, 14.0, 15.0, 31.0, 13.0, 25.0, 29.0, 27.0, 35.0, 37.0, 37.0, 35.0, 34.0, 55.0, 63.0, 38.0, 41.0, 43.0, 37.0, 41.0, 38.0, 26.0, 43.0, 27.0, 31.0, 21.0, 11.0, 21.0, 12.0, 16.0, 9.0, 11.0, 5.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.537799835205078e-05, -1.4923512935638428e-05, -1.4469027519226074e-05, -1.401454210281372e-05, -1.3560056686401367e-05, -1.3105571269989014e-05, -1.265108585357666e-05, -1.2196600437164307e-05, -1.1742115020751953e-05, -1.12876296043396e-05, -1.0833144187927246e-05, -1.0378658771514893e-05, -9.924173355102539e-06, -9.469687938690186e-06, -9.015202522277832e-06, -8.560717105865479e-06, -8.106231689453125e-06, -7.651746273040771e-06, -7.197260856628418e-06, -6.7427754402160645e-06, -6.288290023803711e-06, -5.833804607391357e-06, -5.379319190979004e-06, -4.92483377456665e-06, -4.470348358154297e-06, -4.015862941741943e-06, -3.56137752532959e-06, -3.1068921089172363e-06, -2.652406692504883e-06, -2.1979212760925293e-06, -1.7434358596801758e-06, -1.2889504432678223e-06, -8.344650268554688e-07, -3.7997961044311523e-07, 7.450580596923828e-08, 5.289912223815918e-07, 9.834766387939453e-07, 1.4379620552062988e-06, 1.8924474716186523e-06, 2.346932888031006e-06, 2.8014183044433594e-06, 3.255903720855713e-06, 3.7103891372680664e-06, 4.16487455368042e-06, 4.6193599700927734e-06, 5.073845386505127e-06, 5.5283308029174805e-06, 5.982816219329834e-06, 6.4373016357421875e-06, 6.891787052154541e-06, 7.3462724685668945e-06, 7.800757884979248e-06, 8.255243301391602e-06, 8.709728717803955e-06, 9.164214134216309e-06, 9.618699550628662e-06, 1.0073184967041016e-05, 1.0527670383453369e-05, 1.0982155799865723e-05, 1.1436641216278076e-05, 1.189112663269043e-05, 1.2345612049102783e-05, 1.2800097465515137e-05, 1.325458288192749e-05, 1.3709068298339844e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 10.0, 12.0, 14.0, 17.0, 26.0, 37.0, 61.0, 88.0, 127.0, 208.0, 294.0, 489.0, 819.0, 1418.0, 2836.0, 6183.0, 17381.0, 70263.0, 847867.0, 70431.0, 17306.0, 6270.0, 2721.0, 1440.0, 790.0, 505.0, 314.0, 204.0, 128.0, 94.0, 60.0, 41.0, 22.0, 21.0, 18.0, 9.0, 9.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-06, -3.812834620475769e-06, -3.691762685775757e-06, -3.5706907510757446e-06, -3.4496188163757324e-06, -3.3285468816757202e-06, -3.207474946975708e-06, -3.086403012275696e-06, -2.9653310775756836e-06, -2.8442591428756714e-06, -2.723187208175659e-06, -2.602115273475647e-06, -2.4810433387756348e-06, -2.3599714040756226e-06, -2.2388994693756104e-06, -2.117827534675598e-06, -1.996755599975586e-06, -1.8756836652755737e-06, -1.7546117305755615e-06, -1.6335397958755493e-06, -1.5124678611755371e-06, -1.391395926475525e-06, -1.2703239917755127e-06, -1.1492520570755005e-06, -1.0281801223754883e-06, -9.071081876754761e-07, -7.860362529754639e-07, -6.649643182754517e-07, -5.438923835754395e-07, -4.2282044887542725e-07, -3.0174851417541504e-07, -1.8067657947540283e-07, -5.960464477539063e-08, 6.146728992462158e-08, 1.825392246246338e-07, 3.03611159324646e-07, 4.246830940246582e-07, 5.457550287246704e-07, 6.668269634246826e-07, 7.878988981246948e-07, 9.08970832824707e-07, 1.0300427675247192e-06, 1.1511147022247314e-06, 1.2721866369247437e-06, 1.3932585716247559e-06, 1.514330506324768e-06, 1.6354024410247803e-06, 1.7564743757247925e-06, 1.8775463104248047e-06, 1.998618245124817e-06, 2.119690179824829e-06, 2.2407621145248413e-06, 2.3618340492248535e-06, 2.4829059839248657e-06, 2.603977918624878e-06, 2.72504985332489e-06, 2.8461217880249023e-06, 2.9671937227249146e-06, 3.0882656574249268e-06, 3.209337592124939e-06, 3.330409526824951e-06, 3.4514814615249634e-06, 3.5725533962249756e-06, 3.693625330924988e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 129.0, 0.0, 0.0, 0.0, 0.0, 604.0, 0.0, 0.0, 0.0, 0.0, 138.0, 0.0, 0.0, 0.0, 0.0, 46.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 10.0, 0.0, 2.0, 2.0, 1.0, 36.0, 13.0, 18.0, 39.0, 73.0, 193.0, 201.0, 381.0, 729.0, 1367.0, 3218.0, 5854.0, 13862.0, 41166.0, 145427.0, 622997.0, 145671.0, 41410.0, 13733.0, 5885.0, 3279.0, 1291.0, 759.0, 388.0, 200.0, 173.0, 69.0, 38.0, 22.0, 8.0, 32.0, 5.0, 1.0, 0.0, 1.0, 7.0, 0.0, 0.0, 0.0, 1.0, 7.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.086162567138672e-06, -2.0256265997886658e-06, -1.9650906324386597e-06, -1.9045546650886536e-06, -1.8440186977386475e-06, -1.7834827303886414e-06, -1.7229467630386353e-06, -1.6624107956886292e-06, -1.601874828338623e-06, -1.541338860988617e-06, -1.4808028936386108e-06, -1.4202669262886047e-06, -1.3597309589385986e-06, -1.2991949915885925e-06, -1.2386590242385864e-06, -1.1781230568885803e-06, -1.1175870895385742e-06, -1.0570511221885681e-06, -9.96515154838562e-07, -9.359791874885559e-07, -8.754432201385498e-07, -8.149072527885437e-07, -7.543712854385376e-07, -6.938353180885315e-07, -6.332993507385254e-07, -5.727633833885193e-07, -5.122274160385132e-07, -4.516914486885071e-07, -3.91155481338501e-07, -3.3061951398849487e-07, -2.7008354663848877e-07, -2.0954757928848267e-07, -1.4901161193847656e-07, -8.847564458847046e-08, -2.7939677238464355e-08, 3.259629011154175e-08, 9.313225746154785e-08, 1.5366822481155396e-07, 2.1420419216156006e-07, 2.7474015951156616e-07, 3.3527612686157227e-07, 3.9581209421157837e-07, 4.5634806156158447e-07, 5.168840289115906e-07, 5.774199962615967e-07, 6.379559636116028e-07, 6.984919309616089e-07, 7.59027898311615e-07, 8.195638656616211e-07, 8.800998330116272e-07, 9.406358003616333e-07, 1.0011717677116394e-06, 1.0617077350616455e-06, 1.1222437024116516e-06, 1.1827796697616577e-06, 1.2433156371116638e-06, 1.30385160446167e-06, 1.364387571811676e-06, 1.4249235391616821e-06, 1.4854595065116882e-06, 1.5459954738616943e-06, 1.6065314412117004e-06, 1.6670674085617065e-06, 1.7276033759117126e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 209.0, 0.0, 0.0, 0.0, 0.0, 382.0, 0.0, 0.0, 0.0, 0.0, 205.0, 0.0, 0.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 4.0, 9.0, 8.0, 12.0, 11.0, 17.0, 20.0, 31.0, 31.0, 48.0, 50.0, 90.0, 130.0, 154.0, 100.0, 83.0, 58.0, 29.0, 22.0, 24.0, 10.0, 9.0, 11.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.926261004176922e-05, -2.822054193529766e-05, -2.71784738288261e-05, -2.613640572235454e-05, -2.5094337615882978e-05, -2.4052269509411417e-05, -2.3010201402939856e-05, -2.1968133296468295e-05, -2.0926065189996734e-05, -1.9883997083525173e-05, -1.8841928977053612e-05, -1.779986087058205e-05, -1.675779276411049e-05, -1.571572465763893e-05, -1.4673656551167369e-05, -1.3631588444695808e-05, -1.2589520338224247e-05, -1.1547452231752686e-05, -1.0505384125281125e-05, -9.463316018809564e-06, -8.421247912338004e-06, -7.379179805866443e-06, -6.337111699394882e-06, -5.295043592923321e-06, -4.25297548645176e-06, -3.210907379980199e-06, -2.168839273508638e-06, -1.1267711670370772e-06, -8.470306056551635e-08, 9.573650459060445e-07, 1.9994331523776054e-06, 3.0415012588491663e-06, 4.083573003299534e-06, 5.125641109771095e-06, 6.167709216242656e-06, 7.209777322714217e-06, 8.251845429185778e-06, 9.293913535657339e-06, 1.03359816421289e-05, 1.137804974860046e-05, 1.2420117855072021e-05, 1.3462185961543582e-05, 1.4504254068015143e-05, 1.5546322174486704e-05, 1.6588390280958265e-05, 1.7630458387429826e-05, 1.8672526493901387e-05, 1.9714594600372948e-05, 2.075666270684451e-05, 2.179873081331607e-05, 2.284079891978763e-05, 2.388286702625919e-05, 2.4924935132730752e-05, 2.5967003239202313e-05, 2.7009071345673874e-05, 2.8051139452145435e-05, 2.9093207558616996e-05, 3.0135275665088557e-05, 3.117734377156012e-05, 3.2219410059042275e-05, 3.326147998450324e-05, 3.4303549909964204e-05, 3.534561619744636e-05, 3.638768248492852e-05, 3.742975241038948e-05]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 5.0, 16.0, 15.0, 13.0, 7.0, 18.0, 15.0, 13.0, 21.0, 36.0, 35.0, 38.0, 34.0, 35.0, 40.0, 31.0, 35.0, 41.0, 34.0, 39.0, 51.0, 36.0, 50.0, 45.0, 36.0, 34.0, 35.0, 28.0, 28.0, 20.0, 21.0, 20.0, 11.0, 12.0, 15.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.004855195991695e-05, -1.941248592629563e-05, -1.8776421711663716e-05, -1.8140355678042397e-05, -1.7504291463410482e-05, -1.6868225429789163e-05, -1.6232159396167845e-05, -1.559609518153593e-05, -1.496002914791461e-05, -1.4323964023787994e-05, -1.3687898899661377e-05, -1.3051832866040058e-05, -1.2415767741913442e-05, -1.1779702617786825e-05, -1.1143636584165506e-05, -1.050757146003889e-05, -9.871506335912272e-06, -9.235441211785655e-06, -8.599376087659039e-06, -7.96331005403772e-06, -7.327244929911103e-06, -6.691179805784486e-06, -6.0551142269105185e-06, -5.419048648036551e-06, -4.782983523909934e-06, -4.146918399783317e-06, -3.5108528209093492e-06, -2.874787469409057e-06, -2.2387221179087646e-06, -1.6026567664084723e-06, -9.6659141490818e-07, -3.3052583603421226e-07, 3.055392880924046e-07, 9.416046395926969e-07, 1.5776699910929892e-06, 2.2137353425932815e-06, 2.849800694093574e-06, 3.485866045593866e-06, 4.1219313970941585e-06, 4.757996975968126e-06, 5.394062100094743e-06, 6.03012722422136e-06, 6.666192803095328e-06, 7.3022583819692954e-06, 7.938323506095912e-06, 8.57438863022253e-06, 9.210454663843848e-06, 9.846519787970465e-06, 1.0482584912097082e-05, 1.1118650036223698e-05, 1.1754715160350315e-05, 1.2390781193971634e-05, 1.302684631809825e-05, 1.3662911442224868e-05, 1.4298977475846186e-05, 1.4935042599972803e-05, 1.557110772409942e-05, 1.620717375772074e-05, 1.6843237972352654e-05, 1.7479304005973972e-05, 1.811537003959529e-05, 1.8751434254227206e-05, 1.9387500287848525e-05, 2.0023566321469843e-05, 2.065963053610176e-05]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 6.0, 8.0, 12.0, 8.0, 18.0, 21.0, 29.0, 43.0, 41.0, 62.0, 74.0, 125.0, 179.0, 267.0, 418.0, 652.0, 1100.0, 1933.0, 3833.0, 9683.0, 3982631.0, 178316.0, 7321.0, 3165.0, 1716.0, 933.0, 583.0, 343.0, 211.0, 139.0, 116.0, 55.0, 59.0, 48.0, 34.0, 13.0, 22.0, 16.0, 12.0, 6.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00011992454528808594, -0.00011627562344074249, -0.00011262670159339905, -0.0001089777797460556, -0.00010532885789871216, -0.00010167993605136871, -9.803101420402527e-05, -9.438209235668182e-05, -9.073317050933838e-05, -8.708424866199493e-05, -8.343532681465149e-05, -7.978640496730804e-05, -7.61374831199646e-05, -7.248856127262115e-05, -6.883963942527771e-05, -6.519071757793427e-05, -6.154179573059082e-05, -5.7892873883247375e-05, -5.424395203590393e-05, -5.0595030188560486e-05, -4.694610834121704e-05, -4.3297186493873596e-05, -3.964826464653015e-05, -3.5999342799186707e-05, -3.235042095184326e-05, -2.8701499104499817e-05, -2.5052577257156372e-05, -2.1403655409812927e-05, -1.7754733562469482e-05, -1.4105811715126038e-05, -1.0456889867782593e-05, -6.807968020439148e-06, -3.159046173095703e-06, 4.898756742477417e-07, 4.1387975215911865e-06, 7.787719368934631e-06, 1.1436641216278076e-05, 1.5085563063621521e-05, 1.8734484910964966e-05, 2.238340675830841e-05, 2.6032328605651855e-05, 2.96812504529953e-05, 3.3330172300338745e-05, 3.697909414768219e-05, 4.0628015995025635e-05, 4.427693784236908e-05, 4.7925859689712524e-05, 5.157478153705597e-05, 5.5223703384399414e-05, 5.887262523174286e-05, 6.25215470790863e-05, 6.617046892642975e-05, 6.98193907737732e-05, 7.346831262111664e-05, 7.711723446846008e-05, 8.076615631580353e-05, 8.441507816314697e-05, 8.806400001049042e-05, 9.171292185783386e-05, 9.536184370517731e-05, 9.901076555252075e-05, 0.0001026596873998642, 0.00010630860924720764, 0.00010995753109455109, 0.00011360645294189453]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 4.0, 7.0, 7.0, 7.0, 15.0, 9.0, 10.0, 15.0, 15.0, 20.0, 17.0, 29.0, 36.0, 30.0, 45.0, 34.0, 37.0, 40.0, 37.0, 22.0, 44.0, 40.0, 49.0, 47.0, 35.0, 47.0, 39.0, 29.0, 38.0, 28.0, 28.0, 18.0, 20.0, 24.0, 11.0, 9.0, 15.0, 11.0, 9.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.245737075805664e-05, -1.2077391147613525e-05, -1.169741153717041e-05, -1.1317431926727295e-05, -1.093745231628418e-05, -1.0557472705841064e-05, -1.017749309539795e-05, -9.797513484954834e-06, -9.417533874511719e-06, -9.037554264068604e-06, -8.657574653625488e-06, -8.277595043182373e-06, -7.897615432739258e-06, -7.517635822296143e-06, -7.137656211853027e-06, -6.757676601409912e-06, -6.377696990966797e-06, -5.997717380523682e-06, -5.617737770080566e-06, -5.237758159637451e-06, -4.857778549194336e-06, -4.477798938751221e-06, -4.0978193283081055e-06, -3.7178397178649902e-06, -3.337860107421875e-06, -2.9578804969787598e-06, -2.5779008865356445e-06, -2.1979212760925293e-06, -1.817941665649414e-06, -1.4379620552062988e-06, -1.0579824447631836e-06, -6.780028343200684e-07, -2.980232238769531e-07, 8.195638656616211e-08, 4.6193599700927734e-07, 8.419156074523926e-07, 1.2218952178955078e-06, 1.601874828338623e-06, 1.9818544387817383e-06, 2.3618340492248535e-06, 2.7418136596679688e-06, 3.121793270111084e-06, 3.5017728805541992e-06, 3.8817524909973145e-06, 4.26173210144043e-06, 4.641711711883545e-06, 5.02169132232666e-06, 5.401670932769775e-06, 5.781650543212891e-06, 6.161630153656006e-06, 6.541609764099121e-06, 6.921589374542236e-06, 7.3015689849853516e-06, 7.681548595428467e-06, 8.061528205871582e-06, 8.441507816314697e-06, 8.821487426757812e-06, 9.201467037200928e-06, 9.581446647644043e-06, 9.961426258087158e-06, 1.0341405868530273e-05, 1.0721385478973389e-05, 1.1101365089416504e-05, 1.1481344699859619e-05, 1.1861324310302734e-05]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 17.0, 34.0, 75.0, 162.0, 383.0, 884.0, 2569.0, 10431.0, 276910.0, 3882220.0, 15250.0, 3372.0, 1140.0, 437.0, 187.0, 101.0, 36.0, 23.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012922286987304688, -0.0001254342496395111, -0.00012164562940597534, -0.00011785700917243958, -0.00011406838893890381, -0.00011027976870536804, -0.00010649114847183228, -0.00010270252823829651, -9.891390800476074e-05, -9.512528777122498e-05, -9.133666753768921e-05, -8.754804730415344e-05, -8.375942707061768e-05, -7.997080683708191e-05, -7.618218660354614e-05, -7.239356637001038e-05, -6.860494613647461e-05, -6.481632590293884e-05, -6.1027705669403076e-05, -5.723908543586731e-05, -5.345046520233154e-05, -4.9661844968795776e-05, -4.587322473526001e-05, -4.208460450172424e-05, -3.8295984268188477e-05, -3.450736403465271e-05, -3.071874380111694e-05, -2.6930123567581177e-05, -2.314150333404541e-05, -1.9352883100509644e-05, -1.5564262866973877e-05, -1.177564263343811e-05, -7.987022399902344e-06, -4.198402166366577e-06, -4.0978193283081055e-07, 3.378838300704956e-06, 7.167458534240723e-06, 1.095607876777649e-05, 1.4744699001312256e-05, 1.8533319234848022e-05, 2.232193946838379e-05, 2.6110559701919556e-05, 2.9899179935455322e-05, 3.368780016899109e-05, 3.7476420402526855e-05, 4.126504063606262e-05, 4.505366086959839e-05, 4.8842281103134155e-05, 5.263090133666992e-05, 5.641952157020569e-05, 6.0208141803741455e-05, 6.399676203727722e-05, 6.778538227081299e-05, 7.157400250434875e-05, 7.536262273788452e-05, 7.915124297142029e-05, 8.293986320495605e-05, 8.672848343849182e-05, 9.051710367202759e-05, 9.430572390556335e-05, 9.809434413909912e-05, 0.00010188296437263489, 0.00010567158460617065, 0.00010946020483970642, 0.00011324882507324219]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 4.0, 8.0, 5.0, 8.0, 17.0, 33.0, 78.0, 256.0, 2631.0, 726.0, 174.0, 39.0, 16.0, 21.0, 9.0, 10.0, 6.0, 3.0, 5.0, 0.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1391937732696533e-05, -1.0982155799865723e-05, -1.0572373867034912e-05, -1.0162591934204102e-05, -9.752810001373291e-06, -9.34302806854248e-06, -8.93324613571167e-06, -8.52346420288086e-06, -8.113682270050049e-06, -7.703900337219238e-06, -7.294118404388428e-06, -6.884336471557617e-06, -6.474554538726807e-06, -6.064772605895996e-06, -5.6549906730651855e-06, -5.245208740234375e-06, -4.8354268074035645e-06, -4.425644874572754e-06, -4.015862941741943e-06, -3.606081008911133e-06, -3.1962990760803223e-06, -2.7865171432495117e-06, -2.376735210418701e-06, -1.9669532775878906e-06, -1.55717134475708e-06, -1.1473894119262695e-06, -7.37607479095459e-07, -3.2782554626464844e-07, 8.195638656616211e-08, 4.917383193969727e-07, 9.015202522277832e-07, 1.3113021850585938e-06, 1.7210841178894043e-06, 2.130866050720215e-06, 2.5406479835510254e-06, 2.950429916381836e-06, 3.3602118492126465e-06, 3.769993782043457e-06, 4.179775714874268e-06, 4.589557647705078e-06, 4.999339580535889e-06, 5.409121513366699e-06, 5.81890344619751e-06, 6.22868537902832e-06, 6.638467311859131e-06, 7.048249244689941e-06, 7.458031177520752e-06, 7.867813110351562e-06, 8.277595043182373e-06, 8.687376976013184e-06, 9.097158908843994e-06, 9.506940841674805e-06, 9.916722774505615e-06, 1.0326504707336426e-05, 1.0736286640167236e-05, 1.1146068572998047e-05, 1.1555850505828857e-05, 1.1965632438659668e-05, 1.2375414371490479e-05, 1.2785196304321289e-05, 1.31949782371521e-05, 1.360476016998291e-05, 1.401454210281372e-05, 1.4424324035644531e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 3.0, 10.0, 16.0, 13.0, 20.0, 21.0, 28.0, 39.0, 64.0, 93.0, 141.0, 166.0, 119.0, 70.0, 52.0, 26.0, 25.0, 19.0, 19.0, 12.0, 6.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1945454136584885e-05, -2.119522832799703e-05, -2.044500070041977e-05, -1.9694774891831912e-05, -1.8944547264254652e-05, -1.8194321455666795e-05, -1.7444093828089535e-05, -1.669386801950168e-05, -1.5943642210913822e-05, -1.5193415492831264e-05, -1.4443188774748705e-05, -1.3692962966160849e-05, -1.294273624807829e-05, -1.2192509529995732e-05, -1.1442282811913174e-05, -1.0692056093830615e-05, -9.941829375748057e-06, -9.191602657665499e-06, -8.44137593958294e-06, -7.691149221500382e-06, -6.940923412912525e-06, -6.190696694829967e-06, -5.4404699767474085e-06, -4.690243713412201e-06, -3.940016995329643e-06, -3.1897905046207597e-06, -2.439564013911877e-06, -1.6893372958293185e-06, -9.391108051204355e-07, -1.8888431441155262e-07, 5.613424036710057e-07, 1.3115686670062132e-06, 2.0617953850887716e-06, 2.8120218757976545e-06, 3.5622483665065374e-06, 4.312475084589096e-06, 5.062701347924303e-06, 5.812928066006862e-06, 6.56315478408942e-06, 7.3133810474246275e-06, 8.063607310759835e-06, 8.813834028842393e-06, 9.564060746924952e-06, 1.0314286555512808e-05, 1.1064513273595367e-05, 1.1814739991677925e-05, 1.2564966709760483e-05, 1.3315193427843042e-05, 1.40654201459256e-05, 1.4815646864008158e-05, 1.5565872672596015e-05, 1.6316100300173275e-05, 1.7066326108761132e-05, 1.7816553736338392e-05, 1.856677954492625e-05, 1.9317005353514105e-05, 2.0067232981091365e-05, 2.0817458789679222e-05, 2.1567686417256482e-05, 2.231791222584434e-05, 2.30681398534216e-05, 2.3818365662009455e-05, 2.4568591470597312e-05, 2.5318819098174572e-05, 2.606904490676243e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 12.0, 9.0, 12.0, 12.0, 7.0, 12.0, 16.0, 16.0, 22.0, 43.0, 30.0, 25.0, 32.0, 36.0, 25.0, 55.0, 33.0, 55.0, 45.0, 43.0, 39.0, 46.0, 43.0, 55.0, 44.0, 37.0, 30.0, 42.0, 21.0, 25.0, 22.0, 8.0, 7.0, 8.0, 9.0, 12.0, 5.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3787667739961762e-05, -1.3351617781154346e-05, -1.2915566912852228e-05, -1.2479516954044811e-05, -1.2043466995237395e-05, -1.1607417036429979e-05, -1.1171366168127861e-05, -1.0735316209320445e-05, -1.0299265341018327e-05, -9.86321538221091e-06, -9.427164513908792e-06, -8.991114555101376e-06, -8.55506459629396e-06, -8.119013727991842e-06, -7.682963769184425e-06, -7.246913810377009e-06, -6.810863851569593e-06, -6.374813438014826e-06, -5.9387634792074095e-06, -5.502713065652642e-06, -5.066663106845226e-06, -4.630612693290459e-06, -4.194562279735692e-06, -3.7585120935546e-06, -3.3224619073735084e-06, -2.8864117211924167e-06, -2.450361535011325e-06, -2.014311121456558e-06, -1.5782609352754662e-06, -1.1422107490943745e-06, -7.061603355396073e-07, -2.7011014935851563e-07, 1.659391273278743e-07, 6.019893703523849e-07, 1.0380396133768954e-06, 1.4740899132448249e-06, 1.9101400994259166e-06, 2.3461902856070083e-06, 2.7822406991617754e-06, 3.218290885342867e-06, 3.654341071523959e-06, 4.090391485078726e-06, 4.526441443886142e-06, 4.962491857440909e-06, 5.3985422709956765e-06, 5.834592229803093e-06, 6.27064264335786e-06, 6.706693056912627e-06, 7.142743015720043e-06, 7.5787934292748105e-06, 8.014843842829578e-06, 8.450893801636994e-06, 8.88694376044441e-06, 9.322993719251826e-06, 9.759044587553944e-06, 1.019509454636136e-05, 1.0631145414663479e-05, 1.1067195373470895e-05, 1.1503246241773013e-05, 1.193929620058043e-05, 1.2375346159387846e-05, 1.2811397027689964e-05, 1.324744698649738e-05, 1.3683496945304796e-05, 1.4119546904112212e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 4.0, 12.0, 16.0, 19.0, 43.0, 46.0, 69.0, 108.0, 159.0, 192.0, 361.0, 574.0, 864.0, 1559.0, 2488.0, 3595.0, 6419.0, 11284.0, 17422.0, 34936.0, 67054.0, 120952.0, 327098.0, 241521.0, 92031.0, 53225.0, 28479.0, 14586.0, 9549.0, 5448.0, 2964.0, 2056.0, 1218.0, 756.0, 498.0, 321.0, 176.0, 153.0, 97.0, 57.0, 52.0, 34.0, 25.0, 15.0, 12.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5933997929096222e-05, -1.541711390018463e-05, -1.490022987127304e-05, -1.438334584236145e-05, -1.386646181344986e-05, -1.3349577784538269e-05, -1.2832693755626678e-05, -1.2315809726715088e-05, -1.1798925697803497e-05, -1.1282041668891907e-05, -1.0765157639980316e-05, -1.0248273611068726e-05, -9.731389582157135e-06, -9.214505553245544e-06, -8.697621524333954e-06, -8.180737495422363e-06, -7.663853466510773e-06, -7.146969437599182e-06, -6.6300854086875916e-06, -6.113201379776001e-06, -5.59631735086441e-06, -5.07943332195282e-06, -4.562549293041229e-06, -4.045665264129639e-06, -3.528781235218048e-06, -3.0118972063064575e-06, -2.495013177394867e-06, -1.9781291484832764e-06, -1.4612451195716858e-06, -9.443610906600952e-07, -4.2747706174850464e-07, 8.940696716308594e-08, 6.062909960746765e-07, 1.123175024986267e-06, 1.6400590538978577e-06, 2.1569430828094482e-06, 2.673827111721039e-06, 3.1907111406326294e-06, 3.70759516954422e-06, 4.2244791984558105e-06, 4.741363227367401e-06, 5.258247256278992e-06, 5.775131285190582e-06, 6.292015314102173e-06, 6.8088993430137634e-06, 7.325783371925354e-06, 7.842667400836945e-06, 8.359551429748535e-06, 8.876435458660126e-06, 9.393319487571716e-06, 9.910203516483307e-06, 1.0427087545394897e-05, 1.0943971574306488e-05, 1.1460855603218079e-05, 1.197773963212967e-05, 1.249462366104126e-05, 1.301150768995285e-05, 1.3528391718864441e-05, 1.4045275747776031e-05, 1.4562159776687622e-05, 1.5079043805599213e-05, 1.5595927834510803e-05, 1.6112811863422394e-05, 1.6629695892333984e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 14.0, 15.0, 15.0, 15.0, 17.0, 24.0, 29.0, 31.0, 29.0, 33.0, 21.0, 46.0, 44.0, 49.0, 58.0, 44.0, 41.0, 36.0, 37.0, 50.0, 40.0, 41.0, 36.0, 30.0, 33.0, 34.0, 22.0, 17.0, 18.0, 13.0, 7.0, 6.0, 2.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4126300811767578e-05, -1.3704411685466766e-05, -1.3282522559165955e-05, -1.2860633432865143e-05, -1.2438744306564331e-05, -1.201685518026352e-05, -1.1594966053962708e-05, -1.1173076927661896e-05, -1.0751187801361084e-05, -1.0329298675060272e-05, -9.90740954875946e-06, -9.485520422458649e-06, -9.063631296157837e-06, -8.641742169857025e-06, -8.219853043556213e-06, -7.797963917255402e-06, -7.37607479095459e-06, -6.954185664653778e-06, -6.532296538352966e-06, -6.1104074120521545e-06, -5.688518285751343e-06, -5.266629159450531e-06, -4.844740033149719e-06, -4.4228509068489075e-06, -4.000961780548096e-06, -3.579072654247284e-06, -3.157183527946472e-06, -2.7352944016456604e-06, -2.3134052753448486e-06, -1.8915161490440369e-06, -1.469627022743225e-06, -1.0477378964424133e-06, -6.258487701416016e-07, -2.039596438407898e-07, 2.1792948246002197e-07, 6.398186087608337e-07, 1.0617077350616455e-06, 1.4835968613624573e-06, 1.905485987663269e-06, 2.327375113964081e-06, 2.7492642402648926e-06, 3.1711533665657043e-06, 3.593042492866516e-06, 4.014931619167328e-06, 4.43682074546814e-06, 4.858709871768951e-06, 5.280598998069763e-06, 5.702488124370575e-06, 6.124377250671387e-06, 6.5462663769721985e-06, 6.96815550327301e-06, 7.390044629573822e-06, 7.811933755874634e-06, 8.233822882175446e-06, 8.655712008476257e-06, 9.077601134777069e-06, 9.499490261077881e-06, 9.921379387378693e-06, 1.0343268513679504e-05, 1.0765157639980316e-05, 1.1187046766281128e-05, 1.160893589258194e-05, 1.2030825018882751e-05, 1.2452714145183563e-05, 1.2874603271484375e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 10.0, 19.0, 19.0, 28.0, 46.0, 57.0, 94.0, 124.0, 201.0, 276.0, 382.0, 614.0, 1044.0, 1365.0, 2298.0, 3794.0, 6188.0, 12572.0, 21785.0, 44469.0, 113916.0, 576196.0, 159743.0, 48683.0, 23607.0, 12549.0, 6906.0, 4566.0, 2394.0, 1579.0, 985.0, 639.0, 485.0, 302.0, 192.0, 121.0, 94.0, 71.0, 43.0, 28.0, 19.0, 14.0, 15.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.7869286239147186e-05, -1.732073724269867e-05, -1.6772188246250153e-05, -1.6223639249801636e-05, -1.567509025335312e-05, -1.5126541256904602e-05, -1.4577992260456085e-05, -1.4029443264007568e-05, -1.3480894267559052e-05, -1.2932345271110535e-05, -1.2383796274662018e-05, -1.1835247278213501e-05, -1.1286698281764984e-05, -1.0738149285316467e-05, -1.018960028886795e-05, -9.641051292419434e-06, -9.092502295970917e-06, -8.5439532995224e-06, -7.995404303073883e-06, -7.446855306625366e-06, -6.898306310176849e-06, -6.3497573137283325e-06, -5.801208317279816e-06, -5.252659320831299e-06, -4.704110324382782e-06, -4.155561327934265e-06, -3.6070123314857483e-06, -3.0584633350372314e-06, -2.5099143385887146e-06, -1.9613653421401978e-06, -1.412816345691681e-06, -8.642673492431641e-07, -3.157183527946472e-07, 2.3283064365386963e-07, 7.813796401023865e-07, 1.3299286365509033e-06, 1.8784776329994202e-06, 2.427026629447937e-06, 2.975575625896454e-06, 3.5241246223449707e-06, 4.0726736187934875e-06, 4.621222615242004e-06, 5.169771611690521e-06, 5.718320608139038e-06, 6.266869604587555e-06, 6.815418601036072e-06, 7.363967597484589e-06, 7.912516593933105e-06, 8.461065590381622e-06, 9.00961458683014e-06, 9.558163583278656e-06, 1.0106712579727173e-05, 1.065526157617569e-05, 1.1203810572624207e-05, 1.1752359569072723e-05, 1.230090856552124e-05, 1.2849457561969757e-05, 1.3398006558418274e-05, 1.394655555486679e-05, 1.4495104551315308e-05, 1.5043653547763824e-05, 1.559220254421234e-05, 1.6140751540660858e-05, 1.6689300537109375e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 5.0, 3.0, 8.0, 6.0, 17.0, 12.0, 24.0, 18.0, 21.0, 23.0, 36.0, 37.0, 48.0, 28.0, 34.0, 32.0, 22.0, 27.0, 213.0, 32.0, 27.0, 20.0, 26.0, 22.0, 46.0, 35.0, 29.0, 32.0, 24.0, 18.0, 13.0, 15.0, 13.0, 8.0, 6.0, 8.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.033348083496094e-06, -6.8033114075660706e-06, -6.573274731636047e-06, -6.343238055706024e-06, -6.113201379776001e-06, -5.883164703845978e-06, -5.653128027915955e-06, -5.423091351985931e-06, -5.193054676055908e-06, -4.963018000125885e-06, -4.732981324195862e-06, -4.502944648265839e-06, -4.2729079723358154e-06, -4.042871296405792e-06, -3.812834620475769e-06, -3.582797944545746e-06, -3.3527612686157227e-06, -3.1227245926856995e-06, -2.8926879167556763e-06, -2.662651240825653e-06, -2.43261456489563e-06, -2.2025778889656067e-06, -1.9725412130355835e-06, -1.7425045371055603e-06, -1.5124678611755371e-06, -1.282431185245514e-06, -1.0523945093154907e-06, -8.223578333854675e-07, -5.923211574554443e-07, -3.6228448152542114e-07, -1.3224780559539795e-07, 9.778887033462524e-08, 3.2782554626464844e-07, 5.578622221946716e-07, 7.878988981246948e-07, 1.017935574054718e-06, 1.2479722499847412e-06, 1.4780089259147644e-06, 1.7080456018447876e-06, 1.938082277774811e-06, 2.168118953704834e-06, 2.398155629634857e-06, 2.6281923055648804e-06, 2.8582289814949036e-06, 3.0882656574249268e-06, 3.31830233335495e-06, 3.548339009284973e-06, 3.7783756852149963e-06, 4.0084123611450195e-06, 4.238449037075043e-06, 4.468485713005066e-06, 4.698522388935089e-06, 4.928559064865112e-06, 5.1585957407951355e-06, 5.388632416725159e-06, 5.618669092655182e-06, 5.848705768585205e-06, 6.078742444515228e-06, 6.3087791204452515e-06, 6.538815796375275e-06, 6.768852472305298e-06, 6.998889148235321e-06, 7.228925824165344e-06, 7.4589625000953674e-06, 7.68899917602539e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 11.0, 13.0, 16.0, 24.0, 29.0, 40.0, 47.0, 79.0, 138.0, 191.0, 122.0, 74.0, 55.0, 42.0, 26.0, 19.0, 14.0, 8.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4054797904682346e-05, -2.3334176148637198e-05, -2.261355439259205e-05, -2.1892932636546902e-05, -2.117230906151235e-05, -2.0451687305467203e-05, -1.9731065549422055e-05, -1.9010443793376908e-05, -1.828982203733176e-05, -1.7569200281286612e-05, -1.6848578525241464e-05, -1.6127956769196317e-05, -1.540733501315117e-05, -1.468671234761132e-05, -1.396608968207147e-05, -1.3245467926026322e-05, -1.2524846169981174e-05, -1.1804224413936026e-05, -1.1083602657890879e-05, -1.0362979992351029e-05, -9.642358236305881e-06, -8.921736480260734e-06, -8.201113814720884e-06, -7.480492058675736e-06, -6.759870302630588e-06, -6.039248546585441e-06, -5.318626335792942e-06, -4.598004125000443e-06, -3.8773823689552955e-06, -3.1567603855364723e-06, -2.436138402117649e-06, -1.7155161913251504e-06, -9.948944352800027e-07, -2.7427245186117943e-07, 4.463495315576438e-07, 1.166971514976467e-06, 1.8875934983952902e-06, 2.6082154818141134e-06, 3.3288374652329367e-06, 4.049459676025435e-06, 4.770081432070583e-06, 5.490703188115731e-06, 6.2113253989082295e-06, 6.931947609700728e-06, 7.652569365745876e-06, 8.373191121791024e-06, 9.093813787330873e-06, 9.814435543376021e-06, 1.0535057299421169e-05, 1.1255679055466317e-05, 1.1976300811511464e-05, 1.2696923477051314e-05, 1.3417545233096462e-05, 1.413816698914161e-05, 1.4858789654681459e-05, 1.5579411410726607e-05, 1.6300033166771755e-05, 1.7020654922816902e-05, 1.774127667886205e-05, 1.8461898434907198e-05, 1.9182520190952346e-05, 1.9903143765986897e-05, 2.0623765522032045e-05, 2.1344387278077193e-05, 2.206500903412234e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 8.0, 13.0, 9.0, 11.0, 13.0, 11.0, 13.0, 14.0, 21.0, 29.0, 42.0, 30.0, 24.0, 30.0, 34.0, 43.0, 45.0, 35.0, 63.0, 39.0, 38.0, 52.0, 40.0, 47.0, 47.0, 42.0, 35.0, 33.0, 32.0, 21.0, 22.0, 17.0, 8.0, 8.0, 8.0, 7.0, 10.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2866780707554426e-05, -1.2464290193747729e-05, -1.206179877044633e-05, -1.1659307347144932e-05, -1.1256816833338235e-05, -1.0854326319531538e-05, -1.0451834896230139e-05, -1.004934347292874e-05, -9.646852959122043e-06, -9.244362445315346e-06, -8.841871022013947e-06, -8.439379598712549e-06, -8.036889084905852e-06, -7.634398571099155e-06, -7.231907147797756e-06, -6.829416179243708e-06, -6.42692521068966e-06, -6.024434242135612e-06, -5.6219432735815644e-06, -5.2194523050275166e-06, -4.816961336473469e-06, -4.414470367919421e-06, -4.011979399365373e-06, -3.609488430811325e-06, -3.2069974622572772e-06, -2.8045064937032294e-06, -2.4020155251491815e-06, -1.9995245565951336e-06, -1.5970335880410857e-06, -1.1945426194870379e-06, -7.9205165093299e-07, -3.8956068237894215e-07, 1.2931195669807494e-08, 4.1542216422385536e-07, 8.179131327779032e-07, 1.220404101331951e-06, 1.622895069885999e-06, 2.025386038440047e-06, 2.4278770069940947e-06, 2.8303679755481426e-06, 3.2328589441021904e-06, 3.6353499126562383e-06, 4.037840881210286e-06, 4.440331849764334e-06, 4.842822818318382e-06, 5.24531378687243e-06, 5.647804755426478e-06, 6.0502957239805255e-06, 6.452786692534573e-06, 6.855277661088621e-06, 7.257768629642669e-06, 7.660259143449366e-06, 8.062750566750765e-06, 8.465241990052164e-06, 8.86773250385886e-06, 9.270223017665558e-06, 9.672714440966956e-06, 1.0075205864268355e-05, 1.0477696378075052e-05, 1.0880186891881749e-05, 1.1282678315183148e-05, 1.1685169738484547e-05, 1.2087660252291244e-05, 1.249015076609794e-05, 1.289264218939934e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 3.0, 14.0, 13.0, 27.0, 38.0, 45.0, 86.0, 124.0, 210.0, 264.0, 408.0, 715.0, 1142.0, 2023.0, 3048.0, 4859.0, 9362.0, 15760.0, 31424.0, 60543.0, 154576.0, 387648.0, 208867.0, 83555.0, 36871.0, 20429.0, 10447.0, 6390.0, 3681.0, 2242.0, 1412.0, 853.0, 574.0, 302.0, 199.0, 141.0, 83.0, 63.0, 33.0, 23.0, 21.0, 8.0, 6.0, 5.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0994415283203125e-05, -3.0015595257282257e-05, -2.903677523136139e-05, -2.805795520544052e-05, -2.7079135179519653e-05, -2.6100315153598785e-05, -2.5121495127677917e-05, -2.414267510175705e-05, -2.316385507583618e-05, -2.2185035049915314e-05, -2.1206215023994446e-05, -2.0227394998073578e-05, -1.924857497215271e-05, -1.8269754946231842e-05, -1.7290934920310974e-05, -1.6312114894390106e-05, -1.5333294868469238e-05, -1.435447484254837e-05, -1.3375654816627502e-05, -1.2396834790706635e-05, -1.1418014764785767e-05, -1.0439194738864899e-05, -9.46037471294403e-06, -8.481554687023163e-06, -7.502734661102295e-06, -6.523914635181427e-06, -5.545094609260559e-06, -4.566274583339691e-06, -3.5874545574188232e-06, -2.6086345314979553e-06, -1.6298145055770874e-06, -6.509944796562195e-07, 3.2782554626464844e-07, 1.3066455721855164e-06, 2.2854655981063843e-06, 3.264285624027252e-06, 4.24310564994812e-06, 5.221925675868988e-06, 6.200745701789856e-06, 7.179565727710724e-06, 8.158385753631592e-06, 9.13720577955246e-06, 1.0116025805473328e-05, 1.1094845831394196e-05, 1.2073665857315063e-05, 1.3052485883235931e-05, 1.40313059091568e-05, 1.5010125935077667e-05, 1.5988945960998535e-05, 1.6967765986919403e-05, 1.794658601284027e-05, 1.892540603876114e-05, 1.9904226064682007e-05, 2.0883046090602875e-05, 2.1861866116523743e-05, 2.284068614244461e-05, 2.381950616836548e-05, 2.4798326194286346e-05, 2.5777146220207214e-05, 2.6755966246128082e-05, 2.773478627204895e-05, 2.8713606297969818e-05, 2.9692426323890686e-05, 3.0671246349811554e-05, 3.165006637573242e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 4.0, 7.0, 18.0, 9.0, 9.0, 10.0, 19.0, 19.0, 29.0, 30.0, 41.0, 33.0, 48.0, 52.0, 46.0, 51.0, 53.0, 35.0, 49.0, 44.0, 46.0, 49.0, 46.0, 36.0, 46.0, 25.0, 27.0, 21.0, 21.0, 27.0, 10.0, 9.0, 7.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.154420018196106e-06, -6.917864084243774e-06, -6.681308150291443e-06, -6.444752216339111e-06, -6.20819628238678e-06, -5.971640348434448e-06, -5.735084414482117e-06, -5.498528480529785e-06, -5.261972546577454e-06, -5.025416612625122e-06, -4.7888606786727905e-06, -4.552304744720459e-06, -4.3157488107681274e-06, -4.079192876815796e-06, -3.842636942863464e-06, -3.606081008911133e-06, -3.3695250749588013e-06, -3.1329691410064697e-06, -2.896413207054138e-06, -2.6598572731018066e-06, -2.423301339149475e-06, -2.1867454051971436e-06, -1.950189471244812e-06, -1.7136335372924805e-06, -1.477077603340149e-06, -1.2405216693878174e-06, -1.0039657354354858e-06, -7.674098014831543e-07, -5.308538675308228e-07, -2.942979335784912e-07, -5.774199962615967e-08, 1.7881393432617188e-07, 4.153698682785034e-07, 6.51925802230835e-07, 8.884817361831665e-07, 1.125037670135498e-06, 1.3615936040878296e-06, 1.5981495380401611e-06, 1.8347054719924927e-06, 2.0712614059448242e-06, 2.3078173398971558e-06, 2.5443732738494873e-06, 2.780929207801819e-06, 3.0174851417541504e-06, 3.254041075706482e-06, 3.4905970096588135e-06, 3.727152943611145e-06, 3.9637088775634766e-06, 4.200264811515808e-06, 4.43682074546814e-06, 4.673376679420471e-06, 4.909932613372803e-06, 5.146488547325134e-06, 5.383044481277466e-06, 5.619600415229797e-06, 5.856156349182129e-06, 6.0927122831344604e-06, 6.329268217086792e-06, 6.5658241510391235e-06, 6.802380084991455e-06, 7.038936018943787e-06, 7.275491952896118e-06, 7.51204788684845e-06, 7.748603820800781e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 13.0, 7.0, 9.0, 16.0, 25.0, 45.0, 34.0, 72.0, 104.0, 136.0, 253.0, 406.0, 688.0, 1255.0, 2081.0, 3793.0, 6940.0, 12663.0, 24175.0, 43844.0, 103760.0, 304396.0, 330606.0, 111362.0, 49003.0, 24175.0, 12642.0, 6945.0, 3835.0, 2144.0, 1229.0, 730.0, 407.0, 255.0, 160.0, 99.0, 75.0, 40.0, 41.0, 31.0, 18.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.6166439056396484e-05, -2.53971666097641e-05, -2.4627894163131714e-05, -2.385862171649933e-05, -2.3089349269866943e-05, -2.2320076823234558e-05, -2.1550804376602173e-05, -2.0781531929969788e-05, -2.0012259483337402e-05, -1.9242987036705017e-05, -1.8473714590072632e-05, -1.7704442143440247e-05, -1.693516969680786e-05, -1.6165897250175476e-05, -1.539662480354309e-05, -1.4627352356910706e-05, -1.385807991027832e-05, -1.3088807463645935e-05, -1.231953501701355e-05, -1.1550262570381165e-05, -1.078099012374878e-05, -1.0011717677116394e-05, -9.242445230484009e-06, -8.473172783851624e-06, -7.703900337219238e-06, -6.934627890586853e-06, -6.165355443954468e-06, -5.3960829973220825e-06, -4.626810550689697e-06, -3.857538104057312e-06, -3.0882656574249268e-06, -2.3189932107925415e-06, -1.5497207641601562e-06, -7.80448317527771e-07, -1.1175870895385742e-08, 7.580965757369995e-07, 1.5273690223693848e-06, 2.29664146900177e-06, 3.0659139156341553e-06, 3.8351863622665405e-06, 4.604458808898926e-06, 5.373731255531311e-06, 6.143003702163696e-06, 6.9122761487960815e-06, 7.681548595428467e-06, 8.450821042060852e-06, 9.220093488693237e-06, 9.989365935325623e-06, 1.0758638381958008e-05, 1.1527910828590393e-05, 1.2297183275222778e-05, 1.3066455721855164e-05, 1.3835728168487549e-05, 1.4605000615119934e-05, 1.537427306175232e-05, 1.6143545508384705e-05, 1.691281795501709e-05, 1.7682090401649475e-05, 1.845136284828186e-05, 1.9220635294914246e-05, 1.998990774154663e-05, 2.0759180188179016e-05, 2.15284526348114e-05, 2.2297725081443787e-05, 2.3066997528076172e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 11.0, 12.0, 11.0, 15.0, 11.0, 22.0, 19.0, 21.0, 12.0, 21.0, 36.0, 31.0, 30.0, 41.0, 48.0, 54.0, 30.0, 36.0, 46.0, 39.0, 46.0, 50.0, 33.0, 37.0, 31.0, 36.0, 24.0, 29.0, 21.0, 24.0, 18.0, 18.0, 15.0, 11.0, 14.0, 7.0, 12.0, 10.0, 1.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4836273193359375e-06, -5.301088094711304e-06, -5.11854887008667e-06, -4.936009645462036e-06, -4.753470420837402e-06, -4.5709311962127686e-06, -4.388391971588135e-06, -4.205852746963501e-06, -4.023313522338867e-06, -3.840774297714233e-06, -3.6582350730895996e-06, -3.475695848464966e-06, -3.293156623840332e-06, -3.1106173992156982e-06, -2.9280781745910645e-06, -2.7455389499664307e-06, -2.562999725341797e-06, -2.380460500717163e-06, -2.1979212760925293e-06, -2.0153820514678955e-06, -1.8328428268432617e-06, -1.650303602218628e-06, -1.4677643775939941e-06, -1.2852251529693604e-06, -1.1026859283447266e-06, -9.201467037200928e-07, -7.37607479095459e-07, -5.550682544708252e-07, -3.725290298461914e-07, -1.8998980522155762e-07, -7.450580596923828e-09, 1.7508864402770996e-07, 3.5762786865234375e-07, 5.401670932769775e-07, 7.227063179016113e-07, 9.052455425262451e-07, 1.087784767150879e-06, 1.2703239917755127e-06, 1.4528632164001465e-06, 1.6354024410247803e-06, 1.817941665649414e-06, 2.000480890274048e-06, 2.1830201148986816e-06, 2.3655593395233154e-06, 2.5480985641479492e-06, 2.730637788772583e-06, 2.913177013397217e-06, 3.0957162380218506e-06, 3.2782554626464844e-06, 3.460794687271118e-06, 3.643333911895752e-06, 3.825873136520386e-06, 4.0084123611450195e-06, 4.190951585769653e-06, 4.373490810394287e-06, 4.556030035018921e-06, 4.738569259643555e-06, 4.9211084842681885e-06, 5.103647708892822e-06, 5.286186933517456e-06, 5.46872615814209e-06, 5.651265382766724e-06, 5.833804607391357e-06, 6.016343832015991e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 15.0, 15.0, 19.0, 23.0, 25.0, 41.0, 72.0, 189.0, 185.0, 255.0, 398.0, 730.0, 1349.0, 2650.0, 5385.0, 84824.0, 856232.0, 68846.0, 15849.0, 5531.0, 2596.0, 1346.0, 718.0, 653.0, 152.0, 122.0, 80.0, 65.0, 33.0, 41.0, 17.0, 39.0, 12.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.2649765014648438e-06, -2.1979212760925293e-06, -2.130866050720215e-06, -2.0638108253479004e-06, -1.996755599975586e-06, -1.9297003746032715e-06, -1.862645149230957e-06, -1.7955899238586426e-06, -1.7285346984863281e-06, -1.6614794731140137e-06, -1.5944242477416992e-06, -1.5273690223693848e-06, -1.4603137969970703e-06, -1.3932585716247559e-06, -1.3262033462524414e-06, -1.259148120880127e-06, -1.1920928955078125e-06, -1.125037670135498e-06, -1.0579824447631836e-06, -9.909272193908691e-07, -9.238719940185547e-07, -8.568167686462402e-07, -7.897615432739258e-07, -7.227063179016113e-07, -6.556510925292969e-07, -5.885958671569824e-07, -5.21540641784668e-07, -4.544854164123535e-07, -3.8743019104003906e-07, -3.203749656677246e-07, -2.5331974029541016e-07, -1.862645149230957e-07, -1.1920928955078125e-07, -5.21540641784668e-08, 1.4901161193847656e-08, 8.195638656616211e-08, 1.4901161193847656e-07, 2.1606683731079102e-07, 2.8312206268310547e-07, 3.501772880554199e-07, 4.172325134277344e-07, 4.842877388000488e-07, 5.513429641723633e-07, 6.183981895446777e-07, 6.854534149169922e-07, 7.525086402893066e-07, 8.195638656616211e-07, 8.866190910339355e-07, 9.5367431640625e-07, 1.0207295417785645e-06, 1.087784767150879e-06, 1.1548399925231934e-06, 1.2218952178955078e-06, 1.2889504432678223e-06, 1.3560056686401367e-06, 1.4230608940124512e-06, 1.4901161193847656e-06, 1.55717134475708e-06, 1.6242265701293945e-06, 1.691281795501709e-06, 1.7583370208740234e-06, 1.8253922462463379e-06, 1.8924474716186523e-06, 1.959502696990967e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 959.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.647299647331238e-07, -4.5262277126312256e-07, -4.4051557779312134e-07, -4.284083843231201e-07, -4.163011908531189e-07, -4.041939973831177e-07, -3.9208680391311646e-07, -3.7997961044311523e-07, -3.67872416973114e-07, -3.557652235031128e-07, -3.4365803003311157e-07, -3.3155083656311035e-07, -3.1944364309310913e-07, -3.073364496231079e-07, -2.952292561531067e-07, -2.8312206268310547e-07, -2.7101486921310425e-07, -2.5890767574310303e-07, -2.468004822731018e-07, -2.3469328880310059e-07, -2.2258609533309937e-07, -2.1047890186309814e-07, -1.9837170839309692e-07, -1.862645149230957e-07, -1.7415732145309448e-07, -1.6205012798309326e-07, -1.4994293451309204e-07, -1.3783574104309082e-07, -1.257285475730896e-07, -1.1362135410308838e-07, -1.0151416063308716e-07, -8.940696716308594e-08, -7.729977369308472e-08, -6.51925802230835e-08, -5.3085386753082275e-08, -4.0978193283081055e-08, -2.8870999813079834e-08, -1.6763806343078613e-08, -4.6566128730773926e-09, 7.450580596923828e-09, 1.955777406692505e-08, 3.166496753692627e-08, 4.377216100692749e-08, 5.587935447692871e-08, 6.798654794692993e-08, 8.009374141693115e-08, 9.220093488693237e-08, 1.043081283569336e-07, 1.1641532182693481e-07, 1.2852251529693604e-07, 1.4062970876693726e-07, 1.5273690223693848e-07, 1.648440957069397e-07, 1.7695128917694092e-07, 1.8905848264694214e-07, 2.0116567611694336e-07, 2.1327286958694458e-07, 2.253800630569458e-07, 2.3748725652694702e-07, 2.4959444999694824e-07, 2.6170164346694946e-07, 2.738088369369507e-07, 2.859160304069519e-07, 2.980232238769531e-07]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 17.0, 14.0, 29.0, 66.0, 49.0, 82.0, 150.0, 355.0, 1136.0, 2063.0, 0.0, 12893.0, 60839.0, 892913.0, 61015.0, 12968.0, 2084.0, 1076.0, 355.0, 148.0, 96.0, 53.0, 51.0, 28.0, 16.0, 18.0, 0.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8514692783355713e-06, -1.7955899238586426e-06, -1.7397105693817139e-06, -1.6838312149047852e-06, -1.6279518604278564e-06, -1.5720725059509277e-06, -1.516193151473999e-06, -1.4603137969970703e-06, -1.4044344425201416e-06, -1.3485550880432129e-06, -1.2926757335662842e-06, -1.2367963790893555e-06, -1.1809170246124268e-06, -1.125037670135498e-06, -1.0691583156585693e-06, -1.0132789611816406e-06, -9.57399606704712e-07, -9.015202522277832e-07, -8.456408977508545e-07, -7.897615432739258e-07, -7.338821887969971e-07, -6.780028343200684e-07, -6.221234798431396e-07, -5.662441253662109e-07, -5.103647708892822e-07, -4.544854164123535e-07, -3.986060619354248e-07, -3.427267074584961e-07, -2.868473529815674e-07, -2.3096799850463867e-07, -1.7508864402770996e-07, -1.1920928955078125e-07, -6.332993507385254e-08, -7.450580596923828e-09, 4.842877388000488e-08, 1.043081283569336e-07, 1.601874828338623e-07, 2.1606683731079102e-07, 2.7194619178771973e-07, 3.2782554626464844e-07, 3.8370490074157715e-07, 4.3958425521850586e-07, 4.954636096954346e-07, 5.513429641723633e-07, 6.07222318649292e-07, 6.631016731262207e-07, 7.189810276031494e-07, 7.748603820800781e-07, 8.307397365570068e-07, 8.866190910339355e-07, 9.424984455108643e-07, 9.98377799987793e-07, 1.0542571544647217e-06, 1.1101365089416504e-06, 1.166015863418579e-06, 1.2218952178955078e-06, 1.2777745723724365e-06, 1.3336539268493652e-06, 1.389533281326294e-06, 1.4454126358032227e-06, 1.5012919902801514e-06, 1.55717134475708e-06, 1.6130506992340088e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 0.0, 0.0, 751.0, 0.0, 0.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 10.0, 8.0, 10.0, 9.0, 11.0, 12.0, 16.0, 18.0, 20.0, 29.0, 41.0, 59.0, 85.0, 104.0, 146.0, 107.0, 80.0, 39.0, 44.0, 34.0, 27.0, 16.0, 22.0, 7.0, 10.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0208670573774725e-05, -9.873107046587393e-06, -9.537542609905358e-06, -9.201979082718026e-06, -8.866415555530693e-06, -8.530852028343361e-06, -8.195287591661327e-06, -7.859724064473994e-06, -7.5241605372866616e-06, -7.188596555351978e-06, -6.853033028164646e-06, -6.517469046229962e-06, -6.18190551904263e-06, -5.846341537107946e-06, -5.510777555173263e-06, -5.1752140279859304e-06, -4.839650046051247e-06, -4.504086064116564e-06, -4.168522536929231e-06, -3.832958554994548e-06, -3.4973950278072152e-06, -3.161831045872532e-06, -2.826267291311524e-06, -2.490703536750516e-06, -2.155139782189508e-06, -1.8195760276285e-06, -1.484012273067492e-06, -1.1484484048196464e-06, -8.128846502586384e-07, -4.773208956976305e-07, -1.417570274497848e-07, 1.9380672711122315e-07, 5.293704816722311e-07, 8.649342362332391e-07, 1.200497990794247e-06, 1.5360618590420927e-06, 1.8716256136031006e-06, 2.2071894818509463e-06, 2.5427532364119543e-06, 2.8783169909729622e-06, 3.21388074553397e-06, 3.549444500094978e-06, 3.8850084820296615e-06, 4.220572009216994e-06, 4.5561359911516774e-06, 4.89169951833901e-06, 5.227263500273693e-06, 5.562827027461026e-06, 5.898391009395709e-06, 6.233954991330393e-06, 6.569518518517725e-06, 6.9050825004524086e-06, 7.240646027639741e-06, 7.5762100095744245e-06, 7.911773536761757e-06, 8.247337973443791e-06, 8.582901500631124e-06, 8.918465027818456e-06, 9.25402946450049e-06, 9.589592991687823e-06, 9.925156518875156e-06, 1.0260720046062488e-05, 1.0596284482744522e-05, 1.0931848009931855e-05, 1.1267411537119187e-05]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 8.0, 13.0, 7.0, 23.0, 25.0, 22.0, 21.0, 27.0, 38.0, 38.0, 29.0, 49.0, 68.0, 49.0, 51.0, 58.0, 37.0, 54.0, 43.0, 50.0, 40.0, 41.0, 30.0, 40.0, 21.0, 21.0, 10.0, 23.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.670879080658779e-06, -9.391658750246279e-06, -9.11243841983378e-06, -8.83321808942128e-06, -8.55399775900878e-06, -8.27477742859628e-06, -7.995557098183781e-06, -7.716336767771281e-06, -7.437116437358782e-06, -7.157896106946282e-06, -6.8786757765337825e-06, -6.599455446121283e-06, -6.320235115708783e-06, -6.041014785296284e-06, -5.761794454883784e-06, -5.4825741244712844e-06, -5.203353339311434e-06, -4.924133008898934e-06, -4.644912678486435e-06, -4.365692348073935e-06, -4.0864720176614355e-06, -3.807251687248936e-06, -3.528031129462761e-06, -3.2488107990502613e-06, -2.9695904686377617e-06, -2.690370138225262e-06, -2.4111498078127624e-06, -2.1319292500265874e-06, -1.8527090333009255e-06, -1.573488702888426e-06, -1.2942682587890886e-06, -1.015047928376589e-06, -7.358275979640894e-07, -4.5660723912988033e-07, -1.773868802956713e-07, 1.0183350696024718e-07, 3.810538373727468e-07, 6.602741677852464e-07, 9.394946118845837e-07, 1.2187149422970833e-06, 1.497935272709583e-06, 1.7771556031220825e-06, 2.056375933534582e-06, 2.335596491320757e-06, 2.614816821733257e-06, 2.8940371521457564e-06, 3.173257482558256e-06, 3.4524778129707556e-06, 3.7316981433832552e-06, 4.010918473795755e-06, 4.2901388042082544e-06, 4.569359134620754e-06, 4.848579465033254e-06, 5.127799795445753e-06, 5.407020580605604e-06, 5.686240911018103e-06, 5.965461241430603e-06, 6.2446815718431026e-06, 6.523901902255602e-06, 6.803122232668102e-06, 7.082342563080601e-06, 7.361562893493101e-06, 7.6407832239056e-06, 7.9200035543181e-06, 8.1992238847306e-06]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 5.0, 11.0, 9.0, 12.0, 18.0, 17.0, 29.0, 28.0, 36.0, 80.0, 105.0, 231.0, 473.0, 1147.0, 3247.0, 11701.0, 4085518.0, 80800.0, 7047.0, 2060.0, 863.0, 349.0, 184.0, 88.0, 58.0, 39.0, 25.0, 20.0, 24.0, 10.0, 16.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16312026977539e-05, -5.986075848340988e-05, -5.809031426906586e-05, -5.631987005472183e-05, -5.454942584037781e-05, -5.277898162603378e-05, -5.100853741168976e-05, -4.9238093197345734e-05, -4.746764898300171e-05, -4.5697204768657684e-05, -4.392676055431366e-05, -4.2156316339969635e-05, -4.038587212562561e-05, -3.8615427911281586e-05, -3.684498369693756e-05, -3.5074539482593536e-05, -3.330409526824951e-05, -3.153365105390549e-05, -2.9763206839561462e-05, -2.7992762625217438e-05, -2.6222318410873413e-05, -2.445187419652939e-05, -2.2681429982185364e-05, -2.091098576784134e-05, -1.9140541553497314e-05, -1.737009733915329e-05, -1.5599653124809265e-05, -1.382920891046524e-05, -1.2058764696121216e-05, -1.0288320481777191e-05, -8.517876267433167e-06, -6.747432053089142e-06, -4.976987838745117e-06, -3.2065436244010925e-06, -1.4360994100570679e-06, 3.343448042869568e-07, 2.1047890186309814e-06, 3.875233232975006e-06, 5.645677447319031e-06, 7.416121661663055e-06, 9.18656587600708e-06, 1.0957010090351105e-05, 1.272745430469513e-05, 1.4497898519039154e-05, 1.626834273338318e-05, 1.8038786947727203e-05, 1.9809231162071228e-05, 2.1579675376415253e-05, 2.3350119590759277e-05, 2.5120563805103302e-05, 2.6891008019447327e-05, 2.866145223379135e-05, 3.0431896448135376e-05, 3.22023406624794e-05, 3.3972784876823425e-05, 3.574322909116745e-05, 3.7513673305511475e-05, 3.92841175198555e-05, 4.1054561734199524e-05, 4.282500594854355e-05, 4.459545016288757e-05, 4.63658943772316e-05, 4.813633859157562e-05, 4.990678280591965e-05, 5.167722702026367e-05]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 11.0, 11.0, 7.0, 13.0, 17.0, 16.0, 24.0, 32.0, 24.0, 34.0, 34.0, 45.0, 44.0, 35.0, 64.0, 54.0, 60.0, 52.0, 47.0, 55.0, 51.0, 39.0, 36.0, 30.0, 26.0, 26.0, 17.0, 24.0, 18.0, 11.0, 14.0, 9.0, 6.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9604644775390625e-06, -5.7872384786605835e-06, -5.6140124797821045e-06, -5.4407864809036255e-06, -5.2675604820251465e-06, -5.0943344831466675e-06, -4.9211084842681885e-06, -4.7478824853897095e-06, -4.5746564865112305e-06, -4.4014304876327515e-06, -4.2282044887542725e-06, -4.0549784898757935e-06, -3.8817524909973145e-06, -3.7085264921188354e-06, -3.5353004932403564e-06, -3.3620744943618774e-06, -3.1888484954833984e-06, -3.0156224966049194e-06, -2.8423964977264404e-06, -2.6691704988479614e-06, -2.4959444999694824e-06, -2.3227185010910034e-06, -2.1494925022125244e-06, -1.9762665033340454e-06, -1.8030405044555664e-06, -1.6298145055770874e-06, -1.4565885066986084e-06, -1.2833625078201294e-06, -1.1101365089416504e-06, -9.369105100631714e-07, -7.636845111846924e-07, -5.904585123062134e-07, -4.172325134277344e-07, -2.4400651454925537e-07, -7.078051567077637e-08, 1.0244548320770264e-07, 2.7567148208618164e-07, 4.4889748096466064e-07, 6.221234798431396e-07, 7.953494787216187e-07, 9.685754776000977e-07, 1.1418014764785767e-06, 1.3150274753570557e-06, 1.4882534742355347e-06, 1.6614794731140137e-06, 1.8347054719924927e-06, 2.0079314708709717e-06, 2.1811574697494507e-06, 2.3543834686279297e-06, 2.5276094675064087e-06, 2.7008354663848877e-06, 2.8740614652633667e-06, 3.0472874641418457e-06, 3.2205134630203247e-06, 3.3937394618988037e-06, 3.5669654607772827e-06, 3.7401914596557617e-06, 3.913417458534241e-06, 4.08664345741272e-06, 4.259869456291199e-06, 4.433095455169678e-06, 4.606321454048157e-06, 4.779547452926636e-06, 4.952773451805115e-06, 5.125999450683594e-06]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 4.0, 10.0, 22.0, 40.0, 45.0, 98.0, 197.0, 399.0, 1052.0, 2779.0, 9480.0, 61877.0, 4066022.0, 40325.0, 7817.0, 2327.0, 916.0, 400.0, 189.0, 118.0, 57.0, 40.0, 19.0, 18.0, 9.0, 5.0, 5.0, 0.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2378902435302734e-05, -4.114769399166107e-05, -3.991648554801941e-05, -3.8685277104377747e-05, -3.7454068660736084e-05, -3.622286021709442e-05, -3.499165177345276e-05, -3.3760443329811096e-05, -3.2529234886169434e-05, -3.129802644252777e-05, -3.006681799888611e-05, -2.8835609555244446e-05, -2.7604401111602783e-05, -2.637319266796112e-05, -2.5141984224319458e-05, -2.3910775780677795e-05, -2.2679567337036133e-05, -2.144835889339447e-05, -2.0217150449752808e-05, -1.8985942006111145e-05, -1.7754733562469482e-05, -1.652352511882782e-05, -1.5292316675186157e-05, -1.4061108231544495e-05, -1.2829899787902832e-05, -1.159869134426117e-05, -1.0367482900619507e-05, -9.136274456977844e-06, -7.905066013336182e-06, -6.673857569694519e-06, -5.4426491260528564e-06, -4.211440682411194e-06, -2.9802322387695312e-06, -1.7490237951278687e-06, -5.178153514862061e-07, 7.133930921554565e-07, 1.944601535797119e-06, 3.1758099794387817e-06, 4.407018423080444e-06, 5.638226866722107e-06, 6.8694353103637695e-06, 8.100643754005432e-06, 9.331852197647095e-06, 1.0563060641288757e-05, 1.179426908493042e-05, 1.3025477528572083e-05, 1.4256685972213745e-05, 1.5487894415855408e-05, 1.671910285949707e-05, 1.7950311303138733e-05, 1.9181519746780396e-05, 2.0412728190422058e-05, 2.164393663406372e-05, 2.2875145077705383e-05, 2.4106353521347046e-05, 2.533756196498871e-05, 2.656877040863037e-05, 2.7799978852272034e-05, 2.9031187295913696e-05, 3.026239573955536e-05, 3.149360418319702e-05, 3.2724812626838684e-05, 3.395602107048035e-05, 3.518722951412201e-05, 3.641843795776367e-05]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 5.0, 10.0, 9.0, 6.0, 13.0, 1.0, 23.0, 36.0, 101.0, 415.0, 2477.0, 740.0, 135.0, 37.0, 13.0, 8.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.947185516357422e-06, -4.780478775501251e-06, -4.6137720346450806e-06, -4.44706529378891e-06, -4.280358552932739e-06, -4.113651812076569e-06, -3.946945071220398e-06, -3.7802383303642273e-06, -3.6135315895080566e-06, -3.446824848651886e-06, -3.2801181077957153e-06, -3.1134113669395447e-06, -2.946704626083374e-06, -2.7799978852272034e-06, -2.6132911443710327e-06, -2.446584403514862e-06, -2.2798776626586914e-06, -2.1131709218025208e-06, -1.94646418094635e-06, -1.7797574400901794e-06, -1.6130506992340088e-06, -1.4463439583778381e-06, -1.2796372175216675e-06, -1.1129304766654968e-06, -9.462237358093262e-07, -7.795169949531555e-07, -6.128102540969849e-07, -4.461035132408142e-07, -2.7939677238464355e-07, -1.126900315284729e-07, 5.4016709327697754e-08, 2.207234501838684e-07, 3.8743019104003906e-07, 5.541369318962097e-07, 7.208436727523804e-07, 8.87550413608551e-07, 1.0542571544647217e-06, 1.2209638953208923e-06, 1.387670636177063e-06, 1.5543773770332336e-06, 1.7210841178894043e-06, 1.887790858745575e-06, 2.0544975996017456e-06, 2.2212043404579163e-06, 2.387911081314087e-06, 2.5546178221702576e-06, 2.7213245630264282e-06, 2.888031303882599e-06, 3.0547380447387695e-06, 3.22144478559494e-06, 3.388151526451111e-06, 3.5548582673072815e-06, 3.721565008163452e-06, 3.888271749019623e-06, 4.0549784898757935e-06, 4.221685230731964e-06, 4.388391971588135e-06, 4.555098712444305e-06, 4.721805453300476e-06, 4.888512194156647e-06, 5.055218935012817e-06, 5.221925675868988e-06, 5.388632416725159e-06, 5.555339157581329e-06, 5.7220458984375e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 12.0, 11.0, 17.0, 14.0, 20.0, 33.0, 29.0, 40.0, 58.0, 92.0, 157.0, 131.0, 103.0, 70.0, 57.0, 32.0, 27.0, 14.0, 13.0, 6.0, 16.0, 11.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.14581676927628e-06, -5.901014446862973e-06, -5.656212124449667e-06, -5.41140980203636e-06, -5.166607934370404e-06, -4.9218056119570974e-06, -4.677003289543791e-06, -4.432200967130484e-06, -4.187399099464528e-06, -3.942596777051222e-06, -3.6977946820115903e-06, -3.4529923595982837e-06, -3.2081902645586524e-06, -2.9633879421453457e-06, -2.718585619732039e-06, -2.4737832973187324e-06, -2.2289809749054257e-06, -1.984178652492119e-06, -1.7393765574524878e-06, -1.494574235039181e-06, -1.2497720263127121e-06, -1.0049698175862432e-06, -7.601674951729365e-07, -5.153652864464675e-07, -2.7056307771999855e-07, -2.5760840571820154e-08, 2.1904139657635824e-07, 4.6384366214624606e-07, 7.08645870872715e-07, 9.53448079599184e-07, 1.1982504020124907e-06, 1.4430526107389596e-06, 1.6878548194654286e-06, 1.9326571418787353e-06, 2.1774592369183665e-06, 2.422261559331673e-06, 2.6670636543713044e-06, 2.911865976784611e-06, 3.156668299197918e-06, 3.4014706216112245e-06, 3.6462727166508557e-06, 3.891074811690487e-06, 4.135877134103794e-06, 4.3806794565171e-06, 4.625481778930407e-06, 4.870284101343714e-06, 5.11508642375702e-06, 5.359888291422976e-06, 5.604690613836283e-06, 5.8494929362495895e-06, 6.094295258662896e-06, 6.339097126328852e-06, 6.583899448742159e-06, 6.828701771155465e-06, 7.073504093568772e-06, 7.318306415982079e-06, 7.5631087383953854e-06, 7.807911060808692e-06, 8.052713383221999e-06, 8.297515705635305e-06, 8.542318028048612e-06, 8.787119440967217e-06, 9.031922672875226e-06, 9.27672408579383e-06, 9.521526408207137e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 6.0, 11.0, 10.0, 8.0, 15.0, 22.0, 19.0, 29.0, 28.0, 22.0, 47.0, 37.0, 52.0, 26.0, 47.0, 54.0, 51.0, 61.0, 59.0, 49.0, 57.0, 40.0, 40.0, 27.0, 40.0, 21.0, 30.0, 16.0, 22.0, 14.0, 11.0, 13.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.093946805980522e-06, -6.906579983478878e-06, -6.719213615724584e-06, -6.5318472479702905e-06, -6.344480425468646e-06, -6.1571136029670015e-06, -5.969747235212708e-06, -5.782380867458414e-06, -5.59501404495677e-06, -5.407647222455125e-06, -5.220280854700832e-06, -5.032914486946538e-06, -4.845547664444894e-06, -4.658180841943249e-06, -4.4708144741889555e-06, -4.283448106434662e-06, -4.096081283933017e-06, -3.908714461431373e-06, -3.7213480936770793e-06, -3.5339814985491103e-06, -3.346614903421141e-06, -3.159248308293172e-06, -2.971881713165203e-06, -2.784515118037234e-06, -2.597148522909265e-06, -2.409781927781296e-06, -2.222415332653327e-06, -2.035048737525358e-06, -1.8476821423973888e-06, -1.6603155472694198e-06, -1.4729489521414507e-06, -1.2855823570134817e-06, -1.0982157618855126e-06, -9.108491667575436e-07, -7.234825716295745e-07, -5.361159765016055e-07, -3.487493813736364e-07, -1.6138278624566738e-07, 2.5983808882301673e-08, 2.1335040401027072e-07, 4.0071699913823977e-07, 5.880835942662088e-07, 7.754501893941779e-07, 9.62816784522147e-07, 1.150183379650116e-06, 1.337549974778085e-06, 1.524916569906054e-06, 1.7122831650340231e-06, 1.8996497601619922e-06, 2.087016355289961e-06, 2.2743829504179303e-06, 2.4617495455458993e-06, 2.6491161406738684e-06, 2.8364827358018374e-06, 3.0238493309298065e-06, 3.2112159260577755e-06, 3.3985825211857446e-06, 3.5859491163137136e-06, 3.7733157114416827e-06, 3.960682079195976e-06, 4.148048901697621e-06, 4.335415724199265e-06, 4.522782091953559e-06, 4.7101484597078525e-06, 4.897515282209497e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 13.0, 13.0, 13.0, 25.0, 48.0, 45.0, 86.0, 127.0, 195.0, 495.0, 677.0, 1098.0, 1855.0, 4461.0, 6117.0, 10189.0, 16957.0, 29039.0, 77469.0, 130054.0, 309530.0, 236125.0, 100700.0, 63228.0, 24187.0, 14444.0, 8606.0, 6205.0, 2558.0, 1583.0, 907.0, 547.0, 418.0, 188.0, 120.0, 75.0, 58.0, 27.0, 24.0, 13.0, 6.0, 8.0, 2.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.7220458984375e-06, -5.5301934480667114e-06, -5.338340997695923e-06, -5.146488547325134e-06, -4.954636096954346e-06, -4.762783646583557e-06, -4.5709311962127686e-06, -4.37907874584198e-06, -4.187226295471191e-06, -3.995373845100403e-06, -3.8035213947296143e-06, -3.6116689443588257e-06, -3.419816493988037e-06, -3.2279640436172485e-06, -3.03611159324646e-06, -2.8442591428756714e-06, -2.652406692504883e-06, -2.4605542421340942e-06, -2.2687017917633057e-06, -2.076849341392517e-06, -1.8849968910217285e-06, -1.69314444065094e-06, -1.5012919902801514e-06, -1.3094395399093628e-06, -1.1175870895385742e-06, -9.257346391677856e-07, -7.338821887969971e-07, -5.420297384262085e-07, -3.501772880554199e-07, -1.5832483768463135e-07, 3.3527612686157227e-08, 2.253800630569458e-07, 4.172325134277344e-07, 6.09084963798523e-07, 8.009374141693115e-07, 9.927898645401e-07, 1.1846423149108887e-06, 1.3764947652816772e-06, 1.5683472156524658e-06, 1.7601996660232544e-06, 1.952052116394043e-06, 2.1439045667648315e-06, 2.33575701713562e-06, 2.5276094675064087e-06, 2.7194619178771973e-06, 2.911314368247986e-06, 3.1031668186187744e-06, 3.295019268989563e-06, 3.4868717193603516e-06, 3.67872416973114e-06, 3.870576620101929e-06, 4.062429070472717e-06, 4.254281520843506e-06, 4.4461339712142944e-06, 4.637986421585083e-06, 4.829838871955872e-06, 5.02169132232666e-06, 5.213543772697449e-06, 5.405396223068237e-06, 5.597248673439026e-06, 5.7891011238098145e-06, 5.980953574180603e-06, 6.172806024551392e-06, 6.36465847492218e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 11.0, 6.0, 5.0, 11.0, 7.0, 17.0, 18.0, 18.0, 20.0, 27.0, 31.0, 29.0, 40.0, 39.0, 42.0, 47.0, 42.0, 77.0, 55.0, 63.0, 51.0, 33.0, 46.0, 37.0, 40.0, 30.0, 32.0, 29.0, 25.0, 18.0, 13.0, 19.0, 10.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.794929504394531e-06, -6.60773366689682e-06, -6.420537829399109e-06, -6.233341991901398e-06, -6.0461461544036865e-06, -5.858950316905975e-06, -5.671754479408264e-06, -5.484558641910553e-06, -5.297362804412842e-06, -5.110166966915131e-06, -4.9229711294174194e-06, -4.735775291919708e-06, -4.548579454421997e-06, -4.361383616924286e-06, -4.174187779426575e-06, -3.9869919419288635e-06, -3.7997961044311523e-06, -3.612600266933441e-06, -3.42540442943573e-06, -3.238208591938019e-06, -3.0510127544403076e-06, -2.8638169169425964e-06, -2.6766210794448853e-06, -2.489425241947174e-06, -2.302229404449463e-06, -2.1150335669517517e-06, -1.9278377294540405e-06, -1.7406418919563293e-06, -1.5534460544586182e-06, -1.366250216960907e-06, -1.1790543794631958e-06, -9.918585419654846e-07, -8.046627044677734e-07, -6.174668669700623e-07, -4.302710294723511e-07, -2.430751919746399e-07, -5.587935447692871e-08, 1.3131648302078247e-07, 3.1851232051849365e-07, 5.057081580162048e-07, 6.92903995513916e-07, 8.800998330116272e-07, 1.0672956705093384e-06, 1.2544915080070496e-06, 1.4416873455047607e-06, 1.628883183002472e-06, 1.816079020500183e-06, 2.0032748579978943e-06, 2.1904706954956055e-06, 2.3776665329933167e-06, 2.564862370491028e-06, 2.752058207988739e-06, 2.93925404548645e-06, 3.1264498829841614e-06, 3.3136457204818726e-06, 3.5008415579795837e-06, 3.688037395477295e-06, 3.875233232975006e-06, 4.062429070472717e-06, 4.2496249079704285e-06, 4.43682074546814e-06, 4.624016582965851e-06, 4.811212420463562e-06, 4.998408257961273e-06, 5.185604095458984e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 9.0, 15.0, 12.0, 35.0, 58.0, 94.0, 175.0, 238.0, 513.0, 725.0, 1446.0, 2078.0, 3106.0, 7841.0, 14226.0, 71822.0, 904720.0, 23161.0, 7847.0, 3981.0, 2781.0, 1386.0, 990.0, 492.0, 334.0, 152.0, 125.0, 79.0, 46.0, 25.0, 6.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.795410394668579e-06, -8.471310138702393e-06, -8.147209882736206e-06, -7.82310962677002e-06, -7.499009370803833e-06, -7.1749091148376465e-06, -6.85080885887146e-06, -6.5267086029052734e-06, -6.202608346939087e-06, -5.8785080909729e-06, -5.554407835006714e-06, -5.230307579040527e-06, -4.906207323074341e-06, -4.582107067108154e-06, -4.258006811141968e-06, -3.933906555175781e-06, -3.6098062992095947e-06, -3.285706043243408e-06, -2.9616057872772217e-06, -2.637505531311035e-06, -2.3134052753448486e-06, -1.989305019378662e-06, -1.6652047634124756e-06, -1.341104507446289e-06, -1.0170042514801025e-06, -6.92903995513916e-07, -3.688037395477295e-07, -4.470348358154297e-08, 2.7939677238464355e-07, 6.034970283508301e-07, 9.275972843170166e-07, 1.2516975402832031e-06, 1.5757977962493896e-06, 1.8998980522155762e-06, 2.2239983081817627e-06, 2.5480985641479492e-06, 2.8721988201141357e-06, 3.1962990760803223e-06, 3.520399332046509e-06, 3.844499588012695e-06, 4.168599843978882e-06, 4.492700099945068e-06, 4.816800355911255e-06, 5.140900611877441e-06, 5.465000867843628e-06, 5.7891011238098145e-06, 6.113201379776001e-06, 6.4373016357421875e-06, 6.761401891708374e-06, 7.0855021476745605e-06, 7.409602403640747e-06, 7.733702659606934e-06, 8.05780291557312e-06, 8.381903171539307e-06, 8.706003427505493e-06, 9.03010368347168e-06, 9.354203939437866e-06, 9.678304195404053e-06, 1.000240445137024e-05, 1.0326504707336426e-05, 1.0650604963302612e-05, 1.0974705219268799e-05, 1.1298805475234985e-05, 1.1622905731201172e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 2.0, 3.0, 6.0, 5.0, 1.0, 7.0, 2.0, 1.0, 5.0, 7.0, 4.0, 6.0, 5.0, 15.0, 8.0, 7.0, 22.0, 767.0, 15.0, 14.0, 7.0, 6.0, 10.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 5.0, 2.0, 9.0, 1.0, 2.0, 14.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.0994415283203125e-06, -3.0193477869033813e-06, -2.93925404548645e-06, -2.859160304069519e-06, -2.779066562652588e-06, -2.6989728212356567e-06, -2.6188790798187256e-06, -2.5387853384017944e-06, -2.4586915969848633e-06, -2.378597855567932e-06, -2.298504114151001e-06, -2.21841037273407e-06, -2.1383166313171387e-06, -2.0582228899002075e-06, -1.9781291484832764e-06, -1.8980354070663452e-06, -1.817941665649414e-06, -1.737847924232483e-06, -1.6577541828155518e-06, -1.5776604413986206e-06, -1.4975666999816895e-06, -1.4174729585647583e-06, -1.3373792171478271e-06, -1.257285475730896e-06, -1.1771917343139648e-06, -1.0970979928970337e-06, -1.0170042514801025e-06, -9.369105100631714e-07, -8.568167686462402e-07, -7.767230272293091e-07, -6.966292858123779e-07, -6.165355443954468e-07, -5.364418029785156e-07, -4.5634806156158447e-07, -3.762543201446533e-07, -2.9616057872772217e-07, -2.1606683731079102e-07, -1.3597309589385986e-07, -5.587935447692871e-08, 2.421438694000244e-08, 1.043081283569336e-07, 1.8440186977386475e-07, 2.644956111907959e-07, 3.4458935260772705e-07, 4.246830940246582e-07, 5.047768354415894e-07, 5.848705768585205e-07, 6.649643182754517e-07, 7.450580596923828e-07, 8.25151801109314e-07, 9.052455425262451e-07, 9.853392839431763e-07, 1.0654330253601074e-06, 1.1455267667770386e-06, 1.2256205081939697e-06, 1.3057142496109009e-06, 1.385807991027832e-06, 1.4659017324447632e-06, 1.5459954738616943e-06, 1.6260892152786255e-06, 1.7061829566955566e-06, 1.7862766981124878e-06, 1.866370439529419e-06, 1.94646418094635e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 32.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 605.0, 0.0, 0.0, 1676.0, 0.0, 0.0, 0.0, 4661.0, 0.0, 0.0, 1034066.0, 0.0, 0.0, 4678.0, 0.0, 0.0, 0.0, 1699.0, 0.0, 0.0, 661.0, 0.0, 0.0, 0.0, 184.0, 0.0, 0.0, 24.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -3.995373845100403e-07, -3.818422555923462e-07, -3.641471266746521e-07, -3.46451997756958e-07, -3.287568688392639e-07, -3.110617399215698e-07, -2.9336661100387573e-07, -2.7567148208618164e-07, -2.5797635316848755e-07, -2.4028122425079346e-07, -2.2258609533309937e-07, -2.0489096641540527e-07, -1.8719583749771118e-07, -1.695007085800171e-07, -1.51805579662323e-07, -1.341104507446289e-07, -1.1641532182693481e-07, -9.872019290924072e-08, -8.102506399154663e-08, -6.332993507385254e-08, -4.563480615615845e-08, -2.7939677238464355e-08, -1.0244548320770264e-08, 7.450580596923828e-09, 2.514570951461792e-08, 4.284083843231201e-08, 6.05359673500061e-08, 7.82310962677002e-08, 9.592622518539429e-08, 1.1362135410308838e-07, 1.3131648302078247e-07, 1.4901161193847656e-07, 1.6670674085617065e-07, 1.8440186977386475e-07, 2.0209699869155884e-07, 2.1979212760925293e-07, 2.3748725652694702e-07, 2.551823854446411e-07, 2.728775143623352e-07, 2.905726432800293e-07, 3.082677721977234e-07, 3.259629011154175e-07, 3.4365803003311157e-07, 3.6135315895080566e-07, 3.7904828786849976e-07, 3.9674341678619385e-07, 4.1443854570388794e-07, 4.3213367462158203e-07, 4.498288035392761e-07, 4.675239324569702e-07, 4.852190613746643e-07, 5.029141902923584e-07, 5.206093192100525e-07, 5.383044481277466e-07, 5.559995770454407e-07, 5.736947059631348e-07, 5.913898348808289e-07, 6.09084963798523e-07, 6.26780092716217e-07, 6.444752216339111e-07, 6.621703505516052e-07, 6.798654794692993e-07, 6.975606083869934e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 988.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 56.0, 0.0, 156.0, 0.0, 420.0, 0.0, 2170.0, 0.0, 8160.0, 0.0, 0.0, 1026664.0, 0.0, 8064.0, 0.0, 2144.0, 0.0, 456.0, 0.0, 168.0, 0.0, 52.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-8.940696716308594e-07, -8.66129994392395e-07, -8.381903171539307e-07, -8.102506399154663e-07, -7.82310962677002e-07, -7.543712854385376e-07, -7.264316082000732e-07, -6.984919309616089e-07, -6.705522537231445e-07, -6.426125764846802e-07, -6.146728992462158e-07, -5.867332220077515e-07, -5.587935447692871e-07, -5.308538675308228e-07, -5.029141902923584e-07, -4.7497451305389404e-07, -4.470348358154297e-07, -4.1909515857696533e-07, -3.91155481338501e-07, -3.632158041000366e-07, -3.3527612686157227e-07, -3.073364496231079e-07, -2.7939677238464355e-07, -2.514570951461792e-07, -2.2351741790771484e-07, -1.955777406692505e-07, -1.6763806343078613e-07, -1.3969838619232178e-07, -1.1175870895385742e-07, -8.381903171539307e-08, -5.587935447692871e-08, -2.7939677238464355e-08, 0.0, 2.7939677238464355e-08, 5.587935447692871e-08, 8.381903171539307e-08, 1.1175870895385742e-07, 1.3969838619232178e-07, 1.6763806343078613e-07, 1.955777406692505e-07, 2.2351741790771484e-07, 2.514570951461792e-07, 2.7939677238464355e-07, 3.073364496231079e-07, 3.3527612686157227e-07, 3.632158041000366e-07, 3.91155481338501e-07, 4.1909515857696533e-07, 4.470348358154297e-07, 4.7497451305389404e-07, 5.029141902923584e-07, 5.308538675308228e-07, 5.587935447692871e-07, 5.867332220077515e-07, 6.146728992462158e-07, 6.426125764846802e-07, 6.705522537231445e-07, 6.984919309616089e-07, 7.264316082000732e-07, 7.543712854385376e-07, 7.82310962677002e-07, 8.102506399154663e-07, 8.381903171539307e-07, 8.66129994392395e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 988.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 10.0, 5.0, 6.0, 9.0, 12.0, 10.0, 13.0, 22.0, 31.0, 33.0, 33.0, 49.0, 65.0, 107.0, 149.0, 114.0, 91.0, 54.0, 39.0, 27.0, 24.0, 21.0, 19.0, 8.0, 11.0, 5.0, 4.0, 10.0, 3.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5850737226137426e-06, -5.367738594941329e-06, -5.150403012521565e-06, -4.933067884849152e-06, -4.715732302429387e-06, -4.498397174756974e-06, -4.28106159233721e-06, -4.063726464664796e-06, -3.846391336992383e-06, -3.629055981946294e-06, -3.4117206269002054e-06, -3.194385499227792e-06, -2.9770499168080278e-06, -2.7597147891356144e-06, -2.5423794340895256e-06, -2.325044079043437e-06, -2.1077084966236725e-06, -1.8903731415775837e-06, -1.673037786531495e-06, -1.4557025451722438e-06, -1.238367190126155e-06, -1.0210318350800662e-06, -8.036965937208151e-07, -5.863612386747263e-07, -3.6902588362863753e-07, -1.5169055700425815e-07, 6.564476962012122e-08, 2.8298006782279117e-07, 5.0031542286888e-07, 7.176507779149688e-07, 9.349860192742199e-07, 1.1523213743203087e-06, 1.3696562746190466e-06, 1.5869916296651354e-06, 1.8043269847112242e-06, 2.0216621123836376e-06, 2.238997694803402e-06, 2.456332822475815e-06, 2.673668177521904e-06, 2.891003532567993e-06, 3.1083388876140816e-06, 3.3256742426601704e-06, 3.5430095977062592e-06, 3.760344952752348e-06, 3.977680080424761e-06, 4.195015662844526e-06, 4.412350790516939e-06, 4.629686372936703e-06, 4.847021500609117e-06, 5.06435662828153e-06, 5.281692210701294e-06, 5.499027338373708e-06, 5.716362920793472e-06, 5.933698048465885e-06, 6.1510336308856495e-06, 6.368368758558063e-06, 6.585703886230476e-06, 6.8030390139028896e-06, 7.020374596322654e-06, 7.237709723995067e-06, 7.4550453064148314e-06, 7.672380888834596e-06, 7.889715561759658e-06, 8.107051144179422e-06, 8.324386726599187e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 6.0, 12.0, 10.0, 9.0, 13.0, 23.0, 17.0, 31.0, 28.0, 22.0, 48.0, 37.0, 50.0, 27.0, 46.0, 54.0, 51.0, 60.0, 61.0, 50.0, 54.0, 40.0, 39.0, 31.0, 38.0, 21.0, 31.0, 15.0, 21.0, 15.0, 11.0, 13.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.890638815093553e-06, -6.708891305606812e-06, -6.527144250867423e-06, -6.345396741380682e-06, -6.163649231893942e-06, -5.981902177154552e-06, -5.800154667667812e-06, -5.618407158181071e-06, -5.436660103441682e-06, -5.254912593954941e-06, -5.073165539215552e-06, -4.891418029728811e-06, -4.709670974989422e-06, -4.527923465502681e-06, -4.346175956015941e-06, -4.164428901276551e-06, -3.982681391789811e-06, -3.8009341096767457e-06, -3.6191868275636807e-06, -3.4374393180769403e-06, -3.2556920359638752e-06, -3.0739447538508102e-06, -2.8921972443640698e-06, -2.7104499622510048e-06, -2.5287026801379398e-06, -2.3469553980248747e-06, -2.1652081159118097e-06, -1.9834606064250693e-06, -1.8017133243120043e-06, -1.6199660421989392e-06, -1.4382186463990365e-06, -1.2564712505991338e-06, -1.0747239684860688e-06, -8.929766295295849e-07, -7.11229290573101e-07, -5.294819516166172e-07, -3.477346126601333e-07, -1.659872737036494e-07, 1.5760065252834465e-08, 1.975074610527372e-07, 3.792547431658022e-07, 5.610020821222861e-07, 7.4274942107877e-07, 9.244967600352538e-07, 1.1062440989917377e-06, 1.2879913811048027e-06, 1.4697387769047054e-06, 1.6514861727046082e-06, 1.8332334548176732e-06, 2.014980736930738e-06, 2.1967280190438032e-06, 2.3784755285305437e-06, 2.5602228106436087e-06, 2.7419700927566737e-06, 2.923717602243414e-06, 3.105464884356479e-06, 3.287212166469544e-06, 3.468959448582609e-06, 3.650706730695674e-06, 3.832454240182415e-06, 4.014201294921804e-06, 4.195948804408545e-06, 4.377696313895285e-06, 4.559443368634675e-06, 4.741190878121415e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 1.0, 6.0, 7.0, 13.0, 21.0, 18.0, 39.0, 51.0, 78.0, 106.0, 193.0, 335.0, 623.0, 1525.0, 3425.0, 6717.0, 16037.0, 34481.0, 100858.0, 394747.0, 324445.0, 100948.0, 36836.0, 14089.0, 6952.0, 3150.0, 1268.0, 746.0, 319.0, 193.0, 120.0, 52.0, 45.0, 29.0, 26.0, 19.0, 17.0, 4.0, 3.0, 10.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.665111631155014e-05, -1.607649028301239e-05, -1.550186425447464e-05, -1.492723822593689e-05, -1.435261219739914e-05, -1.377798616886139e-05, -1.3203360140323639e-05, -1.2628734111785889e-05, -1.2054108083248138e-05, -1.1479482054710388e-05, -1.0904856026172638e-05, -1.0330229997634888e-05, -9.755603969097137e-06, -9.180977940559387e-06, -8.606351912021637e-06, -8.031725883483887e-06, -7.4570998549461365e-06, -6.882473826408386e-06, -6.307847797870636e-06, -5.733221769332886e-06, -5.1585957407951355e-06, -4.583969712257385e-06, -4.009343683719635e-06, -3.4347176551818848e-06, -2.8600916266441345e-06, -2.2854655981063843e-06, -1.710839569568634e-06, -1.1362135410308838e-06, -5.615875124931335e-07, 1.30385160446167e-08, 5.876645445823669e-07, 1.1622905731201172e-06, 1.7369166016578674e-06, 2.3115426301956177e-06, 2.886168658733368e-06, 3.460794687271118e-06, 4.035420715808868e-06, 4.610046744346619e-06, 5.184672772884369e-06, 5.759298801422119e-06, 6.333924829959869e-06, 6.90855085849762e-06, 7.48317688703537e-06, 8.05780291557312e-06, 8.63242894411087e-06, 9.20705497264862e-06, 9.781681001186371e-06, 1.0356307029724121e-05, 1.0930933058261871e-05, 1.1505559086799622e-05, 1.2080185115337372e-05, 1.2654811143875122e-05, 1.3229437172412872e-05, 1.3804063200950623e-05, 1.4378689229488373e-05, 1.4953315258026123e-05, 1.5527941286563873e-05, 1.6102567315101624e-05, 1.6677193343639374e-05, 1.7251819372177124e-05, 1.7826445400714874e-05, 1.8401071429252625e-05, 1.8975697457790375e-05, 1.9550323486328125e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 10.0, 13.0, 22.0, 15.0, 24.0, 23.0, 33.0, 72.0, 33.0, 70.0, 47.0, 73.0, 59.0, 70.0, 82.0, 62.0, 70.0, 47.0, 51.0, 24.0, 30.0, 19.0, 19.0, 17.0, 8.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, -4.325062036514282e-06, -4.179775714874268e-06, -4.034489393234253e-06, -3.889203071594238e-06, -3.7439167499542236e-06, -3.598630428314209e-06, -3.4533441066741943e-06, -3.3080577850341797e-06, -3.162771463394165e-06, -3.0174851417541504e-06, -2.8721988201141357e-06, -2.726912498474121e-06, -2.5816261768341064e-06, -2.436339855194092e-06, -2.291053533554077e-06, -2.1457672119140625e-06, -2.000480890274048e-06, -1.8551945686340332e-06, -1.7099082469940186e-06, -1.564621925354004e-06, -1.4193356037139893e-06, -1.2740492820739746e-06, -1.12876296043396e-06, -9.834766387939453e-07, -8.381903171539307e-07, -6.92903995513916e-07, -5.476176738739014e-07, -4.023313522338867e-07, -2.5704503059387207e-07, -1.1175870895385742e-07, 3.3527612686157227e-08, 1.7881393432617188e-07, 3.241002559661865e-07, 4.6938657760620117e-07, 6.146728992462158e-07, 7.599592208862305e-07, 9.052455425262451e-07, 1.0505318641662598e-06, 1.1958181858062744e-06, 1.341104507446289e-06, 1.4863908290863037e-06, 1.6316771507263184e-06, 1.776963472366333e-06, 1.9222497940063477e-06, 2.0675361156463623e-06, 2.212822437286377e-06, 2.3581087589263916e-06, 2.5033950805664062e-06, 2.648681402206421e-06, 2.7939677238464355e-06, 2.93925404548645e-06, 3.084540367126465e-06, 3.2298266887664795e-06, 3.375113010406494e-06, 3.520399332046509e-06, 3.6656856536865234e-06, 3.810971975326538e-06, 3.956258296966553e-06, 4.101544618606567e-06, 4.246830940246582e-06, 4.392117261886597e-06, 4.537403583526611e-06, 4.682689905166626e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 8.0, 6.0, 5.0, 14.0, 15.0, 18.0, 31.0, 28.0, 47.0, 70.0, 96.0, 132.0, 220.0, 414.0, 629.0, 1460.0, 2972.0, 5565.0, 14721.0, 38922.0, 92911.0, 409259.0, 342807.0, 80001.0, 34230.0, 13303.0, 5088.0, 2749.0, 1252.0, 600.0, 392.0, 213.0, 109.0, 96.0, 55.0, 25.0, 23.0, 26.0, 9.0, 11.0, 8.0, 3.0, 1.0, 1.0, 7.0, 1.0, 0.0, 3.0], "bins": [-1.7344951629638672e-05, -1.6887672245502472e-05, -1.6430392861366272e-05, -1.5973113477230072e-05, -1.5515834093093872e-05, -1.5058554708957672e-05, -1.4601275324821472e-05, -1.4143995940685272e-05, -1.3686716556549072e-05, -1.3229437172412872e-05, -1.2772157788276672e-05, -1.2314878404140472e-05, -1.1857599020004272e-05, -1.1400319635868073e-05, -1.0943040251731873e-05, -1.0485760867595673e-05, -1.0028481483459473e-05, -9.571202099323273e-06, -9.113922715187073e-06, -8.656643331050873e-06, -8.199363946914673e-06, -7.742084562778473e-06, -7.284805178642273e-06, -6.827525794506073e-06, -6.370246410369873e-06, -5.912967026233673e-06, -5.455687642097473e-06, -4.998408257961273e-06, -4.541128873825073e-06, -4.083849489688873e-06, -3.6265701055526733e-06, -3.1692907214164734e-06, -2.7120113372802734e-06, -2.2547319531440735e-06, -1.7974525690078735e-06, -1.3401731848716736e-06, -8.828938007354736e-07, -4.256144165992737e-07, 3.166496753692627e-08, 4.889443516731262e-07, 9.462237358093262e-07, 1.4035031199455261e-06, 1.860782504081726e-06, 2.318061888217926e-06, 2.775341272354126e-06, 3.232620656490326e-06, 3.689900040626526e-06, 4.147179424762726e-06, 4.604458808898926e-06, 5.061738193035126e-06, 5.519017577171326e-06, 5.976296961307526e-06, 6.433576345443726e-06, 6.8908557295799255e-06, 7.3481351137161255e-06, 7.805414497852325e-06, 8.262693881988525e-06, 8.719973266124725e-06, 9.177252650260925e-06, 9.634532034397125e-06, 1.0091811418533325e-05, 1.0549090802669525e-05, 1.1006370186805725e-05, 1.1463649570941925e-05, 1.1920928955078125e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 4.0, 8.0, 5.0, 18.0, 18.0, 33.0, 18.0, 39.0, 29.0, 48.0, 24.0, 45.0, 40.0, 55.0, 33.0, 70.0, 26.0, 81.0, 33.0, 50.0, 22.0, 63.0, 59.0, 21.0, 20.0, 17.0, 26.0, 8.0, 29.0, 2.0, 11.0, 7.0, 8.0, 5.0, 8.0, 1.0, 1.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.234242856502533e-06, -2.1439045667648315e-06, -2.05356627702713e-06, -1.9632279872894287e-06, -1.8728896975517273e-06, -1.7825514078140259e-06, -1.6922131180763245e-06, -1.601874828338623e-06, -1.5115365386009216e-06, -1.4211982488632202e-06, -1.3308599591255188e-06, -1.2405216693878174e-06, -1.150183379650116e-06, -1.0598450899124146e-06, -9.695068001747131e-07, -8.791685104370117e-07, -7.888302206993103e-07, -6.984919309616089e-07, -6.081536412239075e-07, -5.178153514862061e-07, -4.2747706174850464e-07, -3.371387720108032e-07, -2.468004822731018e-07, -1.564621925354004e-07, -6.612390279769897e-08, 2.421438694000244e-08, 1.1455267667770386e-07, 2.0489096641540527e-07, 2.952292561531067e-07, 3.855675458908081e-07, 4.759058356285095e-07, 5.662441253662109e-07, 6.565824151039124e-07, 7.469207048416138e-07, 8.372589945793152e-07, 9.275972843170166e-07, 1.017935574054718e-06, 1.1082738637924194e-06, 1.1986121535301208e-06, 1.2889504432678223e-06, 1.3792887330055237e-06, 1.469627022743225e-06, 1.5599653124809265e-06, 1.650303602218628e-06, 1.7406418919563293e-06, 1.8309801816940308e-06, 1.921318471431732e-06, 2.0116567611694336e-06, 2.101995050907135e-06, 2.1923333406448364e-06, 2.282671630382538e-06, 2.3730099201202393e-06, 2.4633482098579407e-06, 2.553686499595642e-06, 2.6440247893333435e-06, 2.734363079071045e-06, 2.8247013688087463e-06, 2.9150396585464478e-06, 3.005377948284149e-06, 3.0957162380218506e-06, 3.186054527759552e-06, 3.2763928174972534e-06, 3.366731107234955e-06, 3.4570693969726562e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 3.0, 0.0, 0.0, 13.0, 0.0, 0.0, 21.0, 0.0, 67.0, 0.0, 0.0, 152.0, 0.0, 0.0, 481.0, 0.0, 1760.0, 0.0, 0.0, 14603.0, 0.0, 0.0, 1014392.0, 0.0, 14531.0, 0.0, 0.0, 1821.0, 0.0, 0.0, 467.0, 0.0, 151.0, 0.0, 0.0, 58.0, 0.0, 0.0, 18.0, 0.0, 22.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 88.0, 0.0, 0.0, 0.0, 0.0, 1596.0, 0.0, 0.0, 0.0, 8415.0, 0.0, 0.0, 0.0, 1028291.0, 0.0, 0.0, 0.0, 8353.0, 0.0, 0.0, 0.0, 0.0, 1599.0, 0.0, 0.0, 0.0, 118.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 22.0], "bins": [-5.960464477539062e-07, -5.820766091346741e-07, -5.681067705154419e-07, -5.541369318962097e-07, -5.401670932769775e-07, -5.261972546577454e-07, -5.122274160385132e-07, -4.98257577419281e-07, -4.842877388000488e-07, -4.7031790018081665e-07, -4.5634806156158447e-07, -4.423782229423523e-07, -4.284083843231201e-07, -4.1443854570388794e-07, -4.0046870708465576e-07, -3.864988684654236e-07, -3.725290298461914e-07, -3.5855919122695923e-07, -3.4458935260772705e-07, -3.3061951398849487e-07, -3.166496753692627e-07, -3.026798367500305e-07, -2.8870999813079834e-07, -2.7474015951156616e-07, -2.60770320892334e-07, -2.468004822731018e-07, -2.3283064365386963e-07, -2.1886080503463745e-07, -2.0489096641540527e-07, -1.909211277961731e-07, -1.7695128917694092e-07, -1.6298145055770874e-07, -1.4901161193847656e-07, -1.3504177331924438e-07, -1.210719347000122e-07, -1.0710209608078003e-07, -9.313225746154785e-08, -7.916241884231567e-08, -6.51925802230835e-08, -5.122274160385132e-08, -3.725290298461914e-08, -2.3283064365386963e-08, -9.313225746154785e-09, 4.6566128730773926e-09, 1.862645149230957e-08, 3.259629011154175e-08, 4.6566128730773926e-08, 6.05359673500061e-08, 7.450580596923828e-08, 8.847564458847046e-08, 1.0244548320770264e-07, 1.1641532182693481e-07, 1.30385160446167e-07, 1.4435499906539917e-07, 1.5832483768463135e-07, 1.7229467630386353e-07, 1.862645149230957e-07, 2.0023435354232788e-07, 2.1420419216156006e-07, 2.2817403078079224e-07, 2.421438694000244e-07, 2.561137080192566e-07, 2.7008354663848877e-07, 2.8405338525772095e-07, 2.980232238769531e-07]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 987.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 18.0, 33.0, 49.0, 79.0, 106.0, 219.0, 189.0, 101.0, 60.0, 37.0, 24.0, 18.0, 17.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.801245490350993e-06, -6.538930847455049e-06, -6.2766162045591045e-06, -6.014301106915809e-06, -5.751986464019865e-06, -5.48967182112392e-06, -5.227357178227976e-06, -4.9650425353320315e-06, -4.702727892436087e-06, -4.440413249540143e-06, -4.178098606644198e-06, -3.915783963748254e-06, -3.6534688661049586e-06, -3.391154223209014e-06, -3.1288395803130697e-06, -2.8665249374171253e-06, -2.60420983977383e-06, -2.3418951968778856e-06, -2.0795803266082658e-06, -1.8172656837123213e-06, -1.5549509271295392e-06, -1.292636170546757e-06, -1.0303215276508126e-06, -7.680067710680305e-07, -5.056920144852484e-07, -2.4337728632417566e-07, 1.893744183689705e-08, 2.8125214157626033e-07, 5.435668981590425e-07, 8.058816547418246e-07, 1.068196297637769e-06, 1.3305110542205512e-06, 1.5928262655506842e-06, 1.8551410221334663e-06, 2.1174557787162485e-06, 2.379770421612193e-06, 2.6420852918818127e-06, 2.904399934777757e-06, 3.1667145776737016e-06, 3.429029220569646e-06, 3.691344090839266e-06, 3.953658961108886e-06, 4.21597360400483e-06, 4.4782882469007745e-06, 4.740602889796719e-06, 5.002917532692663e-06, 5.265232175588608e-06, 5.527547273231903e-06, 5.7898619161278475e-06, 6.052176559023792e-06, 6.314491201919736e-06, 6.576806299563032e-06, 6.839120942458976e-06, 7.1014355853549205e-06, 7.363750228250865e-06, 7.626064871146809e-06, 7.888379514042754e-06, 8.150694156938698e-06, 8.413008799834643e-06, 8.675323442730587e-06, 8.937638085626531e-06, 9.199953638017178e-06, 9.462268280913122e-06, 9.724582923809066e-06, 9.98689756670501e-06]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 13.0, 4.0, 13.0, 8.0, 14.0, 18.0, 29.0, 33.0, 34.0, 42.0, 46.0, 49.0, 46.0, 47.0, 42.0, 51.0, 61.0, 47.0, 47.0, 38.0, 47.0, 50.0, 39.0, 36.0, 28.0, 22.0, 10.0, 24.0, 19.0, 11.0, 7.0, 9.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.047038146381965e-06, -3.921922143490519e-06, -3.796806140599074e-06, -3.6716903650813038e-06, -3.5465743621898582e-06, -3.4214583592984127e-06, -3.2963425837806426e-06, -3.171226580889197e-06, -3.0461105779977515e-06, -2.920994575106306e-06, -2.7958785722148605e-06, -2.6707627966970904e-06, -2.545646793805645e-06, -2.4205307909141993e-06, -2.2954150153964292e-06, -2.1702990125049837e-06, -2.045183009613538e-06, -1.9200670067220926e-06, -1.7949511175174848e-06, -1.669835228312877e-06, -1.5447192254214315e-06, -1.419603222529986e-06, -1.2944873333253781e-06, -1.1693714441207703e-06, -1.0442554412293248e-06, -9.191394951812981e-07, -7.940235491332714e-07, -6.689076030852448e-07, -5.437916570372181e-07, -4.1867571098919143e-07, -2.9355976494116476e-07, -1.6844381889313809e-07, -4.3327872845111415e-08, 8.178807320291526e-08, 2.0690401925094193e-07, 3.320199652989686e-07, 4.5713591134699527e-07, 5.822518573950219e-07, 7.073678034430486e-07, 8.324837494910753e-07, 9.57599695539102e-07, 1.0827156984305475e-06, 1.2078315876351553e-06, 1.3329474768397631e-06, 1.4580634797312086e-06, 1.5831794826226542e-06, 1.708295371827262e-06, 1.8334112610318698e-06, 1.9585272639233153e-06, 2.083643266814761e-06, 2.2087592697062064e-06, 2.3338750452239765e-06, 2.458991048115422e-06, 2.5841070510068676e-06, 2.7092228265246376e-06, 2.834338829416083e-06, 2.9594548323075287e-06, 3.0845708351989742e-06, 3.2096868380904198e-06, 3.33480261360819e-06, 3.4599186164996354e-06, 3.585034619391081e-06, 3.710150394908851e-06, 3.8352663978002965e-06, 3.960382400691742e-06]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 25.0, 35.0, 38.0, 44.0, 50.0, 77.0, 120.0, 151.0, 189.0, 254.0, 351.0, 481.0, 726.0, 913.0, 1391.0, 2258.0, 3692.0, 7273.0, 92362.0, 3975325.0, 89633.0, 7700.0, 3759.0, 2218.0, 1509.0, 974.0, 690.0, 534.0, 371.0, 295.0, 172.0, 158.0, 115.0, 86.0, 67.0, 48.0, 34.0, 30.0, 25.0, 18.0, 13.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 3.0, 6.0], "bins": [-1.0251998901367188e-05, -9.953975677490234e-06, -9.655952453613281e-06, -9.357929229736328e-06, -9.059906005859375e-06, -8.761882781982422e-06, -8.463859558105469e-06, -8.165836334228516e-06, -7.867813110351562e-06, -7.569789886474609e-06, -7.271766662597656e-06, -6.973743438720703e-06, -6.67572021484375e-06, -6.377696990966797e-06, -6.079673767089844e-06, -5.781650543212891e-06, -5.4836273193359375e-06, -5.185604095458984e-06, -4.887580871582031e-06, -4.589557647705078e-06, -4.291534423828125e-06, -3.993511199951172e-06, -3.6954879760742188e-06, -3.3974647521972656e-06, -3.0994415283203125e-06, -2.8014183044433594e-06, -2.5033950805664062e-06, -2.205371856689453e-06, -1.9073486328125e-06, -1.6093254089355469e-06, -1.3113021850585938e-06, -1.0132789611816406e-06, -7.152557373046875e-07, -4.172325134277344e-07, -1.1920928955078125e-07, 1.7881393432617188e-07, 4.76837158203125e-07, 7.748603820800781e-07, 1.0728836059570312e-06, 1.3709068298339844e-06, 1.6689300537109375e-06, 1.9669532775878906e-06, 2.2649765014648438e-06, 2.562999725341797e-06, 2.86102294921875e-06, 3.159046173095703e-06, 3.4570693969726562e-06, 3.7550926208496094e-06, 4.0531158447265625e-06, 4.351139068603516e-06, 4.649162292480469e-06, 4.947185516357422e-06, 5.245208740234375e-06, 5.543231964111328e-06, 5.841255187988281e-06, 6.139278411865234e-06, 6.4373016357421875e-06, 6.735324859619141e-06, 7.033348083496094e-06, 7.331371307373047e-06, 7.62939453125e-06, 7.927417755126953e-06, 8.225440979003906e-06, 8.52346420288086e-06, 8.821487426757812e-06]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 2.0, 11.0, 8.0, 12.0, 8.0, 13.0, 23.0, 17.0, 25.0, 9.0, 19.0, 40.0, 31.0, 65.0, 25.0, 50.0, 36.0, 29.0, 54.0, 31.0, 62.0, 31.0, 47.0, 26.0, 19.0, 56.0, 24.0, 48.0, 21.0, 18.0, 28.0, 17.0, 23.0, 8.0, 16.0, 7.0, 5.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.835877239704132e-06, -2.7511268854141235e-06, -2.666376531124115e-06, -2.5816261768341064e-06, -2.496875822544098e-06, -2.4121254682540894e-06, -2.327375113964081e-06, -2.2426247596740723e-06, -2.1578744053840637e-06, -2.073124051094055e-06, -1.9883736968040466e-06, -1.903623342514038e-06, -1.8188729882240295e-06, -1.734122633934021e-06, -1.6493722796440125e-06, -1.564621925354004e-06, -1.4798715710639954e-06, -1.3951212167739868e-06, -1.3103708624839783e-06, -1.2256205081939697e-06, -1.1408701539039612e-06, -1.0561197996139526e-06, -9.71369445323944e-07, -8.866190910339355e-07, -8.01868736743927e-07, -7.171183824539185e-07, -6.323680281639099e-07, -5.476176738739014e-07, -4.628673195838928e-07, -3.781169652938843e-07, -2.9336661100387573e-07, -2.086162567138672e-07, -1.2386590242385864e-07, -3.91155481338501e-08, 4.563480615615845e-08, 1.30385160446167e-07, 2.1513551473617554e-07, 2.998858690261841e-07, 3.8463622331619263e-07, 4.6938657760620117e-07, 5.541369318962097e-07, 6.388872861862183e-07, 7.236376404762268e-07, 8.083879947662354e-07, 8.931383490562439e-07, 9.778887033462524e-07, 1.062639057636261e-06, 1.1473894119262695e-06, 1.232139766216278e-06, 1.3168901205062866e-06, 1.4016404747962952e-06, 1.4863908290863037e-06, 1.5711411833763123e-06, 1.6558915376663208e-06, 1.7406418919563293e-06, 1.8253922462463379e-06, 1.9101426005363464e-06, 1.994892954826355e-06, 2.0796433091163635e-06, 2.164393663406372e-06, 2.2491440176963806e-06, 2.333894371986389e-06, 2.4186447262763977e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 11.0, 6.0, 9.0, 18.0, 24.0, 19.0, 38.0, 60.0, 118.0, 233.0, 337.0, 862.0, 1559.0, 4491.0, 10897.0, 73810.0, 4032909.0, 50021.0, 11840.0, 3669.0, 1800.0, 688.0, 399.0, 170.0, 105.0, 56.0, 32.0, 24.0, 20.0, 6.0, 10.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.823902130126953e-05, -1.778826117515564e-05, -1.7337501049041748e-05, -1.6886740922927856e-05, -1.6435980796813965e-05, -1.5985220670700073e-05, -1.553446054458618e-05, -1.508370041847229e-05, -1.4632940292358398e-05, -1.4182180166244507e-05, -1.3731420040130615e-05, -1.3280659914016724e-05, -1.2829899787902832e-05, -1.237913966178894e-05, -1.1928379535675049e-05, -1.1477619409561157e-05, -1.1026859283447266e-05, -1.0576099157333374e-05, -1.0125339031219482e-05, -9.67457890510559e-06, -9.2238187789917e-06, -8.773058652877808e-06, -8.322298526763916e-06, -7.871538400650024e-06, -7.420778274536133e-06, -6.970018148422241e-06, -6.51925802230835e-06, -6.068497896194458e-06, -5.617737770080566e-06, -5.166977643966675e-06, -4.716217517852783e-06, -4.265457391738892e-06, -3.814697265625e-06, -3.3639371395111084e-06, -2.913177013397217e-06, -2.462416887283325e-06, -2.0116567611694336e-06, -1.560896635055542e-06, -1.1101365089416504e-06, -6.593763828277588e-07, -2.086162567138672e-07, 2.421438694000244e-07, 6.92903995513916e-07, 1.1436641216278076e-06, 1.5944242477416992e-06, 2.045184373855591e-06, 2.4959444999694824e-06, 2.946704626083374e-06, 3.3974647521972656e-06, 3.848224878311157e-06, 4.298985004425049e-06, 4.7497451305389404e-06, 5.200505256652832e-06, 5.651265382766724e-06, 6.102025508880615e-06, 6.552785634994507e-06, 7.0035457611083984e-06, 7.45430588722229e-06, 7.905066013336182e-06, 8.355826139450073e-06, 8.806586265563965e-06, 9.257346391677856e-06, 9.708106517791748e-06, 1.015886664390564e-05, 1.0609626770019531e-05]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 0.0, 7.0, 2.0, 7.0, 11.0, 27.0, 0.0, 76.0, 177.0, 483.0, 2562.0, 369.0, 0.0, 149.0, 57.0, 26.0, 23.0, 17.0, 0.0, 10.0, 8.0, 4.0, 6.0, 0.0, 9.0, 2.0, 6.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0235235095024109e-06, -9.741634130477905e-07, -9.248033165931702e-07, -8.754432201385498e-07, -8.260831236839294e-07, -7.767230272293091e-07, -7.273629307746887e-07, -6.780028343200684e-07, -6.28642737865448e-07, -5.792826414108276e-07, -5.299225449562073e-07, -4.805624485015869e-07, -4.3120235204696655e-07, -3.818422555923462e-07, -3.3248215913772583e-07, -2.8312206268310547e-07, -2.337619662284851e-07, -1.8440186977386475e-07, -1.3504177331924438e-07, -8.568167686462402e-08, -3.632158041000366e-08, 1.30385160446167e-08, 6.239861249923706e-08, 1.1175870895385742e-07, 1.6111880540847778e-07, 2.1047890186309814e-07, 2.598389983177185e-07, 3.0919909477233887e-07, 3.5855919122695923e-07, 4.079192876815796e-07, 4.5727938413619995e-07, 5.066394805908203e-07, 5.559995770454407e-07, 6.05359673500061e-07, 6.547197699546814e-07, 7.040798664093018e-07, 7.534399628639221e-07, 8.028000593185425e-07, 8.521601557731628e-07, 9.015202522277832e-07, 9.508803486824036e-07, 1.000240445137024e-06, 1.0496005415916443e-06, 1.0989606380462646e-06, 1.148320734500885e-06, 1.1976808309555054e-06, 1.2470409274101257e-06, 1.296401023864746e-06, 1.3457611203193665e-06, 1.3951212167739868e-06, 1.4444813132286072e-06, 1.4938414096832275e-06, 1.543201506137848e-06, 1.5925616025924683e-06, 1.6419216990470886e-06, 1.691281795501709e-06, 1.7406418919563293e-06, 1.7900019884109497e-06, 1.83936208486557e-06, 1.8887221813201904e-06, 1.938082277774811e-06, 1.987442374229431e-06, 2.0368024706840515e-06, 2.086162567138672e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 9.0, 8.0, 12.0, 9.0, 21.0, 30.0, 48.0, 45.0, 62.0, 100.0, 123.0, 138.0, 102.0, 68.0, 37.0, 46.0, 22.0, 30.0, 17.0, 13.0, 9.0, 6.0, 10.0, 3.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.8575440157728735e-06, -3.732991217475501e-06, -3.6084386465518037e-06, -3.483885848254431e-06, -3.359333277330734e-06, -3.234780479033361e-06, -3.1102276807359885e-06, -2.9856751098122913e-06, -2.8611223115149187e-06, -2.736569513217546e-06, -2.612016942293849e-06, -2.487464143996476e-06, -2.3629113456991035e-06, -2.2383587747754063e-06, -2.1138059764780337e-06, -1.989253178180661e-06, -1.8647006072569638e-06, -1.740147922646429e-06, -1.615595238035894e-06, -1.4910424397385214e-06, -1.3664897551279864e-06, -1.2419370705174515e-06, -1.1173842722200789e-06, -9.92831587609544e-07, -8.68278902999009e-07, -7.437262183884741e-07, -6.191734769345203e-07, -4.946207354805665e-07, -3.700680508700316e-07, -2.4551536625949666e-07, -1.2096262480554287e-07, 3.5901166484109126e-09, 1.2814234651159495e-07, 2.526950595438393e-07, 3.7724777257608366e-07, 5.018005140300374e-07, 6.263531986405724e-07, 7.509058832511073e-07, 8.754586247050611e-07, 1.0000113661590149e-06, 1.1245640507695498e-06, 1.2491167353800847e-06, 1.3736694199906196e-06, 1.4982222182879923e-06, 1.6227749028985272e-06, 1.7473275875090621e-06, 1.8718803858064348e-06, 1.9964331841038074e-06, 2.1209857550275046e-06, 2.2455385533248773e-06, 2.3700911242485745e-06, 2.494643922545947e-06, 2.6191964934696443e-06, 2.743749291767017e-06, 2.8683020900643896e-06, 2.992854660988087e-06, 3.1174074592854595e-06, 3.241960257582832e-06, 3.3665128285065293e-06, 3.491065626803902e-06, 3.6156184251012746e-06, 3.740170996024972e-06, 3.864723566948669e-06, 3.989276592619717e-06, 4.113829163543414e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 8.0, 4.0, 9.0, 17.0, 23.0, 13.0, 29.0, 39.0, 40.0, 48.0, 57.0, 53.0, 47.0, 54.0, 50.0, 53.0, 47.0, 50.0, 51.0, 43.0, 51.0, 31.0, 33.0, 35.0, 17.0, 25.0, 11.0, 14.0, 6.0, 14.0, 8.0, 8.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.7615498058585217e-06, -3.6581864151230548e-06, -3.5548227970139123e-06, -3.4514594062784454e-06, -3.3480960155429784e-06, -3.244732397433836e-06, -3.141369006698369e-06, -3.038005615962902e-06, -2.934642225227435e-06, -2.831278834491968e-06, -2.7279152163828257e-06, -2.6245518256473588e-06, -2.521188434911892e-06, -2.4178248168027494e-06, -2.3144614260672824e-06, -2.2110980353318155e-06, -2.107734417222673e-06, -2.004371026487206e-06, -1.9010075220649014e-06, -1.7976440176425967e-06, -1.6942806269071298e-06, -1.590917122484825e-06, -1.4875536180625204e-06, -1.3841902273270534e-06, -1.2808268365915865e-06, -1.1774633321692818e-06, -1.0740999414338148e-06, -9.707364370115101e-07, -8.673730462760432e-07, -7.640095418537385e-07, -6.606460942748527e-07, -5.572826466959668e-07, -4.5391925596049987e-07, -3.5055580838161404e-07, -2.471923608027282e-07, -1.4382888480213296e-07, -4.0465437223247136e-08, 6.289803877734812e-08, 1.6626148635623395e-07, 2.6962493393511977e-07, 3.729883815140056e-07, 4.763518290928914e-07, 5.797152766717772e-07, 6.830787242506631e-07, 7.864422286729678e-07, 8.898056762518536e-07, 9.931691238307394e-07, 1.0965325145662064e-06, 1.199896018988511e-06, 1.3032595234108157e-06, 1.4066229141462827e-06, 1.5099864185685874e-06, 1.6133498093040544e-06, 1.716713313726359e-06, 1.820076704461826e-06, 1.9234403225709684e-06, 2.0268037133064354e-06, 2.1301671040419023e-06, 2.2335307221510448e-06, 2.3368941128865117e-06, 2.4402575036219787e-06, 2.543621121731121e-06, 2.646984512466588e-06, 2.750347903202055e-06, 2.853711293937522e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 18.0, 19.0, 15.0, 32.0, 59.0, 85.0, 77.0, 210.0, 350.0, 602.0, 481.0, 1583.0, 3135.0, 6650.0, 5804.0, 22727.0, 53994.0, 144468.0, 164147.0, 403857.0, 144509.0, 54201.0, 13529.0, 14587.0, 6523.0, 3252.0, 931.0, 1156.0, 621.0, 384.0, 121.0, 180.0, 82.0, 56.0, 15.0, 34.0, 24.0, 16.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-06, -3.2335519790649414e-06, -3.129243850708008e-06, -3.0249357223510742e-06, -2.9206275939941406e-06, -2.816319465637207e-06, -2.7120113372802734e-06, -2.60770320892334e-06, -2.5033950805664062e-06, -2.3990869522094727e-06, -2.294778823852539e-06, -2.1904706954956055e-06, -2.086162567138672e-06, -1.9818544387817383e-06, -1.8775463104248047e-06, -1.773238182067871e-06, -1.6689300537109375e-06, -1.564621925354004e-06, -1.4603137969970703e-06, -1.3560056686401367e-06, -1.2516975402832031e-06, -1.1473894119262695e-06, -1.043081283569336e-06, -9.387731552124023e-07, -8.344650268554688e-07, -7.301568984985352e-07, -6.258487701416016e-07, -5.21540641784668e-07, -4.172325134277344e-07, -3.129243850708008e-07, -2.086162567138672e-07, -1.043081283569336e-07, 0.0, 1.043081283569336e-07, 2.086162567138672e-07, 3.129243850708008e-07, 4.172325134277344e-07, 5.21540641784668e-07, 6.258487701416016e-07, 7.301568984985352e-07, 8.344650268554688e-07, 9.387731552124023e-07, 1.043081283569336e-06, 1.1473894119262695e-06, 1.2516975402832031e-06, 1.3560056686401367e-06, 1.4603137969970703e-06, 1.564621925354004e-06, 1.6689300537109375e-06, 1.773238182067871e-06, 1.8775463104248047e-06, 1.9818544387817383e-06, 2.086162567138672e-06, 2.1904706954956055e-06, 2.294778823852539e-06, 2.3990869522094727e-06, 2.5033950805664062e-06, 2.60770320892334e-06, 2.7120113372802734e-06, 2.816319465637207e-06, 2.9206275939941406e-06, 3.0249357223510742e-06, 3.129243850708008e-06, 3.2335519790649414e-06, 3.337860107421875e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 18.0, 20.0, 7.0, 36.0, 41.0, 49.0, 49.0, 51.0, 32.0, 65.0, 50.0, 57.0, 58.0, 61.0, 45.0, 26.0, 59.0, 39.0, 49.0, 41.0, 36.0, 8.0, 24.0, 18.0, 9.0, 15.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.764405846595764e-06, -3.6545097827911377e-06, -3.5446137189865112e-06, -3.4347176551818848e-06, -3.3248215913772583e-06, -3.214925527572632e-06, -3.1050294637680054e-06, -2.995133399963379e-06, -2.8852373361587524e-06, -2.775341272354126e-06, -2.6654452085494995e-06, -2.555549144744873e-06, -2.4456530809402466e-06, -2.33575701713562e-06, -2.2258609533309937e-06, -2.115964889526367e-06, -2.0060688257217407e-06, -1.8961727619171143e-06, -1.7862766981124878e-06, -1.6763806343078613e-06, -1.5664845705032349e-06, -1.4565885066986084e-06, -1.346692442893982e-06, -1.2367963790893555e-06, -1.126900315284729e-06, -1.0170042514801025e-06, -9.071081876754761e-07, -7.972121238708496e-07, -6.873160600662231e-07, -5.774199962615967e-07, -4.675239324569702e-07, -3.5762786865234375e-07, -2.477318048477173e-07, -1.3783574104309082e-07, -2.7939677238464355e-08, 8.195638656616211e-08, 1.9185245037078857e-07, 3.0174851417541504e-07, 4.116445779800415e-07, 5.21540641784668e-07, 6.314367055892944e-07, 7.413327693939209e-07, 8.512288331985474e-07, 9.611248970031738e-07, 1.0710209608078003e-06, 1.1809170246124268e-06, 1.2908130884170532e-06, 1.4007091522216797e-06, 1.5106052160263062e-06, 1.6205012798309326e-06, 1.730397343635559e-06, 1.8402934074401855e-06, 1.950189471244812e-06, 2.0600855350494385e-06, 2.169981598854065e-06, 2.2798776626586914e-06, 2.389773726463318e-06, 2.4996697902679443e-06, 2.609565854072571e-06, 2.7194619178771973e-06, 2.8293579816818237e-06, 2.93925404548645e-06, 3.0491501092910767e-06, 3.159046173095703e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 15.0, 6.0, 12.0, 12.0, 31.0, 20.0, 35.0, 36.0, 74.0, 78.0, 253.0, 1047102.0, 436.0, 164.0, 55.0, 55.0, 25.0, 31.0, 17.0, 14.0, 7.0, 15.0, 5.0, 8.0, 5.0, 8.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.708766937255859e-06, -4.560686647891998e-06, -4.412606358528137e-06, -4.264526069164276e-06, -4.116445779800415e-06, -3.968365490436554e-06, -3.820285201072693e-06, -3.6722049117088318e-06, -3.5241246223449707e-06, -3.3760443329811096e-06, -3.2279640436172485e-06, -3.0798837542533875e-06, -2.9318034648895264e-06, -2.7837231755256653e-06, -2.635642886161804e-06, -2.487562596797943e-06, -2.339482307434082e-06, -2.191402018070221e-06, -2.04332172870636e-06, -1.8952414393424988e-06, -1.7471611499786377e-06, -1.5990808606147766e-06, -1.4510005712509155e-06, -1.3029202818870544e-06, -1.1548399925231934e-06, -1.0067597031593323e-06, -8.586794137954712e-07, -7.105991244316101e-07, -5.62518835067749e-07, -4.1443854570388794e-07, -2.6635825634002686e-07, -1.1827796697616577e-07, 2.9802322387695312e-08, 1.778826117515564e-07, 3.259629011154175e-07, 4.7404319047927856e-07, 6.221234798431396e-07, 7.702037692070007e-07, 9.182840585708618e-07, 1.066364347934723e-06, 1.214444637298584e-06, 1.362524926662445e-06, 1.5106052160263062e-06, 1.6586855053901672e-06, 1.8067657947540283e-06, 1.9548460841178894e-06, 2.1029263734817505e-06, 2.2510066628456116e-06, 2.3990869522094727e-06, 2.5471672415733337e-06, 2.695247530937195e-06, 2.843327820301056e-06, 2.991408109664917e-06, 3.139488399028778e-06, 3.287568688392639e-06, 3.4356489777565002e-06, 3.5837292671203613e-06, 3.7318095564842224e-06, 3.8798898458480835e-06, 4.027970135211945e-06, 4.176050424575806e-06, 4.324130713939667e-06, 4.472211003303528e-06, 4.620291292667389e-06, 4.76837158203125e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1021.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -3.4458935260772705e-08, -9.313225746154785e-09, 1.5832483768463135e-08, 4.0978193283081055e-08, 6.612390279769897e-08, 9.12696123123169e-08, 1.1641532182693481e-07, 1.4156103134155273e-07, 1.6670674085617065e-07, 1.9185245037078857e-07, 2.169981598854065e-07, 2.421438694000244e-07, 2.6728957891464233e-07, 2.9243528842926025e-07, 3.175809979438782e-07, 3.427267074584961e-07, 3.67872416973114e-07, 3.9301812648773193e-07, 4.1816383600234985e-07, 4.4330954551696777e-07, 4.684552550315857e-07, 4.936009645462036e-07, 5.187466740608215e-07, 5.438923835754395e-07, 5.690380930900574e-07, 5.941838026046753e-07, 6.193295121192932e-07, 6.444752216339111e-07, 6.69620931148529e-07, 6.94766640663147e-07, 7.199123501777649e-07, 7.450580596923828e-07, 7.702037692070007e-07, 7.953494787216187e-07, 8.204951882362366e-07, 8.456408977508545e-07, 8.707866072654724e-07, 8.959323167800903e-07, 9.210780262947083e-07, 9.462237358093262e-07, 9.71369445323944e-07, 9.96515154838562e-07, 1.02166086435318e-06, 1.0468065738677979e-06, 1.0719522833824158e-06, 1.0970979928970337e-06, 1.1222437024116516e-06, 1.1473894119262695e-06, 1.1725351214408875e-06, 1.1976808309555054e-06, 1.2228265404701233e-06, 1.2479722499847412e-06, 1.2731179594993591e-06, 1.298263669013977e-06, 1.323409378528595e-06, 1.3485550880432129e-06, 1.3737007975578308e-06, 1.3988465070724487e-06, 1.4239922165870667e-06, 1.4491379261016846e-06, 1.4742836356163025e-06, 1.4994293451309204e-06, 1.5245750546455383e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 4.0, 8.0, 4.0, 12.0, 17.0, 16.0, 32.0, 34.0, 39.0, 67.0, 88.0, 123.0, 128.0, 122.0, 74.0, 50.0, 41.0, 35.0, 17.0, 25.0, 16.0, 7.0, 5.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.635193818103289e-06, -4.507486210059142e-06, -4.379779056762345e-06, -4.252071448718198e-06, -4.12436384067405e-06, -3.996656232629903e-06, -3.868949079333106e-06, -3.7412414712889586e-06, -3.6135340906184865e-06, -3.4858267099480145e-06, -3.358119101903867e-06, -3.230411721233395e-06, -3.102704340562923e-06, -2.9749967325187754e-06, -2.8472893518483033e-06, -2.7195819711778313e-06, -2.591874363133684e-06, -2.4641669824632118e-06, -2.3364593744190643e-06, -2.2087519937485922e-06, -2.0810443857044447e-06, -1.9533370050339727e-06, -1.8256296243635006e-06, -1.6979221300061909e-06, -1.570214635648881e-06, -1.4425071412915713e-06, -1.3147996469342615e-06, -1.1870922662637895e-06, -1.0593847719064797e-06, -9.3167727754917e-07, -8.03969840035279e-07, -6.762624025213881e-07, -5.485553629114293e-07, -4.208478969758289e-07, -2.931404310402286e-07, -1.6543296510462824e-07, -3.77254991690279e-08, 8.998199518828187e-08, 2.1768943270217278e-07, 3.453968702160637e-07, 4.7310436457337346e-07, 6.008118589306832e-07, 7.285192964445741e-07, 8.56226733958465e-07, 9.839342283157748e-07, 1.1116417226730846e-06, 1.2393491033435566e-06, 1.3670565977008664e-06, 1.4947640920581762e-06, 1.622471586415486e-06, 1.7501790807727957e-06, 1.8778864614432678e-06, 2.0055940694874153e-06, 2.1333014501578873e-06, 2.2610088308283594e-06, 2.388716438872507e-06, 2.516423819542979e-06, 2.644131200213451e-06, 2.7718388082575984e-06, 2.8995461889280705e-06, 3.0272535695985425e-06, 3.15496117764269e-06, 3.282668558313162e-06, 3.410375938983634e-06, 3.5380835470277816e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 4.0, 7.0, 18.0, 23.0, 19.0, 26.0, 34.0, 49.0, 47.0, 53.0, 49.0, 45.0, 55.0, 51.0, 53.0, 49.0, 45.0, 48.0, 40.0, 57.0, 34.0, 31.0, 36.0, 21.0, 22.0, 9.0, 16.0, 8.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.569599812180968e-06, -3.471054469628143e-06, -3.3725091270753182e-06, -3.2739637845224934e-06, -3.1754184419696685e-06, -3.0768730994168436e-06, -2.9783277568640187e-06, -2.8797821869375184e-06, -2.781237071758369e-06, -2.682691729205544e-06, -2.5841463866527192e-06, -2.4856010440998944e-06, -2.3870557015470695e-06, -2.2885103589942446e-06, -2.1899650164414197e-06, -2.0914194465149194e-06, -1.9928741039620945e-06, -1.8943287614092696e-06, -1.7957834188564448e-06, -1.6972380763036199e-06, -1.598692733750795e-06, -1.5001473911979701e-06, -1.4016019349583075e-06, -1.3030565924054827e-06, -1.2045112498526578e-06, -1.105965907299833e-06, -1.007420564747008e-06, -9.088751653507643e-07, -8.103298227979394e-07, -7.117844802451145e-07, -6.132390808488708e-07, -5.146937382960459e-07, -4.161481683695456e-07, -3.176028258167207e-07, -2.1905745484218642e-07, -1.205120838676521e-07, -2.1966741314827232e-08, 7.657860123799765e-08, 1.7512400063424138e-07, 2.7366934318706626e-07, 3.7221468573989114e-07, 4.70760028292716e-07, 5.693053708455409e-07, 6.678507702417846e-07, 7.663961127946095e-07, 8.649414553474344e-07, 9.634868547436781e-07, 1.062032197296503e-06, 1.1605775398493279e-06, 1.2591228824021528e-06, 1.3576682249549776e-06, 1.4562135675078025e-06, 1.5547589100606274e-06, 1.6533042526134523e-06, 1.7518497088531149e-06, 1.8503950514059397e-06, 1.948940280271927e-06, 2.0474856228247518e-06, 2.1460309653775766e-06, 2.2445763079304015e-06, 2.3431216504832264e-06, 2.4416669930360513e-06, 2.540212335588876e-06, 2.6387579055153765e-06, 2.7373032480682014e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 8.0, 5.0, 3.0, 8.0, 22.0, 24.0, 30.0, 69.0, 42.0, 82.0, 129.0, 161.0, 263.0, 381.0, 522.0, 493.0, 1082.0, 1603.0, 2466.0, 3773.0, 6170.0, 6085.0, 14035.0, 24626.0, 45487.0, 86510.0, 179101.0, 205406.0, 229519.0, 110122.0, 56007.0, 30185.0, 16828.0, 10146.0, 4374.0, 4531.0, 2731.0, 1783.0, 1228.0, 797.0, 404.0, 395.0, 270.0, 187.0, 134.0, 111.0, 73.0, 37.0, 36.0, 21.0, 18.0, 14.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.364418029785156e-06, -5.194917321205139e-06, -5.025416612625122e-06, -4.855915904045105e-06, -4.686415195465088e-06, -4.516914486885071e-06, -4.347413778305054e-06, -4.177913069725037e-06, -4.0084123611450195e-06, -3.8389116525650024e-06, -3.6694109439849854e-06, -3.4999102354049683e-06, -3.330409526824951e-06, -3.160908818244934e-06, -2.991408109664917e-06, -2.8219074010849e-06, -2.652406692504883e-06, -2.4829059839248657e-06, -2.3134052753448486e-06, -2.1439045667648315e-06, -1.9744038581848145e-06, -1.8049031496047974e-06, -1.6354024410247803e-06, -1.4659017324447632e-06, -1.296401023864746e-06, -1.126900315284729e-06, -9.57399606704712e-07, -7.878988981246948e-07, -6.183981895446777e-07, -4.4889748096466064e-07, -2.7939677238464355e-07, -1.0989606380462646e-07, 5.960464477539063e-08, 2.2910535335540771e-07, 3.986060619354248e-07, 5.681067705154419e-07, 7.37607479095459e-07, 9.071081876754761e-07, 1.0766088962554932e-06, 1.2461096048355103e-06, 1.4156103134155273e-06, 1.5851110219955444e-06, 1.7546117305755615e-06, 1.9241124391555786e-06, 2.0936131477355957e-06, 2.263113856315613e-06, 2.43261456489563e-06, 2.602115273475647e-06, 2.771615982055664e-06, 2.941116690635681e-06, 3.1106173992156982e-06, 3.2801181077957153e-06, 3.4496188163757324e-06, 3.6191195249557495e-06, 3.7886202335357666e-06, 3.958120942115784e-06, 4.127621650695801e-06, 4.297122359275818e-06, 4.466623067855835e-06, 4.636123776435852e-06, 4.805624485015869e-06, 4.975125193595886e-06, 5.144625902175903e-06, 5.31412661075592e-06, 5.4836273193359375e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 13.0, 23.0, 23.0, 27.0, 34.0, 33.0, 41.0, 50.0, 37.0, 47.0, 40.0, 41.0, 45.0, 34.0, 67.0, 42.0, 46.0, 49.0, 37.0, 41.0, 35.0, 23.0, 16.0, 25.0, 10.0, 19.0, 12.0, 6.0, 7.0, 10.0, 9.0, 5.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9073486328125e-06, -1.8458813428878784e-06, -1.7844140529632568e-06, -1.7229467630386353e-06, -1.6614794731140137e-06, -1.600012183189392e-06, -1.5385448932647705e-06, -1.477077603340149e-06, -1.4156103134155273e-06, -1.3541430234909058e-06, -1.2926757335662842e-06, -1.2312084436416626e-06, -1.169741153717041e-06, -1.1082738637924194e-06, -1.0468065738677979e-06, -9.853392839431763e-07, -9.238719940185547e-07, -8.624047040939331e-07, -8.009374141693115e-07, -7.394701242446899e-07, -6.780028343200684e-07, -6.165355443954468e-07, -5.550682544708252e-07, -4.936009645462036e-07, -4.3213367462158203e-07, -3.7066638469696045e-07, -3.0919909477233887e-07, -2.477318048477173e-07, -1.862645149230957e-07, -1.2479722499847412e-07, -6.332993507385254e-08, -1.862645149230957e-09, 5.960464477539063e-08, 1.210719347000122e-07, 1.825392246246338e-07, 2.4400651454925537e-07, 3.0547380447387695e-07, 3.6694109439849854e-07, 4.284083843231201e-07, 4.898756742477417e-07, 5.513429641723633e-07, 6.128102540969849e-07, 6.742775440216064e-07, 7.35744833946228e-07, 7.972121238708496e-07, 8.586794137954712e-07, 9.201467037200928e-07, 9.816139936447144e-07, 1.043081283569336e-06, 1.1045485734939575e-06, 1.166015863418579e-06, 1.2274831533432007e-06, 1.2889504432678223e-06, 1.3504177331924438e-06, 1.4118850231170654e-06, 1.473352313041687e-06, 1.5348196029663086e-06, 1.5962868928909302e-06, 1.6577541828155518e-06, 1.7192214727401733e-06, 1.780688762664795e-06, 1.8421560525894165e-06, 1.903623342514038e-06, 1.9650906324386597e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 18.0, 13.0, 17.0, 28.0, 58.0, 61.0, 134.0, 152.0, 272.0, 335.0, 834.0, 1103.0, 2476.0, 3224.0, 8355.0, 11701.0, 30591.0, 46587.0, 152910.0, 334458.0, 294248.0, 74299.0, 45520.0, 17075.0, 11775.0, 4714.0, 3484.0, 1431.0, 1125.0, 519.0, 402.0, 194.0, 142.0, 72.0, 57.0, 48.0, 35.0, 17.0, 18.0, 15.0, 5.0, 4.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -5.990266799926758e-06, -5.781650543212891e-06, -5.5730342864990234e-06, -5.364418029785156e-06, -5.155801773071289e-06, -4.947185516357422e-06, -4.738569259643555e-06, -4.5299530029296875e-06, -4.32133674621582e-06, -4.112720489501953e-06, -3.904104232788086e-06, -3.6954879760742188e-06, -3.4868717193603516e-06, -3.2782554626464844e-06, -3.069639205932617e-06, -2.86102294921875e-06, -2.652406692504883e-06, -2.4437904357910156e-06, -2.2351741790771484e-06, -2.0265579223632812e-06, -1.817941665649414e-06, -1.6093254089355469e-06, -1.4007091522216797e-06, -1.1920928955078125e-06, -9.834766387939453e-07, -7.748603820800781e-07, -5.662441253662109e-07, -3.5762786865234375e-07, -1.4901161193847656e-07, 5.960464477539063e-08, 2.682209014892578e-07, 4.76837158203125e-07, 6.854534149169922e-07, 8.940696716308594e-07, 1.1026859283447266e-06, 1.3113021850585938e-06, 1.519918441772461e-06, 1.7285346984863281e-06, 1.9371509552001953e-06, 2.1457672119140625e-06, 2.3543834686279297e-06, 2.562999725341797e-06, 2.771615982055664e-06, 2.9802322387695312e-06, 3.1888484954833984e-06, 3.3974647521972656e-06, 3.606081008911133e-06, 3.814697265625e-06, 4.023313522338867e-06, 4.231929779052734e-06, 4.4405460357666016e-06, 4.649162292480469e-06, 4.857778549194336e-06, 5.066394805908203e-06, 5.27501106262207e-06, 5.4836273193359375e-06, 5.692243576049805e-06, 5.900859832763672e-06, 6.109476089477539e-06, 6.318092346191406e-06, 6.5267086029052734e-06, 6.735324859619141e-06, 6.943941116333008e-06, 7.152557373046875e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 7.0, 3.0, 0.0, 5.0, 2.0, 10.0, 6.0, 15.0, 13.0, 0.0, 20.0, 17.0, 27.0, 31.0, 31.0, 0.0, 29.0, 37.0, 51.0, 47.0, 62.0, 0.0, 46.0, 51.0, 79.0, 53.0, 50.0, 47.0, 0.0, 36.0, 38.0, 34.0, 34.0, 26.0, 0.0, 31.0, 11.0, 13.0, 16.0, 9.0, 10.0, 0.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6186386346817017e-06, -1.5683472156524658e-06, -1.51805579662323e-06, -1.4677643775939941e-06, -1.4174729585647583e-06, -1.3671815395355225e-06, -1.3168901205062866e-06, -1.2665987014770508e-06, -1.216307282447815e-06, -1.166015863418579e-06, -1.1157244443893433e-06, -1.0654330253601074e-06, -1.0151416063308716e-06, -9.648501873016357e-07, -9.145587682723999e-07, -8.642673492431641e-07, -8.139759302139282e-07, -7.636845111846924e-07, -7.133930921554565e-07, -6.631016731262207e-07, -6.128102540969849e-07, -5.62518835067749e-07, -5.122274160385132e-07, -4.6193599700927734e-07, -4.116445779800415e-07, -3.6135315895080566e-07, -3.110617399215698e-07, -2.60770320892334e-07, -2.1047890186309814e-07, -1.601874828338623e-07, -1.0989606380462646e-07, -5.960464477539063e-08, -9.313225746154785e-09, 4.0978193283081055e-08, 9.12696123123169e-08, 1.4156103134155273e-07, 1.9185245037078857e-07, 2.421438694000244e-07, 2.9243528842926025e-07, 3.427267074584961e-07, 3.9301812648773193e-07, 4.4330954551696777e-07, 4.936009645462036e-07, 5.438923835754395e-07, 5.941838026046753e-07, 6.444752216339111e-07, 6.94766640663147e-07, 7.450580596923828e-07, 7.953494787216187e-07, 8.456408977508545e-07, 8.959323167800903e-07, 9.462237358093262e-07, 9.96515154838562e-07, 1.0468065738677979e-06, 1.0970979928970337e-06, 1.1473894119262695e-06, 1.1976808309555054e-06, 1.2479722499847412e-06, 1.298263669013977e-06, 1.3485550880432129e-06, 1.3988465070724487e-06, 1.4491379261016846e-06, 1.4994293451309204e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 13.0, 10.0, 18.0, 16.0, 24.0, 39.0, 52.0, 89.0, 142.0, 170.0, 124.0, 94.0, 49.0, 38.0, 28.0, 17.0, 18.0, 14.0, 12.0, 5.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.876811661029933e-06, -3.7573297504422953e-06, -3.637848067228333e-06, -3.5183661566406954e-06, -3.398884473426733e-06, -3.2794025628390955e-06, -3.159920652251458e-06, -3.0404389690374956e-06, -2.920957058449858e-06, -2.80147514786222e-06, -2.681993464648258e-06, -2.5625115540606203e-06, -2.4430296434729826e-06, -2.3235479602590203e-06, -2.2040660496713826e-06, -2.084584139083745e-06, -1.9651024558697827e-06, -1.8456206589689828e-06, -1.7261388620681828e-06, -1.606656951480545e-06, -1.4871751545797451e-06, -1.3676933576789452e-06, -1.2482114470913075e-06, -1.1287296501905075e-06, -1.0092478532897076e-06, -8.897660563889076e-07, -7.702842026446888e-07, -6.5080234890047e-07, -5.3132055199967e-07, -4.1183875509887e-07, -2.923569013546512e-07, -1.7287504761043238e-07, -5.3393478083307855e-08, 6.608834723920154e-08, 1.8557017256171093e-07, 3.0505199788422033e-07, 4.245338232067297e-07, 5.440156201075297e-07, 6.634974738517485e-07, 7.829793275959673e-07, 9.024611244967673e-07, 1.0219429213975673e-06, 1.1414247182983672e-06, 1.260906628886005e-06, 1.3803884257868049e-06, 1.4998702226876048e-06, 1.6193521332752425e-06, 1.7388339301760425e-06, 1.8583157270768424e-06, 1.97779763766448e-06, 2.0972793208784424e-06, 2.21676123146608e-06, 2.3362431420537177e-06, 2.45572482526768e-06, 2.5752067358553177e-06, 2.6946886464429554e-06, 2.8141703296569176e-06, 2.9336522402445553e-06, 3.0531339234585175e-06, 3.1726158340461552e-06, 3.2920975172601175e-06, 3.411579427847755e-06, 3.531061338435393e-06, 3.650543021649355e-06, 3.7700249322369928e-06]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 6.0, 4.0, 4.0, 9.0, 21.0, 14.0, 16.0, 20.0, 26.0, 29.0, 32.0, 30.0, 48.0, 39.0, 55.0, 46.0, 50.0, 51.0, 57.0, 44.0, 43.0, 40.0, 41.0, 31.0, 29.0, 25.0, 32.0, 27.0, 31.0, 27.0, 17.0, 14.0, 11.0, 5.0, 5.0, 6.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-2.649838279467076e-06, -2.5810727493080776e-06, -2.512307219149079e-06, -2.443541916363756e-06, -2.3747763862047577e-06, -2.3060108560457593e-06, -2.237245325886761e-06, -2.1684797957277624e-06, -2.0997144929424394e-06, -2.030948962783441e-06, -1.9621834326244425e-06, -1.8934180161522818e-06, -1.824652599680121e-06, -1.7558870695211226e-06, -1.6871215393621242e-06, -1.6183560092031257e-06, -1.5495904790441273e-06, -1.4808249488851288e-06, -1.4120595324129681e-06, -1.3432940022539697e-06, -1.274528585781809e-06, -1.2057630556228105e-06, -1.136997525463812e-06, -1.0682319953048136e-06, -9.994665788326529e-07, -9.307011055170733e-07, -8.619356322014937e-07, -7.931701020424953e-07, -7.244046287269157e-07, -6.556391554113361e-07, -5.868736252523377e-07, -5.181081519367581e-07, -4.4934256493434077e-07, -3.805770916187612e-07, -3.1181158988147217e-07, -2.4304608814418316e-07, -1.7428061482860358e-07, -1.0551514151302399e-07, -3.674963977573498e-08, 3.201586196155404e-08, 1.0078133527713362e-07, 1.6954682280356792e-07, 2.3831231033000222e-07, 3.0707781206729123e-07, 3.758432853828708e-07, 4.446087586984504e-07, 5.133742888574488e-07, 5.821397621730284e-07, 6.50905235488608e-07, 7.196707088041876e-07, 7.884361821197672e-07, 8.572017122787656e-07, 9.259671855943452e-07, 9.947326589099248e-07, 1.0634981890689232e-06, 1.132263605541084e-06, 1.2010291357000824e-06, 1.2697946658590809e-06, 1.3385600823312416e-06, 1.40732561249024e-06, 1.4760910289624007e-06, 1.5448565591213992e-06, 1.6136220892803976e-06, 1.682387619439396e-06, 1.7511530359115568e-06]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 4.0, 8.0, 8.0, 16.0, 14.0, 22.0, 31.0, 28.0, 47.0, 65.0, 64.0, 118.0, 170.0, 180.0, 371.0, 621.0, 778.0, 1704.0, 3761.0, 22018.0, 3812950.0, 338364.0, 6903.0, 2107.0, 1514.0, 885.0, 431.0, 350.0, 211.0, 106.0, 97.0, 93.0, 54.0, 56.0, 38.0, 32.0, 11.0, 16.0, 12.0, 6.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-7.867813110351562e-06, -7.64802098274231e-06, -7.428228855133057e-06, -7.208436727523804e-06, -6.988644599914551e-06, -6.768852472305298e-06, -6.549060344696045e-06, -6.329268217086792e-06, -6.109476089477539e-06, -5.889683961868286e-06, -5.669891834259033e-06, -5.45009970664978e-06, -5.230307579040527e-06, -5.010515451431274e-06, -4.7907233238220215e-06, -4.5709311962127686e-06, -4.351139068603516e-06, -4.131346940994263e-06, -3.91155481338501e-06, -3.691762685775757e-06, -3.471970558166504e-06, -3.252178430557251e-06, -3.032386302947998e-06, -2.812594175338745e-06, -2.592802047729492e-06, -2.3730099201202393e-06, -2.1532177925109863e-06, -1.9334256649017334e-06, -1.7136335372924805e-06, -1.4938414096832275e-06, -1.2740492820739746e-06, -1.0542571544647217e-06, -8.344650268554688e-07, -6.146728992462158e-07, -3.948807716369629e-07, -1.7508864402770996e-07, 4.470348358154297e-08, 2.644956111907959e-07, 4.842877388000488e-07, 7.040798664093018e-07, 9.238719940185547e-07, 1.1436641216278076e-06, 1.3634562492370605e-06, 1.5832483768463135e-06, 1.8030405044555664e-06, 2.0228326320648193e-06, 2.2426247596740723e-06, 2.462416887283325e-06, 2.682209014892578e-06, 2.902001142501831e-06, 3.121793270111084e-06, 3.341585397720337e-06, 3.56137752532959e-06, 3.7811696529388428e-06, 4.000961780548096e-06, 4.220753908157349e-06, 4.4405460357666016e-06, 4.6603381633758545e-06, 4.880130290985107e-06, 5.09992241859436e-06, 5.319714546203613e-06, 5.539506673812866e-06, 5.759298801422119e-06, 5.979090929031372e-06, 6.198883056640625e-06]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 4.0, 10.0, 10.0, 11.0, 18.0, 15.0, 19.0, 22.0, 32.0, 22.0, 32.0, 54.0, 46.0, 0.0, 54.0, 57.0, 50.0, 60.0, 63.0, 45.0, 54.0, 36.0, 38.0, 38.0, 26.0, 24.0, 25.0, 22.0, 20.0, 21.0, 20.0, 13.0, 8.0, 10.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0265579223632812e-06, -1.9688159227371216e-06, -1.911073923110962e-06, -1.8533319234848022e-06, -1.7955899238586426e-06, -1.737847924232483e-06, -1.6801059246063232e-06, -1.6223639249801636e-06, -1.564621925354004e-06, -1.5068799257278442e-06, -1.4491379261016846e-06, -1.391395926475525e-06, -1.3336539268493652e-06, -1.2759119272232056e-06, -1.218169927597046e-06, -1.1604279279708862e-06, -1.1026859283447266e-06, -1.044943928718567e-06, -9.872019290924072e-07, -9.294599294662476e-07, -8.717179298400879e-07, -8.139759302139282e-07, -7.562339305877686e-07, -6.984919309616089e-07, -6.407499313354492e-07, -5.830079317092896e-07, -5.252659320831299e-07, -4.675239324569702e-07, -4.0978193283081055e-07, -3.520399332046509e-07, -2.942979335784912e-07, -2.3655593395233154e-07, -1.7881393432617188e-07, -1.210719347000122e-07, -6.332993507385254e-08, -5.587935447692871e-09, 5.21540641784668e-08, 1.0989606380462646e-07, 1.6763806343078613e-07, 2.253800630569458e-07, 2.8312206268310547e-07, 3.4086406230926514e-07, 3.986060619354248e-07, 4.5634806156158447e-07, 5.140900611877441e-07, 5.718320608139038e-07, 6.295740604400635e-07, 6.873160600662231e-07, 7.450580596923828e-07, 8.028000593185425e-07, 8.605420589447021e-07, 9.182840585708618e-07, 9.760260581970215e-07, 1.0337680578231812e-06, 1.0915100574493408e-06, 1.1492520570755005e-06, 1.2069940567016602e-06, 1.2647360563278198e-06, 1.3224780559539795e-06, 1.3802200555801392e-06, 1.4379620552062988e-06, 1.4957040548324585e-06, 1.5534460544586182e-06, 1.6111880540847778e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 16.0, 45.0, 59.0, 70.0, 156.0, 285.0, 536.0, 799.0, 1832.0, 4019.0, 9009.0, 110202.0, 4028118.0, 27903.0, 5410.0, 2854.0, 1341.0, 735.0, 333.0, 243.0, 117.0, 69.0, 29.0, 20.0, 18.0, 9.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-9.953975677490234e-06, -9.671784937381744e-06, -9.389594197273254e-06, -9.107403457164764e-06, -8.825212717056274e-06, -8.543021976947784e-06, -8.260831236839294e-06, -7.978640496730804e-06, -7.696449756622314e-06, -7.4142590165138245e-06, -7.1320682764053345e-06, -6.8498775362968445e-06, -6.5676867961883545e-06, -6.2854960560798645e-06, -6.0033053159713745e-06, -5.7211145758628845e-06, -5.4389238357543945e-06, -5.1567330956459045e-06, -4.8745423555374146e-06, -4.5923516154289246e-06, -4.3101608753204346e-06, -4.027970135211945e-06, -3.7457793951034546e-06, -3.4635886549949646e-06, -3.1813979148864746e-06, -2.8992071747779846e-06, -2.6170164346694946e-06, -2.3348256945610046e-06, -2.0526349544525146e-06, -1.7704442143440247e-06, -1.4882534742355347e-06, -1.2060627341270447e-06, -9.238719940185547e-07, -6.416812539100647e-07, -3.594905138015747e-07, -7.729977369308472e-08, 2.0489096641540527e-07, 4.870817065238953e-07, 7.692724466323853e-07, 1.0514631867408752e-06, 1.3336539268493652e-06, 1.6158446669578552e-06, 1.8980354070663452e-06, 2.180226147174835e-06, 2.462416887283325e-06, 2.744607627391815e-06, 3.026798367500305e-06, 3.308989107608795e-06, 3.591179847717285e-06, 3.873370587825775e-06, 4.155561327934265e-06, 4.437752068042755e-06, 4.719942808151245e-06, 5.002133548259735e-06, 5.284324288368225e-06, 5.566515028476715e-06, 5.848705768585205e-06, 6.130896508693695e-06, 6.413087248802185e-06, 6.695277988910675e-06, 6.977468729019165e-06, 7.259659469127655e-06, 7.541850209236145e-06, 7.824040949344635e-06, 8.106231689453125e-06]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 0.0, 12.0, 7.0, 0.0, 13.0, 0.0, 27.0, 76.0, 0.0, 319.0, 3145.0, 0.0, 356.0, 55.0, 0.0, 26.0, 8.0, 0.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.391395926475525e-06, -1.3522803783416748e-06, -1.3131648302078247e-06, -1.2740492820739746e-06, -1.2349337339401245e-06, -1.1958181858062744e-06, -1.1567026376724243e-06, -1.1175870895385742e-06, -1.0784715414047241e-06, -1.039355993270874e-06, -1.000240445137024e-06, -9.611248970031738e-07, -9.220093488693237e-07, -8.828938007354736e-07, -8.437782526016235e-07, -8.046627044677734e-07, -7.655471563339233e-07, -7.264316082000732e-07, -6.873160600662231e-07, -6.48200511932373e-07, -6.09084963798523e-07, -5.699694156646729e-07, -5.308538675308228e-07, -4.917383193969727e-07, -4.5262277126312256e-07, -4.1350722312927246e-07, -3.7439167499542236e-07, -3.3527612686157227e-07, -2.9616057872772217e-07, -2.5704503059387207e-07, -2.1792948246002197e-07, -1.7881393432617188e-07, -1.3969838619232178e-07, -1.0058283805847168e-07, -6.146728992462158e-08, -2.2351741790771484e-08, 1.6763806343078613e-08, 5.587935447692871e-08, 9.499490261077881e-08, 1.341104507446289e-07, 1.73225998878479e-07, 2.123415470123291e-07, 2.514570951461792e-07, 2.905726432800293e-07, 3.296881914138794e-07, 3.688037395477295e-07, 4.079192876815796e-07, 4.470348358154297e-07, 4.861503839492798e-07, 5.252659320831299e-07, 5.6438148021698e-07, 6.034970283508301e-07, 6.426125764846802e-07, 6.817281246185303e-07, 7.208436727523804e-07, 7.599592208862305e-07, 7.990747690200806e-07, 8.381903171539307e-07, 8.773058652877808e-07, 9.164214134216309e-07, 9.55536961555481e-07, 9.94652509689331e-07, 1.0337680578231812e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 9.0, 14.0, 22.0, 25.0, 26.0, 31.0, 44.0, 74.0, 112.0, 133.0, 97.0, 93.0, 58.0, 51.0, 47.0, 33.0, 17.0, 18.0, 15.0, 10.0, 7.0, 1.0, 6.0, 4.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.343038431718014e-06, -2.2643962438451126e-06, -2.1857538285985356e-06, -2.1071114133519586e-06, -2.028469225479057e-06, -1.9498270376061555e-06, -1.8711846223595785e-06, -1.7925423207998392e-06, -1.7139000192401e-06, -1.6352577176803607e-06, -1.5566154161206214e-06, -1.477973114560882e-06, -1.3993308130011428e-06, -1.3206885114414035e-06, -1.2420462098816643e-06, -1.163403908321925e-06, -1.0847616067621857e-06, -1.0061193052024464e-06, -9.274770036427071e-07, -8.488347020829679e-07, -7.701924005232286e-07, -6.915500989634893e-07, -6.1290779740375e-07, -5.342654958440107e-07, -4.5562319428427145e-07, -3.7698089272453217e-07, -2.983385911647929e-07, -2.196962896050536e-07, -1.4105398804531433e-07, -6.241168648557505e-08, 1.6230615074164234e-08, 9.487291663390351e-08, 1.7351544556731824e-07, 2.521577471270575e-07, 3.308000486867968e-07, 4.094423502465361e-07, 4.880846518062754e-07, 5.667269533660146e-07, 6.453692549257539e-07, 7.240115564854932e-07, 8.026538580452325e-07, 8.812961596049718e-07, 9.59938461164711e-07, 1.0385807627244503e-06, 1.1172230642841896e-06, 1.1958653658439289e-06, 1.2745076674036682e-06, 1.3531499689634074e-06, 1.4317922705231467e-06, 1.510434572082886e-06, 1.5890768736426253e-06, 1.6677191752023646e-06, 1.7463614767621038e-06, 1.8250037783218431e-06, 1.9036460798815824e-06, 1.982288267754484e-06, 2.060930683001061e-06, 2.139573098247638e-06, 2.2182152861205395e-06, 2.296857473993441e-06, 2.375499889240018e-06, 2.454142304486595e-06, 2.5327844923594967e-06, 2.6114266802323982e-06, 2.6900690954789752e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 13.0, 13.0, 16.0, 21.0, 28.0, 28.0, 30.0, 44.0, 36.0, 44.0, 48.0, 48.0, 63.0, 52.0, 51.0, 60.0, 53.0, 54.0, 35.0, 38.0, 32.0, 31.0, 24.0, 27.0, 19.0, 19.0, 23.0, 8.0, 7.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.5493052362435265e-06, -2.4852354272297816e-06, -2.4211658455897123e-06, -2.3570960365759674e-06, -2.2930262275622226e-06, -2.2289566459221533e-06, -2.1648868369084084e-06, -2.100817255268339e-06, -2.0367474462545943e-06, -1.9726776372408494e-06, -1.90860805560078e-06, -1.8445382465870352e-06, -1.7804685512601282e-06, -1.716398855933221e-06, -1.6523290469194762e-06, -1.5882593515925691e-06, -1.524189656265662e-06, -1.460119960938755e-06, -1.3960502656118479e-06, -1.331980456598103e-06, -1.267910761271196e-06, -1.2038410659442889e-06, -1.139771256930544e-06, -1.075701561603637e-06, -1.0116318662767299e-06, -9.475621709498228e-07, -8.834924187794968e-07, -8.194226666091708e-07, -7.553529712822638e-07, -6.912832759553567e-07, -6.272135237850307e-07, -5.631437716147047e-07, -4.990741899746354e-07, -4.3500446622601885e-07, -3.709347424774023e-07, -3.068650187287858e-07, -2.427952949801693e-07, -1.7872557123155275e-07, -1.1465584748293622e-07, -5.05861237343197e-08, 1.3483600014296826e-08, 7.755332376291335e-08, 1.4162304751152988e-07, 2.056927712601464e-07, 2.697624950087629e-07, 3.3383221875737945e-07, 3.97901942505996e-07, 4.619716662546125e-07, 5.26041390003229e-07, 5.901110853301361e-07, 6.541808375004621e-07, 7.18250589670788e-07, 7.823202849976951e-07, 8.463899803246022e-07, 9.104597324949282e-07, 9.745294846652541e-07, 1.0385991799921612e-06, 1.1026688753190683e-06, 1.1667386843328131e-06, 1.2308083796597202e-06, 1.2948780749866273e-06, 1.3589477703135344e-06, 1.4230174656404415e-06, 1.4870872746541863e-06, 1.5511569699810934e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 2.0, 7.0, 3.0, 6.0, 15.0, 10.0, 38.0, 17.0, 26.0, 92.0, 80.0, 115.0, 333.0, 289.0, 933.0, 891.0, 1221.0, 4888.0, 4782.0, 7650.0, 34623.0, 40188.0, 248806.0, 358603.0, 171112.0, 117897.0, 21723.0, 12914.0, 12330.0, 2963.0, 3137.0, 863.0, 576.0, 675.0, 180.0, 129.0, 190.0, 56.0, 76.0, 29.0, 19.0, 21.0, 14.0, 12.0, 12.0, 6.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1830201148986816e-06, -2.1010637283325195e-06, -2.0191073417663574e-06, -1.9371509552001953e-06, -1.8551945686340332e-06, -1.773238182067871e-06, -1.691281795501709e-06, -1.6093254089355469e-06, -1.5273690223693848e-06, -1.4454126358032227e-06, -1.3634562492370605e-06, -1.2814998626708984e-06, -1.1995434761047363e-06, -1.1175870895385742e-06, -1.0356307029724121e-06, -9.5367431640625e-07, -8.717179298400879e-07, -7.897615432739258e-07, -7.078051567077637e-07, -6.258487701416016e-07, -5.438923835754395e-07, -4.6193599700927734e-07, -3.7997961044311523e-07, -2.980232238769531e-07, -2.1606683731079102e-07, -1.341104507446289e-07, -5.21540641784668e-08, 2.9802322387695312e-08, 1.1175870895385742e-07, 1.9371509552001953e-07, 2.7567148208618164e-07, 3.5762786865234375e-07, 4.3958425521850586e-07, 5.21540641784668e-07, 6.034970283508301e-07, 6.854534149169922e-07, 7.674098014831543e-07, 8.493661880493164e-07, 9.313225746154785e-07, 1.0132789611816406e-06, 1.0952353477478027e-06, 1.1771917343139648e-06, 1.259148120880127e-06, 1.341104507446289e-06, 1.4230608940124512e-06, 1.5050172805786133e-06, 1.5869736671447754e-06, 1.6689300537109375e-06, 1.7508864402770996e-06, 1.8328428268432617e-06, 1.914799213409424e-06, 1.996755599975586e-06, 2.078711986541748e-06, 2.16066837310791e-06, 2.2426247596740723e-06, 2.3245811462402344e-06, 2.4065375328063965e-06, 2.4884939193725586e-06, 2.5704503059387207e-06, 2.652406692504883e-06, 2.734363079071045e-06, 2.816319465637207e-06, 2.898275852203369e-06, 2.9802322387695312e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 7.0, 11.0, 16.0, 35.0, 19.0, 32.0, 27.0, 41.0, 36.0, 49.0, 78.0, 43.0, 57.0, 37.0, 63.0, 49.0, 54.0, 89.0, 34.0, 43.0, 34.0, 16.0, 18.0, 18.0, 40.0, 17.0, 7.0, 5.0, 5.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5546178221702576e-06, -2.4866312742233276e-06, -2.4186447262763977e-06, -2.3506581783294678e-06, -2.282671630382538e-06, -2.214685082435608e-06, -2.146698534488678e-06, -2.078711986541748e-06, -2.010725438594818e-06, -1.942738890647888e-06, -1.8747523427009583e-06, -1.8067657947540283e-06, -1.7387792468070984e-06, -1.6707926988601685e-06, -1.6028061509132385e-06, -1.5348196029663086e-06, -1.4668330550193787e-06, -1.3988465070724487e-06, -1.3308599591255188e-06, -1.2628734111785889e-06, -1.194886863231659e-06, -1.126900315284729e-06, -1.058913767337799e-06, -9.909272193908691e-07, -9.229406714439392e-07, -8.549541234970093e-07, -7.869675755500793e-07, -7.189810276031494e-07, -6.509944796562195e-07, -5.830079317092896e-07, -5.150213837623596e-07, -4.470348358154297e-07, -3.7904828786849976e-07, -3.110617399215698e-07, -2.430751919746399e-07, -1.7508864402770996e-07, -1.0710209608078003e-07, -3.91155481338501e-08, 2.8870999813079834e-08, 9.685754776000977e-08, 1.648440957069397e-07, 2.3283064365386963e-07, 3.0081719160079956e-07, 3.688037395477295e-07, 4.367902874946594e-07, 5.047768354415894e-07, 5.727633833885193e-07, 6.407499313354492e-07, 7.087364792823792e-07, 7.767230272293091e-07, 8.44709575176239e-07, 9.126961231231689e-07, 9.806826710700989e-07, 1.0486692190170288e-06, 1.1166557669639587e-06, 1.1846423149108887e-06, 1.2526288628578186e-06, 1.3206154108047485e-06, 1.3886019587516785e-06, 1.4565885066986084e-06, 1.5245750546455383e-06, 1.5925616025924683e-06, 1.6605481505393982e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 10.0, 6.0, 11.0, 14.0, 11.0, 15.0, 22.0, 23.0, 32.0, 54.0, 56.0, 106.0, 101.0, 163.0, 216.0, 360.0, 515.0, 816.0, 1467.0, 2614.0, 5805.0, 0.0, 1023630.0, 5847.0, 2720.0, 1484.0, 760.0, 506.0, 350.0, 212.0, 161.0, 103.0, 119.0, 59.0, 34.0, 25.0, 17.0, 28.0, 22.0, 12.0, 7.0, 8.0, 1.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7900019884109497e-06, -1.73225998878479e-06, -1.6745179891586304e-06, -1.6167759895324707e-06, -1.559033989906311e-06, -1.5012919902801514e-06, -1.4435499906539917e-06, -1.385807991027832e-06, -1.3280659914016724e-06, -1.2703239917755127e-06, -1.212581992149353e-06, -1.1548399925231934e-06, -1.0970979928970337e-06, -1.039355993270874e-06, -9.816139936447144e-07, -9.238719940185547e-07, -8.66129994392395e-07, -8.083879947662354e-07, -7.506459951400757e-07, -6.92903995513916e-07, -6.351619958877563e-07, -5.774199962615967e-07, -5.19677996635437e-07, -4.6193599700927734e-07, -4.041939973831177e-07, -3.46451997756958e-07, -2.8870999813079834e-07, -2.3096799850463867e-07, -1.73225998878479e-07, -1.1548399925231934e-07, -5.774199962615967e-08, 0.0, 5.774199962615967e-08, 1.1548399925231934e-07, 1.73225998878479e-07, 2.3096799850463867e-07, 2.8870999813079834e-07, 3.46451997756958e-07, 4.041939973831177e-07, 4.6193599700927734e-07, 5.19677996635437e-07, 5.774199962615967e-07, 6.351619958877563e-07, 6.92903995513916e-07, 7.506459951400757e-07, 8.083879947662354e-07, 8.66129994392395e-07, 9.238719940185547e-07, 9.816139936447144e-07, 1.039355993270874e-06, 1.0970979928970337e-06, 1.1548399925231934e-06, 1.212581992149353e-06, 1.2703239917755127e-06, 1.3280659914016724e-06, 1.385807991027832e-06, 1.4435499906539917e-06, 1.5012919902801514e-06, 1.559033989906311e-06, 1.6167759895324707e-06, 1.6745179891586304e-06, 1.73225998878479e-06, 1.7900019884109497e-06, 1.8477439880371094e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 974.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 56.0, 36.0, 0.0, 33.0, 0.0, 43.0, 0.0, 140.0, 0.0, 204.0, 0.0, 353.0, 849.0, 0.0, 1641.0, 0.0, 3443.0, 0.0, 1034853.0, 0.0, 3609.0, 0.0, 1602.0, 833.0, 0.0, 363.0, 0.0, 212.0, 0.0, 145.0, 0.0, 35.0, 0.0, 40.0, 27.0, 0.0, 38.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.940696716308594e-07, -8.614733815193176e-07, -8.288770914077759e-07, -7.962808012962341e-07, -7.636845111846924e-07, -7.310882210731506e-07, -6.984919309616089e-07, -6.658956408500671e-07, -6.332993507385254e-07, -6.007030606269836e-07, -5.681067705154419e-07, -5.355104804039001e-07, -5.029141902923584e-07, -4.7031790018081665e-07, -4.377216100692749e-07, -4.0512531995773315e-07, -3.725290298461914e-07, -3.3993273973464966e-07, -3.073364496231079e-07, -2.7474015951156616e-07, -2.421438694000244e-07, -2.0954757928848267e-07, -1.7695128917694092e-07, -1.4435499906539917e-07, -1.1175870895385742e-07, -7.916241884231567e-08, -4.6566128730773926e-08, -1.3969838619232178e-08, 1.862645149230957e-08, 5.122274160385132e-08, 8.381903171539307e-08, 1.1641532182693481e-07, 1.4901161193847656e-07, 1.816079020500183e-07, 2.1420419216156006e-07, 2.468004822731018e-07, 2.7939677238464355e-07, 3.119930624961853e-07, 3.4458935260772705e-07, 3.771856427192688e-07, 4.0978193283081055e-07, 4.423782229423523e-07, 4.7497451305389404e-07, 5.075708031654358e-07, 5.401670932769775e-07, 5.727633833885193e-07, 6.05359673500061e-07, 6.379559636116028e-07, 6.705522537231445e-07, 7.031485438346863e-07, 7.35744833946228e-07, 7.683411240577698e-07, 8.009374141693115e-07, 8.335337042808533e-07, 8.66129994392395e-07, 8.987262845039368e-07, 9.313225746154785e-07, 9.639188647270203e-07, 9.96515154838562e-07, 1.0291114449501038e-06, 1.0617077350616455e-06, 1.0943040251731873e-06, 1.126900315284729e-06, 1.1594966053962708e-06, 1.1920928955078125e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 994.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 14.0, 20.0, 37.0, 73.0, 133.0, 0.0, 274.0, 467.0, 1048.0, 3128.0, 9993.0, 1018117.0, 10014.0, 3173.0, 1035.0, 0.0, 494.0, 220.0, 112.0, 92.0, 49.0, 27.0, 9.0, 12.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4901161193847656e-06, -1.4360994100570679e-06, -1.3820827007293701e-06, -1.3280659914016724e-06, -1.2740492820739746e-06, -1.2200325727462769e-06, -1.166015863418579e-06, -1.1119991540908813e-06, -1.0579824447631836e-06, -1.0039657354354858e-06, -9.499490261077881e-07, -8.959323167800903e-07, -8.419156074523926e-07, -7.878988981246948e-07, -7.338821887969971e-07, -6.798654794692993e-07, -6.258487701416016e-07, -5.718320608139038e-07, -5.178153514862061e-07, -4.637986421585083e-07, -4.0978193283081055e-07, -3.557652235031128e-07, -3.0174851417541504e-07, -2.477318048477173e-07, -1.9371509552001953e-07, -1.3969838619232178e-07, -8.568167686462402e-08, -3.166496753692627e-08, 2.2351741790771484e-08, 7.636845111846924e-08, 1.30385160446167e-07, 1.8440186977386475e-07, 2.384185791015625e-07, 2.9243528842926025e-07, 3.46451997756958e-07, 4.0046870708465576e-07, 4.544854164123535e-07, 5.085021257400513e-07, 5.62518835067749e-07, 6.165355443954468e-07, 6.705522537231445e-07, 7.245689630508423e-07, 7.7858567237854e-07, 8.326023817062378e-07, 8.866190910339355e-07, 9.406358003616333e-07, 9.94652509689331e-07, 1.0486692190170288e-06, 1.1026859283447266e-06, 1.1567026376724243e-06, 1.210719347000122e-06, 1.2647360563278198e-06, 1.3187527656555176e-06, 1.3727694749832153e-06, 1.426786184310913e-06, 1.4808028936386108e-06, 1.5348196029663086e-06, 1.5888363122940063e-06, 1.642853021621704e-06, 1.6968697309494019e-06, 1.7508864402770996e-06, 1.8049031496047974e-06, 1.8589198589324951e-06, 1.912936568260193e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 980.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 10.0, 4.0, 8.0, 13.0, 7.0, 19.0, 16.0, 36.0, 27.0, 40.0, 69.0, 82.0, 140.0, 111.0, 99.0, 78.0, 54.0, 42.0, 33.0, 27.0, 22.0, 10.0, 9.0, 8.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5368556180183077e-06, -2.4582443529652664e-06, -2.3796333152859006e-06, -2.3010220502328593e-06, -2.222410785179818e-06, -2.1437995201267768e-06, -2.065188482447411e-06, -1.9865772173943697e-06, -1.907966179715004e-06, -1.8293550283488003e-06, -1.750743763295759e-06, -1.6721326119295554e-06, -1.5935213468765141e-06, -1.5149101955103106e-06, -1.436299044144107e-06, -1.3576877790910657e-06, -1.2790765140380245e-06, -1.200465362671821e-06, -1.1218540976187796e-06, -1.043242946252576e-06, -9.646316811995348e-07, -8.860205298333312e-07, -8.074093784671277e-07, -7.287981702575053e-07, -6.501869620478828e-07, -5.715757538382604e-07, -4.92964545628638e-07, -4.1435339426243445e-07, -3.3574218605281203e-07, -2.571309778431896e-07, -1.7851979805527662e-07, -9.990861826736364e-08, -2.129763743141666e-08, 5.731355656735104e-08, 1.3592475056611875e-07, 2.1453594456488645e-07, 2.9314713856365415e-07, 3.7175834677327657e-07, 4.5036952656118956e-07, 5.289807063491025e-07, 6.07591914558725e-07, 6.862031227683474e-07, 7.648143309779698e-07, 8.434254823441734e-07, 9.220366905537958e-07, 1.0006478987634182e-06, 1.0792590501296218e-06, 1.1578702014958253e-06, 1.2364814665488666e-06, 1.3150926179150702e-06, 1.3937038829681114e-06, 1.472315034334315e-06, 1.5509262993873563e-06, 1.6295374507535598e-06, 1.7081486021197634e-06, 1.7867598671728047e-06, 1.8653710185390082e-06, 1.9439821699052118e-06, 2.022593434958253e-06, 2.1012047000112943e-06, 2.17981573769066e-06, 2.2584270027437015e-06, 2.3370382677967427e-06, 2.4156493054761086e-06, 2.49426057052915e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 14.0, 12.0, 19.0, 21.0, 24.0, 30.0, 28.0, 48.0, 36.0, 41.0, 48.0, 50.0, 61.0, 54.0, 50.0, 58.0, 52.0, 55.0, 40.0, 36.0, 29.0, 33.0, 23.0, 27.0, 19.0, 21.0, 20.0, 8.0, 7.0, 10.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.4545765882066917e-06, -2.3929519556986634e-06, -2.331327323190635e-06, -2.2697026906826068e-06, -2.2080780581745785e-06, -2.14645342566655e-06, -2.084828793158522e-06, -2.0232041606504936e-06, -1.9615795281424653e-06, -1.899954895634437e-06, -1.8383302631264087e-06, -1.7767056306183804e-06, -1.715080998110352e-06, -1.6534563656023238e-06, -1.5918317330942955e-06, -1.5302071005862672e-06, -1.4685825817650766e-06, -1.4069579492570483e-06, -1.34533331674902e-06, -1.2837086842409917e-06, -1.2220840517329634e-06, -1.1604594192249351e-06, -1.0988349004037445e-06, -1.0372102678957162e-06, -9.75585635387688e-07, -9.139610028796596e-07, -8.523363703716313e-07, -7.90711737863603e-07, -7.290871053555747e-07, -6.674624728475465e-07, -6.05837897182937e-07, -5.442132646749087e-07, -4.825885753234616e-07, -4.2096394281543326e-07, -3.5933931030740496e-07, -2.977147062210861e-07, -2.360900737130578e-07, -1.744654412050295e-07, -1.1284083711871062e-07, -5.1216204610682325e-08, 1.0408427897345973e-08, 7.203305329994691e-08, 1.3365767870254786e-07, 1.9528229699972144e-07, 2.5690692950774974e-07, 3.1853156201577804e-07, 3.801561661020969e-07, 4.417807986101252e-07, 5.034054311181535e-07, 5.650300636261818e-07, 6.266546961342101e-07, 6.882793286422384e-07, 7.499039611502667e-07, 8.11528593658295e-07, 8.731531693229044e-07, 9.347778018309327e-07, 9.964023774955422e-07, 1.0580270100035705e-06, 1.1196516425115988e-06, 1.181276275019627e-06, 1.2429009075276554e-06, 1.3045255400356837e-06, 1.366150172543712e-06, 1.4277748050517403e-06, 1.4893994375597686e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 1.0, 6.0, 3.0, 18.0, 8.0, 33.0, 57.0, 74.0, 62.0, 164.0, 236.0, 435.0, 521.0, 1216.0, 2148.0, 4018.0, 4732.0, 12931.0, 27598.0, 63686.0, 95720.0, 399593.0, 277768.0, 88080.0, 27139.0, 21041.0, 10283.0, 4985.0, 1940.0, 1756.0, 957.0, 549.0, 217.0, 215.0, 119.0, 84.0, 30.0, 45.0, 31.0, 19.0, 6.0, 7.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0], "bins": [-5.364418029785156e-06, -5.200505256652832e-06, -5.036592483520508e-06, -4.872679710388184e-06, -4.708766937255859e-06, -4.544854164123535e-06, -4.380941390991211e-06, -4.217028617858887e-06, -4.0531158447265625e-06, -3.889203071594238e-06, -3.725290298461914e-06, -3.56137752532959e-06, -3.3974647521972656e-06, -3.2335519790649414e-06, -3.069639205932617e-06, -2.905726432800293e-06, -2.7418136596679688e-06, -2.5779008865356445e-06, -2.4139881134033203e-06, -2.250075340270996e-06, -2.086162567138672e-06, -1.9222497940063477e-06, -1.7583370208740234e-06, -1.5944242477416992e-06, -1.430511474609375e-06, -1.2665987014770508e-06, -1.1026859283447266e-06, -9.387731552124023e-07, -7.748603820800781e-07, -6.109476089477539e-07, -4.470348358154297e-07, -2.8312206268310547e-07, -1.1920928955078125e-07, 4.470348358154297e-08, 2.086162567138672e-07, 3.725290298461914e-07, 5.364418029785156e-07, 7.003545761108398e-07, 8.642673492431641e-07, 1.0281801223754883e-06, 1.1920928955078125e-06, 1.3560056686401367e-06, 1.519918441772461e-06, 1.6838312149047852e-06, 1.8477439880371094e-06, 2.0116567611694336e-06, 2.175569534301758e-06, 2.339482307434082e-06, 2.5033950805664062e-06, 2.6673078536987305e-06, 2.8312206268310547e-06, 2.995133399963379e-06, 3.159046173095703e-06, 3.3229589462280273e-06, 3.4868717193603516e-06, 3.6507844924926758e-06, 3.814697265625e-06, 3.978610038757324e-06, 4.1425228118896484e-06, 4.306435585021973e-06, 4.470348358154297e-06, 4.634261131286621e-06, 4.798173904418945e-06, 4.9620866775512695e-06, 5.125999450683594e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 5.0, 0.0, 10.0, 15.0, 17.0, 23.0, 25.0, 21.0, 35.0, 47.0, 55.0, 57.0, 77.0, 71.0, 0.0, 67.0, 64.0, 68.0, 69.0, 39.0, 48.0, 47.0, 23.0, 21.0, 19.0, 18.0, 29.0, 0.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0908191800117493e-06, -2.035871148109436e-06, -1.980923116207123e-06, -1.9259750843048096e-06, -1.8710270524024963e-06, -1.816079020500183e-06, -1.7611309885978699e-06, -1.7061829566955566e-06, -1.6512349247932434e-06, -1.5962868928909302e-06, -1.541338860988617e-06, -1.4863908290863037e-06, -1.4314427971839905e-06, -1.3764947652816772e-06, -1.321546733379364e-06, -1.2665987014770508e-06, -1.2116506695747375e-06, -1.1567026376724243e-06, -1.101754605770111e-06, -1.0468065738677979e-06, -9.918585419654846e-07, -9.369105100631714e-07, -8.819624781608582e-07, -8.270144462585449e-07, -7.720664143562317e-07, -7.171183824539185e-07, -6.621703505516052e-07, -6.07222318649292e-07, -5.522742867469788e-07, -4.973262548446655e-07, -4.423782229423523e-07, -3.8743019104003906e-07, -3.3248215913772583e-07, -2.775341272354126e-07, -2.2258609533309937e-07, -1.6763806343078613e-07, -1.126900315284729e-07, -5.774199962615967e-08, -2.7939677238464355e-09, 5.21540641784668e-08, 1.0710209608078003e-07, 1.6205012798309326e-07, 2.169981598854065e-07, 2.7194619178771973e-07, 3.2689422369003296e-07, 3.818422555923462e-07, 4.367902874946594e-07, 4.917383193969727e-07, 5.466863512992859e-07, 6.016343832015991e-07, 6.565824151039124e-07, 7.115304470062256e-07, 7.664784789085388e-07, 8.21426510810852e-07, 8.763745427131653e-07, 9.313225746154785e-07, 9.862706065177917e-07, 1.041218638420105e-06, 1.0961666703224182e-06, 1.1511147022247314e-06, 1.2060627341270447e-06, 1.261010766029358e-06, 1.3159587979316711e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 11.0, 4.0, 11.0, 26.0, 22.0, 63.0, 61.0, 119.0, 147.0, 267.0, 336.0, 480.0, 1338.0, 1577.0, 4677.0, 5814.0, 18287.0, 24879.0, 47450.0, 187000.0, 320740.0, 289639.0, 67281.0, 45229.0, 13746.0, 10248.0, 3474.0, 1979.0, 1702.0, 604.0, 558.0, 213.0, 245.0, 80.0, 68.0, 60.0, 28.0, 21.0, 20.0, 24.0, 4.0, 9.0, 2.0, 1.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.887580871582031e-06, -4.742294549942017e-06, -4.597008228302002e-06, -4.451721906661987e-06, -4.306435585021973e-06, -4.161149263381958e-06, -4.015862941741943e-06, -3.870576620101929e-06, -3.725290298461914e-06, -3.5800039768218994e-06, -3.4347176551818848e-06, -3.28943133354187e-06, -3.1441450119018555e-06, -2.998858690261841e-06, -2.853572368621826e-06, -2.7082860469818115e-06, -2.562999725341797e-06, -2.4177134037017822e-06, -2.2724270820617676e-06, -2.127140760421753e-06, -1.9818544387817383e-06, -1.8365681171417236e-06, -1.691281795501709e-06, -1.5459954738616943e-06, -1.4007091522216797e-06, -1.255422830581665e-06, -1.1101365089416504e-06, -9.648501873016357e-07, -8.195638656616211e-07, -6.742775440216064e-07, -5.289912223815918e-07, -3.8370490074157715e-07, -2.384185791015625e-07, -9.313225746154785e-08, 5.21540641784668e-08, 1.9744038581848145e-07, 3.427267074584961e-07, 4.880130290985107e-07, 6.332993507385254e-07, 7.7858567237854e-07, 9.238719940185547e-07, 1.0691583156585693e-06, 1.214444637298584e-06, 1.3597309589385986e-06, 1.5050172805786133e-06, 1.650303602218628e-06, 1.7955899238586426e-06, 1.9408762454986572e-06, 2.086162567138672e-06, 2.2314488887786865e-06, 2.376735210418701e-06, 2.522021532058716e-06, 2.6673078536987305e-06, 2.812594175338745e-06, 2.9578804969787598e-06, 3.1031668186187744e-06, 3.248453140258789e-06, 3.3937394618988037e-06, 3.5390257835388184e-06, 3.684312105178833e-06, 3.829598426818848e-06, 3.974884748458862e-06, 4.120171070098877e-06, 4.265457391738892e-06, 4.410743713378906e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 2.0, 0.0, 5.0, 10.0, 0.0, 20.0, 0.0, 29.0, 29.0, 0.0, 45.0, 54.0, 0.0, 55.0, 0.0, 67.0, 90.0, 0.0, 85.0, 79.0, 0.0, 63.0, 0.0, 67.0, 73.0, 0.0, 68.0, 47.0, 0.0, 34.0, 0.0, 24.0, 22.0, 0.0, 12.0, 16.0, 0.0, 5.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0356307029724121e-06, -9.98377799987793e-07, -9.611248970031738e-07, -9.238719940185547e-07, -8.866190910339355e-07, -8.493661880493164e-07, -8.121132850646973e-07, -7.748603820800781e-07, -7.37607479095459e-07, -7.003545761108398e-07, -6.631016731262207e-07, -6.258487701416016e-07, -5.885958671569824e-07, -5.513429641723633e-07, -5.140900611877441e-07, -4.76837158203125e-07, -4.3958425521850586e-07, -4.023313522338867e-07, -3.650784492492676e-07, -3.2782554626464844e-07, -2.905726432800293e-07, -2.5331974029541016e-07, -2.1606683731079102e-07, -1.7881393432617188e-07, -1.4156103134155273e-07, -1.043081283569336e-07, -6.705522537231445e-08, -2.9802322387695312e-08, 7.450580596923828e-09, 4.470348358154297e-08, 8.195638656616211e-08, 1.1920928955078125e-07, 1.564621925354004e-07, 1.9371509552001953e-07, 2.3096799850463867e-07, 2.682209014892578e-07, 3.0547380447387695e-07, 3.427267074584961e-07, 3.7997961044311523e-07, 4.172325134277344e-07, 4.544854164123535e-07, 4.917383193969727e-07, 5.289912223815918e-07, 5.662441253662109e-07, 6.034970283508301e-07, 6.407499313354492e-07, 6.780028343200684e-07, 7.152557373046875e-07, 7.525086402893066e-07, 7.897615432739258e-07, 8.270144462585449e-07, 8.642673492431641e-07, 9.015202522277832e-07, 9.387731552124023e-07, 9.760260581970215e-07, 1.0132789611816406e-06, 1.0505318641662598e-06, 1.087784767150879e-06, 1.125037670135498e-06, 1.1622905731201172e-06, 1.1995434761047363e-06, 1.2367963790893555e-06, 1.2740492820739746e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 9.0, 13.0, 23.0, 20.0, 24.0, 40.0, 46.0, 106.0, 103.0, 141.0, 125.0, 96.0, 56.0, 28.0, 33.0, 27.0, 13.0, 17.0, 3.0, 15.0, 6.0, 8.0, 4.0, 7.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.205072178185219e-06, -2.13540351978736e-06, -2.065734861389501e-06, -1.996066202991642e-06, -1.926397544593783e-06, -1.8567288861959241e-06, -1.7870601141112274e-06, -1.7173914557133685e-06, -1.6477227973155095e-06, -1.5780541389176506e-06, -1.5083854805197916e-06, -1.4387168221219326e-06, -1.369048050037236e-06, -1.299379391639377e-06, -1.229710733241518e-06, -1.160042074843659e-06, -1.0903734164458e-06, -1.0207047580479411e-06, -9.510360996500822e-07, -8.813673844088044e-07, -8.116987260109454e-07, -7.420300676130864e-07, -6.723613523718086e-07, -6.026926939739496e-07, -5.330240355760907e-07, -4.633553771782317e-07, -3.9368669035866333e-07, -3.2401800353909493e-07, -2.5434934514123597e-07, -1.84680686743377e-07, -1.1501199992380862e-07, -4.5343313104240224e-08, 2.432534529361874e-08, 9.399401790233242e-08, 1.636626905110461e-07, 2.3333136311975977e-07, 3.0300003572847345e-07, 3.726686941263324e-07, 4.423373809459008e-07, 5.120060677654692e-07, 5.816747261633282e-07, 6.513433845611871e-07, 7.210120429590461e-07, 7.906807582003239e-07, 8.603494165981829e-07, 9.300180749960418e-07, 9.996867902373197e-07, 1.0693554486351786e-06, 1.1390241070330376e-06, 1.2086927654308965e-06, 1.2783614238287555e-06, 1.3480300822266145e-06, 1.4176987406244734e-06, 1.4873673990223324e-06, 1.557036171107029e-06, 1.626704829504888e-06, 1.696373487902747e-06, 1.766042146300606e-06, 1.835710804698465e-06, 1.9053794630963239e-06, 1.9750482351810206e-06, 2.0447168935788795e-06, 2.1143855519767385e-06, 2.1840542103745975e-06, 2.2537228687724564e-06]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 12.0, 17.0, 13.0, 18.0, 16.0, 36.0, 34.0, 35.0, 47.0, 59.0, 50.0, 50.0, 62.0, 48.0, 43.0, 52.0, 53.0, 50.0, 36.0, 30.0, 21.0, 34.0, 29.0, 24.0, 28.0, 25.0, 15.0, 12.0, 7.0, 7.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.925745436892612e-06, -1.8744856333796633e-06, -1.8232259435535525e-06, -1.771966140040604e-06, -1.720706450214493e-06, -1.6694466467015445e-06, -1.618186843188596e-06, -1.5669271533624851e-06, -1.5156674635363743e-06, -1.4644076600234257e-06, -1.4131479701973149e-06, -1.3618881666843663e-06, -1.3106284768582555e-06, -1.2593686733453069e-06, -1.2081088698323583e-06, -1.1568491800062475e-06, -1.105589376493299e-06, -1.0543295729803503e-06, -1.0030698831542395e-06, -9.518100796412909e-07, -9.005503898151801e-07, -8.492905863022315e-07, -7.980308396327018e-07, -7.467710929631721e-07, -6.955113462936424e-07, -6.442515996241127e-07, -5.92991852954583e-07, -5.417321062850533e-07, -4.904723027721047e-07, -4.3921258452428447e-07, -3.8795280943304533e-07, -3.3669306276351563e-07, -2.854333160939859e-07, -2.3417356942445622e-07, -1.829138085440718e-07, -1.3165404766368738e-07, -8.039430099415767e-08, -2.913455432462797e-08, 2.2125220766611164e-08, 7.338496743614087e-08, 1.2464471410567057e-07, 1.7590446077520028e-07, 2.271642216555847e-07, 2.784239825359691e-07, 3.296837292054988e-07, 3.809434758750285e-07, 4.3220325096626766e-07, 4.834629976357974e-07, 5.347227443053271e-07, 5.859824909748568e-07, 6.372422376443865e-07, 6.88502041157335e-07, 7.397617309834459e-07, 7.910215344963945e-07, 8.422812811659242e-07, 8.935410278354539e-07, 9.448007745049836e-07, 9.960605211745133e-07, 1.0473203246874618e-06, 1.0985800145135727e-06, 1.1498398180265212e-06, 1.201099507852632e-06, 1.2523593113655807e-06, 1.3036190011916915e-06, 1.35487880470464e-06]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 12.0, 7.0, 13.0, 10.0, 4.0, 27.0, 27.0, 17.0, 32.0, 31.0, 77.0, 104.0, 60.0, 147.0, 110.0, 345.0, 483.0, 361.0, 1173.0, 977.0, 6017.0, 25252.0, 3944122.0, 204282.0, 4759.0, 2678.0, 694.0, 862.0, 512.0, 178.0, 275.0, 100.0, 148.0, 122.0, 49.0, 52.0, 24.0, 48.0, 29.0, 9.0, 16.0, 4.0, 12.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.0994415283203125e-06, -3.0044466257095337e-06, -2.909451723098755e-06, -2.814456820487976e-06, -2.7194619178771973e-06, -2.6244670152664185e-06, -2.5294721126556396e-06, -2.434477210044861e-06, -2.339482307434082e-06, -2.2444874048233032e-06, -2.1494925022125244e-06, -2.0544975996017456e-06, -1.959502696990967e-06, -1.864507794380188e-06, -1.7695128917694092e-06, -1.6745179891586304e-06, -1.5795230865478516e-06, -1.4845281839370728e-06, -1.389533281326294e-06, -1.2945383787155151e-06, -1.1995434761047363e-06, -1.1045485734939575e-06, -1.0095536708831787e-06, -9.145587682723999e-07, -8.195638656616211e-07, -7.245689630508423e-07, -6.295740604400635e-07, -5.345791578292847e-07, -4.3958425521850586e-07, -3.4458935260772705e-07, -2.4959444999694824e-07, -1.5459954738616943e-07, -5.960464477539063e-08, 3.5390257835388184e-08, 1.30385160446167e-07, 2.253800630569458e-07, 3.203749656677246e-07, 4.153698682785034e-07, 5.103647708892822e-07, 6.05359673500061e-07, 7.003545761108398e-07, 7.953494787216187e-07, 8.903443813323975e-07, 9.853392839431763e-07, 1.080334186553955e-06, 1.1753290891647339e-06, 1.2703239917755127e-06, 1.3653188943862915e-06, 1.4603137969970703e-06, 1.5553086996078491e-06, 1.650303602218628e-06, 1.7452985048294067e-06, 1.8402934074401855e-06, 1.9352883100509644e-06, 2.030283212661743e-06, 2.125278115272522e-06, 2.2202730178833008e-06, 2.3152679204940796e-06, 2.4102628231048584e-06, 2.505257725715637e-06, 2.600252628326416e-06, 2.695247530937195e-06, 2.7902424335479736e-06, 2.8852373361587524e-06, 2.9802322387695312e-06]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 0.0, 6.0, 4.0, 0.0, 11.0, 10.0, 9.0, 0.0, 27.0, 20.0, 0.0, 28.0, 35.0, 0.0, 43.0, 55.0, 68.0, 0.0, 74.0, 76.0, 0.0, 72.0, 61.0, 70.0, 0.0, 54.0, 54.0, 0.0, 38.0, 41.0, 0.0, 26.0, 31.0, 21.0, 0.0, 16.0, 20.0, 0.0, 9.0, 5.0, 0.0, 4.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.430511474609375e-06, -1.3886019587516785e-06, -1.346692442893982e-06, -1.3047829270362854e-06, -1.2628734111785889e-06, -1.2209638953208923e-06, -1.1790543794631958e-06, -1.1371448636054993e-06, -1.0952353477478027e-06, -1.0533258318901062e-06, -1.0114163160324097e-06, -9.695068001747131e-07, -9.275972843170166e-07, -8.856877684593201e-07, -8.437782526016235e-07, -8.01868736743927e-07, -7.599592208862305e-07, -7.180497050285339e-07, -6.761401891708374e-07, -6.342306733131409e-07, -5.923211574554443e-07, -5.504116415977478e-07, -5.085021257400513e-07, -4.6659260988235474e-07, -4.246830940246582e-07, -3.8277357816696167e-07, -3.4086406230926514e-07, -2.989545464515686e-07, -2.5704503059387207e-07, -2.1513551473617554e-07, -1.73225998878479e-07, -1.3131648302078247e-07, -8.940696716308594e-08, -4.7497451305389404e-08, -5.587935447692871e-09, 3.632158041000366e-08, 7.82310962677002e-08, 1.2014061212539673e-07, 1.6205012798309326e-07, 2.039596438407898e-07, 2.4586915969848633e-07, 2.8777867555618286e-07, 3.296881914138794e-07, 3.7159770727157593e-07, 4.1350722312927246e-07, 4.55416738986969e-07, 4.973262548446655e-07, 5.392357707023621e-07, 5.811452865600586e-07, 6.230548024177551e-07, 6.649643182754517e-07, 7.068738341331482e-07, 7.487833499908447e-07, 7.906928658485413e-07, 8.326023817062378e-07, 8.745118975639343e-07, 9.164214134216309e-07, 9.583309292793274e-07, 1.000240445137024e-06, 1.0421499609947205e-06, 1.084059476852417e-06, 1.1259689927101135e-06, 1.16787850856781e-06, 1.2097880244255066e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 28.0, 43.0, 93.0, 125.0, 275.0, 641.0, 1214.0, 5144.0, 180464.0, 3995714.0, 6828.0, 2223.0, 752.0, 382.0, 109.0, 91.0, 48.0, 34.0, 14.0, 13.0, 6.0, 1.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0192394256591797e-05, -9.910203516483307e-06, -9.628012776374817e-06, -9.345822036266327e-06, -9.063631296157837e-06, -8.781440556049347e-06, -8.499249815940857e-06, -8.217059075832367e-06, -7.934868335723877e-06, -7.652677595615387e-06, -7.370486855506897e-06, -7.088296115398407e-06, -6.806105375289917e-06, -6.523914635181427e-06, -6.241723895072937e-06, -5.959533154964447e-06, -5.677342414855957e-06, -5.395151674747467e-06, -5.112960934638977e-06, -4.830770194530487e-06, -4.548579454421997e-06, -4.266388714313507e-06, -3.984197974205017e-06, -3.702007234096527e-06, -3.419816493988037e-06, -3.137625753879547e-06, -2.855435013771057e-06, -2.573244273662567e-06, -2.291053533554077e-06, -2.008862793445587e-06, -1.7266720533370972e-06, -1.4444813132286072e-06, -1.1622905731201172e-06, -8.800998330116272e-07, -5.979090929031372e-07, -3.157183527946472e-07, -3.3527612686157227e-08, 2.4866312742233276e-07, 5.308538675308228e-07, 8.130446076393127e-07, 1.0952353477478027e-06, 1.3774260878562927e-06, 1.6596168279647827e-06, 1.9418075680732727e-06, 2.2239983081817627e-06, 2.5061890482902527e-06, 2.7883797883987427e-06, 3.0705705285072327e-06, 3.3527612686157227e-06, 3.6349520087242126e-06, 3.917142748832703e-06, 4.199333488941193e-06, 4.481524229049683e-06, 4.763714969158173e-06, 5.045905709266663e-06, 5.328096449375153e-06, 5.610287189483643e-06, 5.8924779295921326e-06, 6.1746686697006226e-06, 6.4568594098091125e-06, 6.7390501499176025e-06, 7.0212408900260925e-06, 7.3034316301345825e-06, 7.5856223702430725e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 0.0, 30.0, 219.0, 0.0, 3547.0, 0.0, 223.0, 25.0, 0.0, 9.0, 0.0, 6.0, 5.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.577480912208557e-07, -8.21426510810852e-07, -7.851049304008484e-07, -7.487833499908447e-07, -7.124617695808411e-07, -6.761401891708374e-07, -6.398186087608337e-07, -6.034970283508301e-07, -5.671754479408264e-07, -5.308538675308228e-07, -4.945322871208191e-07, -4.5821070671081543e-07, -4.2188912630081177e-07, -3.855675458908081e-07, -3.4924596548080444e-07, -3.129243850708008e-07, -2.766028046607971e-07, -2.4028122425079346e-07, -2.039596438407898e-07, -1.6763806343078613e-07, -1.3131648302078247e-07, -9.499490261077881e-08, -5.8673322200775146e-08, -2.2351741790771484e-08, 1.3969838619232178e-08, 5.029141902923584e-08, 8.66129994392395e-08, 1.2293457984924316e-07, 1.5925616025924683e-07, 1.955777406692505e-07, 2.3189932107925415e-07, 2.682209014892578e-07, 3.045424818992615e-07, 3.4086406230926514e-07, 3.771856427192688e-07, 4.1350722312927246e-07, 4.498288035392761e-07, 4.861503839492798e-07, 5.224719643592834e-07, 5.587935447692871e-07, 5.951151251792908e-07, 6.314367055892944e-07, 6.677582859992981e-07, 7.040798664093018e-07, 7.404014468193054e-07, 7.767230272293091e-07, 8.130446076393127e-07, 8.493661880493164e-07, 8.856877684593201e-07, 9.220093488693237e-07, 9.583309292793274e-07, 9.94652509689331e-07, 1.0309740900993347e-06, 1.0672956705093384e-06, 1.103617250919342e-06, 1.1399388313293457e-06, 1.1762604117393494e-06, 1.212581992149353e-06, 1.2489035725593567e-06, 1.2852251529693604e-06, 1.321546733379364e-06, 1.3578683137893677e-06, 1.3941898941993713e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 5.0, 4.0, 11.0, 10.0, 12.0, 9.0, 11.0, 19.0, 32.0, 39.0, 53.0, 74.0, 125.0, 137.0, 125.0, 90.0, 55.0, 39.0, 31.0, 35.0, 14.0, 21.0, 8.0, 8.0, 2.0, 7.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6175649761862587e-06, -1.5544302414127742e-06, -1.4912955066392897e-06, -1.4281607718658051e-06, -1.3650260370923206e-06, -1.3018914160056738e-06, -1.2387566812321893e-06, -1.1756219464587048e-06, -1.1124872116852202e-06, -1.0493524769117357e-06, -9.862177421382512e-07, -9.230830642081855e-07, -8.59948329434701e-07, -7.968135946612165e-07, -7.336789167311508e-07, -6.705441819576663e-07, -6.074094471841818e-07, -5.442747124106972e-07, -4.811399776372127e-07, -4.1800529970714706e-07, -3.5487056493366254e-07, -2.91735830160178e-07, -2.2860112380840292e-07, -1.6546641745662782e-07, -1.023316826831433e-07, -3.919696212051349e-08, 2.393775844211632e-08, 8.707247900474613e-08, 1.5020719956737594e-07, 2.1334193434086046e-07, 2.7647664069263556e-07, 3.3961134704441065e-07, 4.027460818178952e-07, 4.658808165913797e-07, 5.290155513648642e-07, 5.921502292949299e-07, 6.552849640684144e-07, 7.184196988418989e-07, 7.815543767719646e-07, 8.446891115454491e-07, 9.078238463189336e-07, 9.709585810924182e-07, 1.0340933158659027e-06, 1.0972280506393872e-06, 1.160362671726034e-06, 1.2234975201863563e-06, 1.286632141273003e-06, 1.3497668760464876e-06, 1.4129016108199721e-06, 1.4760363455934566e-06, 1.5391710803669412e-06, 1.6023058151404257e-06, 1.6654405499139102e-06, 1.728575171000557e-06, 1.7917099057740415e-06, 1.854844640547526e-06, 1.917979261634173e-06, 1.9811138827208197e-06, 2.044248731181142e-06, 2.1073833522677887e-06, 2.170518200728111e-06, 2.2336528218147578e-06, 2.29678767027508e-06, 2.359922291361727e-06, 2.423057139822049e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 5.0, 4.0, 9.0, 11.0, 16.0, 23.0, 27.0, 33.0, 39.0, 53.0, 39.0, 51.0, 63.0, 63.0, 49.0, 47.0, 73.0, 41.0, 53.0, 43.0, 43.0, 36.0, 31.0, 20.0, 21.0, 31.0, 27.0, 10.0, 12.0, 2.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.1186735921219224e-06, -2.067048171738861e-06, -2.0154227513558e-06, -1.963797558346414e-06, -1.9121721379633527e-06, -1.8605467175802914e-06, -1.8089212971972302e-06, -1.7572958768141689e-06, -1.7056705701179453e-06, -1.654045149734884e-06, -1.6024198430386605e-06, -1.5507944226555992e-06, -1.499169002272538e-06, -1.4475436955763143e-06, -1.395918275193253e-06, -1.3442929684970295e-06, -1.2926675481139682e-06, -1.241042127730907e-06, -1.1894168210346834e-06, -1.137791400651622e-06, -1.0861660939553985e-06, -1.0345406735723373e-06, -9.82915253189276e-07, -9.312898896496336e-07, -8.796645261099911e-07, -8.280391625703487e-07, -7.764137990307063e-07, -7.24788378647645e-07, -6.731630151080026e-07, -6.215376515683602e-07, -5.699122311852989e-07, -5.182868676456565e-07, -4.6666161779285176e-07, -4.1503625425320934e-07, -3.634108622918575e-07, -3.1178547033050563e-07, -2.601601067908632e-07, -2.085347432512208e-07, -1.5690935128986894e-07, -1.0528395932851708e-07, -5.3658595788874663e-08, -2.0332180383775267e-09, 4.959215971211961e-08, 1.0121753746261675e-07, 1.5284291521311388e-07, 2.044682787527563e-07, 2.5609367071410816e-07, 3.0771906267546e-07, 3.5934442621510243e-07, 4.1096978975474485e-07, 4.625951817160967e-07, 5.142205736774486e-07, 5.65845937217091e-07, 6.174713007567334e-07, 6.690967211397947e-07, 7.207220846794371e-07, 7.723474482190795e-07, 8.239728117587219e-07, 8.755981752983644e-07, 9.272235956814256e-07, 9.788489023776492e-07, 1.0304743227607105e-06, 1.0820997431437718e-06, 1.133725163526833e-06, 1.1853504702230566e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 7.0, 4.0, 3.0, 17.0, 21.0, 33.0, 24.0, 82.0, 168.0, 123.0, 437.0, 886.0, 1764.0, 1626.0, 6048.0, 16310.0, 52997.0, 71483.0, 568732.0, 247349.0, 52775.0, 10492.0, 9705.0, 3934.0, 1037.0, 1200.0, 605.0, 332.0, 87.0, 127.0, 61.0, 29.0, 11.0, 22.0, 11.0, 5.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-06, -2.757646143436432e-06, -2.6542693376541138e-06, -2.5508925318717957e-06, -2.4475157260894775e-06, -2.3441389203071594e-06, -2.2407621145248413e-06, -2.137385308742523e-06, -2.034008502960205e-06, -1.930631697177887e-06, -1.8272548913955688e-06, -1.7238780856132507e-06, -1.6205012798309326e-06, -1.5171244740486145e-06, -1.4137476682662964e-06, -1.3103708624839783e-06, -1.2069940567016602e-06, -1.103617250919342e-06, -1.000240445137024e-06, -8.968636393547058e-07, -7.934868335723877e-07, -6.901100277900696e-07, -5.867332220077515e-07, -4.833564162254333e-07, -3.7997961044311523e-07, -2.766028046607971e-07, -1.73225998878479e-07, -6.984919309616089e-08, 3.3527612686157227e-08, 1.3690441846847534e-07, 2.4028122425079346e-07, 3.4365803003311157e-07, 4.470348358154297e-07, 5.504116415977478e-07, 6.537884473800659e-07, 7.57165253162384e-07, 8.605420589447021e-07, 9.639188647270203e-07, 1.0672956705093384e-06, 1.1706724762916565e-06, 1.2740492820739746e-06, 1.3774260878562927e-06, 1.4808028936386108e-06, 1.584179699420929e-06, 1.687556505203247e-06, 1.7909333109855652e-06, 1.8943101167678833e-06, 1.9976869225502014e-06, 2.1010637283325195e-06, 2.2044405341148376e-06, 2.3078173398971558e-06, 2.411194145679474e-06, 2.514570951461792e-06, 2.61794775724411e-06, 2.7213245630264282e-06, 2.8247013688087463e-06, 2.9280781745910645e-06, 3.0314549803733826e-06, 3.1348317861557007e-06, 3.238208591938019e-06, 3.341585397720337e-06, 3.444962203502655e-06, 3.548339009284973e-06, 3.6517158150672913e-06, 3.7550926208496094e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 10.0, 12.0, 18.0, 0.0, 23.0, 20.0, 38.0, 43.0, 0.0, 34.0, 54.0, 70.0, 57.0, 0.0, 77.0, 72.0, 87.0, 63.0, 0.0, 62.0, 60.0, 43.0, 36.0, 0.0, 36.0, 17.0, 22.0, 7.0, 0.0, 15.0, 17.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9194558262825012e-06, -1.8719583749771118e-06, -1.8244609236717224e-06, -1.776963472366333e-06, -1.7294660210609436e-06, -1.6819685697555542e-06, -1.6344711184501648e-06, -1.5869736671447754e-06, -1.539476215839386e-06, -1.4919787645339966e-06, -1.4444813132286072e-06, -1.3969838619232178e-06, -1.3494864106178284e-06, -1.301988959312439e-06, -1.2544915080070496e-06, -1.2069940567016602e-06, -1.1594966053962708e-06, -1.1119991540908813e-06, -1.064501702785492e-06, -1.0170042514801025e-06, -9.695068001747131e-07, -9.220093488693237e-07, -8.745118975639343e-07, -8.270144462585449e-07, -7.795169949531555e-07, -7.320195436477661e-07, -6.845220923423767e-07, -6.370246410369873e-07, -5.895271897315979e-07, -5.420297384262085e-07, -4.945322871208191e-07, -4.470348358154297e-07, -3.995373845100403e-07, -3.520399332046509e-07, -3.045424818992615e-07, -2.5704503059387207e-07, -2.0954757928848267e-07, -1.6205012798309326e-07, -1.1455267667770386e-07, -6.705522537231445e-08, -1.955777406692505e-08, 2.7939677238464355e-08, 7.543712854385376e-08, 1.2293457984924316e-07, 1.7043203115463257e-07, 2.1792948246002197e-07, 2.654269337654114e-07, 3.129243850708008e-07, 3.604218363761902e-07, 4.079192876815796e-07, 4.55416738986969e-07, 5.029141902923584e-07, 5.504116415977478e-07, 5.979090929031372e-07, 6.454065442085266e-07, 6.92903995513916e-07, 7.404014468193054e-07, 7.878988981246948e-07, 8.353963494300842e-07, 8.828938007354736e-07, 9.30391252040863e-07, 9.778887033462524e-07, 1.0253861546516418e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 7.0, 9.0, 8.0, 18.0, 39.0, 26.0, 40.0, 56.0, 61.0, 210.0, 115.0, 176.0, 202.0, 304.0, 811.0, 572.0, 948.0, 1287.0, 1758.0, 7481.0, 9689.0, 1000787.0, 9667.0, 4800.0, 4539.0, 1287.0, 972.0, 603.0, 457.0, 635.0, 180.0, 180.0, 114.0, 107.0, 152.0, 56.0, 40.0, 30.0, 20.0, 43.0, 15.0, 6.0, 13.0, 6.0, 11.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.6226043701171875e-06, -2.5508925318717957e-06, -2.479180693626404e-06, -2.407468855381012e-06, -2.33575701713562e-06, -2.2640451788902283e-06, -2.1923333406448364e-06, -2.1206215023994446e-06, -2.0489096641540527e-06, -1.977197825908661e-06, -1.905485987663269e-06, -1.8337741494178772e-06, -1.7620623111724854e-06, -1.6903504729270935e-06, -1.6186386346817017e-06, -1.5469267964363098e-06, -1.475214958190918e-06, -1.4035031199455261e-06, -1.3317912817001343e-06, -1.2600794434547424e-06, -1.1883676052093506e-06, -1.1166557669639587e-06, -1.044943928718567e-06, -9.73232090473175e-07, -9.015202522277832e-07, -8.298084139823914e-07, -7.580965757369995e-07, -6.863847374916077e-07, -6.146728992462158e-07, -5.42961061000824e-07, -4.7124922275543213e-07, -3.995373845100403e-07, -3.2782554626464844e-07, -2.561137080192566e-07, -1.8440186977386475e-07, -1.126900315284729e-07, -4.0978193283081055e-08, 3.073364496231079e-08, 1.0244548320770264e-07, 1.7415732145309448e-07, 2.4586915969848633e-07, 3.175809979438782e-07, 3.8929283618927e-07, 4.6100467443466187e-07, 5.327165126800537e-07, 6.044283509254456e-07, 6.761401891708374e-07, 7.478520274162292e-07, 8.195638656616211e-07, 8.912757039070129e-07, 9.629875421524048e-07, 1.0346993803977966e-06, 1.1064112186431885e-06, 1.1781230568885803e-06, 1.2498348951339722e-06, 1.321546733379364e-06, 1.3932585716247559e-06, 1.4649704098701477e-06, 1.5366822481155396e-06, 1.6083940863609314e-06, 1.6801059246063232e-06, 1.751817762851715e-06, 1.823529601097107e-06, 1.8952414393424988e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 933.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.868473529815674e-07, -2.7567148208618164e-07, -2.644956111907959e-07, -2.5331974029541016e-07, -2.421438694000244e-07, -2.3096799850463867e-07, -2.1979212760925293e-07, -2.086162567138672e-07, -1.9744038581848145e-07, -1.862645149230957e-07, -1.7508864402770996e-07, -1.6391277313232422e-07, -1.5273690223693848e-07, -1.4156103134155273e-07, -1.30385160446167e-07, -1.1920928955078125e-07, -1.0803341865539551e-07, -9.685754776000977e-08, -8.568167686462402e-08, -7.450580596923828e-08, -6.332993507385254e-08, -5.21540641784668e-08, -4.0978193283081055e-08, -2.9802322387695312e-08, -1.862645149230957e-08, -7.450580596923828e-09, 3.725290298461914e-09, 1.4901161193847656e-08, 2.60770320892334e-08, 3.725290298461914e-08, 4.842877388000488e-08, 5.960464477539063e-08, 7.078051567077637e-08, 8.195638656616211e-08, 9.313225746154785e-08, 1.043081283569336e-07, 1.1548399925231934e-07, 1.2665987014770508e-07, 1.3783574104309082e-07, 1.4901161193847656e-07, 1.601874828338623e-07, 1.7136335372924805e-07, 1.825392246246338e-07, 1.9371509552001953e-07, 2.0489096641540527e-07, 2.1606683731079102e-07, 2.2724270820617676e-07, 2.384185791015625e-07, 2.4959444999694824e-07, 2.60770320892334e-07, 2.7194619178771973e-07, 2.8312206268310547e-07, 2.942979335784912e-07, 3.0547380447387695e-07, 3.166496753692627e-07, 3.2782554626464844e-07, 3.390014171600342e-07, 3.501772880554199e-07, 3.6135315895080566e-07, 3.725290298461914e-07, 3.8370490074157715e-07, 3.948807716369629e-07, 4.0605664253234863e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 4.0, 10.0, 8.0, 11.0, 24.0, 18.0, 18.0, 39.0, 47.0, 68.0, 96.0, 137.0, 134.0, 93.0, 73.0, 39.0, 32.0, 31.0, 24.0, 18.0, 11.0, 7.0, 5.0, 7.0, 6.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.774855832081812e-06, -1.717669761092111e-06, -1.66048369010241e-06, -1.603297619112709e-06, -1.5461115481230081e-06, -1.4889254771333071e-06, -1.4317392924567685e-06, -1.3745532214670675e-06, -1.3173671504773665e-06, -1.2601810794876656e-06, -1.2029950084979646e-06, -1.1458089375082636e-06, -1.0886228665185627e-06, -1.0314367955288617e-06, -9.742507245391607e-07, -9.170645967060409e-07, -8.598785825597588e-07, -8.026925115700578e-07, -7.455064405803569e-07, -6.883203695906559e-07, -6.311342986009549e-07, -5.73948227611254e-07, -5.167620997781341e-07, -4.595760287884332e-07, -4.023899577987322e-07, -3.4520388680903125e-07, -2.880178158193303e-07, -2.3083171640791988e-07, -1.7364564541821892e-07, -1.1645957442851795e-07, -5.927347501710756e-08, -2.087404027406592e-09, 5.509855327545665e-08, 1.1228463137058498e-07, 1.694707094657133e-07, 2.2665679466626898e-07, 2.8384286565596994e-07, 3.410289366456709e-07, 3.982150360570813e-07, 4.5540110704678227e-07, 5.125871780364832e-07, 5.697732490261842e-07, 6.269593200158852e-07, 6.84145447849005e-07, 7.41331518838706e-07, 7.985175898284069e-07, 8.557036608181079e-07, 9.128897318078089e-07, 9.700758027975098e-07, 1.0272618737872108e-06, 1.0844479447769118e-06, 1.1416340157666127e-06, 1.1988200867563137e-06, 1.2560061577460147e-06, 1.3131923424225533e-06, 1.3703784134122543e-06, 1.4275644844019553e-06, 1.4847505553916562e-06, 1.5419366263813572e-06, 1.5991226973710582e-06, 1.6563087683607591e-06, 1.71349483935046e-06, 1.770680910340161e-06, 1.827866981329862e-06, 1.885053052319563e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 12.0, 4.0, 5.0, 8.0, 14.0, 15.0, 23.0, 25.0, 36.0, 40.0, 48.0, 40.0, 57.0, 60.0, 60.0, 54.0, 49.0, 73.0, 40.0, 52.0, 42.0, 42.0, 38.0, 25.0, 22.0, 26.0, 28.0, 24.0, 11.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.9624881133495364e-06, -1.91462277143728e-06, -1.8667574295250233e-06, -1.8188922012996045e-06, -1.771026859387348e-06, -1.7231615174750914e-06, -1.6752962892496726e-06, -1.627430947337416e-06, -1.5795656054251594e-06, -1.5317002635129029e-06, -1.4838349216006463e-06, -1.4359696933752275e-06, -1.388104351462971e-06, -1.3402390095507144e-06, -1.2923737813252956e-06, -1.244508439413039e-06, -1.1966430975007825e-06, -1.148777755588526e-06, -1.1009124136762694e-06, -1.0530471854508505e-06, -1.005181843538594e-06, -9.573165016263374e-07, -9.094512165574997e-07, -8.61585931488662e-07, -8.137205895764055e-07, -7.658552476641489e-07, -7.179899625953112e-07, -6.701246775264735e-07, -6.22259335614217e-07, -5.743939937019604e-07, -5.265287086331227e-07, -4.78663423564285e-07, -4.307981953388662e-07, -3.829328818483191e-07, -3.3506756835777196e-07, -2.8720225486722484e-07, -2.393369413766777e-07, -1.914716278861306e-07, -1.4360631439558347e-07, -9.574100090503634e-08, -4.787568741448922e-08, -1.0373923942097463e-11, 4.7854939566605026e-08, 9.572025305715215e-08, 1.4358556654769927e-07, 1.914508800382464e-07, 2.393161935287935e-07, 2.8718150701934064e-07, 3.3504682050988777e-07, 3.829121340004349e-07, 4.30777447490982e-07, 4.786427325598197e-07, 5.265080744720763e-07, 5.743734163843328e-07, 6.222387014531705e-07, 6.701039865220082e-07, 7.179693284342648e-07, 7.658346703465213e-07, 8.13699955415359e-07, 8.615652404841967e-07, 9.094305823964532e-07, 9.572959243087098e-07, 1.0051612662209664e-06, 1.0530264944463852e-06, 1.1008918363586417e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 11.0, 10.0, 12.0, 21.0, 24.0, 41.0, 62.0, 104.0, 175.0, 464.0, 610.0, 1080.0, 1936.0, 3448.0, 6064.0, 11296.0, 20607.0, 40722.0, 87913.0, 241585.0, 369437.0, 141689.0, 58725.0, 28565.0, 15093.0, 8297.0, 4638.0, 2573.0, 1387.0, 778.0, 582.0, 219.0, 128.0, 76.0, 51.0, 39.0, 24.0, 12.0, 16.0, 8.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.933906555175781e-06, -3.8119032979011536e-06, -3.689900040626526e-06, -3.567896783351898e-06, -3.4458935260772705e-06, -3.323890268802643e-06, -3.201887011528015e-06, -3.0798837542533875e-06, -2.9578804969787598e-06, -2.835877239704132e-06, -2.7138739824295044e-06, -2.5918707251548767e-06, -2.469867467880249e-06, -2.3478642106056213e-06, -2.2258609533309937e-06, -2.103857696056366e-06, -1.9818544387817383e-06, -1.8598511815071106e-06, -1.737847924232483e-06, -1.6158446669578552e-06, -1.4938414096832275e-06, -1.3718381524085999e-06, -1.2498348951339722e-06, -1.1278316378593445e-06, -1.0058283805847168e-06, -8.838251233100891e-07, -7.618218660354614e-07, -6.398186087608337e-07, -5.178153514862061e-07, -3.9581209421157837e-07, -2.738088369369507e-07, -1.51805579662323e-07, -2.9802322387695312e-08, 9.220093488693237e-08, 2.1420419216156006e-07, 3.3620744943618774e-07, 4.5821070671081543e-07, 5.802139639854431e-07, 7.022172212600708e-07, 8.242204785346985e-07, 9.462237358093262e-07, 1.0682269930839539e-06, 1.1902302503585815e-06, 1.3122335076332092e-06, 1.434236764907837e-06, 1.5562400221824646e-06, 1.6782432794570923e-06, 1.80024653673172e-06, 1.9222497940063477e-06, 2.0442530512809753e-06, 2.166256308555603e-06, 2.2882595658302307e-06, 2.4102628231048584e-06, 2.532266080379486e-06, 2.6542693376541138e-06, 2.7762725949287415e-06, 2.898275852203369e-06, 3.020279109477997e-06, 3.1422823667526245e-06, 3.264285624027252e-06, 3.38628888130188e-06, 3.5082921385765076e-06, 3.6302953958511353e-06, 3.752298653125763e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 7.0, 7.0, 0.0, 16.0, 28.0, 28.0, 0.0, 41.0, 43.0, 58.0, 60.0, 0.0, 86.0, 79.0, 88.0, 0.0, 74.0, 68.0, 77.0, 0.0, 53.0, 35.0, 44.0, 0.0, 26.0, 32.0, 13.0, 13.0, 0.0, 9.0, 10.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6828998923301697e-06, -1.6372650861740112e-06, -1.5916302800178528e-06, -1.5459954738616943e-06, -1.5003606677055359e-06, -1.4547258615493774e-06, -1.409091055393219e-06, -1.3634562492370605e-06, -1.317821443080902e-06, -1.2721866369247437e-06, -1.2265518307685852e-06, -1.1809170246124268e-06, -1.1352822184562683e-06, -1.0896474123001099e-06, -1.0440126061439514e-06, -9.98377799987793e-07, -9.527429938316345e-07, -9.071081876754761e-07, -8.614733815193176e-07, -8.158385753631592e-07, -7.702037692070007e-07, -7.245689630508423e-07, -6.789341568946838e-07, -6.332993507385254e-07, -5.876645445823669e-07, -5.420297384262085e-07, -4.9639493227005e-07, -4.507601261138916e-07, -4.0512531995773315e-07, -3.594905138015747e-07, -3.1385570764541626e-07, -2.682209014892578e-07, -2.2258609533309937e-07, -1.7695128917694092e-07, -1.3131648302078247e-07, -8.568167686462402e-08, -4.0046870708465576e-08, 5.587935447692871e-09, 5.122274160385132e-08, 9.685754776000977e-08, 1.424923539161682e-07, 1.8812716007232666e-07, 2.337619662284851e-07, 2.7939677238464355e-07, 3.25031578540802e-07, 3.7066638469696045e-07, 4.163011908531189e-07, 4.6193599700927734e-07, 5.075708031654358e-07, 5.532056093215942e-07, 5.988404154777527e-07, 6.444752216339111e-07, 6.901100277900696e-07, 7.35744833946228e-07, 7.813796401023865e-07, 8.270144462585449e-07, 8.726492524147034e-07, 9.182840585708618e-07, 9.639188647270203e-07, 1.0095536708831787e-06, 1.0551884770393372e-06, 1.1008232831954956e-06, 1.146458089351654e-06, 1.1920928955078125e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 3.0, 6.0, 3.0, 9.0, 14.0, 18.0, 29.0, 29.0, 38.0, 68.0, 85.0, 158.0, 229.0, 743.0, 931.0, 1708.0, 3232.0, 6201.0, 12221.0, 24981.0, 106484.0, 250174.0, 395180.0, 140859.0, 54398.0, 25073.0, 12086.0, 8073.0, 2455.0, 1299.0, 695.0, 402.0, 217.0, 142.0, 148.0, 37.0, 41.0, 18.0, 12.0, 18.0, 7.0, 16.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.874301910400391e-06, -3.74671071767807e-06, -3.6191195249557495e-06, -3.491528332233429e-06, -3.3639371395111084e-06, -3.236345946788788e-06, -3.1087547540664673e-06, -2.9811635613441467e-06, -2.853572368621826e-06, -2.7259811758995056e-06, -2.598389983177185e-06, -2.4707987904548645e-06, -2.343207597732544e-06, -2.2156164050102234e-06, -2.088025212287903e-06, -1.9604340195655823e-06, -1.8328428268432617e-06, -1.7052516341209412e-06, -1.5776604413986206e-06, -1.4500692486763e-06, -1.3224780559539795e-06, -1.194886863231659e-06, -1.0672956705093384e-06, -9.397044777870178e-07, -8.121132850646973e-07, -6.845220923423767e-07, -5.569308996200562e-07, -4.293397068977356e-07, -3.0174851417541504e-07, -1.7415732145309448e-07, -4.6566128730773926e-08, 8.102506399154663e-08, 2.086162567138672e-07, 3.3620744943618774e-07, 4.637986421585083e-07, 5.913898348808289e-07, 7.189810276031494e-07, 8.4657222032547e-07, 9.741634130477905e-07, 1.101754605770111e-06, 1.2293457984924316e-06, 1.3569369912147522e-06, 1.4845281839370728e-06, 1.6121193766593933e-06, 1.7397105693817139e-06, 1.8673017621040344e-06, 1.994892954826355e-06, 2.1224841475486755e-06, 2.250075340270996e-06, 2.3776665329933167e-06, 2.505257725715637e-06, 2.6328489184379578e-06, 2.7604401111602783e-06, 2.888031303882599e-06, 3.0156224966049194e-06, 3.14321368932724e-06, 3.2708048820495605e-06, 3.398396074771881e-06, 3.5259872674942017e-06, 3.6535784602165222e-06, 3.7811696529388428e-06, 3.908760845661163e-06, 4.036352038383484e-06, 4.1639432311058044e-06, 4.291534423828125e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 7.0, 0.0, 0.0, 22.0, 0.0, 27.0, 0.0, 30.0, 0.0, 59.0, 0.0, 0.0, 56.0, 0.0, 72.0, 0.0, 84.0, 0.0, 0.0, 97.0, 0.0, 98.0, 0.0, 79.0, 0.0, 88.0, 0.0, 0.0, 63.0, 0.0, 72.0, 0.0, 43.0, 0.0, 0.0, 41.0, 0.0, 26.0, 0.0, 21.0, 0.0, 11.0, 0.0, 0.0, 5.0, 0.0, 7.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.67992639541626e-07, -8.419156074523926e-07, -8.158385753631592e-07, -7.897615432739258e-07, -7.636845111846924e-07, -7.37607479095459e-07, -7.115304470062256e-07, -6.854534149169922e-07, -6.593763828277588e-07, -6.332993507385254e-07, -6.07222318649292e-07, -5.811452865600586e-07, -5.550682544708252e-07, -5.289912223815918e-07, -5.029141902923584e-07, -4.76837158203125e-07, -4.507601261138916e-07, -4.246830940246582e-07, -3.986060619354248e-07, -3.725290298461914e-07, -3.46451997756958e-07, -3.203749656677246e-07, -2.942979335784912e-07, -2.682209014892578e-07, -2.421438694000244e-07, -2.1606683731079102e-07, -1.8998980522155762e-07, -1.6391277313232422e-07, -1.3783574104309082e-07, -1.1175870895385742e-07, -8.568167686462402e-08, -5.960464477539063e-08, -3.3527612686157227e-08, -7.450580596923828e-09, 1.862645149230957e-08, 4.470348358154297e-08, 7.078051567077637e-08, 9.685754776000977e-08, 1.2293457984924316e-07, 1.4901161193847656e-07, 1.7508864402770996e-07, 2.0116567611694336e-07, 2.2724270820617676e-07, 2.5331974029541016e-07, 2.7939677238464355e-07, 3.0547380447387695e-07, 3.3155083656311035e-07, 3.5762786865234375e-07, 3.8370490074157715e-07, 4.0978193283081055e-07, 4.3585896492004395e-07, 4.6193599700927734e-07, 4.880130290985107e-07, 5.140900611877441e-07, 5.401670932769775e-07, 5.662441253662109e-07, 5.923211574554443e-07, 6.183981895446777e-07, 6.444752216339111e-07, 6.705522537231445e-07, 6.966292858123779e-07, 7.227063179016113e-07, 7.487833499908447e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 6.0, 17.0, 17.0, 18.0, 14.0, 39.0, 47.0, 56.0, 75.0, 121.0, 132.0, 109.0, 67.0, 66.0, 41.0, 34.0, 16.0, 14.0, 17.0, 11.0, 10.0, 2.0, 5.0, 9.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.7180251461468288e-06, -1.6706817405065522e-06, -1.6233384485531133e-06, -1.5759951565996744e-06, -1.5286517509593978e-06, -1.4813083453191211e-06, -1.4339650533656823e-06, -1.3866217614122434e-06, -1.3392783557719667e-06, -1.2919349501316901e-06, -1.2445916581782512e-06, -1.1972483662248123e-06, -1.1499049605845357e-06, -1.1025615549442591e-06, -1.0552182629908202e-06, -1.0078749710373813e-06, -9.605315653971047e-07, -9.13188216600247e-07, -8.658448678033892e-07, -8.185015190065315e-07, -7.711581702096737e-07, -7.238148214128159e-07, -6.764714726159582e-07, -6.291281238191004e-07, -5.817847750222427e-07, -5.344414262253849e-07, -4.870980774285272e-07, -4.397547286316694e-07, -3.9241137983481167e-07, -3.450680310379539e-07, -2.9772468224109616e-07, -2.503813334442384e-07, -2.0303787096054293e-07, -1.5569452216368518e-07, -1.0835117336682742e-07, -6.100782456996967e-08, -1.3664475773111917e-08, 3.3678873023745837e-08, 8.102222182060359e-08, 1.2836557061746134e-07, 1.757089194143191e-07, 2.2305226821117685e-07, 2.703956170080346e-07, 3.1773896580489236e-07, 3.650823146017501e-07, 4.1242566339860787e-07, 4.597690121954656e-07, 5.071123609923234e-07, 5.544557097891811e-07, 6.017990585860389e-07, 6.491424073828966e-07, 6.964857561797544e-07, 7.438291049766121e-07, 7.911724537734699e-07, 8.385158025703277e-07, 8.858591513671854e-07, 9.332025001640432e-07, 9.80545792117482e-07, 1.0278891977577587e-06, 1.0752326033980353e-06, 1.1225758953514742e-06, 1.169919187304913e-06, 1.2172625929451897e-06, 1.2646059985854663e-06, 1.3119492905389052e-06]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 8.0, 14.0, 15.0, 22.0, 14.0, 24.0, 35.0, 38.0, 39.0, 42.0, 55.0, 47.0, 49.0, 58.0, 56.0, 65.0, 48.0, 55.0, 45.0, 37.0, 38.0, 32.0, 26.0, 33.0, 15.0, 21.0, 12.0, 11.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677600153016101e-06, -1.6327179537256598e-06, -1.5878356407483807e-06, -1.5429534414579393e-06, -1.498071242167498e-06, -1.4531890428770566e-06, -1.4083068435866153e-06, -1.3634245306093362e-06, -1.3185423313188949e-06, -1.2736601320284535e-06, -1.2287778190511744e-06, -1.183895619760733e-06, -1.1390134204702917e-06, -1.0941312211798504e-06, -1.049249021889409e-06, -1.00436670891213e-06, -9.594845096216886e-07, -9.146023103312473e-07, -8.697200541973871e-07, -8.248377980635269e-07, -7.799555987730855e-07, -7.350733994826442e-07, -6.90191143348784e-07, -6.453088872149237e-07, -6.004266879244824e-07, -5.55544488634041e-07, -5.106622325001808e-07, -4.6578000478803006e-07, -4.208977770758793e-07, -3.760155493637285e-07, -3.311333216515777e-07, -2.8625109393942694e-07, -2.4136886622727616e-07, -1.9648663851512538e-07, -1.516044108029746e-07, -1.0672218309082382e-07, -6.183995537867304e-08, -1.695772766652226e-08, 2.792450004562852e-08, 7.28067277577793e-08, 1.1768895546993008e-07, 1.6257118318208086e-07, 2.0745341089423164e-07, 2.523356386063824e-07, 2.972178663185332e-07, 3.42100094030684e-07, 3.8698232174283476e-07, 4.3186454945498554e-07, 4.767467771671363e-07, 5.216289764575777e-07, 5.665112325914379e-07, 6.113934887252981e-07, 6.562756880157394e-07, 7.011578873061808e-07, 7.46040143440041e-07, 7.909223995739012e-07, 8.358045988643426e-07, 8.806867981547839e-07, 9.255690542886441e-07, 9.704513104225043e-07, 1.0153335097129457e-06, 1.060215709003387e-06, 1.1050979082938284e-06, 1.1499802212711074e-06, 1.1948624205615488e-06]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 8.0, 10.0, 14.0, 13.0, 27.0, 43.0, 61.0, 57.0, 136.0, 228.0, 166.0, 491.0, 857.0, 2197.0, 10218.0, 4052689.0, 122508.0, 2456.0, 497.0, 617.0, 369.0, 216.0, 84.0, 104.0, 75.0, 30.0, 36.0, 23.0, 11.0, 3.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.993511199951172e-06, -3.890134394168854e-06, -3.7867575883865356e-06, -3.6833807826042175e-06, -3.5800039768218994e-06, -3.4766271710395813e-06, -3.373250365257263e-06, -3.269873559474945e-06, -3.166496753692627e-06, -3.063119947910309e-06, -2.9597431421279907e-06, -2.8563663363456726e-06, -2.7529895305633545e-06, -2.6496127247810364e-06, -2.5462359189987183e-06, -2.4428591132164e-06, -2.339482307434082e-06, -2.236105501651764e-06, -2.132728695869446e-06, -2.0293518900871277e-06, -1.9259750843048096e-06, -1.8225982785224915e-06, -1.7192214727401733e-06, -1.6158446669578552e-06, -1.5124678611755371e-06, -1.409091055393219e-06, -1.3057142496109009e-06, -1.2023374438285828e-06, -1.0989606380462646e-06, -9.955838322639465e-07, -8.922070264816284e-07, -7.888302206993103e-07, -6.854534149169922e-07, -5.820766091346741e-07, -4.78699803352356e-07, -3.7532299757003784e-07, -2.7194619178771973e-07, -1.685693860054016e-07, -6.51925802230835e-08, 3.818422555923462e-08, 1.4156103134155273e-07, 2.4493783712387085e-07, 3.4831464290618896e-07, 4.516914486885071e-07, 5.550682544708252e-07, 6.584450602531433e-07, 7.618218660354614e-07, 8.651986718177795e-07, 9.685754776000977e-07, 1.0719522833824158e-06, 1.1753290891647339e-06, 1.278705894947052e-06, 1.3820827007293701e-06, 1.4854595065116882e-06, 1.5888363122940063e-06, 1.6922131180763245e-06, 1.7955899238586426e-06, 1.8989667296409607e-06, 2.002343535423279e-06, 2.105720341205597e-06, 2.209097146987915e-06, 2.312473952770233e-06, 2.4158507585525513e-06, 2.5192275643348694e-06, 2.6226043701171875e-06]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 0.0, 12.0, 9.0, 0.0, 15.0, 21.0, 0.0, 25.0, 35.0, 42.0, 0.0, 56.0, 69.0, 0.0, 92.0, 84.0, 79.0, 0.0, 89.0, 93.0, 0.0, 66.0, 47.0, 0.0, 38.0, 43.0, 30.0, 0.0, 18.0, 12.0, 0.0, 3.0, 11.0, 0.0, 5.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5078112483024597e-06, -1.4659017324447632e-06, -1.4239922165870667e-06, -1.3820827007293701e-06, -1.3401731848716736e-06, -1.298263669013977e-06, -1.2563541531562805e-06, -1.214444637298584e-06, -1.1725351214408875e-06, -1.130625605583191e-06, -1.0887160897254944e-06, -1.0468065738677979e-06, -1.0048970580101013e-06, -9.629875421524048e-07, -9.210780262947083e-07, -8.791685104370117e-07, -8.372589945793152e-07, -7.953494787216187e-07, -7.534399628639221e-07, -7.115304470062256e-07, -6.69620931148529e-07, -6.277114152908325e-07, -5.85801899433136e-07, -5.438923835754395e-07, -5.019828677177429e-07, -4.600733518600464e-07, -4.1816383600234985e-07, -3.762543201446533e-07, -3.343448042869568e-07, -2.9243528842926025e-07, -2.505257725715637e-07, -2.086162567138672e-07, -1.6670674085617065e-07, -1.2479722499847412e-07, -8.288770914077759e-08, -4.0978193283081055e-08, 9.313225746154785e-10, 4.284083843231201e-08, 8.475035429000854e-08, 1.2665987014770508e-07, 1.685693860054016e-07, 2.1047890186309814e-07, 2.523884177207947e-07, 2.942979335784912e-07, 3.3620744943618774e-07, 3.781169652938843e-07, 4.200264811515808e-07, 4.6193599700927734e-07, 5.038455128669739e-07, 5.457550287246704e-07, 5.876645445823669e-07, 6.295740604400635e-07, 6.7148357629776e-07, 7.133930921554565e-07, 7.553026080131531e-07, 7.972121238708496e-07, 8.391216397285461e-07, 8.810311555862427e-07, 9.229406714439392e-07, 9.648501873016357e-07, 1.0067597031593323e-06, 1.0486692190170288e-06, 1.0905787348747253e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 18.0, 34.0, 74.0, 146.0, 690.0, 1989.0, 8912.0, 4150851.0, 27028.0, 3266.0, 677.0, 405.0, 78.0, 57.0, 20.0, 10.0, 5.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.062219083309174e-06, -6.852671504020691e-06, -6.643123924732208e-06, -6.433576345443726e-06, -6.224028766155243e-06, -6.01448118686676e-06, -5.804933607578278e-06, -5.595386028289795e-06, -5.385838449001312e-06, -5.17629086971283e-06, -4.966743290424347e-06, -4.757195711135864e-06, -4.547648131847382e-06, -4.338100552558899e-06, -4.128552973270416e-06, -3.919005393981934e-06, -3.709457814693451e-06, -3.4999102354049683e-06, -3.2903626561164856e-06, -3.080815076828003e-06, -2.8712674975395203e-06, -2.6617199182510376e-06, -2.452172338962555e-06, -2.2426247596740723e-06, -2.0330771803855896e-06, -1.823529601097107e-06, -1.6139820218086243e-06, -1.4044344425201416e-06, -1.194886863231659e-06, -9.853392839431763e-07, -7.757917046546936e-07, -5.662441253662109e-07, -3.5669654607772827e-07, -1.471489667892456e-07, 6.239861249923706e-08, 2.7194619178771973e-07, 4.814937710762024e-07, 6.910413503646851e-07, 9.005889296531677e-07, 1.1101365089416504e-06, 1.319684088230133e-06, 1.5292316675186157e-06, 1.7387792468070984e-06, 1.948326826095581e-06, 2.1578744053840637e-06, 2.3674219846725464e-06, 2.576969563961029e-06, 2.7865171432495117e-06, 2.9960647225379944e-06, 3.205612301826477e-06, 3.4151598811149597e-06, 3.6247074604034424e-06, 3.834255039691925e-06, 4.043802618980408e-06, 4.25335019826889e-06, 4.462897777557373e-06, 4.672445356845856e-06, 4.881992936134338e-06, 5.091540515422821e-06, 5.301088094711304e-06, 5.510635673999786e-06, 5.720183253288269e-06, 5.929730832576752e-06, 6.139278411865234e-06]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 15.0, 0.0, 0.0, 147.0, 0.0, 0.0, 0.0, 3739.0, 0.0, 0.0, 156.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.187466740608215e-07, -5.010515451431274e-07, -4.833564162254333e-07, -4.6566128730773926e-07, -4.4796615839004517e-07, -4.302710294723511e-07, -4.12575900554657e-07, -3.948807716369629e-07, -3.771856427192688e-07, -3.594905138015747e-07, -3.417953848838806e-07, -3.241002559661865e-07, -3.0640512704849243e-07, -2.8870999813079834e-07, -2.7101486921310425e-07, -2.5331974029541016e-07, -2.3562461137771606e-07, -2.1792948246002197e-07, -2.0023435354232788e-07, -1.825392246246338e-07, -1.648440957069397e-07, -1.471489667892456e-07, -1.2945383787155151e-07, -1.1175870895385742e-07, -9.406358003616333e-08, -7.636845111846924e-08, -5.8673322200775146e-08, -4.0978193283081055e-08, -2.3283064365386963e-08, -5.587935447692871e-09, 1.210719347000122e-08, 2.9802322387695312e-08, 4.7497451305389404e-08, 6.51925802230835e-08, 8.288770914077759e-08, 1.0058283805847168e-07, 1.1827796697616577e-07, 1.3597309589385986e-07, 1.5366822481155396e-07, 1.7136335372924805e-07, 1.8905848264694214e-07, 2.0675361156463623e-07, 2.2444874048233032e-07, 2.421438694000244e-07, 2.598389983177185e-07, 2.775341272354126e-07, 2.952292561531067e-07, 3.129243850708008e-07, 3.3061951398849487e-07, 3.4831464290618896e-07, 3.6600977182388306e-07, 3.8370490074157715e-07, 4.0140002965927124e-07, 4.1909515857696533e-07, 4.367902874946594e-07, 4.544854164123535e-07, 4.721805453300476e-07, 4.898756742477417e-07, 5.075708031654358e-07, 5.252659320831299e-07, 5.42961061000824e-07, 5.606561899185181e-07, 5.783513188362122e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 7.0, 5.0, 8.0, 16.0, 15.0, 22.0, 30.0, 21.0, 42.0, 73.0, 81.0, 105.0, 112.0, 105.0, 81.0, 52.0, 48.0, 22.0, 19.0, 18.0, 15.0, 13.0, 13.0, 9.0, 3.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.226264430442825e-06, -1.1882001444973866e-06, -1.1501357448651106e-06, -1.1120714589196723e-06, -1.0740070592873963e-06, -1.035942773341958e-06, -9.978784873965196e-07, -9.598140877642436e-07, -9.217498018188053e-07, -8.836854590299481e-07, -8.456211162410909e-07, -8.075568302956526e-07, -7.694924875067954e-07, -7.314281447179383e-07, -6.933638019290811e-07, -6.552994591402239e-07, -6.172351163513667e-07, -5.791707735625096e-07, -5.411064307736524e-07, -5.030420879847952e-07, -4.649778020393569e-07, -4.2691345925049973e-07, -3.8884911646164255e-07, -3.507848020944948e-07, -3.1272045930563763e-07, -2.7465611651678046e-07, -2.365918021496327e-07, -1.9852745936077554e-07, -1.6046313078277308e-07, -1.2239880220477062e-07, -8.433445941591344e-08, -4.62701450487657e-08, -8.205802259908523e-09, 2.9858529870807615e-08, 6.792286200152375e-08, 1.0598719768495357e-07, 1.4405152626295603e-07, 1.821158548409585e-07, 2.2018019762981567e-07, 2.582445119969634e-07, 2.963088547858206e-07, 3.3437319757467776e-07, 3.724375119418255e-07, 4.105018547306827e-07, 4.4856619751953986e-07, 4.866304834649782e-07, 5.246948830972542e-07, 5.627591690426925e-07, 6.008235118315497e-07, 6.388878546204069e-07, 6.76952197409264e-07, 7.150165401981212e-07, 7.530808261435595e-07, 7.911451689324167e-07, 8.292095117212739e-07, 8.672737976667122e-07, 9.053381972989882e-07, 9.434025400878454e-07, 9.814668828767026e-07, 1.019531168822141e-06, 1.057595568454417e-06, 1.0956598543998552e-06, 1.1337242540321313e-06, 1.1717885399775696e-06, 1.209852825923008e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 9.0, 3.0, 5.0, 10.0, 8.0, 17.0, 22.0, 16.0, 32.0, 43.0, 41.0, 42.0, 41.0, 60.0, 53.0, 53.0, 54.0, 58.0, 56.0, 42.0, 50.0, 55.0, 32.0, 42.0, 32.0, 25.0, 25.0, 12.0, 13.0, 12.0, 9.0, 9.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5392382692880346e-06, -1.4984263998485403e-06, -1.4576146440958837e-06, -1.4168027746563894e-06, -1.3759910189037328e-06, -1.3351791494642384e-06, -1.2943673937115818e-06, -1.2535555242720875e-06, -1.2127436548325932e-06, -1.1719317853930988e-06, -1.1311200296404422e-06, -1.090308160200948e-06, -1.0494964044482913e-06, -1.008684535008797e-06, -9.678726655693026e-07, -9.27060909816646e-07, -8.862491540639894e-07, -8.454373414679139e-07, -8.046255288718385e-07, -7.638136594323441e-07, -7.230019036796875e-07, -6.821900342401932e-07, -6.413782216441177e-07, -6.005664090480423e-07, -5.597545964519668e-07, -5.189427838558913e-07, -4.781309712598159e-07, -4.3731913024203095e-07, -3.965073176459555e-07, -3.5569550504988e-07, -3.148836640320951e-07, -2.7407185143601964e-07, -2.332601525267819e-07, -1.9244833993070642e-07, -1.5163651312377624e-07, -1.1082468631684605e-07, -7.001287372077059e-08, -2.9201061124695116e-08, 1.1610779893089784e-08, 5.2422592489165254e-08, 9.323440508524072e-08, 1.340462176813162e-07, 1.7485804448824638e-07, 2.1566987129517656e-07, 2.5648168389125203e-07, 2.972934964873275e-07, 3.381053375051124e-07, 3.7891715010118787e-07, 4.1972896269726334e-07, 4.605407752933388e-07, 5.013525878894143e-07, 5.421644573289086e-07, 5.829762130815652e-07, 6.237880825210596e-07, 6.64599895117135e-07, 7.054117077132105e-07, 7.46223520309286e-07, 7.870353329053614e-07, 8.278471455014369e-07, 8.686589580975124e-07, 9.094708275370067e-07, 9.502825832896633e-07, 9.910944527291576e-07, 1.031906322168652e-06, 1.0727180779213086e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 0.0, 5.0, 15.0, 18.0, 0.0, 34.0, 63.0, 114.0, 0.0, 136.0, 321.0, 472.0, 0.0, 829.0, 1476.0, 2764.0, 0.0, 5366.0, 10763.0, 23551.0, 0.0, 57256.0, 172945.0, 495399.0, 0.0, 173908.0, 57592.0, 23169.0, 0.0, 10768.0, 5372.0, 2681.0, 0.0, 1535.0, 861.0, 473.0, 0.0, 274.0, 155.0, 84.0, 0.0, 70.0, 31.0, 22.0, 0.0, 15.0, 10.0, 8.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06, 1.3560056686401367e-06, 1.4007091522216797e-06, 1.4454126358032227e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 7.0, 0.0, 12.0, 0.0, 12.0, 16.0, 0.0, 28.0, 0.0, 30.0, 0.0, 44.0, 0.0, 69.0, 0.0, 79.0, 0.0, 88.0, 0.0, 78.0, 0.0, 92.0, 96.0, 0.0, 75.0, 0.0, 75.0, 0.0, 53.0, 0.0, 58.0, 0.0, 33.0, 0.0, 13.0, 0.0, 15.0, 13.0, 0.0, 10.0, 0.0, 8.0, 0.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0132789611816406e-06, -9.816139936447144e-07, -9.499490261077881e-07, -9.182840585708618e-07, -8.866190910339355e-07, -8.549541234970093e-07, -8.23289155960083e-07, -7.916241884231567e-07, -7.599592208862305e-07, -7.282942533493042e-07, -6.966292858123779e-07, -6.649643182754517e-07, -6.332993507385254e-07, -6.016343832015991e-07, -5.699694156646729e-07, -5.383044481277466e-07, -5.066394805908203e-07, -4.7497451305389404e-07, -4.4330954551696777e-07, -4.116445779800415e-07, -3.7997961044311523e-07, -3.4831464290618896e-07, -3.166496753692627e-07, -2.849847078323364e-07, -2.5331974029541016e-07, -2.2165477275848389e-07, -1.8998980522155762e-07, -1.5832483768463135e-07, -1.2665987014770508e-07, -9.499490261077881e-08, -6.332993507385254e-08, -3.166496753692627e-08, 0.0, 3.166496753692627e-08, 6.332993507385254e-08, 9.499490261077881e-08, 1.2665987014770508e-07, 1.5832483768463135e-07, 1.8998980522155762e-07, 2.2165477275848389e-07, 2.5331974029541016e-07, 2.849847078323364e-07, 3.166496753692627e-07, 3.4831464290618896e-07, 3.7997961044311523e-07, 4.116445779800415e-07, 4.4330954551696777e-07, 4.7497451305389404e-07, 5.066394805908203e-07, 5.383044481277466e-07, 5.699694156646729e-07, 6.016343832015991e-07, 6.332993507385254e-07, 6.649643182754517e-07, 6.966292858123779e-07, 7.282942533493042e-07, 7.599592208862305e-07, 7.916241884231567e-07, 8.23289155960083e-07, 8.549541234970093e-07, 8.866190910339355e-07, 9.182840585708618e-07, 9.499490261077881e-07, 9.816139936447144e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 11.0, 13.0, 0.0, 64.0, 55.0, 34.0, 0.0, 74.0, 138.0, 225.0, 0.0, 311.0, 646.0, 1236.0, 0.0, 2311.0, 1038075.0, 2639.0, 0.0, 1146.0, 637.0, 331.0, 0.0, 228.0, 147.0, 62.0, 0.0, 62.0, 25.0, 22.0, 0.0, 8.0, 11.0, 10.0, 0.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-1.6689300537109375e-06, -1.6242265701293945e-06, -1.5795230865478516e-06, -1.5348196029663086e-06, -1.4901161193847656e-06, -1.4454126358032227e-06, -1.4007091522216797e-06, -1.3560056686401367e-06, -1.3113021850585938e-06, -1.2665987014770508e-06, -1.2218952178955078e-06, -1.1771917343139648e-06, -1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1002.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1362135410308838e-07, -1.0803341865539551e-07, -1.0244548320770264e-07, -9.685754776000977e-08, -9.12696123123169e-08, -8.568167686462402e-08, -8.009374141693115e-08, -7.450580596923828e-08, -6.891787052154541e-08, -6.332993507385254e-08, -5.774199962615967e-08, -5.21540641784668e-08, -4.6566128730773926e-08, -4.0978193283081055e-08, -3.5390257835388184e-08, -2.9802322387695312e-08, -2.421438694000244e-08, -1.862645149230957e-08, -1.30385160446167e-08, -7.450580596923828e-09, -1.862645149230957e-09, 3.725290298461914e-09, 9.313225746154785e-09, 1.4901161193847656e-08, 2.0489096641540527e-08, 2.60770320892334e-08, 3.166496753692627e-08, 3.725290298461914e-08, 4.284083843231201e-08, 4.842877388000488e-08, 5.4016709327697754e-08, 5.960464477539063e-08, 6.51925802230835e-08, 7.078051567077637e-08, 7.636845111846924e-08, 8.195638656616211e-08, 8.754432201385498e-08, 9.313225746154785e-08, 9.872019290924072e-08, 1.043081283569336e-07, 1.0989606380462646e-07, 1.1548399925231934e-07, 1.210719347000122e-07, 1.2665987014770508e-07, 1.3224780559539795e-07, 1.3783574104309082e-07, 1.434236764907837e-07, 1.4901161193847656e-07, 1.5459954738616943e-07, 1.601874828338623e-07, 1.6577541828155518e-07, 1.7136335372924805e-07, 1.7695128917694092e-07, 1.825392246246338e-07, 1.8812716007232666e-07, 1.9371509552001953e-07, 1.993030309677124e-07, 2.0489096641540527e-07, 2.1047890186309814e-07, 2.1606683731079102e-07, 2.2165477275848389e-07, 2.2724270820617676e-07, 2.3283064365386963e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 11.0, 12.0, 11.0, 25.0, 24.0, 32.0, 47.0, 43.0, 86.0, 100.0, 123.0, 109.0, 80.0, 61.0, 36.0, 31.0, 35.0, 19.0, 15.0, 11.0, 8.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1085492133133812e-06, -1.0694345746742329e-06, -1.0303199360350845e-06, -9.91205411082774e-07, -9.520907724436256e-07, -9.129761338044773e-07, -8.73861495165329e-07, -8.347468565261806e-07, -7.956322747304512e-07, -7.565176360913028e-07, -7.174030542955734e-07, -6.782884156564251e-07, -6.391737770172767e-07, -6.000591952215473e-07, -5.609445565823989e-07, -5.218299747866695e-07, -4.827153361475212e-07, -4.4360072593008226e-07, -4.0448611571264337e-07, -3.6537147707349504e-07, -3.2625686685605615e-07, -2.8714225663861725e-07, -2.4802761799946893e-07, -2.0891300778203004e-07, -1.6979839756459114e-07, -1.3068378734715225e-07, -9.156916291885864e-08, -5.2454545595992386e-08, -1.3339928273126134e-08, 2.577468194431276e-08, 6.488930637260637e-08, 1.0400393080089998e-07, 1.4311854101833887e-07, 1.8223315123577777e-07, 2.2134777566407138e-07, 2.60462400092365e-07, 2.995770103098039e-07, 3.386916205272428e-07, 3.778062591663911e-07, 4.1692086938383e-07, 4.560354796012689e-07, 4.951501182404172e-07, 5.342647000361467e-07, 5.73379338675295e-07, 6.124939773144433e-07, 6.516085591101728e-07, 6.907231977493211e-07, 7.298377795450506e-07, 7.689524181841989e-07, 8.080670568233472e-07, 8.471816386190767e-07, 8.86296277258225e-07, 9.254108590539545e-07, 9.645254976931028e-07, 1.0036401363322511e-06, 1.0427547749713995e-06, 1.0818694136105478e-06, 1.120984052249696e-06, 1.1600986908888444e-06, 1.199213215841155e-06, 1.2383278544803034e-06, 1.2774424931194517e-06, 1.3165571317586e-06, 1.3556717703977483e-06, 1.394786295350059e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 6.0, 4.0, 9.0, 8.0, 14.0, 24.0, 16.0, 27.0, 45.0, 40.0, 38.0, 47.0, 54.0, 54.0, 55.0, 49.0, 53.0, 69.0, 44.0, 43.0, 57.0, 35.0, 37.0, 32.0, 33.0, 25.0, 13.0, 13.0, 9.0, 10.0, 11.0, 6.0, 5.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.405195121151337e-06, -1.3681097925655195e-06, -1.3310245776665397e-06, -1.2939392490807222e-06, -1.2568540341817425e-06, -1.219768705595925e-06, -1.1826834906969452e-06, -1.1455981621111277e-06, -1.1085128335253103e-06, -1.0714275049394928e-06, -1.034342290040513e-06, -9.972569614546956e-07, -9.601717465557158e-07, -9.230864179698983e-07, -8.860011462274997e-07, -8.489158744851011e-07, -8.118306595861213e-07, -7.747453878437227e-07, -7.376601161013241e-07, -7.005748443589255e-07, -6.634895726165269e-07, -6.264042440307094e-07, -5.893189722883108e-07, -5.522337005459121e-07, -5.151484288035135e-07, -4.780631570611149e-07, -4.409778853187163e-07, -4.0389258515460824e-07, -3.668073134122096e-07, -3.29722041669811e-07, -2.9263674150570296e-07, -2.5555146976330434e-07, -2.18466084334068e-07, -1.8138081259166938e-07, -1.4429552663841605e-07, -1.0721024779059007e-07, -7.01249689427641e-08, -3.303969720036548e-08, 4.045588752887852e-09, 4.1130874706141185e-08, 7.82161464485398e-08, 1.1530142529636578e-07, 1.5238670414419175e-07, 1.8947199009744509e-07, 2.265572618398437e-07, 2.636425335822423e-07, 3.0072783374635037e-07, 3.37813105488749e-07, 3.748983772311476e-07, 4.119836489735462e-07, 4.4906892071594484e-07, 4.861541924583435e-07, 5.232394642007421e-07, 5.603247927865596e-07, 5.974100645289582e-07, 6.344953362713568e-07, 6.715806080137554e-07, 7.08665879756154e-07, 7.457511514985526e-07, 7.828364232409513e-07, 8.199217518267687e-07, 8.570069667257485e-07, 8.94092295311566e-07, 9.311775670539646e-07, 9.682628387963632e-07]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 10.0, 9.0, 6.0, 15.0, 14.0, 14.0, 44.0, 40.0, 40.0, 208.0, 135.0, 188.0, 633.0, 484.0, 700.0, 2255.0, 1941.0, 2745.0, 9525.0, 8134.0, 12194.0, 48651.0, 49925.0, 86512.0, 433593.0, 166392.0, 86809.0, 79282.0, 18677.0, 12230.0, 13755.0, 3879.0, 2757.0, 3239.0, 959.0, 701.0, 880.0, 249.0, 212.0, 248.0, 72.0, 45.0, 54.0, 21.0, 21.0, 33.0, 8.0, 3.0, 3.0, 4.0, 0.0, 8.0, 3.0, 2.0, 2.0], "bins": [-2.682209014892578e-06, -2.6030465960502625e-06, -2.5238841772079468e-06, -2.444721758365631e-06, -2.3655593395233154e-06, -2.2863969206809998e-06, -2.207234501838684e-06, -2.1280720829963684e-06, -2.0489096641540527e-06, -1.969747245311737e-06, -1.8905848264694214e-06, -1.8114224076271057e-06, -1.73225998878479e-06, -1.6530975699424744e-06, -1.5739351511001587e-06, -1.494772732257843e-06, -1.4156103134155273e-06, -1.3364478945732117e-06, -1.257285475730896e-06, -1.1781230568885803e-06, -1.0989606380462646e-06, -1.019798219203949e-06, -9.406358003616333e-07, -8.614733815193176e-07, -7.82310962677002e-07, -7.031485438346863e-07, -6.239861249923706e-07, -5.448237061500549e-07, -4.6566128730773926e-07, -3.864988684654236e-07, -3.073364496231079e-07, -2.2817403078079224e-07, -1.4901161193847656e-07, -6.984919309616089e-08, 9.313225746154785e-09, 8.847564458847046e-08, 1.6763806343078613e-07, 2.468004822731018e-07, 3.259629011154175e-07, 4.0512531995773315e-07, 4.842877388000488e-07, 5.634501576423645e-07, 6.426125764846802e-07, 7.217749953269958e-07, 8.009374141693115e-07, 8.800998330116272e-07, 9.592622518539429e-07, 1.0384246706962585e-06, 1.1175870895385742e-06, 1.1967495083808899e-06, 1.2759119272232056e-06, 1.3550743460655212e-06, 1.434236764907837e-06, 1.5133991837501526e-06, 1.5925616025924683e-06, 1.671724021434784e-06, 1.7508864402770996e-06, 1.8300488591194153e-06, 1.909211277961731e-06, 1.9883736968040466e-06, 2.0675361156463623e-06, 2.146698534488678e-06, 2.2258609533309937e-06, 2.3050233721733093e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 11.0, 0.0, 11.0, 13.0, 0.0, 15.0, 0.0, 31.0, 31.0, 0.0, 50.0, 0.0, 88.0, 0.0, 104.0, 92.0, 0.0, 123.0, 0.0, 93.0, 0.0, 98.0, 74.0, 0.0, 59.0, 0.0, 42.0, 27.0, 0.0, 14.0, 0.0, 15.0, 0.0, 12.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1576339602470398e-06, -1.123175024986267e-06, -1.0887160897254944e-06, -1.0542571544647217e-06, -1.019798219203949e-06, -9.853392839431763e-07, -9.508803486824036e-07, -9.164214134216309e-07, -8.819624781608582e-07, -8.475035429000854e-07, -8.130446076393127e-07, -7.7858567237854e-07, -7.441267371177673e-07, -7.096678018569946e-07, -6.752088665962219e-07, -6.407499313354492e-07, -6.062909960746765e-07, -5.718320608139038e-07, -5.373731255531311e-07, -5.029141902923584e-07, -4.684552550315857e-07, -4.33996319770813e-07, -3.995373845100403e-07, -3.650784492492676e-07, -3.3061951398849487e-07, -2.9616057872772217e-07, -2.6170164346694946e-07, -2.2724270820617676e-07, -1.9278377294540405e-07, -1.5832483768463135e-07, -1.2386590242385864e-07, -8.940696716308594e-08, -5.494803190231323e-08, -2.0489096641540527e-08, 1.3969838619232178e-08, 4.842877388000488e-08, 8.288770914077759e-08, 1.1734664440155029e-07, 1.51805579662323e-07, 1.862645149230957e-07, 2.207234501838684e-07, 2.551823854446411e-07, 2.896413207054138e-07, 3.241002559661865e-07, 3.5855919122695923e-07, 3.9301812648773193e-07, 4.2747706174850464e-07, 4.6193599700927734e-07, 4.9639493227005e-07, 5.308538675308228e-07, 5.653128027915955e-07, 5.997717380523682e-07, 6.342306733131409e-07, 6.686896085739136e-07, 7.031485438346863e-07, 7.37607479095459e-07, 7.720664143562317e-07, 8.065253496170044e-07, 8.409842848777771e-07, 8.754432201385498e-07, 9.099021553993225e-07, 9.443610906600952e-07, 9.78820025920868e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 11.0, 2.0, 15.0, 8.0, 4.0, 15.0, 26.0, 6.0, 85.0, 46.0, 161.0, 438.0, 328.0, 1471.0, 1342.0, 5032.0, 4709.0, 17416.0, 16663.0, 72019.0, 82725.0, 470595.0, 172688.0, 128186.0, 26744.0, 27186.0, 7060.0, 7787.0, 3225.0, 855.0, 934.0, 210.0, 292.0, 68.0, 84.0, 24.0, 32.0, 21.0, 20.0, 0.0, 14.0, 2.0, 6.0, 10.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3525208234786987e-06, -2.261251211166382e-06, -2.169981598854065e-06, -2.078711986541748e-06, -1.987442374229431e-06, -1.8961727619171143e-06, -1.8049031496047974e-06, -1.7136335372924805e-06, -1.6223639249801636e-06, -1.5310943126678467e-06, -1.4398247003555298e-06, -1.3485550880432129e-06, -1.257285475730896e-06, -1.166015863418579e-06, -1.0747462511062622e-06, -9.834766387939453e-07, -8.922070264816284e-07, -8.009374141693115e-07, -7.096678018569946e-07, -6.183981895446777e-07, -5.271285772323608e-07, -4.3585896492004395e-07, -3.4458935260772705e-07, -2.5331974029541016e-07, -1.6205012798309326e-07, -7.078051567077637e-08, 2.0489096641540527e-08, 1.1175870895385742e-07, 2.0302832126617432e-07, 2.942979335784912e-07, 3.855675458908081e-07, 4.76837158203125e-07, 5.681067705154419e-07, 6.593763828277588e-07, 7.506459951400757e-07, 8.419156074523926e-07, 9.331852197647095e-07, 1.0244548320770264e-06, 1.1157244443893433e-06, 1.2069940567016602e-06, 1.298263669013977e-06, 1.389533281326294e-06, 1.4808028936386108e-06, 1.5720725059509277e-06, 1.6633421182632446e-06, 1.7546117305755615e-06, 1.8458813428878784e-06, 1.9371509552001953e-06, 2.028420567512512e-06, 2.119690179824829e-06, 2.210959792137146e-06, 2.302229404449463e-06, 2.3934990167617798e-06, 2.4847686290740967e-06, 2.5760382413864136e-06, 2.6673078536987305e-06, 2.7585774660110474e-06, 2.8498470783233643e-06, 2.941116690635681e-06, 3.032386302947998e-06, 3.123655915260315e-06, 3.214925527572632e-06, 3.3061951398849487e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 13.0, 0.0, 15.0, 0.0, 0.0, 32.0, 0.0, 0.0, 43.0, 0.0, 50.0, 0.0, 0.0, 64.0, 0.0, 0.0, 91.0, 0.0, 108.0, 0.0, 0.0, 121.0, 0.0, 0.0, 120.0, 0.0, 106.0, 0.0, 0.0, 85.0, 0.0, 0.0, 59.0, 0.0, 49.0, 0.0, 0.0, 26.0, 0.0, 0.0, 20.0, 0.0, 12.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.344650268554688e-07, -8.121132850646973e-07, -7.897615432739258e-07, -7.674098014831543e-07, -7.450580596923828e-07, -7.227063179016113e-07, -7.003545761108398e-07, -6.780028343200684e-07, -6.556510925292969e-07, -6.332993507385254e-07, -6.109476089477539e-07, -5.885958671569824e-07, -5.662441253662109e-07, -5.438923835754395e-07, -5.21540641784668e-07, -4.991888999938965e-07, -4.76837158203125e-07, -4.544854164123535e-07, -4.3213367462158203e-07, -4.0978193283081055e-07, -3.8743019104003906e-07, -3.650784492492676e-07, -3.427267074584961e-07, -3.203749656677246e-07, -2.980232238769531e-07, -2.7567148208618164e-07, -2.5331974029541016e-07, -2.3096799850463867e-07, -2.086162567138672e-07, -1.862645149230957e-07, -1.6391277313232422e-07, -1.4156103134155273e-07, -1.1920928955078125e-07, -9.685754776000977e-08, -7.450580596923828e-08, -5.21540641784668e-08, -2.9802322387695312e-08, -7.450580596923828e-09, 1.4901161193847656e-08, 3.725290298461914e-08, 5.960464477539063e-08, 8.195638656616211e-08, 1.043081283569336e-07, 1.2665987014770508e-07, 1.4901161193847656e-07, 1.7136335372924805e-07, 1.9371509552001953e-07, 2.1606683731079102e-07, 2.384185791015625e-07, 2.60770320892334e-07, 2.8312206268310547e-07, 3.0547380447387695e-07, 3.2782554626464844e-07, 3.501772880554199e-07, 3.725290298461914e-07, 3.948807716369629e-07, 4.172325134277344e-07, 4.3958425521850586e-07, 4.6193599700927734e-07, 4.842877388000488e-07, 5.066394805908203e-07, 5.289912223815918e-07, 5.513429641723633e-07, 5.736947059631348e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 13.0, 10.0, 14.0, 28.0, 23.0, 55.0, 58.0, 98.0, 128.0, 146.0, 103.0, 77.0, 47.0, 38.0, 28.0, 24.0, 20.0, 10.0, 11.0, 8.0, 6.0, 1.0, 4.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2982030739294714e-06, -1.2539267117972486e-06, -1.2096503496650257e-06, -1.1653739875328029e-06, -1.12109762540058e-06, -1.0768212632683571e-06, -1.032545014822972e-06, -9.882685390039114e-07, -9.439922337151074e-07, -8.997158715828846e-07, -8.554395094506617e-07, -8.111632041618577e-07, -7.668868420296349e-07, -7.22610479897412e-07, -6.783341177651891e-07, -6.340577556329663e-07, -5.897813935007434e-07, -5.455050313685206e-07, -5.012286692362977e-07, -4.569523355257843e-07, -4.1267597339356143e-07, -3.683996112613386e-07, -3.2412327755082515e-07, -2.798469154186023e-07, -2.3557055328637944e-07, -1.9129419115415658e-07, -1.4701784323278844e-07, -1.027414953114203e-07, -5.846513317919744e-08, -1.418877104697458e-08, 3.008756266353885e-08, 7.43639247957617e-08, 1.1864040061482228e-07, 1.6291676274704514e-07, 2.0719311066841328e-07, 2.514694585897814e-07, 2.957458207220043e-07, 3.4002218285422714e-07, 3.8429851656474057e-07, 4.285748786969634e-07, 4.728512408291863e-07, 5.171276029614091e-07, 5.61403965093632e-07, 6.05680270382436e-07, 6.499566325146588e-07, 6.942329946468817e-07, 7.385093567791046e-07, 7.827857189113274e-07, 8.270620810435503e-07, 8.713384431757731e-07, 9.15614805307996e-07, 9.598911674402189e-07, 1.0041675295724417e-06, 1.0484438917046646e-06, 1.0927201401500497e-06, 1.1369966159691103e-06, 1.1812728644144954e-06, 1.2255492265467183e-06, 1.2698255886789411e-06, 1.314101950811164e-06, 1.3583783129433868e-06, 1.4026546750756097e-06, 1.4469310372078326e-06, 1.4912072856532177e-06, 1.5354837614722783e-06]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 6.0, 7.0, 12.0, 14.0, 20.0, 18.0, 15.0, 34.0, 34.0, 33.0, 32.0, 33.0, 45.0, 38.0, 46.0, 44.0, 55.0, 60.0, 44.0, 59.0, 38.0, 57.0, 36.0, 33.0, 27.0, 32.0, 22.0, 20.0, 11.0, 20.0, 9.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1146156566610443e-06, -1.0822859621839598e-06, -1.049956381393713e-06, -1.0176266869166284e-06, -9.852969924395438e-07, -9.529672979624593e-07, -9.206376603287936e-07, -8.883080226951279e-07, -8.559783282180433e-07, -8.236486337409588e-07, -7.913189961072931e-07, -7.589893584736274e-07, -7.266596639965428e-07, -6.943299695194582e-07, -6.620003318857925e-07, -6.296706942521269e-07, -5.973409997750423e-07, -5.650113052979577e-07, -5.32681667664292e-07, -5.003520300306263e-07, -4.680223355535418e-07, -4.3569266949816665e-07, -4.033630034427915e-07, -3.710333373874164e-07, -3.3870367133204127e-07, -3.0637400527666614e-07, -2.74044339221291e-07, -2.417146731659159e-07, -2.0938500711054076e-07, -1.7705534105516563e-07, -1.447256749997905e-07, -1.1239600894441537e-07, -8.006645657587796e-08, -4.7736790520502836e-08, -1.540712446512771e-08, 1.692254159024742e-08, 4.925220764562255e-08, 8.158187370099768e-08, 1.139115397563728e-07, 1.4624120581174793e-07, 1.7857087186712306e-07, 2.109005379224982e-07, 2.432302039778733e-07, 2.7555987003324844e-07, 3.0788953608862357e-07, 3.402192021439987e-07, 3.7254886819937383e-07, 4.0487853425474896e-07, 4.372082003101241e-07, 4.695378663654992e-07, 5.018675324208743e-07, 5.3419717005454e-07, 5.665268645316246e-07, 5.988565590087092e-07, 6.311861966423749e-07, 6.635158342760406e-07, 6.958455287531251e-07, 7.281752232302097e-07, 7.605048608638754e-07, 7.928344984975411e-07, 8.251641929746256e-07, 8.574938874517102e-07, 8.898235250853759e-07, 9.221531627190416e-07, 9.544828571961261e-07]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 10.0, 27.0, 15.0, 43.0, 22.0, 74.0, 133.0, 104.0, 295.0, 164.0, 487.0, 895.0, 474.0, 1860.0, 1228.0, 3899.0, 7957.0, 7622.0, 102769.0, 3927626.0, 112216.0, 8430.0, 8306.0, 4088.0, 1159.0, 1781.0, 481.0, 841.0, 446.0, 139.0, 250.0, 82.0, 111.0, 81.0, 29.0, 47.0, 15.0, 26.0, 14.0, 7.0, 12.0, 4.0, 9.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8014183044433594e-06, -2.7064234018325806e-06, -2.6114284992218018e-06, -2.516433596611023e-06, -2.421438694000244e-06, -2.3264437913894653e-06, -2.2314488887786865e-06, -2.1364539861679077e-06, -2.041459083557129e-06, -1.94646418094635e-06, -1.8514692783355713e-06, -1.7564743757247925e-06, -1.6614794731140137e-06, -1.5664845705032349e-06, -1.471489667892456e-06, -1.3764947652816772e-06, -1.2814998626708984e-06, -1.1865049600601196e-06, -1.0915100574493408e-06, -9.96515154838562e-07, -9.015202522277832e-07, -8.065253496170044e-07, -7.115304470062256e-07, -6.165355443954468e-07, -5.21540641784668e-07, -4.2654573917388916e-07, -3.3155083656311035e-07, -2.3655593395233154e-07, -1.4156103134155273e-07, -4.6566128730773926e-08, 4.842877388000488e-08, 1.434236764907837e-07, 2.384185791015625e-07, 3.334134817123413e-07, 4.284083843231201e-07, 5.234032869338989e-07, 6.183981895446777e-07, 7.133930921554565e-07, 8.083879947662354e-07, 9.033828973770142e-07, 9.98377799987793e-07, 1.0933727025985718e-06, 1.1883676052093506e-06, 1.2833625078201294e-06, 1.3783574104309082e-06, 1.473352313041687e-06, 1.5683472156524658e-06, 1.6633421182632446e-06, 1.7583370208740234e-06, 1.8533319234848022e-06, 1.948326826095581e-06, 2.04332172870636e-06, 2.1383166313171387e-06, 2.2333115339279175e-06, 2.3283064365386963e-06, 2.423301339149475e-06, 2.518296241760254e-06, 2.6132911443710327e-06, 2.7082860469818115e-06, 2.8032809495925903e-06, 2.898275852203369e-06, 2.993270754814148e-06, 3.0882656574249268e-06, 3.1832605600357056e-06, 3.2782554626464844e-06]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 0.0, 21.0, 0.0, 0.0, 22.0, 0.0, 0.0, 50.0, 0.0, 0.0, 73.0, 0.0, 0.0, 98.0, 0.0, 0.0, 131.0, 0.0, 0.0, 173.0, 0.0, 0.0, 156.0, 0.0, 117.0, 0.0, 0.0, 84.0, 0.0, 0.0, 45.0, 0.0, 0.0, 20.0, 0.0, 0.0, 11.0, 0.0, 0.0, 5.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.755573511123657e-07, -5.550682544708252e-07, -5.345791578292847e-07, -5.140900611877441e-07, -4.936009645462036e-07, -4.731118679046631e-07, -4.5262277126312256e-07, -4.3213367462158203e-07, -4.116445779800415e-07, -3.91155481338501e-07, -3.7066638469696045e-07, -3.501772880554199e-07, -3.296881914138794e-07, -3.0919909477233887e-07, -2.8870999813079834e-07, -2.682209014892578e-07, -2.477318048477173e-07, -2.2724270820617676e-07, -2.0675361156463623e-07, -1.862645149230957e-07, -1.6577541828155518e-07, -1.4528632164001465e-07, -1.2479722499847412e-07, -1.043081283569336e-07, -8.381903171539307e-08, -6.332993507385254e-08, -4.284083843231201e-08, -2.2351741790771484e-08, -1.862645149230957e-09, 1.862645149230957e-08, 3.91155481338501e-08, 5.960464477539063e-08, 8.009374141693115e-08, 1.0058283805847168e-07, 1.210719347000122e-07, 1.4156103134155273e-07, 1.6205012798309326e-07, 1.825392246246338e-07, 2.0302832126617432e-07, 2.2351741790771484e-07, 2.4400651454925537e-07, 2.644956111907959e-07, 2.849847078323364e-07, 3.0547380447387695e-07, 3.259629011154175e-07, 3.46451997756958e-07, 3.6694109439849854e-07, 3.8743019104003906e-07, 4.079192876815796e-07, 4.284083843231201e-07, 4.4889748096466064e-07, 4.6938657760620117e-07, 4.898756742477417e-07, 5.103647708892822e-07, 5.308538675308228e-07, 5.513429641723633e-07, 5.718320608139038e-07, 5.923211574554443e-07, 6.128102540969849e-07, 6.332993507385254e-07, 6.537884473800659e-07, 6.742775440216064e-07, 6.94766640663147e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 23.0, 29.0, 24.0, 75.0, 101.0, 289.0, 381.0, 847.0, 4242.0, 9115.0, 113397.0, 4011707.0, 38974.0, 11192.0, 1984.0, 1080.0, 299.0, 172.0, 141.0, 70.0, 57.0, 18.0, 15.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.4924596548080444e-06, -3.3490359783172607e-06, -3.205612301826477e-06, -3.0621886253356934e-06, -2.9187649488449097e-06, -2.775341272354126e-06, -2.6319175958633423e-06, -2.4884939193725586e-06, -2.345070242881775e-06, -2.201646566390991e-06, -2.0582228899002075e-06, -1.914799213409424e-06, -1.7713755369186401e-06, -1.6279518604278564e-06, -1.4845281839370728e-06, -1.341104507446289e-06, -1.1976808309555054e-06, -1.0542571544647217e-06, -9.10833477973938e-07, -7.674098014831543e-07, -6.239861249923706e-07, -4.805624485015869e-07, -3.371387720108032e-07, -1.9371509552001953e-07, -5.029141902923584e-08, 9.313225746154785e-08, 2.3655593395233154e-07, 3.7997961044311523e-07, 5.234032869338989e-07, 6.668269634246826e-07, 8.102506399154663e-07, 9.5367431640625e-07, 1.0970979928970337e-06, 1.2405216693878174e-06, 1.383945345878601e-06, 1.5273690223693848e-06, 1.6707926988601685e-06, 1.8142163753509521e-06, 1.957640051841736e-06, 2.1010637283325195e-06, 2.2444874048233032e-06, 2.387911081314087e-06, 2.5313347578048706e-06, 2.6747584342956543e-06, 2.818182110786438e-06, 2.9616057872772217e-06, 3.1050294637680054e-06, 3.248453140258789e-06, 3.3918768167495728e-06, 3.5353004932403564e-06, 3.67872416973114e-06, 3.822147846221924e-06, 3.9655715227127075e-06, 4.108995199203491e-06, 4.252418875694275e-06, 4.395842552185059e-06, 4.539266228675842e-06, 4.682689905166626e-06, 4.82611358165741e-06, 4.969537258148193e-06, 5.112960934638977e-06, 5.256384611129761e-06, 5.3998082876205444e-06, 5.543231964111328e-06]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 11.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 97.0, 0.0, 0.0, 3756.0, 0.0, 0.0, 100.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-07, -3.986060619354248e-07, -3.7997961044311523e-07, -3.6135315895080566e-07, -3.427267074584961e-07, -3.241002559661865e-07, -3.0547380447387695e-07, -2.868473529815674e-07, -2.682209014892578e-07, -2.4959444999694824e-07, -2.3096799850463867e-07, -2.123415470123291e-07, -1.9371509552001953e-07, -1.7508864402770996e-07, -1.564621925354004e-07, -1.3783574104309082e-07, -1.1920928955078125e-07, -1.0058283805847168e-07, -8.195638656616211e-08, -6.332993507385254e-08, -4.470348358154297e-08, -2.60770320892334e-08, -7.450580596923828e-09, 1.1175870895385742e-08, 2.9802322387695312e-08, 4.842877388000488e-08, 6.705522537231445e-08, 8.568167686462402e-08, 1.043081283569336e-07, 1.2293457984924316e-07, 1.4156103134155273e-07, 1.601874828338623e-07, 1.7881393432617188e-07, 1.9744038581848145e-07, 2.1606683731079102e-07, 2.3469328880310059e-07, 2.5331974029541016e-07, 2.7194619178771973e-07, 2.905726432800293e-07, 3.0919909477233887e-07, 3.2782554626464844e-07, 3.46451997756958e-07, 3.650784492492676e-07, 3.8370490074157715e-07, 4.023313522338867e-07, 4.209578037261963e-07, 4.3958425521850586e-07, 4.5821070671081543e-07, 4.76837158203125e-07, 4.954636096954346e-07, 5.140900611877441e-07, 5.327165126800537e-07, 5.513429641723633e-07, 5.699694156646729e-07, 5.885958671569824e-07, 6.07222318649292e-07, 6.258487701416016e-07, 6.444752216339111e-07, 6.631016731262207e-07, 6.817281246185303e-07, 7.003545761108398e-07, 7.189810276031494e-07, 7.37607479095459e-07, 7.562339305877686e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 9.0, 17.0, 22.0, 27.0, 38.0, 49.0, 93.0, 144.0, 195.0, 138.0, 75.0, 53.0, 40.0, 30.0, 23.0, 11.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.147329157902277e-06, -1.10557584775961e-06, -1.063822537616943e-06, -1.022069227474276e-06, -9.803160310184467e-07, -9.385627208757796e-07, -8.968094107331126e-07, -8.550561005904456e-07, -8.133027904477785e-07, -7.715494803051115e-07, -7.297962270058633e-07, -6.880429168631963e-07, -6.462896067205293e-07, -6.045363534212811e-07, -5.627830432786141e-07, -5.21029733135947e-07, -4.792764798366989e-07, -4.3752319811574125e-07, -3.957698879730742e-07, -3.540166062521166e-07, -3.122632961094496e-07, -2.70510014388492e-07, -2.2875673266753438e-07, -1.8700342252486735e-07, -1.4525014080390974e-07, -1.0349684487209743e-07, -6.174355604571247e-08, -1.9990267219327507e-08, 2.176302871248481e-08, 6.351632464429713e-08, 1.0526960636525473e-07, 1.4702291650792176e-07, 1.8877619822887937e-07, 2.3052949416069168e-07, 2.72282790092504e-07, 3.140360718134616e-07, 3.5578938195612864e-07, 3.9754266367708624e-07, 4.3929594539804384e-07, 4.810492555407109e-07, 5.228025656833779e-07, 5.645558758260449e-07, 6.063091291252931e-07, 6.480624392679601e-07, 6.898157494106272e-07, 7.315690027098753e-07, 7.733223128525424e-07, 8.150756229952094e-07, 8.568288762944576e-07, 8.985821864371246e-07, 9.403354397363728e-07, 9.820887498790398e-07, 1.0238420600217069e-06, 1.0655953701643739e-06, 1.107348680307041e-06, 1.149101990449708e-06, 1.1908551869055373e-06, 1.2326084970482043e-06, 1.2743618071908713e-06, 1.3161150036467006e-06, 1.3578683137893677e-06, 1.3996216239320347e-06, 1.4413749340747017e-06, 1.4831282442173688e-06, 1.5248815543600358e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 6.0, 11.0, 11.0, 17.0, 15.0, 15.0, 14.0, 19.0, 29.0, 24.0, 37.0, 38.0, 42.0, 42.0, 42.0, 51.0, 44.0, 55.0, 61.0, 45.0, 39.0, 39.0, 41.0, 47.0, 37.0, 35.0, 22.0, 21.0, 30.0, 11.0, 8.0, 10.0, 9.0, 9.0, 5.0, 10.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.610336527046456e-07, -6.386528639268363e-07, -6.162720751490269e-07, -5.938912863712176e-07, -5.715104407499894e-07, -5.4912965197218e-07, -5.267488631943706e-07, -5.043680744165613e-07, -4.819872856387519e-07, -4.5960649686094257e-07, -4.372256796614238e-07, -4.148448908836144e-07, -3.9246407368409564e-07, -3.700832849062863e-07, -3.477024961284769e-07, -3.2532170735066757e-07, -3.0294086172943935e-07, -2.8056007295163e-07, -2.581792557521112e-07, -2.3579846697430185e-07, -2.1341766398563777e-07, -1.910368609969737e-07, -1.6865607221916434e-07, -1.4627526923050027e-07, -1.238944662418362e-07, -1.0151366325317213e-07, -7.913286736993541e-08, -5.6752071486698696e-08, -3.4371268498034624e-08, -1.1990465509370551e-08, 1.0390323268438806e-08, 3.277112625710288e-08, 5.515192924576695e-08, 7.753273223443102e-08, 9.991352811766774e-08, 1.2229432400090445e-07, 1.4467512698956853e-07, 1.670559299782326e-07, 1.8943671875604196e-07, 2.1181752174470603e-07, 2.341983247333701e-07, 2.5657911351117946e-07, 2.7895993071069825e-07, 3.013407194885076e-07, 3.2372150826631696e-07, 3.4610232546583575e-07, 3.684831142436451e-07, 3.908639314431639e-07, 4.1324472022097325e-07, 4.356255089987826e-07, 4.580063261983014e-07, 4.803871433978202e-07, 5.027679321756295e-07, 5.251487209534389e-07, 5.475295097312483e-07, 5.699102985090576e-07, 5.922911441302858e-07, 6.146719329080952e-07, 6.370527216859045e-07, 6.594335673071328e-07, 6.818143560849421e-07, 7.041951448627515e-07, 7.265759336405608e-07, 7.489567224183702e-07, 7.713375111961795e-07]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 9.0, 14.0, 0.0, 26.0, 53.0, 86.0, 144.0, 0.0, 222.0, 368.0, 523.0, 923.0, 0.0, 1514.0, 2824.0, 4877.0, 9975.0, 0.0, 21814.0, 53991.0, 166454.0, 520695.0, 0.0, 166191.0, 54470.0, 21811.0, 9780.0, 0.0, 4925.0, 2797.0, 1569.0, 935.0, 0.0, 548.0, 378.0, 238.0, 118.0, 0.0, 87.0, 73.0, 43.0, 15.0, 0.0, 21.0, 23.0, 9.0, 6.0, 0.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.323409378528595e-06, -1.2759119272232056e-06, -1.2284144759178162e-06, -1.1809170246124268e-06, -1.1334195733070374e-06, -1.085922122001648e-06, -1.0384246706962585e-06, -9.909272193908691e-07, -9.434297680854797e-07, -8.959323167800903e-07, -8.484348654747009e-07, -8.009374141693115e-07, -7.534399628639221e-07, -7.059425115585327e-07, -6.584450602531433e-07, -6.109476089477539e-07, -5.634501576423645e-07, -5.159527063369751e-07, -4.684552550315857e-07, -4.209578037261963e-07, -3.734603524208069e-07, -3.259629011154175e-07, -2.784654498100281e-07, -2.3096799850463867e-07, -1.8347054719924927e-07, -1.3597309589385986e-07, -8.847564458847046e-08, -4.0978193283081055e-08, 6.51925802230835e-09, 5.4016709327697754e-08, 1.0151416063308716e-07, 1.4901161193847656e-07, 1.9650906324386597e-07, 2.4400651454925537e-07, 2.915039658546448e-07, 3.390014171600342e-07, 3.864988684654236e-07, 4.33996319770813e-07, 4.814937710762024e-07, 5.289912223815918e-07, 5.764886736869812e-07, 6.239861249923706e-07, 6.7148357629776e-07, 7.189810276031494e-07, 7.664784789085388e-07, 8.139759302139282e-07, 8.614733815193176e-07, 9.08970832824707e-07, 9.564682841300964e-07, 1.0039657354354858e-06, 1.0514631867408752e-06, 1.0989606380462646e-06, 1.146458089351654e-06, 1.1939555406570435e-06, 1.2414529919624329e-06, 1.2889504432678223e-06, 1.3364478945732117e-06, 1.383945345878601e-06, 1.4314427971839905e-06, 1.4789402484893799e-06, 1.5264376997947693e-06, 1.5739351511001587e-06, 1.621432602405548e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 57.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 146.0, 0.0, 0.0, 164.0, 0.0, 0.0, 0.0, 151.0, 0.0, 0.0, 115.0, 0.0, 0.0, 0.0, 77.0, 0.0, 0.0, 39.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 5.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.591420292854309e-07, -4.414469003677368e-07, -4.237517714500427e-07, -4.0605664253234863e-07, -3.8836151361465454e-07, -3.7066638469696045e-07, -3.5297125577926636e-07, -3.3527612686157227e-07, -3.175809979438782e-07, -2.998858690261841e-07, -2.8219074010849e-07, -2.644956111907959e-07, -2.468004822731018e-07, -2.2910535335540771e-07, -2.1141022443771362e-07, -1.9371509552001953e-07, -1.7601996660232544e-07, -1.5832483768463135e-07, -1.4062970876693726e-07, -1.2293457984924316e-07, -1.0523945093154907e-07, -8.754432201385498e-08, -6.984919309616089e-08, -5.21540641784668e-08, -3.4458935260772705e-08, -1.6763806343078613e-08, 9.313225746154785e-10, 1.862645149230957e-08, 3.632158041000366e-08, 5.4016709327697754e-08, 7.171183824539185e-08, 8.940696716308594e-08, 1.0710209608078003e-07, 1.2479722499847412e-07, 1.424923539161682e-07, 1.601874828338623e-07, 1.778826117515564e-07, 1.955777406692505e-07, 2.1327286958694458e-07, 2.3096799850463867e-07, 2.4866312742233276e-07, 2.6635825634002686e-07, 2.8405338525772095e-07, 3.0174851417541504e-07, 3.1944364309310913e-07, 3.371387720108032e-07, 3.548339009284973e-07, 3.725290298461914e-07, 3.902241587638855e-07, 4.079192876815796e-07, 4.256144165992737e-07, 4.4330954551696777e-07, 4.6100467443466187e-07, 4.78699803352356e-07, 4.9639493227005e-07, 5.140900611877441e-07, 5.317851901054382e-07, 5.494803190231323e-07, 5.671754479408264e-07, 5.848705768585205e-07, 6.025657057762146e-07, 6.202608346939087e-07, 6.379559636116028e-07, 6.556510925292969e-07]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 12.0, 20.0, 0.0, 21.0, 20.0, 0.0, 40.0, 53.0, 0.0, 160.0, 151.0, 0.0, 244.0, 398.0, 0.0, 827.0, 1300.0, 0.0, 2223.0, 4177.0, 0.0, 7286.0, 15301.0, 0.0, 983980.0, 15383.0, 0.0, 7334.0, 0.0, 4168.0, 2234.0, 0.0, 1278.0, 796.0, 0.0, 401.0, 230.0, 0.0, 175.0, 197.0, 0.0, 58.0, 29.0, 0.0, 24.0, 23.0, 0.0, 12.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0728836059570312e-06, -1.0337680578231812e-06, -9.94652509689331e-07, -9.55536961555481e-07, -9.164214134216309e-07, -8.773058652877808e-07, -8.381903171539307e-07, -7.990747690200806e-07, -7.599592208862305e-07, -7.208436727523804e-07, -6.817281246185303e-07, -6.426125764846802e-07, -6.034970283508301e-07, -5.6438148021698e-07, -5.252659320831299e-07, -4.861503839492798e-07, -4.470348358154297e-07, -4.079192876815796e-07, -3.688037395477295e-07, -3.296881914138794e-07, -2.905726432800293e-07, -2.514570951461792e-07, -2.123415470123291e-07, -1.73225998878479e-07, -1.341104507446289e-07, -9.499490261077881e-08, -5.587935447692871e-08, -1.6763806343078613e-08, 2.2351741790771484e-08, 6.146728992462158e-08, 1.0058283805847168e-07, 1.3969838619232178e-07, 1.7881393432617188e-07, 2.1792948246002197e-07, 2.5704503059387207e-07, 2.9616057872772217e-07, 3.3527612686157227e-07, 3.7439167499542236e-07, 4.1350722312927246e-07, 4.5262277126312256e-07, 4.917383193969727e-07, 5.308538675308228e-07, 5.699694156646729e-07, 6.09084963798523e-07, 6.48200511932373e-07, 6.873160600662231e-07, 7.264316082000732e-07, 7.655471563339233e-07, 8.046627044677734e-07, 8.437782526016235e-07, 8.828938007354736e-07, 9.220093488693237e-07, 9.611248970031738e-07, 1.000240445137024e-06, 1.039355993270874e-06, 1.0784715414047241e-06, 1.1175870895385742e-06, 1.1567026376724243e-06, 1.1958181858062744e-06, 1.2349337339401245e-06, 1.2740492820739746e-06, 1.3131648302078247e-06, 1.3522803783416748e-06, 1.391395926475525e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 884.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 10.0, 11.0, 19.0, 31.0, 29.0, 51.0, 99.0, 159.0, 211.0, 116.0, 74.0, 60.0, 35.0, 21.0, 20.0, 15.0, 10.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09175901395065e-07, -7.711817033850821e-07, -7.331875053750991e-07, -6.951933073651162e-07, -6.571991093551333e-07, -6.192049113451503e-07, -5.812106564917485e-07, -5.432165153251844e-07, -5.052222604717826e-07, -4.672280624617997e-07, -4.2923386445181677e-07, -3.9123966644183383e-07, -3.532454684318509e-07, -3.1525127042186796e-07, -2.772570439901756e-07, -2.3926284598019265e-07, -2.0126867639191914e-07, -1.632744783819362e-07, -1.2528028037195327e-07, -8.728606815111561e-08, -4.9291870141132677e-08, -1.1297672131149739e-08, 2.6696540089687915e-08, 6.469073809967085e-08, 1.0268493610965379e-07, 1.4067913411963673e-07, 1.7867333212961967e-07, 2.1666754435045732e-07, 2.5466175657129497e-07, 2.926559545812779e-07, 3.3065015259126085e-07, 3.686443506012438e-07, 4.066386054546456e-07, 4.446328034646285e-07, 4.826270014746115e-07, 5.206211994845944e-07, 5.586153974945773e-07, 5.966095955045603e-07, 6.346037935145432e-07, 6.72598048367945e-07, 7.105921895345091e-07, 7.48586387544492e-07, 7.86580585554475e-07, 8.245747835644579e-07, 8.625689815744408e-07, 9.005631795844238e-07, 9.385573775944067e-07, 9.765516324478085e-07, 1.0145458873012103e-06, 1.0525401421546121e-06, 1.0905342833211762e-06, 1.128528538174578e-06, 1.166522679341142e-06, 1.2045169341945439e-06, 1.242511075361108e-06, 1.2805053302145097e-06, 1.3184994713810738e-06, 1.3564937262344756e-06, 1.3944878674010397e-06, 1.4324821222544415e-06, 1.4704762634210056e-06, 1.5084705182744074e-06, 1.5464646594409714e-06, 1.5844589142943732e-06, 1.6224530554609373e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 14.0, 17.0, 15.0, 13.0, 14.0, 23.0, 27.0, 20.0, 38.0, 32.0, 43.0, 45.0, 41.0, 40.0, 52.0, 56.0, 61.0, 44.0, 43.0, 39.0, 39.0, 50.0, 34.0, 37.0, 21.0, 28.0, 26.0, 14.0, 11.0, 10.0, 10.0, 8.0, 3.0, 12.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.834446028529783e-07, -5.638614197778224e-07, -5.442782367026666e-07, -5.246949967840919e-07, -5.051118137089361e-07, -4.855286306337803e-07, -4.6594544755862444e-07, -4.463622644834686e-07, -4.2677905298660335e-07, -4.071958699114475e-07, -3.8761265841458226e-07, -3.680294753394264e-07, -3.484462922642706e-07, -3.2886308076740534e-07, -3.092798976922495e-07, -2.8969668619538425e-07, -2.701135031202284e-07, -2.505303200450726e-07, -2.3094710854820732e-07, -2.113639254730515e-07, -1.9178072818704095e-07, -1.721975309010304e-07, -1.5261434782587457e-07, -1.3303115053986403e-07, -1.1344795325385348e-07, -9.386475596784294e-08, -7.428156578725975e-08, -5.4698372053962885e-08, -3.511517832066602e-08, -1.5531981034655473e-08, 4.0512091459277144e-09, 2.3634399326510902e-08, 4.321759661252145e-08, 6.280079389853199e-08, 8.238398407911518e-08, 1.0196717425969837e-07, 1.215503715457089e-07, 1.4113356883171946e-07, 1.607167519068753e-07, 1.8029994919288583e-07, 1.9988314647889638e-07, 2.1946634376490692e-07, 2.3904954105091747e-07, 2.586327241260733e-07, 2.7821590720122913e-07, 2.977991186980944e-07, 3.173823017732502e-07, 3.369655132701155e-07, 3.565486963452713e-07, 3.7613187942042714e-07, 3.957150909172924e-07, 4.1529827399244823e-07, 4.348814854893135e-07, 4.544646685644693e-07, 4.7404785163962515e-07, 4.93631034714781e-07, 5.132142177899368e-07, 5.327974008650926e-07, 5.523805839402485e-07, 5.719638238588232e-07, 5.91547006933979e-07, 6.111301900091348e-07, 6.307133730842907e-07, 6.502965561594465e-07, 6.698797960780212e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 4.0, 0.0, 3.0, 12.0, 1.0, 16.0, 2.0, 6.0, 44.0, 25.0, 60.0, 41.0, 63.0, 193.0, 269.0, 404.0, 597.0, 684.0, 1003.0, 2257.0, 3473.0, 14801.0, 18680.0, 33742.0, 74793.0, 157868.0, 430100.0, 158359.0, 74669.0, 52367.0, 9237.0, 5568.0, 3525.0, 2271.0, 1030.0, 664.0, 609.0, 666.0, 128.0, 66.0, 79.0, 32.0, 57.0, 29.0, 28.0, 11.0, 4.0, 13.0, 0.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.8998980522155762e-06, -1.8328428268432617e-06, -1.7657876014709473e-06, -1.6987323760986328e-06, -1.6316771507263184e-06, -1.564621925354004e-06, -1.4975666999816895e-06, -1.430511474609375e-06, -1.3634562492370605e-06, -1.296401023864746e-06, -1.2293457984924316e-06, -1.1622905731201172e-06, -1.0952353477478027e-06, -1.0281801223754883e-06, -9.611248970031738e-07, -8.940696716308594e-07, -8.270144462585449e-07, -7.599592208862305e-07, -6.92903995513916e-07, -6.258487701416016e-07, -5.587935447692871e-07, -4.917383193969727e-07, -4.246830940246582e-07, -3.5762786865234375e-07, -2.905726432800293e-07, -2.2351741790771484e-07, -1.564621925354004e-07, -8.940696716308594e-08, -2.2351741790771484e-08, 4.470348358154297e-08, 1.1175870895385742e-07, 1.7881393432617188e-07, 2.4586915969848633e-07, 3.129243850708008e-07, 3.7997961044311523e-07, 4.470348358154297e-07, 5.140900611877441e-07, 5.811452865600586e-07, 6.48200511932373e-07, 7.152557373046875e-07, 7.82310962677002e-07, 8.493661880493164e-07, 9.164214134216309e-07, 9.834766387939453e-07, 1.0505318641662598e-06, 1.1175870895385742e-06, 1.1846423149108887e-06, 1.2516975402832031e-06, 1.3187527656555176e-06, 1.385807991027832e-06, 1.4528632164001465e-06, 1.519918441772461e-06, 1.5869736671447754e-06, 1.6540288925170898e-06, 1.7210841178894043e-06, 1.7881393432617188e-06, 1.8551945686340332e-06, 1.9222497940063477e-06, 1.989305019378662e-06, 2.0563602447509766e-06, 2.123415470123291e-06, 2.1904706954956055e-06, 2.25752592086792e-06, 2.3245811462402344e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 199.0, 0.0, 0.0, 0.0, 0.0, 0.0, 265.0, 0.0, 0.0, 0.0, 0.0, 233.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.8777867555618286e-07, -2.775341272354126e-07, -2.6728957891464233e-07, -2.5704503059387207e-07, -2.468004822731018e-07, -2.3655593395233154e-07, -2.2631138563156128e-07, -2.1606683731079102e-07, -2.0582228899002075e-07, -1.955777406692505e-07, -1.8533319234848022e-07, -1.7508864402770996e-07, -1.648440957069397e-07, -1.5459954738616943e-07, -1.4435499906539917e-07, -1.341104507446289e-07, -1.2386590242385864e-07, -1.1362135410308838e-07, -1.0337680578231812e-07, -9.313225746154785e-08, -8.288770914077759e-08, -7.264316082000732e-08, -6.239861249923706e-08, -5.21540641784668e-08, -4.190951585769653e-08, -3.166496753692627e-08, -2.1420419216156006e-08, -1.1175870895385742e-08, -9.313225746154785e-10, 9.313225746154785e-09, 1.955777406692505e-08, 2.9802322387695312e-08, 4.0046870708465576e-08, 5.029141902923584e-08, 6.05359673500061e-08, 7.078051567077637e-08, 8.102506399154663e-08, 9.12696123123169e-08, 1.0151416063308716e-07, 1.1175870895385742e-07, 1.2200325727462769e-07, 1.3224780559539795e-07, 1.424923539161682e-07, 1.5273690223693848e-07, 1.6298145055770874e-07, 1.73225998878479e-07, 1.8347054719924927e-07, 1.9371509552001953e-07, 2.039596438407898e-07, 2.1420419216156006e-07, 2.2444874048233032e-07, 2.3469328880310059e-07, 2.4493783712387085e-07, 2.551823854446411e-07, 2.654269337654114e-07, 2.7567148208618164e-07, 2.859160304069519e-07, 2.9616057872772217e-07, 3.0640512704849243e-07, 3.166496753692627e-07, 3.2689422369003296e-07, 3.371387720108032e-07, 3.473833203315735e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 23.0, 0.0, 19.0, 0.0, 64.0, 0.0, 0.0, 170.0, 0.0, 280.0, 0.0, 877.0, 0.0, 2151.0, 0.0, 0.0, 5060.0, 0.0, 14281.0, 0.0, 44610.0, 0.0, 0.0, 157181.0, 0.0, 600021.0, 0.0, 156683.0, 0.0, 44487.0, 0.0, 0.0, 14064.0, 0.0, 5199.0, 0.0, 2023.0, 0.0, 0.0, 771.0, 0.0, 297.0, 0.0, 173.0, 0.0, 83.0, 0.0, 0.0, 20.0, 0.0, 16.0, 0.0, 4.0, 0.0, 4.0], "bins": [-8.940696716308594e-07, -8.67992639541626e-07, -8.419156074523926e-07, -8.158385753631592e-07, -7.897615432739258e-07, -7.636845111846924e-07, -7.37607479095459e-07, -7.115304470062256e-07, -6.854534149169922e-07, -6.593763828277588e-07, -6.332993507385254e-07, -6.07222318649292e-07, -5.811452865600586e-07, -5.550682544708252e-07, -5.289912223815918e-07, -5.029141902923584e-07, -4.76837158203125e-07, -4.507601261138916e-07, -4.246830940246582e-07, -3.986060619354248e-07, -3.725290298461914e-07, -3.46451997756958e-07, -3.203749656677246e-07, -2.942979335784912e-07, -2.682209014892578e-07, -2.421438694000244e-07, -2.1606683731079102e-07, -1.8998980522155762e-07, -1.6391277313232422e-07, -1.3783574104309082e-07, -1.1175870895385742e-07, -8.568167686462402e-08, -5.960464477539063e-08, -3.3527612686157227e-08, -7.450580596923828e-09, 1.862645149230957e-08, 4.470348358154297e-08, 7.078051567077637e-08, 9.685754776000977e-08, 1.2293457984924316e-07, 1.4901161193847656e-07, 1.7508864402770996e-07, 2.0116567611694336e-07, 2.2724270820617676e-07, 2.5331974029541016e-07, 2.7939677238464355e-07, 3.0547380447387695e-07, 3.3155083656311035e-07, 3.5762786865234375e-07, 3.8370490074157715e-07, 4.0978193283081055e-07, 4.3585896492004395e-07, 4.6193599700927734e-07, 4.880130290985107e-07, 5.140900611877441e-07, 5.401670932769775e-07, 5.662441253662109e-07, 5.923211574554443e-07, 6.183981895446777e-07, 6.444752216339111e-07, 6.705522537231445e-07, 6.966292858123779e-07, 7.227063179016113e-07, 7.487833499908447e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 239.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 319.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 237.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.980232238769531e-07, -2.896413207054138e-07, -2.812594175338745e-07, -2.728775143623352e-07, -2.644956111907959e-07, -2.561137080192566e-07, -2.477318048477173e-07, -2.39349901676178e-07, -2.3096799850463867e-07, -2.2258609533309937e-07, -2.1420419216156006e-07, -2.0582228899002075e-07, -1.9744038581848145e-07, -1.8905848264694214e-07, -1.8067657947540283e-07, -1.7229467630386353e-07, -1.6391277313232422e-07, -1.555308699607849e-07, -1.471489667892456e-07, -1.387670636177063e-07, -1.30385160446167e-07, -1.2200325727462769e-07, -1.1362135410308838e-07, -1.0523945093154907e-07, -9.685754776000977e-08, -8.847564458847046e-08, -8.009374141693115e-08, -7.171183824539185e-08, -6.332993507385254e-08, -5.494803190231323e-08, -4.6566128730773926e-08, -3.818422555923462e-08, -2.9802322387695312e-08, -2.1420419216156006e-08, -1.30385160446167e-08, -4.6566128730773926e-09, 3.725290298461914e-09, 1.210719347000122e-08, 2.0489096641540527e-08, 2.8870999813079834e-08, 3.725290298461914e-08, 4.563480615615845e-08, 5.4016709327697754e-08, 6.239861249923706e-08, 7.078051567077637e-08, 7.916241884231567e-08, 8.754432201385498e-08, 9.592622518539429e-08, 1.043081283569336e-07, 1.126900315284729e-07, 1.210719347000122e-07, 1.2945383787155151e-07, 1.3783574104309082e-07, 1.4621764421463013e-07, 1.5459954738616943e-07, 1.6298145055770874e-07, 1.7136335372924805e-07, 1.7974525690078735e-07, 1.8812716007232666e-07, 1.9650906324386597e-07, 2.0489096641540527e-07, 2.1327286958694458e-07, 2.2165477275848389e-07, 2.300366759300232e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 7.0, 3.0, 5.0, 8.0, 12.0, 10.0, 13.0, 24.0, 22.0, 33.0, 52.0, 70.0, 110.0, 195.0, 138.0, 87.0, 55.0, 36.0, 37.0, 19.0, 15.0, 14.0, 10.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.910504677965946e-07, -7.699920274717442e-07, -7.489335871468938e-07, -7.278751468220435e-07, -7.068167064971931e-07, -6.857582661723427e-07, -6.646997690040735e-07, -6.436413286792231e-07, -6.225828883543727e-07, -6.015244480295223e-07, -5.804660077046719e-07, -5.594075673798216e-07, -5.383491270549712e-07, -5.172906867301208e-07, -4.962322464052704e-07, -4.751737776587106e-07, -4.5411536575556966e-07, -4.330569254307193e-07, -4.119984851058689e-07, -3.909400447810185e-07, -3.6988160445616813e-07, -3.4882316413131775e-07, -3.2776469538475794e-07, -3.0670625505990756e-07, -2.856478147350572e-07, -2.645893744102068e-07, -2.435309340853564e-07, -2.2247247954965133e-07, -2.0141403922480094e-07, -1.8035559889995056e-07, -1.5929714436424547e-07, -1.382387040393951e-07, -1.1718026371454471e-07, -9.612182338969433e-08, -7.506337595941659e-08, -5.400492852913885e-08, -3.294648820428847e-08, -1.188804787943809e-08, 9.170406656267005e-09, 3.0228846981117385e-08, 5.1287287305967766e-08, 7.234572763081815e-08, 9.340417506109588e-08, 1.1446262249137362e-07, 1.35521062816224e-07, 1.5657950314107438e-07, 1.7763795767677948e-07, 1.9869639800162986e-07, 2.1975483832648024e-07, 2.408132786513306e-07, 2.61871718976181e-07, 2.829301593010314e-07, 3.0398859962588176e-07, 3.2504703995073214e-07, 3.4610550869729195e-07, 3.6716394902214233e-07, 3.882223893469927e-07, 4.092808296718431e-07, 4.303392699966935e-07, 4.513977387432533e-07, 4.7245617906810367e-07, 4.93514619392954e-07, 5.145730597178044e-07, 5.356315000426548e-07, 5.566899403675052e-07]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 5.0, 10.0, 8.0, 8.0, 19.0, 13.0, 21.0, 15.0, 15.0, 15.0, 28.0, 40.0, 39.0, 26.0, 47.0, 54.0, 29.0, 55.0, 49.0, 44.0, 63.0, 38.0, 27.0, 37.0, 36.0, 25.0, 40.0, 26.0, 25.0, 25.0, 31.0, 14.0, 15.0, 8.0, 9.0, 14.0, 7.0, 10.0, 7.0, 0.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.668282317903504e-07, -3.549787663814641e-07, -3.431293293942872e-07, -3.312798639854009e-07, -3.1943039857651456e-07, -3.0758093316762825e-07, -2.9573149618045136e-07, -2.8388203077156504e-07, -2.7203259378438815e-07, -2.6018312837550184e-07, -2.4833369138832495e-07, -2.3648422597943863e-07, -2.2463476057055232e-07, -2.1278530937252071e-07, -2.009358581744891e-07, -1.890863927656028e-07, -1.7723692735671648e-07, -1.6538747615868488e-07, -1.5353801074979856e-07, -1.4168855955176696e-07, -1.2983909414288064e-07, -1.1798964294484904e-07, -1.0614019174681744e-07, -9.429073344335848e-08, -8.244127513989952e-08, -7.059181683644056e-08, -5.8742362085695277e-08, -4.6892907334949996e-08, -3.5043449031491036e-08, -2.3193990728032077e-08, -1.1344539530000475e-08, 5.049187734584848e-10, 1.2354348655208014e-08, 2.4203805182310134e-08, 3.6053261709412254e-08, 4.7902716460157535e-08, 5.97521747636165e-08, 7.160163306707545e-08, 8.345108426510706e-08, 9.530054256856602e-08, 1.0715000087202498e-07, 1.1899945917548393e-07, 1.308489174789429e-07, 1.426983686769745e-07, 1.545478198750061e-07, 1.6639728528389242e-07, 1.7824673648192402e-07, 1.9009618767995562e-07, 2.0194565308884194e-07, 2.1379510428687354e-07, 2.2564456969575986e-07, 2.3749402089379146e-07, 2.493434863026778e-07, 2.611929517115641e-07, 2.73042388698741e-07, 2.848918541076273e-07, 2.967412910948042e-07, 3.085907565036905e-07, 3.204401934908674e-07, 3.322896588997537e-07, 3.4413912430864e-07, 3.559885612958169e-07, 3.678380267047032e-07, 3.7968749211358954e-07, 3.9153695752247586e-07]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.0, 0.0, 0.0, 0.0, 0.0, 158.0, 0.0, 0.0, 0.0, 0.0, 0.0, 312.0, 0.0, 0.0, 0.0, 0.0, 0.0, 612.0, 0.0, 0.0, 0.0, 0.0, 0.0, 768.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1222.0, 0.0, 0.0, 0.0, 0.0, 4191050.0], "bins": [-6.556510925292969e-07, -6.454065442085266e-07, -6.351619958877563e-07, -6.249174475669861e-07, -6.146728992462158e-07, -6.044283509254456e-07, -5.941838026046753e-07, -5.83939254283905e-07, -5.736947059631348e-07, -5.634501576423645e-07, -5.532056093215942e-07, -5.42961061000824e-07, -5.327165126800537e-07, -5.224719643592834e-07, -5.122274160385132e-07, -5.019828677177429e-07, -4.917383193969727e-07, -4.814937710762024e-07, -4.7124922275543213e-07, -4.6100467443466187e-07, -4.507601261138916e-07, -4.4051557779312134e-07, -4.302710294723511e-07, -4.200264811515808e-07, -4.0978193283081055e-07, -3.995373845100403e-07, -3.8929283618927e-07, -3.7904828786849976e-07, -3.688037395477295e-07, -3.5855919122695923e-07, -3.4831464290618896e-07, -3.380700945854187e-07, -3.2782554626464844e-07, -3.175809979438782e-07, -3.073364496231079e-07, -2.9709190130233765e-07, -2.868473529815674e-07, -2.766028046607971e-07, -2.6635825634002686e-07, -2.561137080192566e-07, -2.4586915969848633e-07, -2.3562461137771606e-07, -2.253800630569458e-07, -2.1513551473617554e-07, -2.0489096641540527e-07, -1.94646418094635e-07, -1.8440186977386475e-07, -1.7415732145309448e-07, -1.6391277313232422e-07, -1.5366822481155396e-07, -1.434236764907837e-07, -1.3317912817001343e-07, -1.2293457984924316e-07, -1.126900315284729e-07, -1.0244548320770264e-07, -9.220093488693237e-08, -8.195638656616211e-08, -7.171183824539185e-08, -6.146728992462158e-08, -5.122274160385132e-08, -4.0978193283081055e-08, -3.073364496231079e-08, -2.0489096641540527e-08, -1.0244548320770264e-08, 0.0]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0], "bins": [-5.960464477539063e-08, -5.8673322200775146e-08, -5.774199962615967e-08, -5.681067705154419e-08, -5.587935447692871e-08, -5.494803190231323e-08, -5.4016709327697754e-08, -5.3085386753082275e-08, -5.21540641784668e-08, -5.122274160385132e-08, -5.029141902923584e-08, -4.936009645462036e-08, -4.842877388000488e-08, -4.7497451305389404e-08, -4.6566128730773926e-08, -4.563480615615845e-08, -4.470348358154297e-08, -4.377216100692749e-08, -4.284083843231201e-08, -4.190951585769653e-08, -4.0978193283081055e-08, -4.0046870708465576e-08, -3.91155481338501e-08, -3.818422555923462e-08, -3.725290298461914e-08, -3.632158041000366e-08, -3.5390257835388184e-08, -3.4458935260772705e-08, -3.3527612686157227e-08, -3.259629011154175e-08, -3.166496753692627e-08, -3.073364496231079e-08, -2.9802322387695312e-08, -2.8870999813079834e-08, -2.7939677238464355e-08, -2.7008354663848877e-08, -2.60770320892334e-08, -2.514570951461792e-08, -2.421438694000244e-08, -2.3283064365386963e-08, -2.2351741790771484e-08, -2.1420419216156006e-08, -2.0489096641540527e-08, -1.955777406692505e-08, -1.862645149230957e-08, -1.7695128917694092e-08, -1.6763806343078613e-08, -1.5832483768463135e-08, -1.4901161193847656e-08, -1.3969838619232178e-08, -1.30385160446167e-08, -1.210719347000122e-08, -1.1175870895385742e-08, -1.0244548320770264e-08, -9.313225746154785e-09, -8.381903171539307e-09, -7.450580596923828e-09, -6.51925802230835e-09, -5.587935447692871e-09, -4.6566128730773926e-09, -3.725290298461914e-09, -2.7939677238464355e-09, -1.862645149230957e-09, -9.313225746154785e-10, 0.0]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 9.0, 8.0, 15.0, 17.0, 17.0, 14.0, 22.0, 33.0, 58.0, 63.0, 108.0, 127.0, 97.0, 98.0, 49.0, 45.0, 38.0, 23.0, 18.0, 23.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 9.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1229239517169844e-08, -4.950540599679698e-08, -4.778157247642412e-08, -4.605773895605125e-08, -4.433390543567839e-08, -4.2610071915305525e-08, -4.088623839493266e-08, -3.91624048745598e-08, -3.7438571354186934e-08, -3.571473783381407e-08, -3.3990904313441206e-08, -3.226707079306834e-08, -3.054323727269548e-08, -2.8819403752322614e-08, -2.709557023194975e-08, -2.5371736711576887e-08, -2.3647903191204023e-08, -2.192406967083116e-08, -2.0200236150458295e-08, -1.847640263008543e-08, -1.6752569109712567e-08, -1.5028735589339703e-08, -1.330490206896684e-08, -1.1581068548593976e-08, -9.857235028221112e-09, -8.133401507848248e-09, -6.409567987475384e-09, -4.68573446710252e-09, -2.9619009467296564e-09, -1.2380674263567926e-09, 4.857660940160713e-10, 2.209599614388935e-09, 3.93342958204812e-09, 5.657263102420984e-09, 7.381096622793848e-09, 9.104930143166712e-09, 1.0828763663539576e-08, 1.255259718391244e-08, 1.4276430704285303e-08, 1.6000264224658167e-08, 1.772409774503103e-08, 1.9447931265403895e-08, 2.117176478577676e-08, 2.2895598306149623e-08, 2.4619431826522487e-08, 2.634326534689535e-08, 2.8067098867268214e-08, 2.9790932387641078e-08, 3.151476590801394e-08, 3.3238599428386806e-08, 3.496243294875967e-08, 3.6686266469132534e-08, 3.84100999895054e-08, 4.013393350987826e-08, 4.1857767030251125e-08, 4.358160055062399e-08, 4.530543407099685e-08, 4.7029267591369717e-08, 4.875310111174258e-08, 5.0476934632115444e-08, 5.220076815248831e-08, 5.392460167286117e-08, 5.5648435193234036e-08, 5.73722687136069e-08, 5.9096102233979764e-08]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 11.0, 9.0, 17.0, 12.0, 19.0, 13.0, 22.0, 13.0, 29.0, 36.0, 35.0, 31.0, 46.0, 54.0, 38.0, 40.0, 58.0, 50.0, 60.0, 40.0, 27.0, 36.0, 39.0, 29.0, 35.0, 33.0, 22.0, 26.0, 25.0, 17.0, 14.0, 11.0, 10.0, 11.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.400312292318631e-08, -4.255564078903262e-08, -4.1108155102165256e-08, -3.966067296801157e-08, -3.82131872811442e-08, -3.676570514699051e-08, -3.5318223012836825e-08, -3.387073732596946e-08, -3.242325163910209e-08, -3.09757695049484e-08, -2.9528283818081036e-08, -2.8080801683927348e-08, -2.663331599705998e-08, -2.5185833862906293e-08, -2.3738349952395765e-08, -2.2290866041885238e-08, -2.084338390773155e-08, -1.9395899997221022e-08, -1.7948416086710495e-08, -1.6500933952556807e-08, -1.505344826568944e-08, -1.3605965243357332e-08, -1.2158482221025224e-08, -1.0710998310514697e-08, -9.263514400004169e-09, -7.816030489493642e-09, -6.368547023072324e-09, -4.921063556651006e-09, -3.473579646140479e-09, -2.0260957356299514e-09, -5.786127132978436e-10, 8.688711972126839e-10, 2.31635866043689e-09, 3.763842570947418e-09, 5.211326037368735e-09, 6.658809503790053e-09, 8.10629341430058e-09, 9.553777324811108e-09, 1.1001260347143216e-08, 1.2448744257653743e-08, 1.389622816816427e-08, 1.5343712078674798e-08, 1.6791195989185326e-08, 1.8238679899695853e-08, 1.968616203384954e-08, 2.1133647720716908e-08, 2.2581129854870596e-08, 2.4028613765381124e-08, 2.547609767589165e-08, 2.692358158640218e-08, 2.8371065496912706e-08, 2.9818547631066394e-08, 3.126603331793376e-08, 3.271351545208745e-08, 3.416099758624114e-08, 3.5608483273108504e-08, 3.705596895997587e-08, 3.850345109412956e-08, 3.9950936780996926e-08, 4.1398418915150614e-08, 4.284590460201798e-08, 4.429338673617167e-08, 4.574086887032536e-08, 4.7188354557192724e-08, 4.863583669134641e-08]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 416.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1047724.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 408.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1020.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 4.0, 3.0, 7.0, 10.0, 13.0, 10.0, 14.0, 20.0, 24.0, 29.0, 43.0, 55.0, 82.0, 122.0, 147.0, 98.0, 63.0, 47.0, 46.0, 29.0, 14.0, 17.0, 10.0, 9.0, 15.0, 11.0, 7.0, 7.0, 4.0, 7.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.651341794532527e-08, -5.481421894160121e-08, -5.311502349059083e-08, -5.141582448686677e-08, -4.971662548314271e-08, -4.8017430032132324e-08, -4.631823102840826e-08, -4.461903557739788e-08, -4.291983657367382e-08, -4.122063756994976e-08, -3.9521442118939376e-08, -3.7822243115215315e-08, -3.6123044111491254e-08, -3.442384866048087e-08, -3.272464965675681e-08, -3.102545065303275e-08, -2.9326253425665527e-08, -2.7627056198298305e-08, -2.5927857194574244e-08, -2.4228659967207022e-08, -2.25294627398398e-08, -2.083026373611574e-08, -1.9131066508748518e-08, -1.7431869281381296e-08, -1.5732670277657235e-08, -1.4033472162111593e-08, -1.2334274934744371e-08, -1.063507681919873e-08, -8.935879591831508e-09, -7.236681476285867e-09, -5.537483360740225e-09, -3.838286133373003e-09, -2.1390889060057816e-09, -4.398911235270475e-10, 1.2593066589516866e-09, 2.958504552452723e-09, 4.657702223909155e-09, 6.3568998953655864e-09, 8.056098010911228e-09, 9.75529523827845e-09, 1.1454493353824091e-08, 1.3153691469369733e-08, 1.4852888696736954e-08, 1.6552085924104176e-08, 1.8251284927828237e-08, 1.995048215519546e-08, 2.164967938256268e-08, 2.3348878386286742e-08, 2.5048075613653964e-08, 2.6747272841021186e-08, 2.8446471844745247e-08, 3.014567084846931e-08, 3.184486629947969e-08, 3.354406530320375e-08, 3.5243260754214134e-08, 3.6942459757938195e-08, 3.8641658761662256e-08, 4.034085776538632e-08, 4.20400532163967e-08, 4.373925222012076e-08, 4.543845122384482e-08, 4.7137646674855205e-08, 4.8836845678579266e-08, 5.053604468230333e-08, 5.223524013331371e-08]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 14.0, 8.0, 17.0, 12.0, 20.0, 13.0, 21.0, 15.0, 26.0, 33.0, 41.0, 32.0, 46.0, 54.0, 37.0, 42.0, 54.0, 52.0, 60.0, 39.0, 31.0, 31.0, 34.0, 35.0, 32.0, 35.0, 24.0, 25.0, 24.0, 19.0, 13.0, 11.0, 8.0, 13.0, 9.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.104957795902919e-08, -3.969759632127534e-08, -3.834561468352149e-08, -3.699363304576764e-08, -3.5641651408013786e-08, -3.4289669770259934e-08, -3.2937684579792403e-08, -3.158570294203855e-08, -3.02337213042847e-08, -2.8881739666530848e-08, -2.7529758028776996e-08, -2.6177776391023144e-08, -2.4825792976912453e-08, -2.34738113391586e-08, -2.212182970140475e-08, -2.0769846287294058e-08, -1.9417866425897046e-08, -1.8065884788143194e-08, -1.6713903150389342e-08, -1.536191973627865e-08, -1.4009938098524799e-08, -1.2657956460770947e-08, -1.1305974823017095e-08, -9.953992297084824e-09, -8.602010659330972e-09, -7.25002857748791e-09, -5.898046495644849e-09, -4.546064857890997e-09, -3.194082776047935e-09, -1.8421006942048734e-09, -4.901190564510216e-10, 8.618634694812499e-10, 2.2138451072351018e-09, 3.5658271890781634e-09, 4.917809270921225e-09, 6.269790908675077e-09, 7.621773434607348e-09, 8.9737550723612e-09, 1.0325736710115052e-08, 1.1677719236047324e-08, 1.3029700873801175e-08, 1.4381682511555027e-08, 1.57336650374873e-08, 1.708564667524115e-08, 1.8437628312995002e-08, 1.9789609950748854e-08, 2.1141591588502706e-08, 2.2493575002613397e-08, 2.384555664036725e-08, 2.51975382781211e-08, 2.6549519915874953e-08, 2.7901503329985644e-08, 2.9253484967739496e-08, 3.060546660549335e-08, 3.19574482432472e-08, 3.330942988100105e-08, 3.46614115187549e-08, 3.6013393156508755e-08, 3.736537479426261e-08, 3.871735643201646e-08, 4.006933806977031e-08, 4.142132326023784e-08, 4.2773301345278014e-08, 4.4125286535745545e-08, 4.5477268173499397e-08]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 10.0, 18.0, 15.0, 16.0, 25.0, 39.0, 47.0, 93.0, 168.0, 202.0, 101.0, 68.0, 49.0, 40.0, 25.0, 18.0, 12.0, 12.0, 6.0, 6.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.375671025513839e-08, -4.257916330629996e-08, -4.1401619910175214e-08, -4.022407296133679e-08, -3.904652601249836e-08, -3.7868979063659935e-08, -3.669143211482151e-08, -3.551388871869676e-08, -3.4336341769858336e-08, -3.315879482101991e-08, -3.198125142489516e-08, -3.080370447605674e-08, -2.962615752721831e-08, -2.8448610578379885e-08, -2.7271065405898298e-08, -2.609352023341671e-08, -2.4915973284578286e-08, -2.373842633573986e-08, -2.2560881163258273e-08, -2.1383335990776686e-08, -2.020578904193826e-08, -1.9028242093099834e-08, -1.7850696920618248e-08, -1.667315174813666e-08, -1.5495604799298235e-08, -1.4318058738638229e-08, -1.3140512677978222e-08, -1.1962966617318216e-08, -1.078542055665821e-08, -9.607874495998203e-09, -8.430328435338197e-09, -7.2527823746781905e-09, -6.075232761304505e-09, -4.897686700644499e-09, -3.7201406399844927e-09, -2.5425945793244864e-09, -1.36504851866448e-09, -1.8750245800447374e-10, 9.900436026555326e-10, 2.167589663315539e-09, 3.3451357239755453e-09, 4.522681784635552e-09, 5.700227845295558e-09, 6.877773905955564e-09, 8.05531996661557e-09, 9.232866027275577e-09, 1.0410412087935583e-08, 1.158795814859559e-08, 1.2765504209255596e-08, 1.3943050269915602e-08, 1.512059633057561e-08, 1.6298141503057195e-08, 1.747568845189562e-08, 1.8653235400734047e-08, 1.9830780573215634e-08, 2.100832574569722e-08, 2.2185872694535647e-08, 2.3363419643374073e-08, 2.454096481585566e-08, 2.5718509988337246e-08, 2.6896056937175672e-08, 2.8073603886014098e-08, 2.9251149058495685e-08, 3.042869423097727e-08, 3.16062411798157e-08]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 12.0, 14.0, 12.0, 14.0, 22.0, 13.0, 21.0, 21.0, 32.0, 40.0, 32.0, 41.0, 52.0, 45.0, 36.0, 61.0, 51.0, 62.0, 44.0, 36.0, 31.0, 31.0, 40.0, 31.0, 32.0, 27.0, 23.0, 27.0, 19.0, 15.0, 11.0, 8.0, 9.0, 10.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1673029593216597e-08, -2.098673590467115e-08, -2.0300443992482542e-08, -1.9614150303937095e-08, -1.8927858391748487e-08, -1.824156470320304e-08, -1.755527279101443e-08, -1.6868979102468984e-08, -1.6182685413923537e-08, -1.549639172537809e-08, -1.4810099813189481e-08, -1.4123806124644034e-08, -1.3437514212455426e-08, -1.2751220523909979e-08, -1.2064927723542951e-08, -1.1378634923175923e-08, -1.0692343010987315e-08, -1.0006050210620288e-08, -9.31975741025326e-09, -8.633463721707813e-09, -7.947171809519205e-09, -7.260878565062967e-09, -6.5745853206067295e-09, -5.888292520239702e-09, -5.201999719872674e-09, -4.5157069195056465e-09, -3.829414119138619e-09, -3.1431208746823813e-09, -2.4568280743153537e-09, -1.770535273948326e-09, -1.0842420294920885e-09, -3.979492291250608e-10, 2.8834179488512746e-10, 9.746347062744576e-10, 1.6609276176637877e-09, 2.3472206400754203e-09, 3.033513440442448e-09, 3.7198062408094756e-09, 4.406099485265713e-09, 5.092392285632741e-09, 5.7786850859997685e-09, 6.464977886366796e-09, 7.151270686733824e-09, 7.837563487100851e-09, 8.523857175646299e-09, 9.210149087834907e-09, 9.896442776380354e-09, 1.0582735576747382e-08, 1.126902837711441e-08, 1.1955321177481437e-08, 1.2641613977848465e-08, 1.3327907666393912e-08, 1.401419957858252e-08, 1.4700493267127968e-08, 1.5386785179316576e-08, 1.6073078867862023e-08, 1.675937255640747e-08, 1.7445666244952918e-08, 1.8131958157141526e-08, 1.8818251845686973e-08, 1.950454375787558e-08, 2.0190837446421028e-08, 2.0877131134966476e-08, 2.1563423047155084e-08, 2.224971495934369e-08]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 7.0, 6.0, 8.0, 11.0, 18.0, 16.0, 19.0, 36.0, 38.0, 37.0, 72.0, 99.0, 147.0, 133.0, 92.0, 64.0, 56.0, 28.0, 32.0, 15.0, 19.0, 9.0, 11.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4245914448096642e-09, -1.3711008994832241e-09, -1.3176102431344816e-09, -1.2641196978080416e-09, -1.2106291524816015e-09, -1.157138496132859e-09, -1.103647950806419e-09, -1.0501572944576765e-09, -9.966667491312364e-10, -9.431762038047964e-10, -8.896855474560539e-10, -8.361950021296138e-10, -7.827044012920226e-10, -7.292138004544313e-10, -6.757232551279913e-10, -6.222326542904e-10, -5.687420534528087e-10, -5.152514526152174e-10, -4.6176087953320177e-10, -4.082703064511861e-10, -3.5477970561359484e-10, -3.0128910477600357e-10, -2.477985316939879e-10, -1.9430795861197225e-10, -1.4081735777438098e-10, -8.732677081457751e-11, -3.383618385477405e-11, 1.9654403105029417e-11, 7.314499006483288e-11, 1.2663559090242416e-10, 1.8012616398443981e-10, 2.3361673706645547e-10, 2.871072268817443e-10, 3.4059782771933556e-10, 3.940884008013512e-10, 4.4757897388336687e-10, 5.010695747209581e-10, 5.545601755585494e-10, 6.080507208849895e-10, 6.615413217225807e-10, 7.15031922560172e-10, 7.685225233977633e-10, 8.220131242353546e-10, 8.755036695617946e-10, 9.289942703993859e-10, 9.824848712369771e-10, 1.0359754165634172e-09, 1.0894660729121597e-09, 1.1429566182385997e-09, 1.1964471635650398e-09, 1.2499378199137823e-09, 1.3034283652402223e-09, 1.3569190215889648e-09, 1.4104095669154049e-09, 1.463900112241845e-09, 1.517390657568285e-09, 1.5708813139170275e-09, 1.6243718592434675e-09, 1.67786251559221e-09, 1.73135306091865e-09, 1.78484360624509e-09, 1.8383342625938326e-09, 1.891824918942575e-09, 1.945315464269015e-09, 1.998806009595455e-09]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 14.0, 7.0, 21.0, 15.0, 13.0, 20.0, 19.0, 25.0, 35.0, 35.0, 28.0, 49.0, 51.0, 47.0, 39.0, 59.0, 60.0, 52.0, 46.0, 32.0, 35.0, 32.0, 35.0, 28.0, 33.0, 28.0, 23.0, 27.0, 20.0, 9.0, 8.0, 10.0, 5.0, 10.0, 8.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1960727963611362e-09, -1.1566636537452268e-09, -1.117254400107015e-09, -1.0778452574911057e-09, -1.038436003852894e-09, -9.990268612369846e-10, -9.596176075987728e-10, -9.202084649828635e-10, -8.807992113446517e-10, -8.413900132175911e-10, -8.019808150905305e-10, -7.6257161696347e-10, -7.231624188364094e-10, -6.837532207093489e-10, -6.443440225822883e-10, -6.04934879966379e-10, -5.655256818393184e-10, -5.261164837122578e-10, -4.867072855851973e-10, -4.472980874581367e-10, -4.0788888933107614e-10, -3.684796912040156e-10, -3.2907052083253063e-10, -2.8966132270547007e-10, -2.502521245784095e-10, -2.1084292645134894e-10, -1.7143372832428838e-10, -1.3202454407501563e-10, -9.261534594795506e-11, -5.32061478208945e-11, -1.3796963571621745e-11, 2.5612234555438818e-11, 6.502143268249938e-11, 1.0443063080955994e-10, 1.438398289366205e-10, 1.8324901318589326e-10, 2.2265821131295382e-10, 2.620674233178022e-10, 3.0147659368928714e-10, 3.408857918163477e-10, 3.8029498994340827e-10, 4.1970418807046883e-10, 4.591133861975294e-10, 4.985225565690143e-10, 5.379317546960749e-10, 5.773409528231355e-10, 6.16750150950196e-10, 6.561593490772566e-10, 6.955685472043172e-10, 7.349777453313777e-10, 7.743869434584383e-10, 8.137961415854988e-10, 8.532053397125594e-10, 8.9261453783962e-10, 9.320236804555293e-10, 9.71432934093741e-10, 1.0108420767096504e-09, 1.0502512193255598e-09, 1.0896604729637716e-09, 1.1290696155796809e-09, 1.1684788692178927e-09, 1.207888011833802e-09, 1.2472972654720138e-09, 1.2867064080879231e-09, 1.326115661726135e-09]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 10.0, 11.0, 6.0, 10.0, 11.0, 28.0, 29.0, 35.0, 49.0, 53.0, 101.0, 128.0, 123.0, 109.0, 89.0, 53.0, 39.0, 22.0, 13.0, 11.0, 19.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5629708638442708e-09, -1.5170935618868953e-09, -1.4712161489072173e-09, -1.4253387359275393e-09, -1.3794614339701639e-09, -1.3335841320127884e-09, -1.2877067190331104e-09, -1.2418293060534324e-09, -1.195952004096057e-09, -1.1500747021386815e-09, -1.1041972891590035e-09, -1.0583198761793255e-09, -1.01244257422195e-09, -9.665652722645746e-10, -9.206878592848966e-10, -8.748105018163699e-10, -8.289331443478432e-10, -7.830557868793164e-10, -7.371784294107897e-10, -6.91301071942263e-10, -6.454237144737363e-10, -5.995463570052095e-10, -5.536689995366828e-10, -5.077916420681561e-10, -4.6191428459962935e-10, -4.1603692713110263e-10, -3.701595696625759e-10, -3.242822121940492e-10, -2.7840485472552245e-10, -2.3252749725699573e-10, -1.86650139788469e-10, -1.4077278231994228e-10, -9.489542485141556e-11, -4.901806738288883e-11, -3.1407099143621053e-12, 4.273664755416462e-11, 8.861400502269134e-11, 1.3449136249121807e-10, 1.803687199597448e-10, 2.2624607742827152e-10, 2.7212343489679824e-10, 3.1800079236532497e-10, 3.638781498338517e-10, 4.097555073023784e-10, 4.5563286477090514e-10, 5.015102222394319e-10, 5.473875797079586e-10, 5.932649371764853e-10, 6.39142294645012e-10, 6.850196521135388e-10, 7.308970095820655e-10, 7.767743670505922e-10, 8.226517245191189e-10, 8.685290819876457e-10, 9.144064394561724e-10, 9.602838524358503e-10, 1.0061611543932258e-09, 1.0520384563506013e-09, 1.0979158693302793e-09, 1.1437932823099572e-09, 1.1896705842673327e-09, 1.2355478862247082e-09, 1.2814252992043862e-09, 1.3273027121840641e-09, 1.3731800141414396e-09]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 9.0, 17.0, 14.0, 16.0, 14.0, 20.0, 19.0, 30.0, 38.0, 28.0, 29.0, 52.0, 44.0, 52.0, 56.0, 38.0, 65.0, 46.0, 46.0, 37.0, 27.0, 30.0, 35.0, 30.0, 33.0, 30.0, 26.0, 21.0, 17.0, 11.0, 7.0, 10.0, 6.0, 10.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.002027461005639e-09, -9.687313173856182e-10, -9.354351737655975e-10, -9.021389746344255e-10, -8.688427755032535e-10, -8.355466318832327e-10, -8.02250488263212e-10, -7.689543446431912e-10, -7.356581455120192e-10, -7.023620018919985e-10, -6.690658027608265e-10, -6.357696591408057e-10, -6.02473515520785e-10, -5.69177316389613e-10, -5.358811727695922e-10, -5.025849736384203e-10, -4.692888300183995e-10, -4.359926586428031e-10, -4.0269648726720675e-10, -3.69400343647186e-10, -3.361041722715896e-10, -3.0280800089599325e-10, -2.695118572759725e-10, -2.362156859003761e-10, -2.0291951452477974e-10, -1.6962334314918337e-10, -1.363271856513748e-10, -1.0303102121467234e-10, -6.973485677796987e-11, -3.6438685402373494e-11, -3.142527904564929e-12, 3.0153629593243636e-11, 6.344991199114247e-11, 9.674607642784494e-11, 1.300422408645474e-10, 1.6333839836235597e-10, 1.9663456973795235e-10, 2.2993074111354872e-10, 2.632268847335695e-10, 2.9652305610916585e-10, 3.298192274847622e-10, 3.631153988603586e-10, 3.9641157023595497e-10, 4.2970771385597573e-10, 4.630038852315721e-10, 4.963000566071685e-10, 5.295962002271892e-10, 5.628923993583612e-10, 5.96188542978382e-10, 6.294846865984027e-10, 6.627808857295747e-10, 6.960770293495955e-10, 7.293732284807675e-10, 7.626693721007882e-10, 7.95965515720809e-10, 8.292616593408297e-10, 8.625578584720017e-10, 8.958540020920225e-10, 9.291502012231945e-10, 9.624463448432152e-10, 9.95742488463236e-10, 1.0290386320832567e-09, 1.06233488672558e-09, 1.0956310303456007e-09, 1.1289271739656215e-09]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 9.0, 11.0, 7.0, 12.0, 26.0, 24.0, 33.0, 41.0, 65.0, 88.0, 125.0, 150.0, 105.0, 67.0, 52.0, 26.0, 22.0, 23.0, 20.0, 18.0, 8.0, 4.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.239785910189255e-10, -6.0327309814312e-10, -5.825676607784658e-10, -5.618621679026603e-10, -5.411567305380061e-10, -5.204512376622006e-10, -4.997458002975463e-10, -4.790403074217409e-10, -4.58334842301511e-10, -4.3762937718128114e-10, -4.169239120610513e-10, -3.962184469408214e-10, -3.7551295406501595e-10, -3.548075167003617e-10, -3.3410202382455623e-10, -3.1339655870432637e-10, -2.926910935840965e-10, -2.7198562846386665e-10, -2.512801633436368e-10, -2.3057468434561912e-10, -2.0986921922538926e-10, -1.891637541051594e-10, -1.6845827510714173e-10, -1.4775280998691187e-10, -1.27047344866682e-10, -1.0634187974645215e-10, -8.563640768732839e-11, -6.493093562820462e-11, -4.422547050797476e-11, -2.3520005387744902e-11, -2.8145263897272343e-12, 1.7890938730502626e-11, 3.8596348339581255e-11, 5.930181345981111e-11, 8.000728551893488e-11, 1.0071275757805864e-10, 1.214182226982885e-10, 1.4212368781851836e-10, 1.6282916681653603e-10, 1.835346319367659e-10, 2.0424009705699575e-10, 2.249455621772256e-10, 2.4565102729745547e-10, 2.6635649241768533e-10, 2.870619852934908e-10, 3.0776742265814505e-10, 3.2847291553395053e-10, 3.491783806541804e-10, 3.6988384577441025e-10, 3.905893108946401e-10, 4.1129477601486997e-10, 4.3200026889067544e-10, 4.527057062553297e-10, 4.734111991311352e-10, 4.941166364957894e-10, 5.148221293715949e-10, 5.355276222474004e-10, 5.562331151232058e-10, 5.769385524878601e-10, 5.976440453636656e-10, 6.183494827283198e-10, 6.390549756041253e-10, 6.597604684799308e-10, 6.80465905844585e-10, 7.011713432092392e-10]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 12.0, 14.0, 18.0, 15.0, 20.0, 17.0, 17.0, 40.0, 35.0, 32.0, 40.0, 57.0, 49.0, 59.0, 50.0, 61.0, 56.0, 45.0, 46.0, 25.0, 31.0, 38.0, 33.0, 33.0, 28.0, 30.0, 13.0, 19.0, 7.0, 7.0, 7.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.129451308150124e-10, -4.97073104899215e-10, -4.812010234722663e-10, -4.6532899755646895e-10, -4.4945697164067155e-10, -4.3358491796929854e-10, -4.1771286429792553e-10, -4.0184083838212814e-10, -3.8596878471075513e-10, -3.700967310393821e-10, -3.5422470512358473e-10, -3.383526514522117e-10, -3.224805977808387e-10, -3.066085718650413e-10, -2.907365181936683e-10, -2.748644645222953e-10, -2.589924386064979e-10, -2.431203849351249e-10, -2.272483590193275e-10, -2.1137630534795449e-10, -1.9550426555436928e-10, -1.7963222576078408e-10, -1.6376017208941107e-10, -1.4788813229582587e-10, -1.3201609250224067e-10, -1.1614405270865547e-10, -1.0027200597617636e-10, -8.439995924369725e-11, -6.852791945011205e-11, -5.265587965652685e-11, -3.6783832924047744e-11, -2.0911786191568638e-11, -5.039690886832204e-12, 1.083235237619995e-11, 2.6704395639232104e-11, 4.257643890226426e-11, 5.844848216529641e-11, 7.432052195888161e-11, 9.019256869136072e-11, 1.0606461542383983e-10, 1.2193665521742503e-10, 1.3780869501101023e-10, 1.5368073480459543e-10, 1.6955278847596844e-10, 1.8542482826955364e-10, 2.0129686806313885e-10, 2.1716892173451185e-10, 2.3304097540588486e-10, 2.4891300132168226e-10, 2.6478505499305527e-10, 2.8065708090885266e-10, 2.9652913458022567e-10, 3.1240116049602307e-10, 3.282732141673961e-10, 3.441452678387691e-10, 3.600172937545665e-10, 3.758893474259395e-10, 3.917614010973125e-10, 4.076334270131099e-10, 4.235054806844829e-10, 4.393775343558559e-10, 4.552495602716533e-10, 4.711215861874507e-10, 4.869936676143993e-10, 5.028656935301967e-10]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 5.0, 13.0, 9.0, 31.0, 56.0, 76.0, 142.0, 236.0, 177.0, 101.0, 53.0, 39.0, 25.0, 12.0, 13.0, 11.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2214536326826675e-10, -1.1935062660395346e-10, -1.1655588993964017e-10, -1.1376116021422078e-10, -1.1096642354990749e-10, -1.081716868855942e-10, -1.0537695022128091e-10, -1.0258222049586152e-10, -9.978748383154823e-11, -9.699274716723494e-11, -9.419801050292165e-11, -9.140328077750226e-11, -8.860854411318897e-11, -8.581380744887568e-11, -8.301907078456239e-11, -8.0224341059143e-11, -7.742960439482971e-11, -7.463486773051642e-11, -7.184013106620313e-11, -6.904540134078374e-11, -6.625066467647045e-11, -6.345592801215716e-11, -6.066119134784387e-11, -5.786645815297753e-11, -5.5071718019217286e-11, -5.2276981354903995e-11, -4.9482248160037656e-11, -4.6687511495724365e-11, -4.3892778300858026e-11, -4.1098041636544735e-11, -3.8303304972231444e-11, -3.5508571777365106e-11, -3.2713838582498767e-11, -2.9919101918185476e-11, -2.7124368723319137e-11, -2.4329632059005846e-11, -2.1534898864139507e-11, -1.8740162199826216e-11, -1.59454272702364e-11, -1.3150692340646586e-11, -1.0355957411056771e-11, -7.561222481466956e-12, -4.766487118196272e-12, -1.971751754925588e-12, 8.229831746642269e-13, 3.617718104254042e-12, 6.412453901205595e-12, 9.20718883079541e-12, 1.2001923760385225e-11, 1.479665868997504e-11, 1.7591393619564855e-11, 2.0386130283878146e-11, 2.3180863478744484e-11, 2.5975600143057775e-11, 2.877033507264759e-11, 3.1565070002237405e-11, 3.4359806666550696e-11, 3.715454333086399e-11, 3.9949276525730326e-11, 4.274401319004362e-11, 4.5538746384909956e-11, 4.833348304922325e-11, 5.112821971353654e-11, 5.392295290840288e-11, 5.6717686103269216e-11]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 13.0, 10.0, 16.0, 10.0, 19.0, 26.0, 24.0, 21.0, 24.0, 31.0, 42.0, 47.0, 46.0, 65.0, 45.0, 57.0, 49.0, 52.0, 55.0, 36.0, 29.0, 34.0, 29.0, 40.0, 36.0, 18.0, 25.0, 13.0, 14.0, 7.0, 11.0, 13.0, 3.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7555934057076357e-11, -3.634250886341839e-11, -3.512908366976042e-11, -3.391565847610245e-11, -3.270223328244448e-11, -3.148880808878651e-11, -3.0275382895128544e-11, -2.9061957701470575e-11, -2.7848532507812607e-11, -2.6635107314154638e-11, -2.542168212049667e-11, -2.42082569268387e-11, -2.2994831733180732e-11, -2.1781406539522763e-11, -2.0567981345864794e-11, -1.9354556152206825e-11, -1.8141132693272333e-11, -1.6927707499614364e-11, -1.5714282305956395e-11, -1.4500857112298426e-11, -1.3287431918640458e-11, -1.2074006724982489e-11, -1.0860582398686258e-11, -9.64715720502829e-12, -8.43373201137032e-12, -7.220306817712352e-12, -6.006881624054383e-12, -4.7934568640772834e-12, -3.5800316704193147e-12, -2.366606476761346e-12, -1.1531817167842462e-12, 6.024347687372256e-14, 1.2736686705316913e-12, 2.48709386418966e-12, 3.700519057847629e-12, 4.9139438178247286e-12, 6.127369011482697e-12, 7.340794638821535e-12, 8.554218965117766e-12, 9.767644158775735e-12, 1.0981069352433703e-11, 1.2194494546091672e-11, 1.340791973974964e-11, 1.462134406604587e-11, 1.583476925970384e-11, 1.704819445336181e-11, 1.8261619647019778e-11, 1.9475044840677747e-11, 2.0688470034335715e-11, 2.1901895227993684e-11, 2.3115320421651653e-11, 2.432874561530962e-11, 2.554217080896759e-11, 2.675559600262556e-11, 2.7969019461560052e-11, 2.918244465521802e-11, 3.039586984887599e-11, 3.160929504253396e-11, 3.282272023619193e-11, 3.4036145429849896e-11, 3.5249570623507864e-11, 3.646299581716583e-11, 3.76764210108238e-11, 3.888984620448177e-11, 4.010327139813974e-11]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 14.0, 12.0, 29.0, 54.0, 74.0, 104.0, 190.0, 200.0, 122.0, 74.0, 41.0, 26.0, 21.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.358668007219961e-11, -9.141291890113479e-11, -8.923916466896387e-11, -8.706540349789904e-11, -8.489164926572812e-11, -8.27178880946633e-11, -8.054413386249237e-11, -7.837037269142755e-11, -7.619661845925663e-11, -7.40228572881918e-11, -7.184910305602088e-11, -6.967534188495605e-11, -6.750158765278513e-11, -6.532782648172031e-11, -6.315407224954939e-11, -6.098031107848456e-11, -5.880655684631364e-11, -5.663279914469577e-11, -5.4459041443077894e-11, -5.228528374146002e-11, -5.011152603984215e-11, -4.7937768338224274e-11, -4.57640106366064e-11, -4.3590249465541575e-11, -4.141648829447675e-11, -3.9242730592858877e-11, -3.7068972891241003e-11, -3.489521518962313e-11, -3.2721457488005257e-11, -3.0547699786387383e-11, -2.8373940350046034e-11, -2.620018264842816e-11, -2.4026430150980715e-11, -2.1852672449362842e-11, -1.967891474774497e-11, -1.7505157046127096e-11, -1.5331399344509222e-11, -1.3157640775529611e-11, -1.098388220655e-11, -8.810124504932126e-12, -6.636366803314253e-12, -4.46260910169638e-12, -2.2888509663976375e-12, -1.1509283109889523e-13, 2.058664870518978e-12, 4.232422572136851e-12, 6.406181141116463e-12, 8.579938842734336e-12, 1.075369654435221e-11, 1.2927454245970083e-11, 1.5101211947587956e-11, 1.727496964920583e-11, 1.9448727350823702e-11, 2.1622485052441576e-11, 2.3796244488782925e-11, 2.5970002190400798e-11, 2.814375989201867e-11, 3.031751932836002e-11, 3.2491277029977894e-11, 3.466503473159577e-11, 3.683879243321364e-11, 3.9012550134831514e-11, 4.118630783644939e-11, 4.336006553806726e-11, 4.5533823239685134e-11]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 8.0, 12.0, 11.0, 11.0, 16.0, 20.0, 28.0, 21.0, 25.0, 22.0, 36.0, 39.0, 48.0, 44.0, 66.0, 50.0, 52.0, 52.0, 53.0, 43.0, 33.0, 32.0, 36.0, 26.0, 41.0, 31.0, 21.0, 24.0, 16.0, 12.0, 7.0, 8.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.813636997001101e-11, -2.722126690724025e-11, -2.6306162109746012e-11, -2.539105904697525e-11, -2.447595598420449e-11, -2.3560851186710252e-11, -2.264574812393949e-11, -2.173064506116873e-11, -2.0815540263674492e-11, -1.990043720090373e-11, -1.8985332403409494e-11, -1.8070229340638733e-11, -1.715512627786797e-11, -1.624002321509721e-11, -1.5324918417602973e-11, -1.4409815354832212e-11, -1.349471229206145e-11, -1.2579608361928951e-11, -1.166450529915819e-11, -1.074940136902569e-11, -9.83429830625493e-12, -8.91919437612243e-12, -8.004090445989931e-12, -7.088986949538301e-12, -6.1738834530866704e-12, -5.25877995663504e-12, -4.34367646018341e-12, -3.4285725300509107e-12, -2.5134690335992804e-12, -1.5983655371476502e-12, -6.832616070151509e-13, 2.318418894364793e-13, 1.1469436511646336e-12, 2.062047147616264e-12, 2.9771508609083286e-12, 3.892254574200393e-12, 4.8073580706520236e-12, 5.722461567103654e-12, 6.637565497236153e-12, 7.552668560006914e-12, 8.467772490139414e-12, 9.382876420271913e-12, 1.0297979483042674e-11, 1.1213083413175173e-11, 1.2128187343307673e-11, 1.3043290406078434e-11, 1.3958394336210933e-11, 1.4873498266343432e-11, 1.5788601329114194e-11, 1.6703704391884955e-11, 1.7618809189379192e-11, 1.8533912252149953e-11, 1.9449015314920715e-11, 2.0364120112414952e-11, 2.1279223175185713e-11, 2.2194326237956474e-11, 2.310943103545071e-11, 2.4024534098221473e-11, 2.493963889571571e-11, 2.585474195848647e-11, 2.6769845021257233e-11, 2.7684948084027994e-11, 2.860005288152223e-11, 2.951515767901647e-11, 3.0430259007063754e-11]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 20.0, 24.0, 60.0, 102.0, 222.0, 237.0, 139.0, 93.0, 37.0, 30.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7954349812443482e-11, -1.634721524812477e-11, -1.4740080683806056e-11, -1.3132947854210819e-11, -1.1525813289892106e-11, -9.918678725573393e-12, -8.311545028616418e-12, -6.704411331659443e-12, -5.0972767673407304e-12, -3.4901426367028865e-12, -1.8830085060650426e-12, -2.758743754271986e-13, 1.3312597552106453e-12, 2.9383943195293583e-12, 4.545528016486333e-12, 6.152661713443308e-12, 7.759796277762021e-12, 9.366930842080734e-12, 1.0974064539037709e-11, 1.2581198235994684e-11, 1.4188332800313397e-11, 1.579546736463211e-11, 1.7402600194227347e-11, 1.900973475854606e-11, 2.0616869322864773e-11, 2.2224003887183486e-11, 2.38311384515022e-11, 2.5438271281097435e-11, 2.7045405845416148e-11, 2.865254040973486e-11, 3.02596732393301e-11, 3.186680780364881e-11, 3.347393889852057e-11, 3.5081073462839285e-11, 3.6688208027158e-11, 3.829534259147671e-11, 3.9902477155795424e-11, 4.1509608250667185e-11, 4.31167428149859e-11, 4.472387737930461e-11, 4.6331011943623324e-11, 4.7938146507942037e-11, 4.954528107226075e-11, 5.115241563657946e-11, 5.2759546731451223e-11, 5.436668476521689e-11, 5.597381586008865e-11, 5.758095042440736e-11, 5.918808498872608e-11, 6.079521608359784e-11, 6.24023541173635e-11, 6.400948521223526e-11, 6.561662324600093e-11, 6.722375434087269e-11, 6.883089237463835e-11, 7.043802346951011e-11, 7.204516150327578e-11, 7.365229259814754e-11, 7.52594306319132e-11, 7.686656172678497e-11, 7.847369976055063e-11, 8.008083085542239e-11, 8.168796888918806e-11, 8.329509998405982e-11, 8.490223107893158e-11]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 14.0, 8.0, 10.0, 13.0, 27.0, 26.0, 25.0, 19.0, 31.0, 32.0, 42.0, 50.0, 58.0, 61.0, 53.0, 55.0, 66.0, 44.0, 39.0, 39.0, 31.0, 34.0, 39.0, 26.0, 29.0, 24.0, 15.0, 12.0, 9.0, 8.0, 10.0, 9.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7040936370338322e-11, -1.6514919640164827e-11, -1.598890290999133e-11, -1.5462886179817836e-11, -1.493686944964434e-11, -1.4410852719470846e-11, -1.388483598929735e-11, -1.3358819259123855e-11, -1.283280252895036e-11, -1.2306785798776865e-11, -1.178076906860337e-11, -1.1254752338429874e-11, -1.0728735608256379e-11, -1.0202718878082884e-11, -9.676702147909388e-12, -9.150685417735893e-12, -8.624669554924136e-12, -8.09865282475064e-12, -7.572636094577145e-12, -7.04661936440365e-12, -6.520602634230155e-12, -5.9945859040566596e-12, -5.468569607564033e-12, -4.942552877390538e-12, -4.416536147217043e-12, -3.8905194170435475e-12, -3.3645026868700523e-12, -2.8384861735369915e-12, -2.3124694433634962e-12, -1.786452713190001e-12, -1.2604361998569402e-12, -7.34419469683445e-13, -2.084027395099497e-13, 3.1761393645343694e-13, 8.436306124168236e-13, 1.3696472341701016e-12, 1.895663964343597e-12, 2.421680694517092e-12, 2.947697207850153e-12, 3.473713938023648e-12, 3.999730668197143e-12, 4.525747398370639e-12, 5.051764128544134e-12, 5.57778042503676e-12, 6.1037971552102555e-12, 6.629813885383751e-12, 7.155830615557246e-12, 7.681847345730741e-12, 8.207864075904237e-12, 8.733880806077732e-12, 9.259897536251227e-12, 9.785914266424722e-12, 1.0311930996598218e-11, 1.0837947726771713e-11, 1.136396358958347e-11, 1.1889980319756965e-11, 1.241599704993046e-11, 1.2942013780103956e-11, 1.3468030510277451e-11, 1.3994047240450946e-11, 1.4520063970624442e-11, 1.5046080700797937e-11, 1.5572097430971432e-11, 1.6098114161144927e-11, 1.6624130891318423e-11]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 10.0, 10.0, 11.0, 16.0, 29.0, 56.0, 76.0, 126.0, 183.0, 185.0, 107.0, 68.0, 56.0, 26.0, 14.0, 11.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1079044799633397e-11, -1.0387407080314492e-11, -9.695770228357325e-12, -9.00413250903842e-12, -8.312495657081254e-12, -7.620857937762349e-12, -6.929220652124313e-12, -6.237583366486277e-12, -5.545946080848241e-12, -4.854308795210205e-12, -4.162671509572169e-12, -3.4710340070936985e-12, -2.7793967214556625e-12, -2.0877594358176266e-12, -1.3961219333391561e-12, -7.044846477011202e-13, -1.2847362063084233e-14, 6.787899777850603e-13, 1.370427317633205e-12, 2.062064711691458e-12, 2.753701997329494e-12, 3.44533928296753e-12, 4.1369767854460004e-12, 4.828614071084036e-12, 5.520251356722072e-12, 6.211888642360108e-12, 6.903525927998144e-12, 7.59516321363618e-12, 8.286800932955085e-12, 8.978437784912252e-12, 9.670075504231157e-12, 1.0361713223550062e-11, 1.1053350942868967e-11, 1.1744988662187872e-11, 1.2436625514145039e-11, 1.3128263233463944e-11, 1.381990008542111e-11, 1.4511537804740016e-11, 1.520317552405892e-11, 1.5894813243377826e-11, 1.6586449227973254e-11, 1.727808694729216e-11, 1.7969724666611064e-11, 1.8661360651206493e-11, 1.9352998370525398e-11, 2.0044636089844303e-11, 2.0736273809163208e-11, 2.1427911528482113e-11, 2.2119549247801018e-11, 2.2811186967119923e-11, 2.3502824686438828e-11, 2.4194460671034257e-11, 2.4886098390353162e-11, 2.5577736109672067e-11, 2.6269373828990972e-11, 2.69610098135864e-11, 2.7652647532905306e-11, 2.834428525222421e-11, 2.9035922971543116e-11, 2.972756069086202e-11, 3.0419198410180925e-11, 3.111083266005288e-11, 3.1802470379371783e-11, 3.249410809869069e-11, 3.318574581800959e-11]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 13.0, 14.0, 16.0, 21.0, 21.0, 25.0, 34.0, 32.0, 33.0, 43.0, 52.0, 67.0, 63.0, 71.0, 64.0, 50.0, 56.0, 50.0, 36.0, 38.0, 32.0, 29.0, 21.0, 16.0, 13.0, 13.0, 10.0, 10.0, 6.0, 12.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1060822396879999e-11, -1.0698978161749473e-11, -1.0337133926618947e-11, -9.97528969148842e-12, -9.613445456357894e-12, -9.251601221227368e-12, -8.889756986096842e-12, -8.527912750966316e-12, -8.16606851583579e-12, -7.804224280705263e-12, -7.442380045574737e-12, -7.080535810444211e-12, -6.7186915753136844e-12, -6.356847340183158e-12, -5.995003105052632e-12, -5.633158869922106e-12, -5.2713146347915796e-12, -4.909470399661053e-12, -4.547626164530527e-12, -4.185781929400001e-12, -3.823937694269475e-12, -3.4620934591389485e-12, -3.1002492240084223e-12, -2.738404988877896e-12, -2.37656075374737e-12, -2.0147165186168436e-12, -1.6528722834863174e-12, -1.2910280483557912e-12, -9.29183813225265e-13, -5.673395780947388e-13, -2.0549534296421257e-13, 1.5634889216631365e-13, 5.181939946585779e-13, 8.800382297891041e-13, 1.2418824649196303e-12, 1.6037267000501565e-12, 1.9655709351806827e-12, 2.327415170311209e-12, 2.689259405441735e-12, 3.0511036405722614e-12, 3.4129478757027876e-12, 3.774792110833314e-12, 4.13663634596384e-12, 4.498480581094366e-12, 4.8603248162248924e-12, 5.222169051355419e-12, 5.584013286485945e-12, 5.945857521616471e-12, 6.307701756746997e-12, 6.6695459918775235e-12, 7.03139022700805e-12, 7.393234462138576e-12, 7.755078697269102e-12, 8.116922932399628e-12, 8.478767167530155e-12, 8.84061140266068e-12, 9.202455637791207e-12, 9.564299872921733e-12, 9.92614410805226e-12, 1.0287988343182786e-11, 1.0649832578313312e-11, 1.1011676813443838e-11, 1.1373521048574364e-11, 1.173536528370489e-11, 1.2097209518835417e-11]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 7.0, 5.0, 8.0, 18.0, 9.0, 18.0, 19.0, 33.0, 39.0, 49.0, 83.0, 95.0, 124.0, 113.0, 96.0, 57.0, 63.0, 39.0, 34.0, 15.0, 12.0, 15.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.364377329124096e-12, -9.01724528379333e-12, -8.670113238462562e-12, -8.322981193131795e-12, -7.975849147801028e-12, -7.628717102470262e-12, -7.281585057139495e-12, -6.934453011808728e-12, -6.587320966477961e-12, -6.240188921147194e-12, -5.893056875816427e-12, -5.54592483048566e-12, -5.198792785154893e-12, -4.851660739824126e-12, -4.504528694493359e-12, -4.1573966491625924e-12, -3.8102646038318255e-12, -3.4631325585010586e-12, -3.1160005131702917e-12, -2.7688684678395248e-12, -2.421736422508758e-12, -2.074604377177991e-12, -1.727472331847224e-12, -1.3803402865164571e-12, -1.0332082411856902e-12, -6.860761958549233e-13, -3.389441505241564e-13, 8.18789480661053e-15, 3.5531994013737744e-13, 7.024519854681444e-13, 1.0495840307989113e-12, 1.3967160761296782e-12, 1.743848988822183e-12, 2.09098103415295e-12, 2.438113079483717e-12, 2.785245124814484e-12, 3.1323771701452507e-12, 3.4795092154760177e-12, 3.8266412608067846e-12, 4.1737733061375515e-12, 4.520905351468318e-12, 4.868037396799085e-12, 5.215169442129852e-12, 5.562301487460619e-12, 5.909433532791386e-12, 6.256565578122153e-12, 6.60369762345292e-12, 6.950829668783687e-12, 7.297961714114454e-12, 7.64509375944522e-12, 7.992225804775988e-12, 8.339357850106754e-12, 8.686489895437521e-12, 9.033621940768288e-12, 9.380753986099055e-12, 9.727886031429822e-12, 1.0075018076760589e-11, 1.0422150122091356e-11, 1.0769282167422123e-11, 1.111641421275289e-11, 1.1463546258083657e-11, 1.1810678303414424e-11, 1.215781034874519e-11, 1.2504942394075957e-11, 1.2852074439406724e-11]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 4.0, 6.0, 13.0, 14.0, 12.0, 20.0, 27.0, 30.0, 26.0, 26.0, 32.0, 46.0, 58.0, 62.0, 58.0, 68.0, 73.0, 55.0, 51.0, 41.0, 40.0, 33.0, 37.0, 27.0, 30.0, 20.0, 16.0, 8.0, 11.0, 10.0, 7.0, 12.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.017454317972184e-12, -8.734143616684342e-12, -8.4508329153965e-12, -8.167522214108658e-12, -7.884212380182554e-12, -7.600901678894711e-12, -7.31759097760687e-12, -7.034280276319027e-12, -6.750969575031185e-12, -6.467658873743343e-12, -6.1843481724555005e-12, -5.901037904848527e-12, -5.617727203560685e-12, -5.334416502272843e-12, -5.05110623466587e-12, -4.7677955333780275e-12, -4.484484832090185e-12, -4.201174130802343e-12, -3.917863429514501e-12, -3.6345531619075278e-12, -3.3512424606196856e-12, -3.0679317593318434e-12, -2.7846212748844357e-12, -2.501310790437028e-12, -2.2180000891491858e-12, -1.9346893878613436e-12, -1.6513789034139359e-12, -1.368068310546311e-12, -1.084757717678686e-12, -8.014471248110611e-13, -5.181365319434361e-13, -2.348260474960284e-13, 4.848552115355176e-14, 3.317961140211767e-13, 6.151067068888016e-13, 8.984172997564266e-13, 1.1817278926240515e-12, 1.4650384854916765e-12, 1.7483490783593014e-12, 2.031659562806709e-12, 2.3149702640945513e-12, 2.5982809653823935e-12, 2.881591449829801e-12, 3.164901934277209e-12, 3.448212635565051e-12, 3.731523336852893e-12, 4.0148336044598665e-12, 4.298144305747709e-12, 4.581455007035551e-12, 4.864765708323393e-12, 5.148076409611235e-12, 5.4313866772182084e-12, 5.714697378506051e-12, 5.998008079793893e-12, 6.281318347400866e-12, 6.564629048688708e-12, 6.8479397499765504e-12, 7.131250451264393e-12, 7.414561152552235e-12, 7.697871853840077e-12, 7.981181687766181e-12, 8.264492389054023e-12, 8.547803090341866e-12, 8.831113791629708e-12, 9.11442449291755e-12]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 18.0, 61.0, 138.0, 318.0, 304.0, 105.0, 34.0, 16.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.104065603668163e-12, -5.228696815795519e-12, -4.353327594242007e-12, -3.477958589528929e-12, -2.602589584815851e-12, -1.7272203632623384e-12, -8.518515753896949e-13, 2.351721248294858e-14, 8.988864340364611e-13, 1.774255438749539e-12, 2.649624443462617e-12, 3.524993448175695e-12, 4.400362452888773e-12, 5.2757316744422855e-12, 6.151100462314929e-12, 7.0264692501875725e-12, 7.901838905421954e-12, 8.777208126975466e-12, 9.652577348528979e-12, 1.0527945702720753e-11, 1.1403314924274266e-11, 1.2278684145827778e-11, 1.3154052500019553e-11, 1.4029421721573065e-11, 1.4904790943126578e-11, 1.578016016468009e-11, 1.6655529386233603e-11, 1.7530898607787115e-11, 1.8406266094617152e-11, 1.9281635316170664e-11, 2.0157004537724177e-11, 2.103237375927769e-11, 2.1907742980831202e-11, 2.2783112202384714e-11, 2.3658481423938227e-11, 2.453385064549174e-11, 2.5409219867045252e-11, 2.6284589088598764e-11, 2.71599565754288e-11, 2.8035325796982313e-11, 2.8910695018535826e-11, 2.978606250536586e-11, 3.0661431726919375e-11, 3.153680094847289e-11, 3.24121701700264e-11, 3.328753939157991e-11, 3.4162908613133425e-11, 3.503827783468694e-11, 3.591364705624045e-11, 3.678901627779396e-11, 3.7664385499347475e-11, 3.853975472090099e-11, 3.94151239424545e-11, 4.029049316400801e-11, 4.1165862385561525e-11, 4.204123160711504e-11, 4.291660082866855e-11, 4.379197005022206e-11, 4.4667339271775575e-11, 4.554270849332909e-11, 4.64180777148826e-11, 4.729344693643611e-11, 4.8168816157989625e-11, 4.904418537954314e-11, 4.99195511316497e-11]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 10.0, 16.0, 12.0, 12.0, 28.0, 29.0, 26.0, 23.0, 32.0, 41.0, 56.0, 64.0, 55.0, 60.0, 75.0, 68.0, 48.0, 45.0, 42.0, 34.0, 41.0, 26.0, 36.0, 15.0, 20.0, 9.0, 13.0, 13.0, 6.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.916381963678608e-12, -6.702289764848324e-12, -6.488197999698908e-12, -6.2741058008686235e-12, -6.060013602038339e-12, -5.845921836888923e-12, -5.6318296380586386e-12, -5.417737439228354e-12, -5.203645674078938e-12, -4.989553475248654e-12, -4.775461710099238e-12, -4.561369511268953e-12, -4.347277312438669e-12, -4.133185547289253e-12, -3.9190933484589685e-12, -3.705001583309553e-12, -3.4909091676388337e-12, -3.2768171856489836e-12, -3.062724986818699e-12, -2.848633004828849e-12, -2.6345410228389987e-12, -2.420448824008714e-12, -2.206356842018864e-12, -1.992264860029014e-12, -1.7781727696189464e-12, -1.564080679208879e-12, -1.349988697219029e-12, -1.1358966068089615e-12, -9.218045163988942e-13, -7.07712534409044e-13, -4.936204439989766e-13, -2.795284620091265e-13, -6.543637159905913e-14, 1.4865567815342678e-13, 3.627477279059127e-13, 5.768397912109258e-13, 7.909318274108845e-13, 1.0050238636108433e-12, 1.2191159540209107e-12, 1.4332079360107608e-12, 1.6473000264208282e-12, 1.8613921168308956e-12, 2.0754840988207457e-12, 2.289576080810596e-12, 2.5036682796408805e-12, 2.7177602616307306e-12, 2.9318522436205807e-12, 3.1459444424508654e-12, 3.3600364244407155e-12, 3.5741284064305656e-12, 3.78822060526085e-12, 4.002312370410266e-12, 4.2164045692405505e-12, 4.430496768070835e-12, 4.644588533220251e-12, 4.8586807320505354e-12, 5.07277293088082e-12, 5.286865129711105e-12, 5.50095689486052e-12, 5.715049093690805e-12, 5.9291412925210896e-12, 6.143233057670505e-12, 6.35732525650079e-12, 6.5714170216502055e-12, 6.78550922048049e-12]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 37.0, 120.0, 559.0, 211.0, 40.0, 16.0, 8.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1113080034274034e-11, -2.071926311075778e-11, -2.0325446187241525e-11, -1.993162926372527e-11, -1.9537812340209015e-11, -1.914399541669276e-11, -1.8750178493176506e-11, -1.835636156966025e-11, -1.7962544646143996e-11, -1.7568727722627742e-11, -1.7174910799111487e-11, -1.6781093875595232e-11, -1.6387276952078977e-11, -1.5993460028562723e-11, -1.5599643105046468e-11, -1.5205826181530213e-11, -1.4812007523290482e-11, -1.4418190599774228e-11, -1.4024373676257973e-11, -1.3630556752741718e-11, -1.3236739829225463e-11, -1.2842922905709209e-11, -1.2449105114831216e-11, -1.2055288191314961e-11, -1.1661471267798706e-11, -1.1267654344282452e-11, -1.0873837420766197e-11, -1.0480020497249942e-11, -1.008620270637195e-11, -9.692385782855695e-12, -9.29856885933944e-12, -8.904751935823185e-12, -8.51093501230693e-12, -8.117118088790676e-12, -7.723301165274421e-12, -7.329484241758166e-12, -6.9356668845610425e-12, -6.541849961044788e-12, -6.148032603847664e-12, -5.754215680331409e-12, -5.3603987568151545e-12, -4.9665818332989e-12, -4.572764909782645e-12, -4.178947552585521e-12, -3.7851306290692666e-12, -3.391313705553012e-12, -2.9974965651963226e-12, -2.6036794248396333e-12, -2.2098625013233786e-12, -1.8160454693869066e-12, -1.4222284374504346e-12, -1.0284114055139626e-12, -6.345943735774906e-13, -2.4077745006123585e-13, 1.530396902954534e-13, 5.468568306521426e-13, 9.406737541683974e-13, 1.3344907861048694e-12, 1.7283078180413414e-12, 2.1221249583980306e-12, 2.5159418819142854e-12, 2.90975880543054e-12, 3.3035759457872294e-12, 3.6973930861439186e-12, 4.091210009660173e-12]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 8.0, 10.0, 15.0, 19.0, 22.0, 26.0, 26.0, 40.0, 56.0, 77.0, 91.0, 105.0, 91.0, 103.0, 77.0, 48.0, 33.0, 37.0, 19.0, 20.0, 13.0, 13.0, 14.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.554231553850375e-12, -5.4116338146781295e-12, -5.269036509186753e-12, -5.1264387700145075e-12, -4.983841464523131e-12, -4.8412437253508855e-12, -4.698646419859509e-12, -4.5560486806872635e-12, -4.413451375195887e-12, -4.2708536360236415e-12, -4.128256330532265e-12, -3.9856585913600195e-12, -3.843061285868643e-12, -3.7004635466963975e-12, -3.5578660243645865e-12, -3.4152685020327755e-12, -3.27267076286053e-12, -3.130073240528719e-12, -2.987475718196908e-12, -2.844878195865097e-12, -2.702280673533286e-12, -2.5596829343610406e-12, -2.4170854120292296e-12, -2.2744878896974186e-12, -2.1318903673656076e-12, -1.9892928450337966e-12, -1.8466953227019856e-12, -1.7040976919499573e-12, -1.5615001696181463e-12, -1.4189026472863353e-12, -1.276305016534307e-12, -1.133707494202496e-12, -9.91109971870685e-13, -8.485124495388741e-13, -7.059148729969544e-13, -5.633172964550348e-13, -4.207197741232238e-13, -2.781222517914128e-13, -1.3552467524949319e-13, 7.072901292426437e-15, 1.4967042362423744e-13, 2.9226797306110275e-13, 4.3486552249796806e-13, 5.774630990398877e-13, 7.200606213716987e-13, 8.626581437035097e-13, 1.005255774455538e-12, 1.147853296787349e-12, 1.29045081911916e-12, 1.433048341450971e-12, 1.575645863782782e-12, 1.7182434945348102e-12, 1.860840908446404e-12, 2.0034386476186494e-12, 2.1460361699504604e-12, 2.2886336922822714e-12, 2.4312312146140824e-12, 2.5738287369458934e-12, 2.7164262592777044e-12, 2.8590237816095154e-12, 3.001621520781761e-12, 3.1442188262731374e-12, 3.286816565445383e-12, 3.429414087777194e-12, 3.572011610109005e-12]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 15.0, 29.0, 67.0, 168.0, 406.0, 180.0, 73.0, 39.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.422361336661965e-12, -7.24354820916262e-12, -7.064735081663276e-12, -6.885921954163932e-12, -6.707108826664587e-12, -6.528295699165243e-12, -6.349482571665899e-12, -6.170669444166554e-12, -5.99185631666721e-12, -5.813043189167866e-12, -5.6342300616685215e-12, -5.455416934169177e-12, -5.276603806669833e-12, -5.0977906791704886e-12, -4.918977551671144e-12, -4.7401644241718e-12, -4.561351296672456e-12, -4.382538169173111e-12, -4.203725041673767e-12, -4.024911914174423e-12, -3.8460987866750784e-12, -3.667285659175734e-12, -3.48847253167639e-12, -3.3096594041770455e-12, -3.1308462766777012e-12, -2.952033149178357e-12, -2.7732200216790126e-12, -2.5944068941796683e-12, -2.415593766680324e-12, -2.2367806391809797e-12, -2.0579675116816354e-12, -1.879154384182291e-12, -1.7003416903638158e-12, -1.5215285628644715e-12, -1.3427154353651272e-12, -1.1639023078657829e-12, -9.850891803664386e-13, -8.062760528670943e-13, -6.274629253677499e-13, -4.4864979786840564e-13, -2.6983667036906134e-13, -9.102354286971703e-14, 8.778958462962727e-14, 2.666027121289716e-13, 4.454158396283159e-13, 6.242289671276602e-13, 8.030420946270045e-13, 9.818552221263488e-13, 1.160668349625693e-12, 1.3394814771250374e-12, 1.5182946046243817e-12, 1.697107732123726e-12, 1.8759208596230703e-12, 2.0547339871224146e-12, 2.233547114621759e-12, 2.4123602421211032e-12, 2.5911733696204475e-12, 2.769986497119792e-12, 2.948799624619136e-12, 3.1276127521184804e-12, 3.3064258796178247e-12, 3.485239007117169e-12, 3.664052134616513e-12, 3.842865262115858e-12, 4.021678389615202e-12]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 14.0, 13.0, 21.0, 27.0, 23.0, 37.0, 51.0, 76.0, 91.0, 110.0, 99.0, 108.0, 82.0, 49.0, 42.0, 36.0, 24.0, 14.0, 13.0, 15.0, 15.0, 8.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.262165928011318e-12, -3.1809791346121274e-12, -3.0997925580533714e-12, -3.018605764654181e-12, -2.9374189712549903e-12, -2.8562321778557997e-12, -2.7750456012970437e-12, -2.693858807897853e-12, -2.612672231339097e-12, -2.5314854379399065e-12, -2.4502988613811505e-12, -2.36911206798196e-12, -2.2879252745827694e-12, -2.2067386980240133e-12, -2.1255519046248228e-12, -2.0443651112256322e-12, -1.9631783178264417e-12, -1.881991524427251e-12, -1.8008048394482778e-12, -1.7196181544693045e-12, -1.638431361070114e-12, -1.5572446760911407e-12, -1.4760579911121674e-12, -1.3948711977129769e-12, -1.3136845127340036e-12, -1.2324978277550303e-12, -1.1513110343558397e-12, -1.0701243493768664e-12, -9.889376643978931e-13, -9.077508709987026e-13, -8.265641860197293e-13, -7.453774468306473e-13, -6.641907076415654e-13, -5.830039684524835e-13, -5.018172292634016e-13, -4.2063054428442825e-13, -3.3944380509534633e-13, -2.582570659062644e-13, -1.770703809272911e-13, -9.588364173820918e-14, -1.4696902549127255e-14, 6.648982308742751e-14, 1.4767654872398228e-13, 2.288632608080099e-13, 3.100499999970918e-13, 3.9123673918617374e-13, 4.72423424165147e-13, 5.53610163354229e-13, 6.347969025433109e-13, 7.159836417323928e-13, 7.971703809214747e-13, 8.78357065900448e-13, 9.595438592996386e-13, 1.0407305442786119e-12, 1.1219172292575852e-12, 1.2031040226567757e-12, 1.284290707635749e-12, 1.3654773926147223e-12, 1.4466641860139129e-12, 1.5278508709928862e-12, 1.6090375559718595e-12, 1.69022434937105e-12, 1.7714110343500233e-12, 1.8525977193289966e-12, 1.933784512728187e-12]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 14.0, 31.0, 110.0, 403.0, 295.0, 98.0, 32.0, 16.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9282919445223756e-12, -1.7509946400803833e-12, -1.573697335638391e-12, -1.3964000311963987e-12, -1.2191027267544063e-12, -1.041805422312414e-12, -8.645081178704217e-13, -6.872108134284294e-13, -5.099135089864371e-13, -3.3261620454444474e-13, -1.5531890010245242e-13, 2.1978404339539903e-14, 1.9927570878153222e-13, 3.7657301322352454e-13, 5.538703176655169e-13, 7.311676221075092e-13, 9.084649265495015e-13, 1.0857622309914938e-12, 1.2630595354334861e-12, 1.4403568398754785e-12, 1.6176541443174708e-12, 1.7949514487594631e-12, 1.9722487532014554e-12, 2.149546166063665e-12, 2.32684336208544e-12, 2.504140558107215e-12, 2.6814379709694247e-12, 2.8587353838316343e-12, 3.0360325798534094e-12, 3.2133297758751844e-12, 3.390627188737394e-12, 3.5679246015996036e-12, 3.745222014461813e-12, 3.922519427324023e-12, 4.099816840186232e-12, 4.277113819367573e-12, 4.4544112322297824e-12, 4.631708645091992e-12, 4.8090056242733326e-12, 4.986303037135542e-12, 5.163600449997752e-12, 5.340897862859961e-12, 5.518195275722171e-12, 5.6954922549035114e-12, 5.872789667765721e-12, 6.0500870806279305e-12, 6.227384059809271e-12, 6.404681472671481e-12, 6.58197888553369e-12, 6.7592762983959e-12, 6.936573711258109e-12, 7.11387069043945e-12, 7.29116766962079e-12, 7.468465082483e-12, 7.64576249534521e-12, 7.82305990820742e-12, 8.000357321069629e-12, 8.177654733931838e-12, 8.354952146794048e-12, 8.532249559656258e-12, 8.709546972518467e-12, 8.886843518018939e-12, 9.064140930881148e-12, 9.241438343743358e-12, 9.418735756605567e-12]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 10.0, 8.0, 15.0, 19.0, 31.0, 28.0, 35.0, 58.0, 80.0, 87.0, 119.0, 107.0, 99.0, 76.0, 51.0, 46.0, 25.0, 21.0, 13.0, 12.0, 16.0, 13.0, 6.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.4258915189145913e-12, -2.366644857518252e-12, -2.3073981961219125e-12, -2.248151534725573e-12, -2.1889048733292338e-12, -2.1296582119328944e-12, -2.070411550536555e-12, -2.0111648891402156e-12, -1.9519182277438762e-12, -1.892671566347537e-12, -1.8334249049511975e-12, -1.774178243554858e-12, -1.7149315821585187e-12, -1.6556849207621793e-12, -1.59643825936584e-12, -1.5371915979695006e-12, -1.4779449365731612e-12, -1.4186982751768218e-12, -1.3594516137804824e-12, -1.300204952384143e-12, -1.2409582909878036e-12, -1.1817116295914643e-12, -1.1224649681951249e-12, -1.0632183067987855e-12, -1.003971645402446e-12, -9.447249840061067e-13, -8.854783226097673e-13, -8.262316612134279e-13, -7.669849998170886e-13, -7.077383384207492e-13, -6.484916770244098e-13, -5.892450156280704e-13, -5.299982458115138e-13, -4.707515844151744e-13, -4.11504923018835e-13, -3.5225826162249563e-13, -2.9301160022615624e-13, -2.3376493882981686e-13, -1.7451827743347748e-13, -1.152716160371381e-13, -5.602495464079871e-14, 3.2217067555406764e-15, 6.246836815188006e-14, 1.2171502954821944e-13, 1.8096169094455883e-13, 2.402083523408982e-13, 2.994550137372376e-13, 3.58701675133577e-13, 4.1794833652991636e-13, 4.771949979262557e-13, 5.364416593225951e-13, 5.956883207189345e-13, 6.549349821152739e-13, 7.141816435116133e-13, 7.734283049079527e-13, 8.326749663042921e-13, 8.919216277006314e-13, 9.511682890969708e-13, 1.0104149504933102e-12, 1.0696616118896496e-12, 1.128908273285989e-12, 1.1881549346823284e-12, 1.2474015960786677e-12, 1.3066482574750071e-12, 1.3658949188713465e-12]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4194304.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4096.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 11.0, 16.0, 27.0, 48.0, 95.0, 189.0, 333.0, 134.0, 65.0, 39.0, 14.0, 6.0, 14.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3050500310567434e-12, -2.247944668951063e-12, -2.1908393068453824e-12, -2.1337337278992674e-12, -2.076628365793587e-12, -2.0195230036879064e-12, -1.962417641582226e-12, -1.9053122794765454e-12, -1.8482067005304303e-12, -1.7911013384247498e-12, -1.733995867898852e-12, -1.6768905057931716e-12, -1.6197850352672738e-12, -1.5626796731615933e-12, -1.5055743110559128e-12, -1.448468840530015e-12, -1.3913634784243345e-12, -1.334258116318654e-12, -1.2771526457927562e-12, -1.2200472836870757e-12, -1.162941813161178e-12, -1.1058364510554974e-12, -1.0487309805295997e-12, -9.916256184239192e-13, -9.345202563182387e-13, -8.774148400024495e-13, -8.203094236866604e-13, -7.632040615809799e-13, -7.060985910550821e-13, -6.489932289494016e-13, -5.918878126336125e-13, -5.347823963178233e-13, -4.776768173717083e-13, -4.2057140105591917e-13, -3.6346598474013003e-13, -3.063605955293952e-13, -2.4925517921360607e-13, -1.9214976289781693e-13, -1.350443736870821e-13, -7.793895737129297e-14, -2.0833541055503835e-14, 3.6271868484021724e-14, 9.337727802354728e-14, 1.5048268078680926e-13, 2.075880971025984e-13, 2.6469351341838754e-13, 3.2179890262912236e-13, 3.789043189449115e-13, 4.3600973526070064e-13, 4.931151515764898e-13, 5.502205678922789e-13, 6.073259299979594e-13, 6.644314005238572e-13, 7.215367626295377e-13, 7.786421789453268e-13, 8.35747595261116e-13, 8.928530115769051e-13, 9.499584278926942e-13, 1.0070637899983748e-12, 1.0641692605242725e-12, 1.121274622629953e-12, 1.1783800931558508e-12, 1.2354854552615313e-12, 1.2925908173672118e-12, 1.3496962878931096e-12]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 10.0, 9.0, 20.0, 22.0, 28.0, 39.0, 61.0, 58.0, 93.0, 114.0, 144.0, 88.0, 84.0, 48.0, 41.0, 29.0, 17.0, 16.0, 18.0, 9.0, 7.0, 6.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5836924870463176e-12, -1.5459505420603592e-12, -1.5082085970744008e-12, -1.4704666520884424e-12, -1.4327245986822668e-12, -1.3949826536963084e-12, -1.35724070871035e-12, -1.3194987637243916e-12, -1.2817568187384332e-12, -1.2440148737524748e-12, -1.2062729287665164e-12, -1.168530983780558e-12, -1.1307890387945996e-12, -1.093046985388424e-12, -1.0553050404024655e-12, -1.0175630954165071e-12, -9.798211504305487e-13, -9.420792054445903e-13, -9.043372604586319e-13, -8.665952612625649e-13, -8.288533162766065e-13, -7.911113712906481e-13, -7.533693720945811e-13, -7.156274271086227e-13, -6.778854821226643e-13, -6.401435371367059e-13, -6.024015921507475e-13, -5.646595929546805e-13, -5.269176479687221e-13, -4.891757029827637e-13, -4.51433730891751e-13, -4.1369175880073827e-13, -3.759499222349971e-13, -3.3820797724903873e-13, -3.00466005158026e-13, -2.627240330670133e-13, -2.249820880810549e-13, -1.8724012954256936e-13, -1.494981710040838e-13, -1.1175619891307109e-13, -7.40142539271127e-14, -3.627229538862714e-14, 1.4696631498584134e-15, 3.921162168834397e-14, 7.695358022682952e-14, 1.1469553876531507e-13, 1.5243749730380063e-13, 1.9017946939481334e-13, 2.2792141438077174e-13, 2.6566335936673013e-13, 3.0340533145774284e-13, 3.4114730354875555e-13, 3.7888924853471395e-13, 4.1663119352067235e-13, 4.5437316561168506e-13, 4.921151377026978e-13, 5.298570826886562e-13, 5.675990276746146e-13, 6.05340972660573e-13, 6.4308297185664e-13, 6.808249168425984e-13, 7.185668618285568e-13, 7.563088610246238e-13, 7.940508060105822e-13, 8.317927509965406e-13]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 8.0, 7.0, 15.0, 26.0, 34.0, 43.0, 63.0, 115.0, 247.0, 180.0, 86.0, 56.0, 34.0, 27.0, 19.0, 7.0, 9.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0480735203322045e-12, -1.0140208984987797e-12, -9.79968276665355e-13, -9.459156548319303e-13, -9.118631414187228e-13, -8.778105195852981e-13, -8.437578977518734e-13, -8.097052759184487e-13, -7.756526540850239e-13, -7.416000322515992e-13, -7.075474646282831e-13, -6.734948427948584e-13, -6.394422209614337e-13, -6.053896533381176e-13, -5.713370315046928e-13, -5.372844096712681e-13, -5.03231842047952e-13, -4.691792202145273e-13, -4.351266254861569e-13, -4.0107403075778647e-13, -3.6702140892436175e-13, -3.3296881419599134e-13, -2.989162194676209e-13, -2.648635976341962e-13, -2.308110029058258e-13, -1.9675839462492822e-13, -1.6270578634403066e-13, -1.2865319161566025e-13, -9.460058333476268e-14, -6.054797505386511e-14, -2.64953803254947e-14, 7.557241507930024e-15, 4.1609836236300435e-14, 7.5662444517198e-14, 1.0971504602183199e-13, 1.4376764752646598e-13, 1.7782025580736355e-13, 2.1187286408826111e-13, 2.4592545881663153e-13, 2.7997808065005625e-13, 3.1403067537842666e-13, 3.4808327010679707e-13, 3.821358919402218e-13, 4.161884866685922e-13, 4.502410813969626e-13, 4.842937032303873e-13, 5.183463250638121e-13, 5.523989468972368e-13, 5.864515145205529e-13, 6.205041363539776e-13, 6.545567039772937e-13, 6.886093258107184e-13, 7.226619476441432e-13, 7.567145694775679e-13, 7.90767137100884e-13, 8.248197589343087e-13, 8.588723265576248e-13, 8.929249483910495e-13, 9.269775702244742e-13, 9.610300836376817e-13, 9.950827054711064e-13, 1.0291353273045312e-12, 1.0631879491379559e-12, 1.0972405709713806e-12, 1.1312931928048053e-12]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 7.0, 12.0, 16.0, 26.0, 24.0, 40.0, 61.0, 66.0, 87.0, 129.0, 138.0, 107.0, 68.0, 50.0, 40.0, 27.0, 14.0, 19.0, 16.0, 6.0, 7.0, 7.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1494251730970184e-12, -1.122018385320278e-12, -1.0946115975435378e-12, -1.0672048097667974e-12, -1.0397980219900571e-12, -1.0123912342133168e-12, -9.849844464365765e-13, -9.575775502396189e-13, -9.301708708830958e-13, -9.027640831063555e-13, -8.753572953296151e-13, -8.479505075528748e-13, -8.205437197761345e-13, -7.931369319993942e-13, -7.657300900125452e-13, -7.383233022358049e-13, -7.109164602489559e-13, -6.835096724722156e-13, -6.561028846954753e-13, -6.28696096918735e-13, -6.012893091419946e-13, -5.738825213652543e-13, -5.464756793784054e-13, -5.19068891601665e-13, -4.916621038249247e-13, -4.642553160481844e-13, -4.3684852827144405e-13, -4.094417133896494e-13, -3.820349256129091e-13, -3.5462813783616876e-13, -3.272213229543741e-13, -2.998145351776338e-13, -2.7240769319078484e-13, -2.450009054140445e-13, -2.1759410408477703e-13, -1.9018730275550955e-13, -1.6278051497876922e-13, -1.353737272020289e-13, -1.0796692587276141e-13, -8.056012454349393e-14, -5.31533367667536e-14, -2.5746542213749696e-14, 1.660252339254209e-15, 2.9067046892258114e-14, 5.647384144526202e-14, 8.388062922200235e-14, 1.1128743055126983e-13, 1.386942318805373e-13, 1.6610101965727764e-13, 1.9350780743401796e-13, 2.2091460876328545e-13, 2.4832141009255293e-13, 2.7572819786929326e-13, 3.031349856460336e-13, 3.305418005278282e-13, 3.5794858830456855e-13, 3.853553760813089e-13, 4.127621638580492e-13, 4.4016895163478953e-13, 4.675757394115299e-13, 4.949825271882702e-13, 5.223893149650105e-13, 5.497961569518595e-13, 5.772029447285998e-13, 6.046097325053401e-13]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 13.0, 19.0, 40.0, 37.0, 52.0, 73.0, 141.0, 227.0, 133.0, 70.0, 46.0, 25.0, 31.0, 16.0, 13.0, 7.0, 8.0, 8.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.475739420547469e-13, -9.165148024195546e-13, -8.854556627843624e-13, -8.543965231491701e-13, -8.233373835139779e-13, -7.922782438787856e-13, -7.61219158453702e-13, -7.301600188185098e-13, -6.991008791833175e-13, -6.680417395481253e-13, -6.36982599912933e-13, -6.059234602777408e-13, -5.748643748526572e-13, -5.438052352174649e-13, -5.127460955822727e-13, -4.816869559470804e-13, -4.506278163118882e-13, -4.1956867667669595e-13, -3.885095370415037e-13, -3.5745042451136577e-13, -3.2639128487617353e-13, -2.953321452409813e-13, -2.6427303271084335e-13, -2.332138930756511e-13, -2.0215475344045886e-13, -1.710956138052666e-13, -1.4003648772260152e-13, -1.0897735486367285e-13, -7.791822200474419e-14, -4.685908236955194e-14, -1.579995628688685e-14, 1.5259169795778238e-14, 4.631841785118773e-14, 7.73775507101164e-14, 1.0843668356904507e-13, 1.3949580965171016e-13, 1.705549492869024e-13, 2.0161408892209465e-13, 2.326732014522326e-13, 2.6373234108742483e-13, 2.9479148072261707e-13, 3.258506203578093e-13, 3.5690975999300156e-13, 3.879688725231395e-13, 4.1902801215833174e-13, 4.50087151793524e-13, 4.811462643236619e-13, 5.122054039588542e-13, 5.432645435940464e-13, 5.743236832292387e-13, 6.053828228644309e-13, 6.364419624996231e-13, 6.675011021348154e-13, 6.985602417700076e-13, 7.296193271950913e-13, 7.606784668302835e-13, 7.917376064654758e-13, 8.22796746100668e-13, 8.538558857358602e-13, 8.849150253710525e-13, 9.159741107961361e-13, 9.470332504313284e-13, 9.780923900665206e-13, 1.0091515297017128e-12, 1.040210669336905e-12]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 11.0, 9.0, 18.0, 19.0, 29.0, 35.0, 55.0, 69.0, 90.0, 147.0, 154.0, 100.0, 69.0, 52.0, 32.0, 23.0, 19.0, 15.0, 12.0, 5.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.308724392219297e-12, -2.2548980911640815e-12, -2.2010715732684316e-12, -2.1472452722132163e-12, -2.093418971158001e-12, -2.039592453262351e-12, -1.9857661522071357e-12, -1.9319398511519204e-12, -1.8781133332562705e-12, -1.824287032201055e-12, -1.7704606227256225e-12, -1.71663421325019e-12, -1.6628078037747573e-12, -1.6089813942993247e-12, -1.5551550932441094e-12, -1.5013286837686768e-12, -1.4475022742932442e-12, -1.3936758648178116e-12, -1.3398495637625962e-12, -1.2860231542871636e-12, -1.232196744811731e-12, -1.1783703353362984e-12, -1.124544034281083e-12, -1.0707176248056505e-12, -1.0168913237504351e-12, -9.630649142750025e-13, -9.092385590096785e-13, -8.554122037443546e-13, -8.01585794268922e-13, -7.47759439003598e-13, -6.93933083738274e-13, -6.401066742628414e-13, -5.862802647874088e-13, -5.324539095220848e-13, -4.786275000466522e-13, -4.2480114478132824e-13, -3.7097473530589564e-13, -3.1714838004057166e-13, -2.633219976701934e-13, -2.0949561529981509e-13, -1.556692329294368e-13, -1.0184285055905851e-13, -4.8016474964943795e-14, 5.8099006291709165e-15, 5.96362829995492e-14, 1.1346265181740034e-13, 1.6728903418777863e-13, 2.2111541655815692e-13, 2.749417989285352e-13, 3.287681812989135e-13, 3.825945636692918e-13, 4.3642091893461576e-13, 4.902473284100484e-13, 5.440736836753723e-13, 5.979000931508049e-13, 6.517264484161289e-13, 7.055528036814529e-13, 7.593791589467769e-13, 8.132055684222095e-13, 8.670319236875335e-13, 9.20858333162966e-13, 9.746847426383987e-13, 1.028511043693614e-12, 1.0823374531690466e-12, 1.1361638626444792e-12]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 4.0, 1.0, 3.0, 10.0, 9.0, 16.0, 22.0, 35.0, 41.0, 72.0, 104.0, 203.0, 423.0, 6286.0, 516027.0, 485.0, 178.0, 103.0, 68.0, 42.0, 23.0, 27.0, 16.0, 13.0, 13.0, 5.0, 8.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2974462610125812e-11, -2.2299564972350083e-11, -2.162466906929783e-11, -2.0949771431522102e-11, -2.027487552846985e-11, -1.959997789069412e-11, -1.892508025291839e-11, -1.8250182615142663e-11, -1.757528671209041e-11, -1.690038907431468e-11, -1.622549317126243e-11, -1.55505955334867e-11, -1.487569789571097e-11, -1.4200801992658718e-11, -1.352590435488299e-11, -1.2851007584468999e-11, -1.2176110814055008e-11, -1.1501214043641017e-11, -1.0826317273227026e-11, -1.0151419635451298e-11, -9.476522865037307e-12, -8.801626094623316e-12, -8.126728456847587e-12, -7.451831686433597e-12, -6.776934916019606e-12, -6.102038145605615e-12, -5.427140941510755e-12, -4.7522437374158955e-12, -4.077346967001905e-12, -3.4024499797474794e-12, -2.727552992493054e-12, -2.0526557883981944e-12, -1.3777590179842036e-12, -7.028620307297784e-13, -2.7965043475353113e-14, 6.469319437790721e-13, 1.3218289310334974e-12, 1.9967259182879227e-12, 2.671622905542348e-12, 3.3465201096372077e-12, 4.0214168800511985e-12, 4.696313650465189e-12, 5.371210854560049e-12, 6.046108058654909e-12, 6.7210048290688995e-12, 7.39590159948289e-12, 8.070799237258619e-12, 8.74569600767261e-12, 9.4205927780866e-12, 1.0095489548500591e-11, 1.0770386318914582e-11, 1.1445283956690311e-11, 1.2120180727104302e-11, 1.2795077497518292e-11, 1.3469975135294021e-11, 1.4144871905708012e-11, 1.4819768676122003e-11, 1.549466631389773e-11, 1.6169562216949984e-11, 1.6844459854725713e-11, 1.7519357492501442e-11, 1.8194253395553694e-11, 1.8869151033329423e-11, 1.9544046936381676e-11, 2.0218944574157405e-11]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 12.0, 7.0, 22.0, 19.0, 36.0, 51.0, 58.0, 92.0, 124.0, 1221.0, 104.0, 76.0, 56.0, 34.0, 23.0, 19.0, 17.0, 7.0, 6.0, 9.0, 5.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.8593149509491553e-11, -3.771956011422439e-11, -3.684596724951028e-11, -3.597237785424312e-11, -3.509878845897596e-11, -3.422519559426185e-11, -3.335160619899469e-11, -3.247801680372753e-11, -3.1604423939013415e-11, -3.0730834543746255e-11, -2.985724167903214e-11, -2.8983652283764982e-11, -2.8110061153774346e-11, -2.723647002378371e-11, -2.636288062851655e-11, -2.5489289498525913e-11, -2.4615700103258753e-11, -2.3742108973268117e-11, -2.2868519578000956e-11, -2.199492844801032e-11, -2.1121337318019684e-11, -2.0247747922752524e-11, -1.9374156792761887e-11, -1.850056566277125e-11, -1.762697626750409e-11, -1.6753385137513455e-11, -1.5879795742246294e-11, -1.5006204612255658e-11, -1.4132613482265022e-11, -1.3259023219636124e-11, -1.2385432957007225e-11, -1.1511841827016589e-11, -1.0638252431749429e-11, -9.76466216912053e-12, -8.891071039129894e-12, -8.017480776500996e-12, -7.143890080191229e-12, -6.270299383881461e-12, -5.396709121252563e-12, -4.523118424942796e-12, -3.6495277286330285e-12, -2.7759370323232613e-12, -1.9023465528539285e-12, -1.0287560733845957e-12, -1.5516537707482847e-13, 7.184253192349388e-13, 1.592015581863837e-12, 2.4656062781736043e-12, 3.3391969744833716e-12, 4.212787670793139e-12, 5.086378367102906e-12, 5.9599686297318044e-12, 6.833559326041572e-12, 7.707150022351339e-12, 8.580740284980237e-12, 9.454331414970873e-12, 1.0327921677599772e-11, 1.120151194022867e-11, 1.2075103070219306e-11, 1.2948693332848205e-11, 1.3822283595477103e-11, 1.469587472546774e-11, 1.5569465855458375e-11, 1.6443055250725536e-11, 1.7316646380716172e-11]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 11.0, 16.0, 23.0, 34.0, 55.0, 80.0, 117.0, 215.0, 313.0, 527.0, 1103.0, 2113.0, 5197.0, 12312.0, 29976.0, 338192.0, 30812522.0, 30543.0, 13763.0, 4537.0, 1306.0, 604.0, 341.0, 216.0, 148.0, 101.0, 65.0, 45.0, 27.0, 21.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.6376953125, -34.525390625, -33.4130859375, -32.30078125, -31.1884765625, -30.076171875, -28.9638671875, -27.8515625, -26.7392578125, -25.626953125, -24.5146484375, -23.40234375, -22.2900390625, -21.177734375, -20.0654296875, -18.953125, -17.8408203125, -16.728515625, -15.6162109375, -14.50390625, -13.3916015625, -12.279296875, -11.1669921875, -10.0546875, -8.9423828125, -7.830078125, -6.7177734375, -5.60546875, -4.4931640625, -3.380859375, -2.2685546875, -1.15625, -0.0439453125, 1.068359375, 2.1806640625, 3.29296875, 4.4052734375, 5.517578125, 6.6298828125, 7.7421875, 8.8544921875, 9.966796875, 11.0791015625, 12.19140625, 13.3037109375, 14.416015625, 15.5283203125, 16.640625, 17.7529296875, 18.865234375, 19.9775390625, 21.08984375, 22.2021484375, 23.314453125, 24.4267578125, 25.5390625, 26.6513671875, 27.763671875, 28.8759765625, 29.98828125, 31.1005859375, 32.212890625, 33.3251953125, 34.4375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 7.0, 15.0, 18.0, 34.0, 50.0, 67.0, 128.0, 222.0, 384.0, 644.0, 1161.0, 1901.0, 3275.0, 6156.0, 11866.0, 24626.0, 58121.0, 168989.0, 872437.0, 4445039.0, 486666.0, 121441.0, 45222.0, 20456.0, 9897.0, 5412.0, 2965.0, 1743.0, 1001.0, 628.0, 379.0, 200.0, 106.0, 65.0, 51.0, 31.0, 17.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.76171875, -4.61895751953125, -4.4761962890625, -4.33343505859375, -4.190673828125, -4.04791259765625, -3.9051513671875, -3.76239013671875, -3.61962890625, -3.47686767578125, -3.3341064453125, -3.19134521484375, -3.048583984375, -2.90582275390625, -2.7630615234375, -2.62030029296875, -2.4775390625, -2.33477783203125, -2.1920166015625, -2.04925537109375, -1.906494140625, -1.76373291015625, -1.6209716796875, -1.47821044921875, -1.33544921875, -1.19268798828125, -1.0499267578125, -0.90716552734375, -0.764404296875, -0.62164306640625, -0.4788818359375, -0.33612060546875, -0.193359375, -0.05059814453125, 0.0921630859375, 0.23492431640625, 0.377685546875, 0.52044677734375, 0.6632080078125, 0.80596923828125, 0.94873046875, 1.09149169921875, 1.2342529296875, 1.37701416015625, 1.519775390625, 1.66253662109375, 1.8052978515625, 1.94805908203125, 2.0908203125, 2.23358154296875, 2.3763427734375, 2.51910400390625, 2.661865234375, 2.80462646484375, 2.9473876953125, 3.09014892578125, 3.23291015625, 3.37567138671875, 3.5184326171875, 3.66119384765625, 3.803955078125, 3.94671630859375, 4.0894775390625, 4.23223876953125, 4.375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 8.0, 6.0, 8.0, 10.0, 5.0, 12.0, 11.0, 18.0, 20.0, 28.0, 31.0, 40.0, 40.0, 64.0, 99.0, 118.0, 162.0, 218.0, 264.0, 190.0, 146.0, 100.0, 76.0, 71.0, 55.0, 40.0, 31.0, 25.0, 22.0, 19.0, 15.0, 13.0, 11.0, 8.0, 9.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.5107421875, -1.470367431640625, -1.42999267578125, -1.389617919921875, -1.3492431640625, -1.308868408203125, -1.26849365234375, -1.228118896484375, -1.187744140625, -1.147369384765625, -1.10699462890625, -1.066619873046875, -1.0262451171875, -0.985870361328125, -0.94549560546875, -0.905120849609375, -0.86474609375, -0.824371337890625, -0.78399658203125, -0.743621826171875, -0.7032470703125, -0.662872314453125, -0.62249755859375, -0.582122802734375, -0.541748046875, -0.501373291015625, -0.46099853515625, -0.420623779296875, -0.3802490234375, -0.339874267578125, -0.29949951171875, -0.259124755859375, -0.21875, -0.178375244140625, -0.13800048828125, -0.097625732421875, -0.0572509765625, -0.016876220703125, 0.02349853515625, 0.063873291015625, 0.104248046875, 0.144622802734375, 0.18499755859375, 0.225372314453125, 0.2657470703125, 0.306121826171875, 0.34649658203125, 0.386871337890625, 0.42724609375, 0.467620849609375, 0.50799560546875, 0.548370361328125, 0.5887451171875, 0.629119873046875, 0.66949462890625, 0.709869384765625, 0.750244140625, 0.790618896484375, 0.83099365234375, 0.871368408203125, 0.9117431640625, 0.952117919921875, 0.99249267578125, 1.032867431640625, 1.0732421875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 6.0, 5.0, 14.0, 21.0, 17.0, 26.0, 57.0, 75.0, 82.0, 104.0, 151.0, 241.0, 410.0, 541.0, 730.0, 925.0, 1452.0, 2073.0, 2751.0, 4269.0, 6548.0, 10431.0, 18328.0, 32654.0, 64699.0, 151930.0, 453156.0, 3210342.0, 1736039.0, 343371.0, 122369.0, 54909.0, 28313.0, 15931.0, 9457.0, 5976.0, 3958.0, 2543.0, 1786.0, 1305.0, 962.0, 715.0, 497.0, 368.0, 249.0, 154.0, 121.0, 83.0, 80.0, 55.0, 39.0, 38.0, 31.0, 21.0, 8.0, 16.0, 2.0, 4.0, 4.0, 0.0, 2.0], "bins": [-1.626953125, -1.57427978515625, -1.5216064453125, -1.46893310546875, -1.416259765625, -1.36358642578125, -1.3109130859375, -1.25823974609375, -1.20556640625, -1.15289306640625, -1.1002197265625, -1.04754638671875, -0.994873046875, -0.94219970703125, -0.8895263671875, -0.83685302734375, -0.7841796875, -0.73150634765625, -0.6788330078125, -0.62615966796875, -0.573486328125, -0.52081298828125, -0.4681396484375, -0.41546630859375, -0.36279296875, -0.31011962890625, -0.2574462890625, -0.20477294921875, -0.152099609375, -0.09942626953125, -0.0467529296875, 0.00592041015625, 0.05859375, 0.11126708984375, 0.1639404296875, 0.21661376953125, 0.269287109375, 0.32196044921875, 0.3746337890625, 0.42730712890625, 0.47998046875, 0.53265380859375, 0.5853271484375, 0.63800048828125, 0.690673828125, 0.74334716796875, 0.7960205078125, 0.84869384765625, 0.9013671875, 0.95404052734375, 1.0067138671875, 1.05938720703125, 1.112060546875, 1.16473388671875, 1.2174072265625, 1.27008056640625, 1.32275390625, 1.37542724609375, 1.4281005859375, 1.48077392578125, 1.533447265625, 1.58612060546875, 1.6387939453125, 1.69146728515625, 1.744140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 7.0, 9.0, 5.0, 10.0, 9.0, 10.0, 11.0, 28.0, 24.0, 28.0, 59.0, 80.0, 104.0, 150.0, 216.0, 423.0, 304.0, 152.0, 76.0, 77.0, 47.0, 42.0, 36.0, 17.0, 21.0, 17.0, 12.0, 10.0, 5.0, 3.0, 4.0, 5.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.7177734375, -1.661834716796875, -1.60589599609375, -1.549957275390625, -1.4940185546875, -1.438079833984375, -1.38214111328125, -1.326202392578125, -1.270263671875, -1.214324951171875, -1.15838623046875, -1.102447509765625, -1.0465087890625, -0.990570068359375, -0.93463134765625, -0.878692626953125, -0.82275390625, -0.766815185546875, -0.71087646484375, -0.654937744140625, -0.5989990234375, -0.543060302734375, -0.48712158203125, -0.431182861328125, -0.375244140625, -0.319305419921875, -0.26336669921875, -0.207427978515625, -0.1514892578125, -0.095550537109375, -0.03961181640625, 0.016326904296875, 0.072265625, 0.128204345703125, 0.18414306640625, 0.240081787109375, 0.2960205078125, 0.351959228515625, 0.40789794921875, 0.463836669921875, 0.519775390625, 0.575714111328125, 0.63165283203125, 0.687591552734375, 0.7435302734375, 0.799468994140625, 0.85540771484375, 0.911346435546875, 0.96728515625, 1.023223876953125, 1.07916259765625, 1.135101318359375, 1.1910400390625, 1.246978759765625, 1.30291748046875, 1.358856201171875, 1.414794921875, 1.470733642578125, 1.52667236328125, 1.582611083984375, 1.6385498046875, 1.694488525390625, 1.75042724609375, 1.806365966796875, 1.8623046875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 6.0, 9.0, 8.0, 5.0, 16.0, 27.0, 43.0, 31.0, 47.0, 53.0, 80.0, 96.0, 110.0, 145.0, 234.0, 273.0, 327.0, 493.0, 693.0, 1083.0, 1700.0, 3138.0, 5949.0, 12906.0, 33487.0, 259506.0, 5890329.0, 46928.0, 16259.0, 7414.0, 3784.0, 1992.0, 1280.0, 787.0, 484.0, 408.0, 281.0, 243.0, 183.0, 138.0, 108.0, 63.0, 74.0, 48.0, 48.0, 27.0, 18.0, 21.0, 15.0, 10.0, 4.0, 5.0, 5.0, 2.0, 5.0, 6.0, 3.0], "bins": [-10.4296875, -10.1148681640625, -9.800048828125, -9.4852294921875, -9.17041015625, -8.8555908203125, -8.540771484375, -8.2259521484375, -7.9111328125, -7.5963134765625, -7.281494140625, -6.9666748046875, -6.65185546875, -6.3370361328125, -6.022216796875, -5.7073974609375, -5.392578125, -5.0777587890625, -4.762939453125, -4.4481201171875, -4.13330078125, -3.8184814453125, -3.503662109375, -3.1888427734375, -2.8740234375, -2.5592041015625, -2.244384765625, -1.9295654296875, -1.61474609375, -1.2999267578125, -0.985107421875, -0.6702880859375, -0.35546875, -0.0406494140625, 0.274169921875, 0.5889892578125, 0.90380859375, 1.2186279296875, 1.533447265625, 1.8482666015625, 2.1630859375, 2.4779052734375, 2.792724609375, 3.1075439453125, 3.42236328125, 3.7371826171875, 4.052001953125, 4.3668212890625, 4.681640625, 4.9964599609375, 5.311279296875, 5.6260986328125, 5.94091796875, 6.2557373046875, 6.570556640625, 6.8853759765625, 7.2001953125, 7.5150146484375, 7.829833984375, 8.1446533203125, 8.45947265625, 8.7742919921875, 9.089111328125, 9.4039306640625, 9.71875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 9.0, 12.0, 11.0, 10.0, 12.0, 28.0, 18.0, 30.0, 41.0, 51.0, 78.0, 118.0, 322.0, 585.0, 252.0, 117.0, 48.0, 42.0, 35.0, 22.0, 23.0, 20.0, 18.0, 10.0, 14.0, 15.0, 10.0, 4.0, 4.0, 6.0, 5.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.87890625, -3.76544189453125, -3.6519775390625, -3.53851318359375, -3.425048828125, -3.31158447265625, -3.1981201171875, -3.08465576171875, -2.97119140625, -2.85772705078125, -2.7442626953125, -2.63079833984375, -2.517333984375, -2.40386962890625, -2.2904052734375, -2.17694091796875, -2.0634765625, -1.95001220703125, -1.8365478515625, -1.72308349609375, -1.609619140625, -1.49615478515625, -1.3826904296875, -1.26922607421875, -1.15576171875, -1.04229736328125, -0.9288330078125, -0.81536865234375, -0.701904296875, -0.58843994140625, -0.4749755859375, -0.36151123046875, -0.248046875, -0.13458251953125, -0.0211181640625, 0.09234619140625, 0.205810546875, 0.31927490234375, 0.4327392578125, 0.54620361328125, 0.65966796875, 0.77313232421875, 0.8865966796875, 1.00006103515625, 1.113525390625, 1.22698974609375, 1.3404541015625, 1.45391845703125, 1.5673828125, 1.68084716796875, 1.7943115234375, 1.90777587890625, 2.021240234375, 2.13470458984375, 2.2481689453125, 2.36163330078125, 2.47509765625, 2.58856201171875, 2.7020263671875, 2.81549072265625, 2.928955078125, 3.04241943359375, 3.1558837890625, 3.26934814453125, 3.3828125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 24.0, 850.0, 64.0, 24.0, 16.0, 14.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.95986557006836, -43.192745208740234, -40.425628662109375, -37.65850830078125, -34.891387939453125, -32.124267578125, -29.357149124145508, -26.590030670166016, -23.82291030883789, -21.055789947509766, -18.288671493530273, -15.521552085876465, -12.754432678222656, -9.987313270568848, -7.220193862915039, -4.453075408935547, -1.6859550476074219, 1.0811643600463867, 3.8482837677001953, 6.615403175354004, 9.382522583007812, 12.149641990661621, 14.91676139831543, 17.683879852294922, 20.451000213623047, 23.218120574951172, 25.985239028930664, 28.752357482910156, 31.51947784423828, 34.286598205566406, 37.05371856689453, 39.82083511352539, 42.58795166015625, 45.355072021484375, 48.1221923828125, 50.88930892944336, 53.656429290771484, 56.42354965209961, 59.19066619873047, 61.957786560058594, 64.72490692138672, 67.49202728271484, 70.25914764404297, 73.0262680053711, 75.79338073730469, 78.56050109863281, 81.32762145996094, 84.09474182128906, 86.86186218261719, 89.62898254394531, 92.39610290527344, 95.16322326660156, 97.93034362792969, 100.69745635986328, 103.4645767211914, 106.23169708251953, 108.99881744384766, 111.76593780517578, 114.5330581665039, 117.30017852783203, 120.06729125976562, 122.83441162109375, 125.60153198242188, 128.36865234375, 131.13577270507812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 15.0, 37.0, 591.0, 312.0, 36.0, 14.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.775489807128906, -59.28103256225586, -55.78657531738281, -52.2921142578125, -48.79765701293945, -45.303199768066406, -41.808738708496094, -38.31428146362305, -34.81982421875, -31.325366973876953, -27.830907821655273, -24.336448669433594, -20.841991424560547, -17.3475341796875, -13.85307502746582, -10.35861587524414, -6.864158630371094, -3.3697004318237305, 0.12475776672363281, 3.619215965270996, 7.113674163818359, 10.608131408691406, 14.102590560913086, 17.597049713134766, 21.091506958007812, 24.58596420288086, 28.08042335510254, 31.57488250732422, 35.069339752197266, 38.56379699707031, 42.058258056640625, 45.55271530151367, 49.04718017578125, 52.5416374206543, 56.036094665527344, 59.530555725097656, 63.0250129699707, 66.51947021484375, 70.01393127441406, 73.50839233398438, 77.00284576416016, 80.49730682373047, 83.99176025390625, 87.48622131347656, 90.98068237304688, 94.47513580322266, 97.96959686279297, 101.46405029296875, 104.95851135253906, 108.45297241210938, 111.94742584228516, 115.44188690185547, 118.93634033203125, 122.43080139160156, 125.92526245117188, 129.4197235107422, 132.9141845703125, 136.4086456298828, 139.90310668945312, 143.39755249023438, 146.8920135498047, 150.386474609375, 153.8809356689453, 157.37539672851562, 160.86984252929688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 7.0, 9.0, 17.0, 22.0, 38.0, 54.0, 53.0, 91.0, 133.0, 151.0, 218.0, 281.0, 379.0, 520.0, 764.0, 1092.0, 1741.0, 2895.0, 5953.0, 14008.0, 43643.0, 431560.0, 3579013.0, 71188.0, 20494.0, 9063.0, 4524.0, 2476.0, 1398.0, 805.0, 480.0, 323.0, 239.0, 152.0, 137.0, 85.0, 61.0, 50.0, 36.0, 34.0, 16.0, 23.0, 12.0, 15.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.060333251953125, -0.05851411819458008, -0.056694984436035156, -0.054875850677490234, -0.05305671691894531, -0.05123758316040039, -0.04941844940185547, -0.04759931564331055, -0.045780181884765625, -0.0439610481262207, -0.04214191436767578, -0.04032278060913086, -0.03850364685058594, -0.036684513092041016, -0.034865379333496094, -0.03304624557495117, -0.03122711181640625, -0.029407978057861328, -0.027588844299316406, -0.025769710540771484, -0.023950576782226562, -0.02213144302368164, -0.02031230926513672, -0.018493175506591797, -0.016674041748046875, -0.014854907989501953, -0.013035774230957031, -0.01121664047241211, -0.009397506713867188, -0.007578372955322266, -0.005759239196777344, -0.003940105438232422, -0.0021209716796875, -0.0003018379211425781, 0.0015172958374023438, 0.0033364295959472656, 0.0051555633544921875, 0.006974697113037109, 0.008793830871582031, 0.010612964630126953, 0.012432098388671875, 0.014251232147216797, 0.01607036590576172, 0.01788949966430664, 0.019708633422851562, 0.021527767181396484, 0.023346900939941406, 0.025166034698486328, 0.02698516845703125, 0.028804302215576172, 0.030623435974121094, 0.032442569732666016, 0.03426170349121094, 0.03608083724975586, 0.03789997100830078, 0.0397191047668457, 0.041538238525390625, 0.04335737228393555, 0.04517650604248047, 0.04699563980102539, 0.04881477355957031, 0.050633907318115234, 0.052453041076660156, 0.05427217483520508, 0.05609130859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 9.0, 13.0, 8.0, 9.0, 23.0, 45.0, 203.0, 314.0, 223.0, 78.0, 21.0, 12.0, 10.0, 9.0, 2.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004494845867156982, -0.00433194637298584, -0.004169046878814697, -0.004006147384643555, -0.003843247890472412, -0.0036803483963012695, -0.003517448902130127, -0.0033545494079589844, -0.003191649913787842, -0.0030287504196166992, -0.0028658509254455566, -0.002702951431274414, -0.0025400519371032715, -0.002377152442932129, -0.0022142529487609863, -0.0020513534545898438, -0.0018884539604187012, -0.0017255544662475586, -0.001562654972076416, -0.0013997554779052734, -0.0012368559837341309, -0.0010739564895629883, -0.0009110569953918457, -0.0007481575012207031, -0.0005852580070495605, -0.00042235851287841797, -0.0002594590187072754, -9.655952453613281e-05, 6.633996963500977e-05, 0.00022923946380615234, 0.0003921389579772949, 0.0005550384521484375, 0.0007179379463195801, 0.0008808374404907227, 0.0010437369346618652, 0.0012066364288330078, 0.0013695359230041504, 0.001532435417175293, 0.0016953349113464355, 0.0018582344055175781, 0.0020211338996887207, 0.0021840333938598633, 0.002346932888031006, 0.0025098323822021484, 0.002672731876373291, 0.0028356313705444336, 0.002998530864715576, 0.0031614303588867188, 0.0033243298530578613, 0.003487229347229004, 0.0036501288414001465, 0.003813028335571289, 0.003975927829742432, 0.004138827323913574, 0.004301726818084717, 0.004464626312255859, 0.004627525806427002, 0.0047904253005981445, 0.004953324794769287, 0.00511622428894043, 0.005279123783111572, 0.005442023277282715, 0.005604922771453857, 0.005767822265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 14.0, 15.0, 30.0, 45.0, 69.0, 132.0, 274.0, 485.0, 1062.0, 2649.0, 9933.0, 69874.0, 3570208.0, 499209.0, 29801.0, 6151.0, 2026.0, 969.0, 532.0, 300.0, 173.0, 109.0, 69.0, 53.0, 28.0, 14.0, 20.0, 6.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08970260620117188, -0.08669281005859375, -0.08368301391601562, -0.0806732177734375, -0.07766342163085938, -0.07465362548828125, -0.07164382934570312, -0.068634033203125, -0.06562423706054688, -0.06261444091796875, -0.059604644775390625, -0.0565948486328125, -0.053585052490234375, -0.05057525634765625, -0.047565460205078125, -0.0445556640625, -0.041545867919921875, -0.03853607177734375, -0.035526275634765625, -0.0325164794921875, -0.029506683349609375, -0.02649688720703125, -0.023487091064453125, -0.020477294921875, -0.017467498779296875, -0.01445770263671875, -0.011447906494140625, -0.0084381103515625, -0.005428314208984375, -0.00241851806640625, 0.000591278076171875, 0.00360107421875, 0.006610870361328125, 0.00962066650390625, 0.012630462646484375, 0.0156402587890625, 0.018650054931640625, 0.02165985107421875, 0.024669647216796875, 0.027679443359375, 0.030689239501953125, 0.03369903564453125, 0.036708831787109375, 0.0397186279296875, 0.042728424072265625, 0.04573822021484375, 0.048748016357421875, 0.0517578125, 0.054767608642578125, 0.05777740478515625, 0.060787200927734375, 0.0637969970703125, 0.06680679321289062, 0.06981658935546875, 0.07282638549804688, 0.075836181640625, 0.07884597778320312, 0.08185577392578125, 0.08486557006835938, 0.0878753662109375, 0.09088516235351562, 0.09389495849609375, 0.09690475463867188, 0.09991455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 10.0, 12.0, 12.0, 20.0, 23.0, 31.0, 50.0, 67.0, 75.0, 103.0, 135.0, 210.0, 253.0, 344.0, 895.0, 585.0, 293.0, 209.0, 160.0, 132.0, 116.0, 81.0, 65.0, 40.0, 40.0, 25.0, 23.0, 14.0, 8.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.011260986328125, -0.01097095012664795, -0.010680913925170898, -0.010390877723693848, -0.010100841522216797, -0.009810805320739746, -0.009520769119262695, -0.009230732917785645, -0.008940696716308594, -0.008650660514831543, -0.008360624313354492, -0.008070588111877441, -0.007780551910400391, -0.00749051570892334, -0.007200479507446289, -0.006910443305969238, -0.0066204071044921875, -0.006330370903015137, -0.006040334701538086, -0.005750298500061035, -0.005460262298583984, -0.005170226097106934, -0.004880189895629883, -0.004590153694152832, -0.004300117492675781, -0.0040100812911987305, -0.0037200450897216797, -0.003430008888244629, -0.003139972686767578, -0.0028499364852905273, -0.0025599002838134766, -0.0022698640823364258, -0.001979827880859375, -0.0016897916793823242, -0.0013997554779052734, -0.0011097192764282227, -0.0008196830749511719, -0.0005296468734741211, -0.0002396106719970703, 5.042552947998047e-05, 0.00034046173095703125, 0.000630497932434082, 0.0009205341339111328, 0.0012105703353881836, 0.0015006065368652344, 0.0017906427383422852, 0.002080678939819336, 0.0023707151412963867, 0.0026607513427734375, 0.0029507875442504883, 0.003240823745727539, 0.00353085994720459, 0.0038208961486816406, 0.004110932350158691, 0.004400968551635742, 0.004691004753112793, 0.004981040954589844, 0.0052710771560668945, 0.005561113357543945, 0.005851149559020996, 0.006141185760498047, 0.006431221961975098, 0.0067212581634521484, 0.007011294364929199, 0.00730133056640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 13.0, 37.0, 143.0, 589.0, 189.0, 25.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849619507789612, -0.5602219700813293, -0.5354820489883423, -0.5107420682907104, -0.486002117395401, -0.46126216650009155, -0.4365222156047821, -0.41178226470947266, -0.3870422840118408, -0.36230233311653137, -0.3375623822212219, -0.3128224015235901, -0.28808245062828064, -0.2633424997329712, -0.23860254883766174, -0.2138625830411911, -0.18912264704704285, -0.1643826961517334, -0.13964273035526276, -0.11490277945995331, -0.09016282111406326, -0.06542286276817322, -0.04068291187286377, -0.015942946076393127, 0.00879700481891632, 0.033536963164806366, 0.05827691778540611, 0.08301687240600586, 0.1077568307518959, 0.13249678909778595, 0.1572367399930954, 0.18197670578956604, 0.2067166566848755, 0.23145660758018494, 0.2561965584754944, 0.2809365391731262, 0.30567649006843567, 0.3304164409637451, 0.35515639185905457, 0.379896342754364, 0.40463632345199585, 0.4293762743473053, 0.45411622524261475, 0.4788562059402466, 0.5035961270332336, 0.5283361077308655, 0.5530760288238525, 0.5778160095214844, 0.6025559902191162, 0.627295970916748, 0.6520358920097351, 0.6767758727073669, 0.701515793800354, 0.7262557744979858, 0.7509957551956177, 0.7757356762886047, 0.8004755973815918, 0.8252155780792236, 0.8499554991722107, 0.8746954798698425, 0.8994354009628296, 0.9241753816604614, 0.9489153623580933, 0.9736552834510803, 0.9983952641487122]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 13.0, 19.0, 18.0, 25.0, 33.0, 44.0, 38.0, 49.0, 61.0, 65.0, 64.0, 67.0, 79.0, 62.0, 51.0, 41.0, 50.0, 40.0, 45.0, 26.0, 26.0, 18.0, 11.0, 9.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08179694414138794, -0.07945909351110458, -0.07712124288082123, -0.07478339225053787, -0.07244554162025452, -0.07010768353939056, -0.06776983290910721, -0.06543198227882385, -0.0630941316485405, -0.06075628101825714, -0.058418430387973785, -0.05608057603240013, -0.053742725402116776, -0.05140487477183342, -0.049067020416259766, -0.04672916978597641, -0.044391319155693054, -0.0420534685254097, -0.03971561789512634, -0.03737776353955269, -0.03503991290926933, -0.03270206227898598, -0.030364209786057472, -0.028026357293128967, -0.02568850666284561, -0.023350656032562256, -0.02101280353963375, -0.018674951046705246, -0.01633710041642189, -0.01399924885481596, -0.01166139729321003, -0.009323544800281525, -0.006985694169998169, -0.004647842608392239, -0.0023099910467863083, 2.786051481962204e-05, 0.0023657120764255524, 0.004703563638031483, 0.007041415199637413, 0.009379267692565918, 0.011717118322849274, 0.014054969884455204, 0.016392821446061134, 0.01873067393898964, 0.021068524569272995, 0.02340637519955635, 0.025744227692484856, 0.02808208018541336, 0.030419930815696716, 0.03275778144598007, 0.03509563207626343, 0.03743348643183708, 0.03977133706212044, 0.04210918769240379, 0.04444704204797745, 0.0467848926782608, 0.04912274330854416, 0.051460593938827515, 0.05379844456911087, 0.056136298924684525, 0.05847414955496788, 0.060812000185251236, 0.06314985454082489, 0.06548770517110825, 0.0678255558013916]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 6.0, 8.0, 14.0, 11.0, 23.0, 37.0, 46.0, 59.0, 87.0, 110.0, 201.0, 273.0, 428.0, 708.0, 1374.0, 2726.0, 6383.0, 21516.0, 315369.0, 655724.0, 28909.0, 7617.0, 3053.0, 1548.0, 857.0, 482.0, 296.0, 199.0, 135.0, 90.0, 73.0, 43.0, 39.0, 20.0, 12.0, 14.0, 10.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.066650390625, -0.06457328796386719, -0.062496185302734375, -0.06041908264160156, -0.05834197998046875, -0.05626487731933594, -0.054187774658203125, -0.05211067199707031, -0.0500335693359375, -0.04795646667480469, -0.045879364013671875, -0.04380226135253906, -0.04172515869140625, -0.03964805603027344, -0.037570953369140625, -0.03549385070800781, -0.033416748046875, -0.03133964538574219, -0.029262542724609375, -0.027185440063476562, -0.02510833740234375, -0.023031234741210938, -0.020954132080078125, -0.018877029418945312, -0.0167999267578125, -0.014722824096679688, -0.012645721435546875, -0.010568618774414062, -0.00849151611328125, -0.0064144134521484375, -0.004337310791015625, -0.0022602081298828125, -0.00018310546875, 0.0018939971923828125, 0.003971099853515625, 0.0060482025146484375, 0.00812530517578125, 0.010202407836914062, 0.012279510498046875, 0.014356613159179688, 0.0164337158203125, 0.018510818481445312, 0.020587921142578125, 0.022665023803710938, 0.02474212646484375, 0.026819229125976562, 0.028896331787109375, 0.030973434448242188, 0.033050537109375, 0.03512763977050781, 0.037204742431640625, 0.03928184509277344, 0.04135894775390625, 0.04343605041503906, 0.045513153076171875, 0.04759025573730469, 0.0496673583984375, 0.05174446105957031, 0.053821563720703125, 0.05589866638183594, 0.05797576904296875, 0.06005287170410156, 0.062129974365234375, 0.06420707702636719, 0.0662841796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 14.0, 27.0, 48.0, 78.0, 132.0, 136.0, 152.0, 136.0, 95.0, 70.0, 34.0, 15.0, 10.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.005352020263671875, -0.005211681127548218, -0.0050713419914245605, -0.004931002855300903, -0.004790663719177246, -0.004650324583053589, -0.004509985446929932, -0.004369646310806274, -0.004229307174682617, -0.00408896803855896, -0.003948628902435303, -0.0038082897663116455, -0.0036679506301879883, -0.003527611494064331, -0.003387272357940674, -0.0032469332218170166, -0.0031065940856933594, -0.002966254949569702, -0.002825915813446045, -0.0026855766773223877, -0.0025452375411987305, -0.0024048984050750732, -0.002264559268951416, -0.002124220132827759, -0.0019838809967041016, -0.0018435418605804443, -0.0017032027244567871, -0.0015628635883331299, -0.0014225244522094727, -0.0012821853160858154, -0.0011418461799621582, -0.001001507043838501, -0.0008611679077148438, -0.0007208287715911865, -0.0005804896354675293, -0.00044015049934387207, -0.00029981136322021484, -0.00015947222709655762, -1.913309097290039e-05, 0.00012120604515075684, 0.00026154518127441406, 0.0004018843173980713, 0.0005422234535217285, 0.0006825625896453857, 0.000822901725769043, 0.0009632408618927002, 0.0011035799980163574, 0.0012439191341400146, 0.0013842582702636719, 0.001524597406387329, 0.0016649365425109863, 0.0018052756786346436, 0.0019456148147583008, 0.002085953950881958, 0.0022262930870056152, 0.0023666322231292725, 0.0025069713592529297, 0.002647310495376587, 0.002787649631500244, 0.0029279887676239014, 0.0030683279037475586, 0.003208667039871216, 0.003349006175994873, 0.0034893453121185303, 0.0036296844482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 9.0, 20.0, 10.0, 15.0, 27.0, 53.0, 69.0, 93.0, 171.0, 293.0, 605.0, 1397.0, 3796.0, 14025.0, 192244.0, 796060.0, 30015.0, 5928.0, 1930.0, 826.0, 380.0, 191.0, 141.0, 76.0, 64.0, 32.0, 18.0, 26.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10177898406982422, -0.09851646423339844, -0.09525394439697266, -0.09199142456054688, -0.0887289047241211, -0.08546638488769531, -0.08220386505126953, -0.07894134521484375, -0.07567882537841797, -0.07241630554199219, -0.0691537857055664, -0.06589126586914062, -0.06262874603271484, -0.05936622619628906, -0.05610370635986328, -0.0528411865234375, -0.04957866668701172, -0.04631614685058594, -0.043053627014160156, -0.039791107177734375, -0.036528587341308594, -0.03326606750488281, -0.03000354766845703, -0.02674102783203125, -0.02347850799560547, -0.020215988159179688, -0.016953468322753906, -0.013690948486328125, -0.010428428649902344, -0.0071659088134765625, -0.0039033889770507812, -0.000640869140625, 0.0026216506958007812, 0.0058841705322265625, 0.009146690368652344, 0.012409210205078125, 0.015671730041503906, 0.018934249877929688, 0.02219676971435547, 0.02545928955078125, 0.02872180938720703, 0.03198432922363281, 0.035246849060058594, 0.038509368896484375, 0.041771888732910156, 0.04503440856933594, 0.04829692840576172, 0.0515594482421875, 0.05482196807861328, 0.05808448791503906, 0.061347007751464844, 0.06460952758789062, 0.0678720474243164, 0.07113456726074219, 0.07439708709716797, 0.07765960693359375, 0.08092212677001953, 0.08418464660644531, 0.0874471664428711, 0.09070968627929688, 0.09397220611572266, 0.09723472595214844, 0.10049724578857422, 0.103759765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 5.0, 6.0, 11.0, 9.0, 12.0, 12.0, 20.0, 19.0, 22.0, 28.0, 25.0, 24.0, 41.0, 38.0, 35.0, 38.0, 42.0, 32.0, 37.0, 42.0, 32.0, 44.0, 42.0, 40.0, 41.0, 35.0, 29.0, 25.0, 17.0, 22.0, 16.0, 32.0, 18.0, 9.0, 20.0, 14.0, 11.0, 8.0, 10.0, 2.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014801025390625, -0.014285802841186523, -0.013770580291748047, -0.01325535774230957, -0.012740135192871094, -0.012224912643432617, -0.01170969009399414, -0.011194467544555664, -0.010679244995117188, -0.010164022445678711, -0.009648799896240234, -0.009133577346801758, -0.008618354797363281, -0.008103132247924805, -0.007587909698486328, -0.0070726871490478516, -0.006557464599609375, -0.0060422420501708984, -0.005527019500732422, -0.005011796951293945, -0.004496574401855469, -0.003981351852416992, -0.0034661293029785156, -0.002950906753540039, -0.0024356842041015625, -0.001920461654663086, -0.0014052391052246094, -0.0008900165557861328, -0.00037479400634765625, 0.0001404285430908203, 0.0006556510925292969, 0.0011708736419677734, 0.00168609619140625, 0.0022013187408447266, 0.002716541290283203, 0.0032317638397216797, 0.0037469863891601562, 0.004262208938598633, 0.004777431488037109, 0.005292654037475586, 0.0058078765869140625, 0.006323099136352539, 0.006838321685791016, 0.007353544235229492, 0.007868766784667969, 0.008383989334106445, 0.008899211883544922, 0.009414434432983398, 0.009929656982421875, 0.010444879531860352, 0.010960102081298828, 0.011475324630737305, 0.011990547180175781, 0.012505769729614258, 0.013020992279052734, 0.013536214828491211, 0.014051437377929688, 0.014566659927368164, 0.01508188247680664, 0.015597105026245117, 0.016112327575683594, 0.01662755012512207, 0.017142772674560547, 0.017657995223999023, 0.0181732177734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 0.0, 4.0, 3.0, 8.0, 11.0, 9.0, 15.0, 43.0, 57.0, 92.0, 248.0, 573.0, 2015.0, 10628.0, 835537.0, 190008.0, 6834.0, 1484.0, 531.0, 220.0, 79.0, 41.0, 26.0, 27.0, 15.0, 14.0, 6.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1466064453125, -0.14200973510742188, -0.13741302490234375, -0.13281631469726562, -0.1282196044921875, -0.12362289428710938, -0.11902618408203125, -0.11442947387695312, -0.109832763671875, -0.10523605346679688, -0.10063934326171875, -0.09604263305664062, -0.0914459228515625, -0.08684921264648438, -0.08225250244140625, -0.07765579223632812, -0.07305908203125, -0.06846237182617188, -0.06386566162109375, -0.059268951416015625, -0.0546722412109375, -0.050075531005859375, -0.04547882080078125, -0.040882110595703125, -0.036285400390625, -0.031688690185546875, -0.02709197998046875, -0.022495269775390625, -0.0178985595703125, -0.013301849365234375, -0.00870513916015625, -0.004108428955078125, 0.00048828125, 0.005084991455078125, 0.00968170166015625, 0.014278411865234375, 0.0188751220703125, 0.023471832275390625, 0.02806854248046875, 0.032665252685546875, 0.037261962890625, 0.041858673095703125, 0.04645538330078125, 0.051052093505859375, 0.0556488037109375, 0.060245513916015625, 0.06484222412109375, 0.06943893432617188, 0.07403564453125, 0.07863235473632812, 0.08322906494140625, 0.08782577514648438, 0.0924224853515625, 0.09701919555664062, 0.10161590576171875, 0.10621261596679688, 0.110809326171875, 0.11540603637695312, 0.12000274658203125, 0.12459945678710938, 0.1291961669921875, 0.13379287719726562, 0.13838958740234375, 0.14298629760742188, 0.1475830078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 10.0, 10.0, 21.0, 28.0, 34.0, 47.0, 71.0, 83.0, 114.0, 116.0, 113.0, 81.0, 77.0, 48.0, 35.0, 22.0, 19.0, 17.0, 11.0, 9.0, 5.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006356239318847656, -0.0006187111139297485, -0.0006017982959747314, -0.0005848854780197144, -0.0005679726600646973, -0.0005510598421096802, -0.0005341470241546631, -0.000517234206199646, -0.0005003213882446289, -0.0004834085702896118, -0.0004664957523345947, -0.00044958293437957764, -0.00043267011642456055, -0.00041575729846954346, -0.00039884448051452637, -0.0003819316625595093, -0.0003650188446044922, -0.0003481060266494751, -0.000331193208694458, -0.0003142803907394409, -0.00029736757278442383, -0.00028045475482940674, -0.00026354193687438965, -0.00024662911891937256, -0.00022971630096435547, -0.00021280348300933838, -0.0001958906650543213, -0.0001789778470993042, -0.0001620650291442871, -0.00014515221118927002, -0.00012823939323425293, -0.00011132657527923584, -9.441375732421875e-05, -7.750093936920166e-05, -6.058812141418457e-05, -4.367530345916748e-05, -2.676248550415039e-05, -9.8496675491333e-06, 7.063150405883789e-06, 2.397596836090088e-05, 4.088878631591797e-05, 5.780160427093506e-05, 7.471442222595215e-05, 9.162724018096924e-05, 0.00010854005813598633, 0.00012545287609100342, 0.0001423656940460205, 0.0001592785120010376, 0.0001761913299560547, 0.00019310414791107178, 0.00021001696586608887, 0.00022692978382110596, 0.00024384260177612305, 0.00026075541973114014, 0.0002776682376861572, 0.0002945810556411743, 0.0003114938735961914, 0.0003284066915512085, 0.0003453195095062256, 0.0003622323274612427, 0.00037914514541625977, 0.00039605796337127686, 0.00041297078132629395, 0.00042988359928131104, 0.0004467964172363281]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 7.0, 5.0, 7.0, 15.0, 20.0, 29.0, 45.0, 61.0, 88.0, 194.0, 306.0, 565.0, 1120.0, 2806.0, 8958.0, 59182.0, 930608.0, 33269.0, 6621.0, 2354.0, 1036.0, 520.0, 268.0, 152.0, 104.0, 73.0, 38.0, 30.0, 16.0, 12.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11208057403564453, -0.10813331604003906, -0.1041860580444336, -0.10023880004882812, -0.09629154205322266, -0.09234428405761719, -0.08839702606201172, -0.08444976806640625, -0.08050251007080078, -0.07655525207519531, -0.07260799407958984, -0.06866073608398438, -0.0647134780883789, -0.06076622009277344, -0.05681896209716797, -0.0528717041015625, -0.04892444610595703, -0.04497718811035156, -0.041029930114746094, -0.037082672119140625, -0.033135414123535156, -0.029188156127929688, -0.02524089813232422, -0.02129364013671875, -0.01734638214111328, -0.013399124145507812, -0.009451866149902344, -0.005504608154296875, -0.0015573501586914062, 0.0023899078369140625, 0.006337165832519531, 0.010284423828125, 0.014231681823730469, 0.018178939819335938, 0.022126197814941406, 0.026073455810546875, 0.030020713806152344, 0.03396797180175781, 0.03791522979736328, 0.04186248779296875, 0.04580974578857422, 0.04975700378417969, 0.053704261779785156, 0.057651519775390625, 0.061598777770996094, 0.06554603576660156, 0.06949329376220703, 0.0734405517578125, 0.07738780975341797, 0.08133506774902344, 0.0852823257446289, 0.08922958374023438, 0.09317684173583984, 0.09712409973144531, 0.10107135772705078, 0.10501861572265625, 0.10896587371826172, 0.11291313171386719, 0.11686038970947266, 0.12080764770507812, 0.1247549057006836, 0.12870216369628906, 0.13264942169189453, 0.1365966796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 6.0, 12.0, 27.0, 34.0, 67.0, 79.0, 150.0, 164.0, 165.0, 112.0, 62.0, 37.0, 20.0, 13.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.053558349609375, -0.052138328552246094, -0.05071830749511719, -0.04929828643798828, -0.047878265380859375, -0.04645824432373047, -0.04503822326660156, -0.043618202209472656, -0.04219818115234375, -0.040778160095214844, -0.03935813903808594, -0.03793811798095703, -0.036518096923828125, -0.03509807586669922, -0.03367805480957031, -0.032258033752441406, -0.0308380126953125, -0.029417991638183594, -0.027997970581054688, -0.02657794952392578, -0.025157928466796875, -0.02373790740966797, -0.022317886352539062, -0.020897865295410156, -0.01947784423828125, -0.018057823181152344, -0.016637802124023438, -0.015217781066894531, -0.013797760009765625, -0.012377738952636719, -0.010957717895507812, -0.009537696838378906, -0.00811767578125, -0.006697654724121094, -0.0052776336669921875, -0.0038576126098632812, -0.002437591552734375, -0.0010175704956054688, 0.0004024505615234375, 0.0018224716186523438, 0.00324249267578125, 0.004662513732910156, 0.0060825347900390625, 0.007502555847167969, 0.008922576904296875, 0.010342597961425781, 0.011762619018554688, 0.013182640075683594, 0.0146026611328125, 0.016022682189941406, 0.017442703247070312, 0.01886272430419922, 0.020282745361328125, 0.02170276641845703, 0.023122787475585938, 0.024542808532714844, 0.02596282958984375, 0.027382850646972656, 0.028802871704101562, 0.03022289276123047, 0.031642913818359375, 0.03306293487548828, 0.03448295593261719, 0.035902976989746094, 0.037322998046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 11.0, 24.0, 66.0, 142.0, 426.0, 216.0, 50.0, 23.0, 16.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7422439455986023, -0.718874454498291, -0.6955050230026245, -0.6721355319023132, -0.648766040802002, -0.6253966093063354, -0.6020271182060242, -0.5786576271057129, -0.5552881956100464, -0.5319187045097351, -0.5085492730140686, -0.4851797819137573, -0.46181032061576843, -0.43844085931777954, -0.41507136821746826, -0.39170190691947937, -0.3683324456214905, -0.3449629843235016, -0.3215935230255127, -0.2982240319252014, -0.2748545706272125, -0.25148510932922363, -0.22811563313007355, -0.20474615693092346, -0.18137669563293457, -0.15800723433494568, -0.1346377581357956, -0.1112682893872261, -0.08789882063865662, -0.06452935189008713, -0.04115988314151764, -0.017790406942367554, 0.0055789947509765625, 0.02894846349954605, 0.05231793224811554, 0.07568740099668503, 0.09905686974525452, 0.122426338493824, 0.1457958072423935, 0.16916528344154358, 0.19253474473953247, 0.21590420603752136, 0.23927368223667145, 0.26264315843582153, 0.2860126197338104, 0.3093820810317993, 0.3327515721321106, 0.3561210334300995, 0.3794904947280884, 0.40285995602607727, 0.42622941732406616, 0.44959890842437744, 0.47296836972236633, 0.4963378310203552, 0.5197073221206665, 0.543076753616333, 0.5664462447166443, 0.5898157358169556, 0.6131851673126221, 0.6365546584129333, 0.6599241495132446, 0.6832935810089111, 0.7066630721092224, 0.7300325632095337, 0.7534019947052002]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 5.0, 5.0, 10.0, 17.0, 23.0, 43.0, 57.0, 61.0, 93.0, 100.0, 122.0, 105.0, 72.0, 76.0, 58.0, 37.0, 22.0, 23.0, 17.0, 11.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34716975688934326, -0.3367721736431122, -0.3263745605945587, -0.31597697734832764, -0.30557939410209656, -0.2951818108558655, -0.284784197807312, -0.27438661456108093, -0.26398903131484985, -0.2535914480686188, -0.2431938499212265, -0.23279625177383423, -0.22239866852760315, -0.21200107038021088, -0.2016034722328186, -0.19120588898658752, -0.18080827593803406, -0.17041067779064178, -0.1600130945444107, -0.14961549639701843, -0.13921791315078735, -0.12882031500339508, -0.11842271685600281, -0.10802512615919113, -0.09762753546237946, -0.08722994476556778, -0.0768323540687561, -0.06643475592136383, -0.056037165224552155, -0.04563957452774048, -0.035241980105638504, -0.02484438568353653, -0.014446794986724854, -0.004049202427268028, 0.006348390132188797, 0.016745982691645622, 0.027143575251102448, 0.037541165947914124, 0.0479387603700161, 0.05833635479211807, 0.06873394548892975, 0.07913153618574142, 0.0895291268825531, 0.09992672502994537, 0.11032431572675705, 0.12072190642356873, 0.131119504570961, 0.14151710271835327, 0.15191468596458435, 0.16231228411197662, 0.1727098673582077, 0.18310746550559998, 0.19350504875183105, 0.20390264689922333, 0.2143002450466156, 0.22469782829284668, 0.23509542644023895, 0.24549302458763123, 0.2558906078338623, 0.2662881910800934, 0.27668580412864685, 0.28708338737487793, 0.297480970621109, 0.3078785836696625, 0.31827616691589355]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 33.0, 51.0, 238.0, 4917.0, 4186098.0, 2612.0, 146.0, 54.0, 22.0, 20.0, 13.0, 6.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -7.0166015625, -6.806640625, -6.5966796875, -6.38671875, -6.1767578125, -5.966796875, -5.7568359375, -5.546875, -5.3369140625, -5.126953125, -4.9169921875, -4.70703125, -4.4970703125, -4.287109375, -4.0771484375, -3.8671875, -3.6572265625, -3.447265625, -3.2373046875, -3.02734375, -2.8173828125, -2.607421875, -2.3974609375, -2.1875, -1.9775390625, -1.767578125, -1.5576171875, -1.34765625, -1.1376953125, -0.927734375, -0.7177734375, -0.5078125, -0.2978515625, -0.087890625, 0.1220703125, 0.33203125, 0.5419921875, 0.751953125, 0.9619140625, 1.171875, 1.3818359375, 1.591796875, 1.8017578125, 2.01171875, 2.2216796875, 2.431640625, 2.6416015625, 2.8515625, 3.0615234375, 3.271484375, 3.4814453125, 3.69140625, 3.9013671875, 4.111328125, 4.3212890625, 4.53125, 4.7412109375, 4.951171875, 5.1611328125, 5.37109375, 5.5810546875, 5.791015625, 6.0009765625, 6.2109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 10.0, 6.0, 16.0, 26.0, 55.0, 54.0, 85.0, 102.0, 107.0, 99.0, 107.0, 83.0, 82.0, 40.0, 43.0, 22.0, 20.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037326812744140625, -0.003623664379119873, -0.0035146474838256836, -0.003405630588531494, -0.0032966136932373047, -0.0031875967979431152, -0.0030785799026489258, -0.0029695630073547363, -0.002860546112060547, -0.0027515292167663574, -0.002642512321472168, -0.0025334954261779785, -0.002424478530883789, -0.0023154616355895996, -0.00220644474029541, -0.0020974278450012207, -0.0019884109497070312, -0.0018793940544128418, -0.0017703771591186523, -0.0016613602638244629, -0.0015523433685302734, -0.001443326473236084, -0.0013343095779418945, -0.001225292682647705, -0.0011162757873535156, -0.0010072588920593262, -0.0008982419967651367, -0.0007892251014709473, -0.0006802082061767578, -0.0005711913108825684, -0.0004621744155883789, -0.00035315752029418945, -0.000244140625, -0.00013512372970581055, -2.6106834411621094e-05, 8.291006088256836e-05, 0.0001919269561767578, 0.00030094385147094727, 0.0004099607467651367, 0.0005189776420593262, 0.0006279945373535156, 0.0007370114326477051, 0.0008460283279418945, 0.000955045223236084, 0.0010640621185302734, 0.0011730790138244629, 0.0012820959091186523, 0.0013911128044128418, 0.0015001296997070312, 0.0016091465950012207, 0.0017181634902954102, 0.0018271803855895996, 0.001936197280883789, 0.0020452141761779785, 0.002154231071472168, 0.0022632479667663574, 0.002372264862060547, 0.0024812817573547363, 0.0025902986526489258, 0.0026993155479431152, 0.0028083324432373047, 0.002917349338531494, 0.0030263662338256836, 0.003135383129119873, 0.0032444000244140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 24.0, 49.0, 142.0, 244.0, 513.0, 9983.0, 4182577.0, 501.0, 124.0, 40.0, 26.0, 20.0, 8.0, 13.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.8203125, -5.7066497802734375, -5.592987060546875, -5.4793243408203125, -5.36566162109375, -5.2519989013671875, -5.138336181640625, -5.0246734619140625, -4.9110107421875, -4.7973480224609375, -4.683685302734375, -4.5700225830078125, -4.45635986328125, -4.3426971435546875, -4.229034423828125, -4.1153717041015625, -4.001708984375, -3.8880462646484375, -3.774383544921875, -3.6607208251953125, -3.54705810546875, -3.4333953857421875, -3.319732666015625, -3.2060699462890625, -3.0924072265625, -2.9787445068359375, -2.865081787109375, -2.7514190673828125, -2.63775634765625, -2.5240936279296875, -2.410430908203125, -2.2967681884765625, -2.18310546875, -2.0694427490234375, -1.955780029296875, -1.8421173095703125, -1.72845458984375, -1.6147918701171875, -1.501129150390625, -1.3874664306640625, -1.2738037109375, -1.1601409912109375, -1.046478271484375, -0.9328155517578125, -0.81915283203125, -0.7054901123046875, -0.591827392578125, -0.4781646728515625, -0.364501953125, -0.2508392333984375, -0.137176513671875, -0.0235137939453125, 0.09014892578125, 0.2038116455078125, 0.317474365234375, 0.4311370849609375, 0.5447998046875, 0.6584625244140625, 0.772125244140625, 0.8857879638671875, 0.99945068359375, 1.1131134033203125, 1.226776123046875, 1.3404388427734375, 1.4541015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 11.0, 11.0, 27.0, 67.0, 151.0, 318.0, 588.0, 1585.0, 773.0, 287.0, 124.0, 59.0, 32.0, 21.0, 12.0, 11.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.05120849609375, -0.05022120475769043, -0.04923391342163086, -0.04824662208557129, -0.04725933074951172, -0.04627203941345215, -0.04528474807739258, -0.04429745674133301, -0.04331016540527344, -0.04232287406921387, -0.0413355827331543, -0.04034829139709473, -0.039361000061035156, -0.038373708724975586, -0.037386417388916016, -0.036399126052856445, -0.035411834716796875, -0.034424543380737305, -0.033437252044677734, -0.032449960708618164, -0.031462669372558594, -0.030475378036499023, -0.029488086700439453, -0.028500795364379883, -0.027513504028320312, -0.026526212692260742, -0.025538921356201172, -0.0245516300201416, -0.02356433868408203, -0.02257704734802246, -0.02158975601196289, -0.02060246467590332, -0.01961517333984375, -0.01862788200378418, -0.01764059066772461, -0.01665329933166504, -0.01566600799560547, -0.014678716659545898, -0.013691425323486328, -0.012704133987426758, -0.011716842651367188, -0.010729551315307617, -0.009742259979248047, -0.008754968643188477, -0.007767677307128906, -0.006780385971069336, -0.005793094635009766, -0.004805803298950195, -0.003818511962890625, -0.0028312206268310547, -0.0018439292907714844, -0.0008566379547119141, 0.00013065338134765625, 0.0011179447174072266, 0.002105236053466797, 0.003092527389526367, 0.0040798187255859375, 0.005067110061645508, 0.006054401397705078, 0.0070416927337646484, 0.008028984069824219, 0.009016275405883789, 0.01000356674194336, 0.01099085807800293, 0.0119781494140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 13.0, 115.0, 894.0], "bins": [-23.300260543823242, -22.931734085083008, -22.563209533691406, -22.194683074951172, -21.826156616210938, -21.457630157470703, -21.0891056060791, -20.720579147338867, -20.352052688598633, -19.9835262298584, -19.615001678466797, -19.246475219726562, -18.877948760986328, -18.509422302246094, -18.140897750854492, -17.772371292114258, -17.403846740722656, -17.035320281982422, -16.66679573059082, -16.298269271850586, -15.929742813110352, -15.561217308044434, -15.192691802978516, -14.824165344238281, -14.455638885498047, -14.087113380432129, -13.718586921691895, -13.350061416625977, -12.981534957885742, -12.613009452819824, -12.244483947753906, -11.875957489013672, -11.507431030273438, -11.13890552520752, -10.770379066467285, -10.401853561401367, -10.033327102661133, -9.664801597595215, -9.296276092529297, -8.927749633789062, -8.559224128723145, -8.190698623657227, -7.822172164916992, -7.453646659851074, -7.08512020111084, -6.716594696044922, -6.348068714141846, -5.9795427322387695, -5.611016273498535, -5.242490291595459, -4.873964309692383, -4.505438804626465, -4.1369123458862305, -3.7683866024017334, -3.3998608589172363, -3.03133487701416, -2.662808895111084, -2.294282913208008, -1.9257570505142212, -1.5572311878204346, -1.1887052059173584, -0.8201792240142822, -0.45165348052978516, -0.08312749862670898, 0.2853984534740448]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 18.0, 33.0, 82.0, 162.0, 213.0, 222.0, 146.0, 63.0, 37.0, 18.0, 6.0, 3.0], "bins": [-1.6313228607177734, -1.6025618314743042, -1.573800802230835, -1.5450397729873657, -1.5162787437438965, -1.4875178337097168, -1.4587568044662476, -1.4299957752227783, -1.401234745979309, -1.3724737167358398, -1.3437126874923706, -1.3149516582489014, -1.2861907482147217, -1.2574297189712524, -1.2286686897277832, -1.199907660484314, -1.1711466312408447, -1.1423856019973755, -1.1136245727539062, -1.084863543510437, -1.0561025142669678, -1.027341604232788, -0.9985805749893188, -0.9698195457458496, -0.9410585165023804, -0.9122974872589111, -0.8835364580154419, -0.8547754883766174, -0.8260144591331482, -0.797253429889679, -0.7684924602508545, -0.7397314310073853, -0.7109704613685608, -0.6822094321250916, -0.6534484624862671, -0.6246874332427979, -0.5959264039993286, -0.5671653747558594, -0.5384043455123901, -0.5096433758735657, -0.48088234663009644, -0.4521213173866272, -0.42336031794548035, -0.3945993185043335, -0.36583828926086426, -0.337077260017395, -0.30831626057624817, -0.2795552611351013, -0.2507942318916321, -0.22203321754932404, -0.193272203207016, -0.16451118886470795, -0.1357501745223999, -0.10698916018009186, -0.07822814583778381, -0.04946713149547577, -0.020706117153167725, 0.00805489718914032, 0.036815911531448364, 0.06557692587375641, 0.09433794021606445, 0.1230989545583725, 0.15185996890068054, 0.1806209832429886, 0.20938199758529663]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 4.0, 1.0, 8.0, 9.0, 9.0, 4.0, 13.0, 10.0, 19.0, 18.0, 31.0, 28.0, 50.0, 89.0, 186.0, 438.0, 1460.0, 7941.0, 96486.0, 889476.0, 45573.0, 4891.0, 1005.0, 348.0, 128.0, 83.0, 48.0, 32.0, 27.0, 24.0, 15.0, 16.0, 15.0, 7.0, 9.0, 6.0, 9.0, 3.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.272216796875, -0.2638092041015625, -0.255401611328125, -0.2469940185546875, -0.23858642578125, -0.2301788330078125, -0.221771240234375, -0.2133636474609375, -0.2049560546875, -0.1965484619140625, -0.188140869140625, -0.1797332763671875, -0.17132568359375, -0.1629180908203125, -0.154510498046875, -0.1461029052734375, -0.1376953125, -0.1292877197265625, -0.120880126953125, -0.1124725341796875, -0.10406494140625, -0.0956573486328125, -0.087249755859375, -0.0788421630859375, -0.0704345703125, -0.0620269775390625, -0.053619384765625, -0.0452117919921875, -0.03680419921875, -0.0283966064453125, -0.019989013671875, -0.0115814208984375, -0.003173828125, 0.0052337646484375, 0.013641357421875, 0.0220489501953125, 0.03045654296875, 0.0388641357421875, 0.047271728515625, 0.0556793212890625, 0.0640869140625, 0.0724945068359375, 0.080902099609375, 0.0893096923828125, 0.09771728515625, 0.1061248779296875, 0.114532470703125, 0.1229400634765625, 0.13134765625, 0.1397552490234375, 0.148162841796875, 0.1565704345703125, 0.16497802734375, 0.1733856201171875, 0.181793212890625, 0.1902008056640625, 0.1986083984375, 0.2070159912109375, 0.215423583984375, 0.2238311767578125, 0.23223876953125, 0.2406463623046875, 0.249053955078125, 0.2574615478515625, 0.265869140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 30.0, 50.0, 129.0, 197.0, 264.0, 173.0, 87.0, 34.0, 22.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.01894831657409668, -0.01856374740600586, -0.01817917823791504, -0.01779460906982422, -0.0174100399017334, -0.017025470733642578, -0.016640901565551758, -0.016256332397460938, -0.015871763229370117, -0.015487194061279297, -0.015102624893188477, -0.014718055725097656, -0.014333486557006836, -0.013948917388916016, -0.013564348220825195, -0.013179779052734375, -0.012795209884643555, -0.012410640716552734, -0.012026071548461914, -0.011641502380371094, -0.011256933212280273, -0.010872364044189453, -0.010487794876098633, -0.010103225708007812, -0.009718656539916992, -0.009334087371826172, -0.008949518203735352, -0.008564949035644531, -0.008180379867553711, -0.007795810699462891, -0.00741124153137207, -0.00702667236328125, -0.00664210319519043, -0.006257534027099609, -0.005872964859008789, -0.005488395690917969, -0.0051038265228271484, -0.004719257354736328, -0.004334688186645508, -0.0039501190185546875, -0.003565549850463867, -0.003180980682373047, -0.0027964115142822266, -0.0024118423461914062, -0.002027273178100586, -0.0016427040100097656, -0.0012581348419189453, -0.000873565673828125, -0.0004889965057373047, -0.00010442733764648438, 0.00028014183044433594, 0.0006647109985351562, 0.0010492801666259766, 0.0014338493347167969, 0.0018184185028076172, 0.0022029876708984375, 0.002587556838989258, 0.002972126007080078, 0.0033566951751708984, 0.0037412643432617188, 0.004125833511352539, 0.004510402679443359, 0.00489497184753418, 0.005279541015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 5.0, 15.0, 22.0, 31.0, 33.0, 40.0, 63.0, 104.0, 330.0, 2846.0, 978767.0, 64731.0, 1058.0, 199.0, 79.0, 60.0, 39.0, 21.0, 19.0, 14.0, 15.0, 14.0, 6.0, 5.0, 2.0, 2.0, 6.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.51708984375, -0.501800537109375, -0.48651123046875, -0.471221923828125, -0.4559326171875, -0.440643310546875, -0.42535400390625, -0.410064697265625, -0.394775390625, -0.379486083984375, -0.36419677734375, -0.348907470703125, -0.3336181640625, -0.318328857421875, -0.30303955078125, -0.287750244140625, -0.2724609375, -0.257171630859375, -0.24188232421875, -0.226593017578125, -0.2113037109375, -0.196014404296875, -0.18072509765625, -0.165435791015625, -0.150146484375, -0.134857177734375, -0.11956787109375, -0.104278564453125, -0.0889892578125, -0.073699951171875, -0.05841064453125, -0.043121337890625, -0.02783203125, -0.012542724609375, 0.00274658203125, 0.018035888671875, 0.0333251953125, 0.048614501953125, 0.06390380859375, 0.079193115234375, 0.094482421875, 0.109771728515625, 0.12506103515625, 0.140350341796875, 0.1556396484375, 0.170928955078125, 0.18621826171875, 0.201507568359375, 0.216796875, 0.232086181640625, 0.24737548828125, 0.262664794921875, 0.2779541015625, 0.293243408203125, 0.30853271484375, 0.323822021484375, 0.339111328125, 0.354400634765625, 0.36968994140625, 0.384979248046875, 0.4002685546875, 0.415557861328125, 0.43084716796875, 0.446136474609375, 0.46142578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 7.0, 8.0, 8.0, 7.0, 17.0, 24.0, 21.0, 24.0, 38.0, 40.0, 31.0, 50.0, 45.0, 45.0, 46.0, 51.0, 59.0, 48.0, 44.0, 48.0, 56.0, 43.0, 41.0, 38.0, 29.0, 25.0, 18.0, 23.0, 16.0, 8.0, 8.0, 3.0, 9.0, 5.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017852783203125, -0.017203569412231445, -0.01655435562133789, -0.015905141830444336, -0.015255928039550781, -0.014606714248657227, -0.013957500457763672, -0.013308286666870117, -0.012659072875976562, -0.012009859085083008, -0.011360645294189453, -0.010711431503295898, -0.010062217712402344, -0.009413003921508789, -0.008763790130615234, -0.00811457633972168, -0.007465362548828125, -0.00681614875793457, -0.006166934967041016, -0.005517721176147461, -0.004868507385253906, -0.0042192935943603516, -0.003570079803466797, -0.002920866012573242, -0.0022716522216796875, -0.0016224384307861328, -0.0009732246398925781, -0.00032401084899902344, 0.00032520294189453125, 0.0009744167327880859, 0.0016236305236816406, 0.0022728443145751953, 0.00292205810546875, 0.0035712718963623047, 0.004220485687255859, 0.004869699478149414, 0.005518913269042969, 0.0061681270599365234, 0.006817340850830078, 0.007466554641723633, 0.008115768432617188, 0.008764982223510742, 0.009414196014404297, 0.010063409805297852, 0.010712623596191406, 0.011361837387084961, 0.012011051177978516, 0.01266026496887207, 0.013309478759765625, 0.01395869255065918, 0.014607906341552734, 0.015257120132446289, 0.015906333923339844, 0.0165555477142334, 0.017204761505126953, 0.017853975296020508, 0.018503189086914062, 0.019152402877807617, 0.019801616668701172, 0.020450830459594727, 0.02110004425048828, 0.021749258041381836, 0.02239847183227539, 0.023047685623168945, 0.0236968994140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 19.0, 21.0, 52.0, 98.0, 441.0, 12404.0, 1033973.0, 1251.0, 187.0, 53.0, 20.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.16015625, -2.1144180297851562, -2.0686798095703125, -2.0229415893554688, -1.977203369140625, -1.9314651489257812, -1.8857269287109375, -1.8399887084960938, -1.79425048828125, -1.7485122680664062, -1.7027740478515625, -1.6570358276367188, -1.611297607421875, -1.5655593872070312, -1.5198211669921875, -1.4740829467773438, -1.4283447265625, -1.3826065063476562, -1.3368682861328125, -1.2911300659179688, -1.245391845703125, -1.1996536254882812, -1.1539154052734375, -1.1081771850585938, -1.06243896484375, -1.0167007446289062, -0.9709625244140625, -0.9252243041992188, -0.879486083984375, -0.8337478637695312, -0.7880096435546875, -0.7422714233398438, -0.696533203125, -0.6507949829101562, -0.6050567626953125, -0.5593185424804688, -0.513580322265625, -0.46784210205078125, -0.4221038818359375, -0.37636566162109375, -0.33062744140625, -0.28488922119140625, -0.2391510009765625, -0.19341278076171875, -0.147674560546875, -0.10193634033203125, -0.0561981201171875, -0.01045989990234375, 0.0352783203125, 0.08101654052734375, 0.1267547607421875, 0.17249298095703125, 0.218231201171875, 0.26396942138671875, 0.3097076416015625, 0.35544586181640625, 0.40118408203125, 0.44692230224609375, 0.4926605224609375, 0.5383987426757812, 0.584136962890625, 0.6298751831054688, 0.6756134033203125, 0.7213516235351562, 0.76708984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 14.0, 12.0, 25.0, 28.0, 36.0, 64.0, 132.0, 257.0, 120.0, 85.0, 58.0, 37.0, 29.0, 19.0, 16.0, 7.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011320114135742188, -0.0010859668254852295, -0.0010399222373962402, -0.000993877649307251, -0.0009478330612182617, -0.0009017884731292725, -0.0008557438850402832, -0.0008096992969512939, -0.0007636547088623047, -0.0007176101207733154, -0.0006715655326843262, -0.0006255209445953369, -0.0005794763565063477, -0.0005334317684173584, -0.00048738718032836914, -0.0004413425922393799, -0.0003952980041503906, -0.00034925341606140137, -0.0003032088279724121, -0.00025716423988342285, -0.0002111196517944336, -0.00016507506370544434, -0.00011903047561645508, -7.298588752746582e-05, -2.6941299438476562e-05, 1.9103288650512695e-05, 6.514787673950195e-05, 0.00011119246482849121, 0.00015723705291748047, 0.00020328164100646973, 0.000249326229095459, 0.00029537081718444824, 0.0003414154052734375, 0.00038745999336242676, 0.000433504581451416, 0.0004795491695404053, 0.0005255937576293945, 0.0005716383457183838, 0.000617682933807373, 0.0006637275218963623, 0.0007097721099853516, 0.0007558166980743408, 0.0008018612861633301, 0.0008479058742523193, 0.0008939504623413086, 0.0009399950504302979, 0.0009860396385192871, 0.0010320842266082764, 0.0010781288146972656, 0.0011241734027862549, 0.0011702179908752441, 0.0012162625789642334, 0.0012623071670532227, 0.001308351755142212, 0.0013543963432312012, 0.0014004409313201904, 0.0014464855194091797, 0.001492530107498169, 0.0015385746955871582, 0.0015846192836761475, 0.0016306638717651367, 0.001676708459854126, 0.0017227530479431152, 0.0017687976360321045, 0.0018148422241210938]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 10.0, 13.0, 28.0, 94.0, 564.0, 11023.0, 1023372.0, 12678.0, 585.0, 91.0, 35.0, 15.0, 7.0, 8.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8701171875, -0.8425064086914062, -0.8148956298828125, -0.7872848510742188, -0.759674072265625, -0.7320632934570312, -0.7044525146484375, -0.6768417358398438, -0.64923095703125, -0.6216201782226562, -0.5940093994140625, -0.5663986206054688, -0.538787841796875, -0.5111770629882812, -0.4835662841796875, -0.45595550537109375, -0.4283447265625, -0.40073394775390625, -0.3731231689453125, -0.34551239013671875, -0.317901611328125, -0.29029083251953125, -0.2626800537109375, -0.23506927490234375, -0.20745849609375, -0.17984771728515625, -0.1522369384765625, -0.12462615966796875, -0.097015380859375, -0.06940460205078125, -0.0417938232421875, -0.01418304443359375, 0.013427734375, 0.04103851318359375, 0.0686492919921875, 0.09626007080078125, 0.123870849609375, 0.15148162841796875, 0.1790924072265625, 0.20670318603515625, 0.23431396484375, 0.26192474365234375, 0.2895355224609375, 0.31714630126953125, 0.344757080078125, 0.37236785888671875, 0.3999786376953125, 0.42758941650390625, 0.4552001953125, 0.48281097412109375, 0.5104217529296875, 0.5380325317382812, 0.565643310546875, 0.5932540893554688, 0.6208648681640625, 0.6484756469726562, 0.67608642578125, 0.7036972045898438, 0.7313079833984375, 0.7589187622070312, 0.786529541015625, 0.8141403198242188, 0.8417510986328125, 0.8693618774414062, 0.89697265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 8.0, 7.0, 9.0, 18.0, 25.0, 24.0, 52.0, 51.0, 119.0, 353.0, 119.0, 57.0, 36.0, 26.0, 21.0, 11.0, 10.0, 12.0, 1.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07647705078125, -0.07411766052246094, -0.07175827026367188, -0.06939888000488281, -0.06703948974609375, -0.06468009948730469, -0.062320709228515625, -0.05996131896972656, -0.0576019287109375, -0.05524253845214844, -0.052883148193359375, -0.05052375793457031, -0.04816436767578125, -0.04580497741699219, -0.043445587158203125, -0.04108619689941406, -0.038726806640625, -0.03636741638183594, -0.034008026123046875, -0.03164863586425781, -0.02928924560546875, -0.026929855346679688, -0.024570465087890625, -0.022211074829101562, -0.0198516845703125, -0.017492294311523438, -0.015132904052734375, -0.012773513793945312, -0.01041412353515625, -0.008054733276367188, -0.005695343017578125, -0.0033359527587890625, -0.0009765625, 0.0013828277587890625, 0.003742218017578125, 0.0061016082763671875, 0.00846099853515625, 0.010820388793945312, 0.013179779052734375, 0.015539169311523438, 0.0178985595703125, 0.020257949829101562, 0.022617340087890625, 0.024976730346679688, 0.02733612060546875, 0.029695510864257812, 0.032054901123046875, 0.03441429138183594, 0.036773681640625, 0.03913307189941406, 0.041492462158203125, 0.04385185241699219, 0.04621124267578125, 0.04857063293457031, 0.050930023193359375, 0.05328941345214844, 0.0556488037109375, 0.05800819396972656, 0.060367584228515625, 0.06272697448730469, 0.06508636474609375, 0.06744575500488281, 0.06980514526367188, 0.07216453552246094, 0.07452392578125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 8.0, 20.0, 66.0, 431.0, 376.0, 89.0, 16.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3513333201408386, -0.30708345770835876, -0.2628335654735565, -0.21858370304107666, -0.1743338257074356, -0.13008394837379456, -0.0858340859413147, -0.04158419370651245, 0.0026656687259674072, 0.04691554233431816, 0.09116541594266891, 0.13541528582572937, 0.17966516315937042, 0.22391504049301147, 0.26816490292549133, 0.3124147951602936, 0.35666465759277344, 0.4009145200252533, 0.44516441226005554, 0.4894142746925354, 0.5336641669273376, 0.5779139995574951, 0.6221638917922974, 0.6664137840270996, 0.7106636762619019, 0.7549135684967041, 0.7991634011268616, 0.8434132933616638, 0.8876631855964661, 0.9319130182266235, 0.9761629104614258, 1.020412802696228, 1.0646625757217407, 1.108912467956543, 1.1531623601913452, 1.1974122524261475, 1.2416620254516602, 1.2859119176864624, 1.3301618099212646, 1.374411702156067, 1.4186615943908691, 1.4629114866256714, 1.5071613788604736, 1.5514111518859863, 1.5956610441207886, 1.6399109363555908, 1.684160828590393, 1.7284107208251953, 1.772660493850708, 1.8169103860855103, 1.8611602783203125, 1.9054100513458252, 1.9496599435806274, 1.9939098358154297, 2.0381598472595215, 2.082409620285034, 2.126659631729126, 2.1709094047546387, 2.2151594161987305, 2.259409189224243, 2.303659200668335, 2.3479089736938477, 2.3921589851379395, 2.436408758163452, 2.480658531188965]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 16.0, 13.0, 32.0, 45.0, 47.0, 54.0, 65.0, 79.0, 78.0, 74.0, 81.0, 81.0, 73.0, 58.0, 60.0, 22.0, 31.0, 15.0, 13.0, 13.0, 11.0, 6.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14363634586334229, -0.13680697977542877, -0.12997761368751526, -0.12314825505018234, -0.11631888896226883, -0.10948952287435532, -0.1026601642370224, -0.09583079814910889, -0.08900143206119537, -0.08217206597328186, -0.07534269988536835, -0.06851334124803543, -0.06168397516012192, -0.054854609072208405, -0.04802524670958519, -0.041195884346961975, -0.03436651825904846, -0.027537154033780098, -0.020707789808511734, -0.01387842558324337, -0.007049061357975006, -0.00021969527006149292, 0.006609667092561722, 0.013439029455184937, 0.02026839554309845, 0.027097759768366814, 0.03392712399363518, 0.04075648635625839, 0.047585852444171906, 0.05441521853208542, 0.06124458089470863, 0.06807394325733185, 0.07490330934524536, 0.08173267543315887, 0.08856204152107239, 0.0953914001584053, 0.10222076624631882, 0.10905013233423233, 0.11587949097156525, 0.12270885705947876, 0.12953822314739227, 0.1363675892353058, 0.1431969553232193, 0.1500263214111328, 0.15685567259788513, 0.16368505358695984, 0.17051440477371216, 0.17734377086162567, 0.18417313694953918, 0.1910025030374527, 0.1978318691253662, 0.20466123521327972, 0.21149060130119324, 0.21831995248794556, 0.22514931857585907, 0.23197868466377258, 0.2388080507516861, 0.2456374168395996, 0.25246676802635193, 0.25929614901542664, 0.26612550020217896, 0.27295488119125366, 0.279784232378006, 0.2866135835647583, 0.293442964553833]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 6.0, 10.0, 10.0, 14.0, 10.0, 18.0, 16.0, 22.0, 20.0, 52.0, 349.0, 4193323.0, 224.0, 48.0, 36.0, 24.0, 22.0, 10.0, 10.0, 8.0, 10.0, 10.0, 2.0, 6.0, 4.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.234375, -7.0303955078125, -6.826416015625, -6.6224365234375, -6.41845703125, -6.2144775390625, -6.010498046875, -5.8065185546875, -5.6025390625, -5.3985595703125, -5.194580078125, -4.9906005859375, -4.78662109375, -4.5826416015625, -4.378662109375, -4.1746826171875, -3.970703125, -3.7667236328125, -3.562744140625, -3.3587646484375, -3.15478515625, -2.9508056640625, -2.746826171875, -2.5428466796875, -2.3388671875, -2.1348876953125, -1.930908203125, -1.7269287109375, -1.52294921875, -1.3189697265625, -1.114990234375, -0.9110107421875, -0.70703125, -0.5030517578125, -0.299072265625, -0.0950927734375, 0.10888671875, 0.3128662109375, 0.516845703125, 0.7208251953125, 0.9248046875, 1.1287841796875, 1.332763671875, 1.5367431640625, 1.74072265625, 1.9447021484375, 2.148681640625, 2.3526611328125, 2.556640625, 2.7606201171875, 2.964599609375, 3.1685791015625, 3.37255859375, 3.5765380859375, 3.780517578125, 3.9844970703125, 4.1884765625, 4.3924560546875, 4.596435546875, 4.8004150390625, 5.00439453125, 5.2083740234375, 5.412353515625, 5.6163330078125, 5.8203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 12.0, 20.0, 36.0, 50.0, 76.0, 114.0, 140.0, 128.0, 124.0, 90.0, 74.0, 53.0, 20.0, 18.0, 14.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01052093505859375, -0.010283112525939941, -0.010045289993286133, -0.009807467460632324, -0.009569644927978516, -0.009331822395324707, -0.009093999862670898, -0.00885617733001709, -0.008618354797363281, -0.008380532264709473, -0.008142709732055664, -0.007904887199401855, -0.007667064666748047, -0.007429242134094238, -0.00719141960144043, -0.006953597068786621, -0.0067157745361328125, -0.006477952003479004, -0.006240129470825195, -0.006002306938171387, -0.005764484405517578, -0.0055266618728637695, -0.005288839340209961, -0.005051016807556152, -0.004813194274902344, -0.004575371742248535, -0.0043375492095947266, -0.004099726676940918, -0.0038619041442871094, -0.0036240816116333008, -0.003386259078979492, -0.0031484365463256836, -0.002910614013671875, -0.0026727914810180664, -0.002434968948364258, -0.0021971464157104492, -0.0019593238830566406, -0.001721501350402832, -0.0014836788177490234, -0.0012458562850952148, -0.0010080337524414062, -0.0007702112197875977, -0.0005323886871337891, -0.00029456615447998047, -5.6743621826171875e-05, 0.00018107891082763672, 0.0004189014434814453, 0.0006567239761352539, 0.0008945465087890625, 0.001132369041442871, 0.0013701915740966797, 0.0016080141067504883, 0.0018458366394042969, 0.0020836591720581055, 0.002321481704711914, 0.0025593042373657227, 0.0027971267700195312, 0.00303494930267334, 0.0032727718353271484, 0.003510594367980957, 0.0037484169006347656, 0.003986239433288574, 0.004224061965942383, 0.004461884498596191, 0.00469970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 13.0, 44.0, 90.0, 313.0, 4166956.0, 25142.0, 393.0, 301.0, 180.0, 112.0, 79.0, 76.0, 57.0, 55.0, 47.0, 42.0, 35.0, 41.0, 27.0, 32.0, 32.0, 15.0, 14.0, 19.0, 15.0, 21.0, 16.0, 13.0, 6.0, 13.0, 14.0, 14.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.294921875, -2.140472412109375, -1.98602294921875, -1.831573486328125, -1.6771240234375, -1.522674560546875, -1.36822509765625, -1.213775634765625, -1.059326171875, -0.904876708984375, -0.75042724609375, -0.595977783203125, -0.4415283203125, -0.287078857421875, -0.13262939453125, 0.021820068359375, 0.17626953125, 0.330718994140625, 0.48516845703125, 0.639617919921875, 0.7940673828125, 0.948516845703125, 1.10296630859375, 1.257415771484375, 1.411865234375, 1.566314697265625, 1.72076416015625, 1.875213623046875, 2.0296630859375, 2.184112548828125, 2.33856201171875, 2.493011474609375, 2.6474609375, 2.801910400390625, 2.95635986328125, 3.110809326171875, 3.2652587890625, 3.419708251953125, 3.57415771484375, 3.728607177734375, 3.883056640625, 4.037506103515625, 4.19195556640625, 4.346405029296875, 4.5008544921875, 4.655303955078125, 4.80975341796875, 4.964202880859375, 5.11865234375, 5.273101806640625, 5.42755126953125, 5.582000732421875, 5.7364501953125, 5.890899658203125, 6.04534912109375, 6.199798583984375, 6.354248046875, 6.508697509765625, 6.66314697265625, 6.817596435546875, 6.9720458984375, 7.126495361328125, 7.28094482421875, 7.435394287109375, 7.58984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 16.0, 32.0, 49.0, 60.0, 143.0, 280.0, 818.0, 766.0, 500.0, 343.0, 226.0, 139.0, 101.0, 89.0, 73.0, 57.0, 36.0, 41.0, 41.0, 32.0, 24.0, 20.0, 25.0, 20.0, 14.0, 19.0, 11.0, 7.0, 14.0, 8.0, 10.0, 4.0, 6.0, 4.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0233306884765625, -0.022351503372192383, -0.021372318267822266, -0.02039313316345215, -0.01941394805908203, -0.018434762954711914, -0.017455577850341797, -0.01647639274597168, -0.015497207641601562, -0.014518022537231445, -0.013538837432861328, -0.012559652328491211, -0.011580467224121094, -0.010601282119750977, -0.00962209701538086, -0.008642911911010742, -0.007663726806640625, -0.006684541702270508, -0.005705356597900391, -0.0047261714935302734, -0.0037469863891601562, -0.002767801284790039, -0.0017886161804199219, -0.0008094310760498047, 0.0001697540283203125, 0.0011489391326904297, 0.002128124237060547, 0.003107309341430664, 0.004086494445800781, 0.0050656795501708984, 0.006044864654541016, 0.007024049758911133, 0.00800323486328125, 0.008982419967651367, 0.009961605072021484, 0.010940790176391602, 0.011919975280761719, 0.012899160385131836, 0.013878345489501953, 0.01485753059387207, 0.015836715698242188, 0.016815900802612305, 0.017795085906982422, 0.01877427101135254, 0.019753456115722656, 0.020732641220092773, 0.02171182632446289, 0.022691011428833008, 0.023670196533203125, 0.024649381637573242, 0.02562856674194336, 0.026607751846313477, 0.027586936950683594, 0.02856612205505371, 0.029545307159423828, 0.030524492263793945, 0.03150367736816406, 0.03248286247253418, 0.0334620475769043, 0.034441232681274414, 0.03542041778564453, 0.03639960289001465, 0.037378787994384766, 0.03835797309875488, 0.039337158203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 12.0, 445.0, 522.0, 34.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5375372171401978, -1.1506609916687012, -0.7637848854064941, -0.37690865993499756, 0.009967446327209473, 0.3968435525894165, 0.7837198972702026, 1.1705960035324097, 1.5574721097946167, 1.9443483352661133, 2.3312244415283203, 2.7181005477905273, 3.1049766540527344, 3.4918527603149414, 3.8787293434143066, 4.265605449676514, 4.652481555938721, 5.039357662200928, 5.426233768463135, 5.8131103515625, 6.199986457824707, 6.586862564086914, 6.973738670349121, 7.360614776611328, 7.747490882873535, 8.134366989135742, 8.52124309539795, 8.908119201660156, 9.294995307922363, 9.68187141418457, 10.068748474121094, 10.455623626708984, 10.842500686645508, 11.229376792907715, 11.616252899169922, 12.003129005432129, 12.390005111694336, 12.776881217956543, 13.16375732421875, 13.550634384155273, 13.937509536743164, 14.324385643005371, 14.711261749267578, 15.098137855529785, 15.485013961791992, 15.8718900680542, 16.258766174316406, 16.64564323425293, 17.032520294189453, 17.419397354125977, 17.806272506713867, 18.19314956665039, 18.58002471923828, 18.966901779174805, 19.353776931762695, 19.74065399169922, 20.12752914428711, 20.514406204223633, 20.901281356811523, 21.288158416748047, 21.675033569335938, 22.06191062927246, 22.44878578186035, 22.835662841796875, 23.222537994384766]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 1.0, 7.0, 8.0, 4.0, 11.0, 18.0, 20.0, 25.0, 16.0, 28.0, 33.0, 21.0, 41.0, 29.0, 31.0, 35.0, 43.0, 32.0, 31.0, 46.0, 34.0, 53.0, 44.0, 46.0, 35.0, 45.0, 32.0, 24.0, 35.0, 29.0, 22.0, 17.0, 18.0, 11.0, 12.0, 8.0, 10.0, 8.0, 11.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0331944227218628, -1.0024491548538208, -0.9717039465904236, -0.9409586787223816, -0.9102134108543396, -0.8794682025909424, -0.8487229347229004, -0.8179776668548584, -0.7872323989868164, -0.7564871311187744, -0.7257419228553772, -0.6949966549873352, -0.6642513871192932, -0.633506178855896, -0.602760910987854, -0.572015643119812, -0.54127037525177, -0.510525107383728, -0.4797798693180084, -0.4490346312522888, -0.4182893633842468, -0.3875441253185272, -0.3567988872528076, -0.3260536193847656, -0.2953084111213684, -0.2645631730556488, -0.2338179051876068, -0.2030726671218872, -0.17232739925384521, -0.1415821611881256, -0.11083690822124481, -0.08009165525436401, -0.04934638738632202, -0.018601136282086372, 0.012144114822149277, 0.04288936406373978, 0.07363461703062057, 0.10437986254692078, 0.13512511551380157, 0.16587036848068237, 0.19661562144756317, 0.22736087441444397, 0.2581061124801636, 0.28885138034820557, 0.31959661841392517, 0.3503418564796448, 0.38108712434768677, 0.41183239221572876, 0.44257763028144836, 0.47332286834716797, 0.50406813621521, 0.534813404083252, 0.5655586123466492, 0.5963038802146912, 0.6270491480827332, 0.6577943563461304, 0.6885396242141724, 0.7192848920822144, 0.7500301003456116, 0.7807753682136536, 0.8115206360816956, 0.8422658443450928, 0.8730111122131348, 0.9037563800811768, 0.9345016479492188]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 7.0, 16.0, 24.0, 19.0, 23.0, 30.0, 28.0, 30.0, 35.0, 36.0, 45.0, 71.0, 583.0, 18681.0, 977695.0, 49667.0, 1097.0, 82.0, 44.0, 33.0, 42.0, 31.0, 32.0, 26.0, 22.0, 23.0, 19.0, 13.0, 17.0, 14.0, 10.0, 3.0, 4.0, 4.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.32867431640625, -2.2550048828125, -2.18133544921875, -2.107666015625, -2.03399658203125, -1.9603271484375, -1.88665771484375, -1.81298828125, -1.73931884765625, -1.6656494140625, -1.59197998046875, -1.518310546875, -1.44464111328125, -1.3709716796875, -1.29730224609375, -1.2236328125, -1.14996337890625, -1.0762939453125, -1.00262451171875, -0.928955078125, -0.85528564453125, -0.7816162109375, -0.70794677734375, -0.63427734375, -0.56060791015625, -0.4869384765625, -0.41326904296875, -0.339599609375, -0.26593017578125, -0.1922607421875, -0.11859130859375, -0.044921875, 0.02874755859375, 0.1024169921875, 0.17608642578125, 0.249755859375, 0.32342529296875, 0.3970947265625, 0.47076416015625, 0.54443359375, 0.61810302734375, 0.6917724609375, 0.76544189453125, 0.839111328125, 0.91278076171875, 0.9864501953125, 1.06011962890625, 1.1337890625, 1.20745849609375, 1.2811279296875, 1.35479736328125, 1.428466796875, 1.50213623046875, 1.5758056640625, 1.64947509765625, 1.72314453125, 1.79681396484375, 1.8704833984375, 1.94415283203125, 2.017822265625, 2.09149169921875, 2.1651611328125, 2.23883056640625, 2.3125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 17.0, 33.0, 70.0, 122.0, 161.0, 195.0, 190.0, 98.0, 68.0, 32.0, 13.0, 7.0, 2.0, 2.0, 1.0], "bins": [-0.255615234375, -0.2509164810180664, -0.2462177276611328, -0.24151897430419922, -0.23682022094726562, -0.23212146759033203, -0.22742271423339844, -0.22272396087646484, -0.21802520751953125, -0.21332645416259766, -0.20862770080566406, -0.20392894744873047, -0.19923019409179688, -0.19453144073486328, -0.1898326873779297, -0.1851339340209961, -0.1804351806640625, -0.1757364273071289, -0.1710376739501953, -0.16633892059326172, -0.16164016723632812, -0.15694141387939453, -0.15224266052246094, -0.14754390716552734, -0.14284515380859375, -0.13814640045166016, -0.13344764709472656, -0.12874889373779297, -0.12405014038085938, -0.11935138702392578, -0.11465263366699219, -0.1099538803100586, -0.105255126953125, -0.1005563735961914, -0.09585762023925781, -0.09115886688232422, -0.08646011352539062, -0.08176136016845703, -0.07706260681152344, -0.07236385345458984, -0.06766510009765625, -0.06296634674072266, -0.05826759338378906, -0.05356884002685547, -0.048870086669921875, -0.04417133331298828, -0.03947257995605469, -0.034773826599121094, -0.0300750732421875, -0.025376319885253906, -0.020677566528320312, -0.01597881317138672, -0.011280059814453125, -0.006581306457519531, -0.0018825531005859375, 0.0028162002563476562, 0.00751495361328125, 0.012213706970214844, 0.016912460327148438, 0.02161121368408203, 0.026309967041015625, 0.03100872039794922, 0.03570747375488281, 0.040406227111816406, 0.04510498046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 13.0, 28.0, 49.0, 86.0, 175.0, 426.0, 1308.0, 8277.0, 234174.0, 780345.0, 20413.0, 2223.0, 530.0, 233.0, 110.0, 61.0, 35.0, 26.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.776092529296875, -1.71722412109375, -1.658355712890625, -1.5994873046875, -1.540618896484375, -1.48175048828125, -1.422882080078125, -1.364013671875, -1.305145263671875, -1.24627685546875, -1.187408447265625, -1.1285400390625, -1.069671630859375, -1.01080322265625, -0.951934814453125, -0.89306640625, -0.834197998046875, -0.77532958984375, -0.716461181640625, -0.6575927734375, -0.598724365234375, -0.53985595703125, -0.480987548828125, -0.422119140625, -0.363250732421875, -0.30438232421875, -0.245513916015625, -0.1866455078125, -0.127777099609375, -0.06890869140625, -0.010040283203125, 0.048828125, 0.107696533203125, 0.16656494140625, 0.225433349609375, 0.2843017578125, 0.343170166015625, 0.40203857421875, 0.460906982421875, 0.519775390625, 0.578643798828125, 0.63751220703125, 0.696380615234375, 0.7552490234375, 0.814117431640625, 0.87298583984375, 0.931854248046875, 0.99072265625, 1.049591064453125, 1.10845947265625, 1.167327880859375, 1.2261962890625, 1.285064697265625, 1.34393310546875, 1.402801513671875, 1.461669921875, 1.520538330078125, 1.57940673828125, 1.638275146484375, 1.6971435546875, 1.756011962890625, 1.81488037109375, 1.873748779296875, 1.9326171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 11.0, 27.0, 25.0, 47.0, 69.0, 85.0, 103.0, 114.0, 127.0, 91.0, 101.0, 61.0, 46.0, 30.0, 23.0, 14.0, 8.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7168960571289062, -0.6969757080078125, -0.6770553588867188, -0.657135009765625, -0.6372146606445312, -0.6172943115234375, -0.5973739624023438, -0.57745361328125, -0.5575332641601562, -0.5376129150390625, -0.5176925659179688, -0.497772216796875, -0.47785186767578125, -0.4579315185546875, -0.43801116943359375, -0.4180908203125, -0.39817047119140625, -0.3782501220703125, -0.35832977294921875, -0.338409423828125, -0.31848907470703125, -0.2985687255859375, -0.27864837646484375, -0.25872802734375, -0.23880767822265625, -0.2188873291015625, -0.19896697998046875, -0.179046630859375, -0.15912628173828125, -0.1392059326171875, -0.11928558349609375, -0.099365234375, -0.07944488525390625, -0.0595245361328125, -0.03960418701171875, -0.019683837890625, 0.00023651123046875, 0.0201568603515625, 0.04007720947265625, 0.05999755859375, 0.07991790771484375, 0.0998382568359375, 0.11975860595703125, 0.139678955078125, 0.15959930419921875, 0.1795196533203125, 0.19944000244140625, 0.2193603515625, 0.23928070068359375, 0.2592010498046875, 0.27912139892578125, 0.299041748046875, 0.31896209716796875, 0.3388824462890625, 0.35880279541015625, 0.37872314453125, 0.39864349365234375, 0.4185638427734375, 0.43848419189453125, 0.458404541015625, 0.47832489013671875, 0.4982452392578125, 0.5181655883789062, 0.5380859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 11.0, 10.0, 23.0, 48.0, 98.0, 176.0, 315.0, 710.0, 1726.0, 5696.0, 48046.0, 929468.0, 53025.0, 5916.0, 1811.0, 742.0, 332.0, 169.0, 78.0, 46.0, 37.0, 22.0, 16.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.45672607421875, -1.4056396484375, -1.35455322265625, -1.303466796875, -1.25238037109375, -1.2012939453125, -1.15020751953125, -1.09912109375, -1.04803466796875, -0.9969482421875, -0.94586181640625, -0.894775390625, -0.84368896484375, -0.7926025390625, -0.74151611328125, -0.6904296875, -0.63934326171875, -0.5882568359375, -0.53717041015625, -0.486083984375, -0.43499755859375, -0.3839111328125, -0.33282470703125, -0.28173828125, -0.23065185546875, -0.1795654296875, -0.12847900390625, -0.077392578125, -0.02630615234375, 0.0247802734375, 0.07586669921875, 0.126953125, 0.17803955078125, 0.2291259765625, 0.28021240234375, 0.331298828125, 0.38238525390625, 0.4334716796875, 0.48455810546875, 0.53564453125, 0.58673095703125, 0.6378173828125, 0.68890380859375, 0.739990234375, 0.79107666015625, 0.8421630859375, 0.89324951171875, 0.9443359375, 0.99542236328125, 1.0465087890625, 1.09759521484375, 1.148681640625, 1.19976806640625, 1.2508544921875, 1.30194091796875, 1.35302734375, 1.40411376953125, 1.4552001953125, 1.50628662109375, 1.557373046875, 1.60845947265625, 1.6595458984375, 1.71063232421875, 1.76171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 19.0, 10.0, 20.0, 26.0, 22.0, 22.0, 34.0, 52.0, 59.0, 59.0, 83.0, 86.0, 67.0, 79.0, 53.0, 50.0, 50.0, 40.0, 29.0, 32.0, 20.0, 21.0, 13.0, 11.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00020503997802734375, -0.00019964203238487244, -0.00019424408674240112, -0.0001888461410999298, -0.0001834481954574585, -0.00017805024981498718, -0.00017265230417251587, -0.00016725435853004456, -0.00016185641288757324, -0.00015645846724510193, -0.00015106052160263062, -0.0001456625759601593, -0.000140264630317688, -0.00013486668467521667, -0.00012946873903274536, -0.00012407079339027405, -0.00011867284774780273, -0.00011327490210533142, -0.00010787695646286011, -0.0001024790108203888, -9.708106517791748e-05, -9.168311953544617e-05, -8.628517389297485e-05, -8.088722825050354e-05, -7.548928260803223e-05, -7.009133696556091e-05, -6.46933913230896e-05, -5.9295445680618286e-05, -5.389750003814697e-05, -4.849955439567566e-05, -4.3101608753204346e-05, -3.770366311073303e-05, -3.230571746826172e-05, -2.6907771825790405e-05, -2.1509826183319092e-05, -1.611188054084778e-05, -1.0713934898376465e-05, -5.315989255905151e-06, 8.195638656616211e-08, 5.479902029037476e-06, 1.0877847671508789e-05, 1.6275793313980103e-05, 2.1673738956451416e-05, 2.707168459892273e-05, 3.246963024139404e-05, 3.7867575883865356e-05, 4.326552152633667e-05, 4.8663467168807983e-05, 5.40614128112793e-05, 5.945935845375061e-05, 6.485730409622192e-05, 7.025524973869324e-05, 7.565319538116455e-05, 8.105114102363586e-05, 8.644908666610718e-05, 9.184703230857849e-05, 9.72449779510498e-05, 0.00010264292359352112, 0.00010804086923599243, 0.00011343881487846375, 0.00011883676052093506, 0.00012423470616340637, 0.00012963265180587769, 0.000135030597448349, 0.0001404285430908203]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 12.0, 12.0, 15.0, 44.0, 157.0, 563.0, 5102.0, 887904.0, 151614.0, 2506.0, 401.0, 118.0, 39.0, 25.0, 10.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.957366943359375, -1.86785888671875, -1.778350830078125, -1.6888427734375, -1.599334716796875, -1.50982666015625, -1.420318603515625, -1.330810546875, -1.241302490234375, -1.15179443359375, -1.062286376953125, -0.9727783203125, -0.883270263671875, -0.79376220703125, -0.704254150390625, -0.61474609375, -0.525238037109375, -0.43572998046875, -0.346221923828125, -0.2567138671875, -0.167205810546875, -0.07769775390625, 0.011810302734375, 0.101318359375, 0.190826416015625, 0.28033447265625, 0.369842529296875, 0.4593505859375, 0.548858642578125, 0.63836669921875, 0.727874755859375, 0.8173828125, 0.906890869140625, 0.99639892578125, 1.085906982421875, 1.1754150390625, 1.264923095703125, 1.35443115234375, 1.443939208984375, 1.533447265625, 1.622955322265625, 1.71246337890625, 1.801971435546875, 1.8914794921875, 1.980987548828125, 2.07049560546875, 2.160003662109375, 2.24951171875, 2.339019775390625, 2.42852783203125, 2.518035888671875, 2.6075439453125, 2.697052001953125, 2.78656005859375, 2.876068115234375, 2.965576171875, 3.055084228515625, 3.14459228515625, 3.234100341796875, 3.3236083984375, 3.413116455078125, 3.50262451171875, 3.592132568359375, 3.681640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 8.0, 13.0, 18.0, 32.0, 44.0, 86.0, 168.0, 234.0, 134.0, 105.0, 55.0, 37.0, 19.0, 8.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4093208312988281, -0.39115142822265625, -0.3729820251464844, -0.3548126220703125, -0.3366432189941406, -0.31847381591796875, -0.3003044128417969, -0.282135009765625, -0.2639656066894531, -0.24579620361328125, -0.22762680053710938, -0.2094573974609375, -0.19128799438476562, -0.17311859130859375, -0.15494918823242188, -0.13677978515625, -0.11861038208007812, -0.10044097900390625, -0.08227157592773438, -0.0641021728515625, -0.045932769775390625, -0.02776336669921875, -0.009593963623046875, 0.008575439453125, 0.026744842529296875, 0.04491424560546875, 0.06308364868164062, 0.0812530517578125, 0.09942245483398438, 0.11759185791015625, 0.13576126098632812, 0.1539306640625, 0.17210006713867188, 0.19026947021484375, 0.20843887329101562, 0.2266082763671875, 0.24477767944335938, 0.26294708251953125, 0.2811164855957031, 0.299285888671875, 0.3174552917480469, 0.33562469482421875, 0.3537940979003906, 0.3719635009765625, 0.3901329040527344, 0.40830230712890625, 0.4264717102050781, 0.44464111328125, 0.4628105163574219, 0.48097991943359375, 0.4991493225097656, 0.5173187255859375, 0.5354881286621094, 0.5536575317382812, 0.5718269348144531, 0.589996337890625, 0.6081657409667969, 0.6263351440429688, 0.6445045471191406, 0.6626739501953125, 0.6808433532714844, 0.6990127563476562, 0.7171821594238281, 0.7353515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 964.0, 44.0, 0.0, 1.0, 1.0], "bins": [-100.7710952758789, -99.08003997802734, -97.38897705078125, -95.69792175292969, -94.0068588256836, -92.31580352783203, -90.62474060058594, -88.93368530273438, -87.24263000488281, -85.55157470703125, -83.86051177978516, -82.1694564819336, -80.4783935546875, -78.78733825683594, -77.09628295898438, -75.40522003173828, -73.71415710449219, -72.02310180664062, -70.33203887939453, -68.64098358154297, -66.94992065429688, -65.25886535644531, -63.567806243896484, -61.876747131347656, -60.185691833496094, -58.494632720947266, -56.80357360839844, -55.112518310546875, -53.42145919799805, -51.73040008544922, -50.03934097290039, -48.34828186035156, -46.6572265625, -44.96616744995117, -43.275108337402344, -41.58405303955078, -39.89299392700195, -38.201934814453125, -36.5108757019043, -34.81981658935547, -33.12875747680664, -31.437698364257812, -29.746641159057617, -28.05558204650879, -26.364524841308594, -24.673465728759766, -22.982406616210938, -21.29134750366211, -19.600292205810547, -17.90923309326172, -16.218175888061523, -14.527116775512695, -12.836058616638184, -11.145000457763672, -9.453941345214844, -7.762883186340332, -6.071824550628662, -4.380765914916992, -2.6897077560424805, -0.9986491203308105, 0.6924090385437012, 2.383467197418213, 4.074526309967041, 5.765584468841553, 7.4566426277160645]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 13.0, 24.0, 43.0, 67.0, 91.0, 94.0, 110.0, 134.0, 104.0, 92.0, 86.0, 49.0, 38.0, 25.0, 12.0, 13.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.553884506225586, -7.3783369064331055, -7.202788829803467, -7.027241230010986, -6.851693153381348, -6.676145553588867, -6.5005974769592285, -6.325049877166748, -6.149501800537109, -5.973954200744629, -5.79840612411499, -5.62285852432251, -5.447310447692871, -5.271762847900391, -5.096214771270752, -4.9206671714782715, -4.745119094848633, -4.569571495056152, -4.394023418426514, -4.218475818634033, -4.0429277420043945, -3.867379903793335, -3.6918320655822754, -3.516284465789795, -3.3407368659973145, -3.165189027786255, -2.9896411895751953, -2.8140933513641357, -2.638545513153076, -2.4629976749420166, -2.287449836730957, -2.1119022369384766, -1.936354398727417, -1.7608065605163574, -1.5852587223052979, -1.4097108840942383, -1.2341630458831787, -1.0586152076721191, -0.8830674886703491, -0.7075196504592896, -0.53197181224823, -0.3564239740371704, -0.18087616562843323, -0.005328357219696045, 0.17021948099136353, 0.3457673192024231, 0.5213150978088379, 0.6968629360198975, 0.872410774230957, 1.0479586124420166, 1.2235064506530762, 1.3990542888641357, 1.5746021270751953, 1.7501499652862549, 1.925697684288025, 2.101245403289795, 2.2767934799194336, 2.452341318130493, 2.6278891563415527, 2.8034369945526123, 2.978984832763672, 3.1545326709747314, 3.330080509185791, 3.5056281089782715, 3.681175947189331]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 3.0, 13.0, 20.0, 22.0, 26.0, 49.0, 93.0, 137.0, 303.0, 755.0, 17197.0, 4173110.0, 1891.0, 334.0, 169.0, 97.0, 45.0, 9.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.124053955078125, -10.88873291015625, -10.653411865234375, -10.4180908203125, -10.182769775390625, -9.94744873046875, -9.712127685546875, -9.476806640625, -9.241485595703125, -9.00616455078125, -8.770843505859375, -8.5355224609375, -8.300201416015625, -8.06488037109375, -7.829559326171875, -7.59423828125, -7.358917236328125, -7.12359619140625, -6.888275146484375, -6.6529541015625, -6.417633056640625, -6.18231201171875, -5.946990966796875, -5.711669921875, -5.476348876953125, -5.24102783203125, -5.005706787109375, -4.7703857421875, -4.535064697265625, -4.29974365234375, -4.064422607421875, -3.8291015625, -3.593780517578125, -3.35845947265625, -3.123138427734375, -2.8878173828125, -2.652496337890625, -2.41717529296875, -2.181854248046875, -1.946533203125, -1.711212158203125, -1.47589111328125, -1.240570068359375, -1.0052490234375, -0.769927978515625, -0.53460693359375, -0.299285888671875, -0.06396484375, 0.171356201171875, 0.40667724609375, 0.641998291015625, 0.8773193359375, 1.112640380859375, 1.34796142578125, 1.583282470703125, 1.818603515625, 2.053924560546875, 2.28924560546875, 2.524566650390625, 2.7598876953125, 2.995208740234375, 3.23052978515625, 3.465850830078125, 3.701171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 10.0, 19.0, 47.0, 129.0, 166.0, 194.0, 172.0, 128.0, 72.0, 40.0, 21.0, 8.0, 5.0, 3.0], "bins": [-0.292236328125, -0.2869887351989746, -0.2817411422729492, -0.27649354934692383, -0.27124595642089844, -0.26599836349487305, -0.26075077056884766, -0.25550317764282227, -0.2502555847167969, -0.24500799179077148, -0.2397603988647461, -0.2345128059387207, -0.2292652130126953, -0.22401762008666992, -0.21877002716064453, -0.21352243423461914, -0.20827484130859375, -0.20302724838256836, -0.19777965545654297, -0.19253206253051758, -0.1872844696044922, -0.1820368766784668, -0.1767892837524414, -0.17154169082641602, -0.16629409790039062, -0.16104650497436523, -0.15579891204833984, -0.15055131912231445, -0.14530372619628906, -0.14005613327026367, -0.13480854034423828, -0.1295609474182129, -0.1243133544921875, -0.11906576156616211, -0.11381816864013672, -0.10857057571411133, -0.10332298278808594, -0.09807538986206055, -0.09282779693603516, -0.08758020401000977, -0.08233261108398438, -0.07708501815795898, -0.0718374252319336, -0.0665898323059082, -0.06134223937988281, -0.05609464645385742, -0.05084705352783203, -0.04559946060180664, -0.04035186767578125, -0.03510427474975586, -0.02985668182373047, -0.024609088897705078, -0.019361495971679688, -0.014113903045654297, -0.008866310119628906, -0.0036187171936035156, 0.001628875732421875, 0.006876468658447266, 0.012124061584472656, 0.017371654510498047, 0.022619247436523438, 0.027866840362548828, 0.03311443328857422, 0.03836202621459961, 0.043609619140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 16.0, 34.0, 64.0, 164.0, 396.0, 2799.0, 4185393.0, 4522.0, 536.0, 205.0, 95.0, 40.0, 11.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.2103271484375, -12.858154296875, -12.5059814453125, -12.15380859375, -11.8016357421875, -11.449462890625, -11.0972900390625, -10.7451171875, -10.3929443359375, -10.040771484375, -9.6885986328125, -9.33642578125, -8.9842529296875, -8.632080078125, -8.2799072265625, -7.927734375, -7.5755615234375, -7.223388671875, -6.8712158203125, -6.51904296875, -6.1668701171875, -5.814697265625, -5.4625244140625, -5.1103515625, -4.7581787109375, -4.406005859375, -4.0538330078125, -3.70166015625, -3.3494873046875, -2.997314453125, -2.6451416015625, -2.29296875, -1.9407958984375, -1.588623046875, -1.2364501953125, -0.88427734375, -0.5321044921875, -0.179931640625, 0.1722412109375, 0.5244140625, 0.8765869140625, 1.228759765625, 1.5809326171875, 1.93310546875, 2.2852783203125, 2.637451171875, 2.9896240234375, 3.341796875, 3.6939697265625, 4.046142578125, 4.3983154296875, 4.75048828125, 5.1026611328125, 5.454833984375, 5.8070068359375, 6.1591796875, 6.5113525390625, 6.863525390625, 7.2156982421875, 7.56787109375, 7.9200439453125, 8.272216796875, 8.6243896484375, 8.9765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 9.0, 35.0, 187.0, 3186.0, 446.0, 113.0, 53.0, 27.0, 15.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5163040161132812, -0.4945220947265625, -0.47274017333984375, -0.450958251953125, -0.42917633056640625, -0.4073944091796875, -0.38561248779296875, -0.36383056640625, -0.34204864501953125, -0.3202667236328125, -0.29848480224609375, -0.276702880859375, -0.25492095947265625, -0.2331390380859375, -0.21135711669921875, -0.1895751953125, -0.16779327392578125, -0.1460113525390625, -0.12422943115234375, -0.102447509765625, -0.08066558837890625, -0.0588836669921875, -0.03710174560546875, -0.01531982421875, 0.00646209716796875, 0.0282440185546875, 0.05002593994140625, 0.071807861328125, 0.09358978271484375, 0.1153717041015625, 0.13715362548828125, 0.158935546875, 0.18071746826171875, 0.2024993896484375, 0.22428131103515625, 0.246063232421875, 0.26784515380859375, 0.2896270751953125, 0.31140899658203125, 0.33319091796875, 0.35497283935546875, 0.3767547607421875, 0.39853668212890625, 0.420318603515625, 0.44210052490234375, 0.4638824462890625, 0.48566436767578125, 0.5074462890625, 0.5292282104492188, 0.5510101318359375, 0.5727920532226562, 0.594573974609375, 0.6163558959960938, 0.6381378173828125, 0.6599197387695312, 0.68170166015625, 0.7034835815429688, 0.7252655029296875, 0.7470474243164062, 0.768829345703125, 0.7906112670898438, 0.8123931884765625, 0.8341751098632812, 0.85595703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 43.0, 204.0, 478.0, 186.0, 50.0, 21.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9220210313796997, -1.6935627460479736, -1.4651044607162476, -1.2366461753845215, -1.008188009262085, -0.7797297239303589, -0.5512714385986328, -0.32281315326690674, -0.09435486793518066, 0.13410340249538422, 0.3625616729259491, 0.5910199284553528, 0.8194782137870789, 1.0479364395141602, 1.2763947248458862, 1.5048530101776123, 1.7333112955093384, 1.9617695808410645, 2.190227746963501, 2.4186861515045166, 2.647144317626953, 2.8756027221679688, 3.1040608882904053, 3.332519054412842, 3.5609774589538574, 3.789435625076294, 4.0178937911987305, 4.246352195739746, 4.474810600280762, 4.703269004821777, 4.931726932525635, 5.16018533706665, 5.388643741607666, 5.617102146148682, 5.845560073852539, 6.074018478393555, 6.30247688293457, 6.530935287475586, 6.759393215179443, 6.987851619720459, 7.216310024261475, 7.44476842880249, 7.673226356506348, 7.901684761047363, 8.130143165588379, 8.358601570129395, 8.58705997467041, 8.81551742553711, 9.043975830078125, 9.27243423461914, 9.500892639160156, 9.729351043701172, 9.957808494567871, 10.186266899108887, 10.414725303649902, 10.643183708190918, 10.871642112731934, 11.10010051727295, 11.328558921813965, 11.55701732635498, 11.78547477722168, 12.013933181762695, 12.242391586303711, 12.470849990844727, 12.699308395385742]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 12.0, 16.0, 21.0, 33.0, 48.0, 71.0, 86.0, 92.0, 95.0, 94.0, 97.0, 94.0, 69.0, 54.0, 36.0, 26.0, 26.0, 12.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.524693250656128, -2.453944683074951, -2.3831958770751953, -2.3124473094940186, -2.2416985034942627, -2.170949935913086, -2.10020112991333, -2.0294525623321533, -1.958703875541687, -1.8879551887512207, -1.8172065019607544, -1.746457815170288, -1.6757092475891113, -1.6049604415893555, -1.5342118740081787, -1.4634631872177124, -1.392714500427246, -1.3219658136367798, -1.2512171268463135, -1.1804684400558472, -1.1097197532653809, -1.038971185684204, -0.9682224988937378, -0.8974738121032715, -0.8267251253128052, -0.7559764385223389, -0.6852277517318726, -0.614479124546051, -0.5437304377555847, -0.4729817509651184, -0.4022330939769745, -0.33148443698883057, -0.26073551177978516, -0.18998683989048004, -0.11923816800117493, -0.04848949611186981, 0.022259175777435303, 0.09300786256790161, 0.16375651955604553, 0.23450517654418945, 0.30525386333465576, 0.37600255012512207, 0.446751207113266, 0.5174998641014099, 0.5882485508918762, 0.6589972376823425, 0.7297458648681641, 0.8004945516586304, 0.8712432384490967, 0.941991925239563, 1.0127406120300293, 1.0834892988204956, 1.154237985610962, 1.2249865531921387, 1.295735239982605, 1.3664839267730713, 1.4372326135635376, 1.507981300354004, 1.5787299871444702, 1.6494786739349365, 1.7202272415161133, 1.7909760475158691, 1.861724615097046, 1.9324733018875122, 2.0032219886779785]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 12.0, 11.0, 8.0, 18.0, 11.0, 20.0, 23.0, 19.0, 27.0, 42.0, 56.0, 86.0, 164.0, 375.0, 1320.0, 7404.0, 81304.0, 772739.0, 169502.0, 12438.0, 1905.0, 517.0, 169.0, 85.0, 71.0, 34.0, 28.0, 22.0, 16.0, 21.0, 16.0, 15.0, 12.0, 12.0, 9.0, 6.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.728515625, -1.6720733642578125, -1.615631103515625, -1.5591888427734375, -1.50274658203125, -1.4463043212890625, -1.389862060546875, -1.3334197998046875, -1.2769775390625, -1.2205352783203125, -1.164093017578125, -1.1076507568359375, -1.05120849609375, -0.9947662353515625, -0.938323974609375, -0.8818817138671875, -0.825439453125, -0.7689971923828125, -0.712554931640625, -0.6561126708984375, -0.59967041015625, -0.5432281494140625, -0.486785888671875, -0.4303436279296875, -0.3739013671875, -0.3174591064453125, -0.261016845703125, -0.2045745849609375, -0.14813232421875, -0.0916900634765625, -0.035247802734375, 0.0211944580078125, 0.07763671875, 0.1340789794921875, 0.190521240234375, 0.2469635009765625, 0.30340576171875, 0.3598480224609375, 0.416290283203125, 0.4727325439453125, 0.5291748046875, 0.5856170654296875, 0.642059326171875, 0.6985015869140625, 0.75494384765625, 0.8113861083984375, 0.867828369140625, 0.9242706298828125, 0.980712890625, 1.0371551513671875, 1.093597412109375, 1.1500396728515625, 1.20648193359375, 1.2629241943359375, 1.319366455078125, 1.3758087158203125, 1.4322509765625, 1.4886932373046875, 1.545135498046875, 1.6015777587890625, 1.65802001953125, 1.7144622802734375, 1.770904541015625, 1.8273468017578125, 1.8837890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 12.0, 21.0, 43.0, 62.0, 91.0, 123.0, 143.0, 130.0, 121.0, 105.0, 58.0, 42.0, 15.0, 13.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.229736328125, -0.22474002838134766, -0.2197437286376953, -0.21474742889404297, -0.20975112915039062, -0.20475482940673828, -0.19975852966308594, -0.1947622299194336, -0.18976593017578125, -0.1847696304321289, -0.17977333068847656, -0.17477703094482422, -0.16978073120117188, -0.16478443145751953, -0.1597881317138672, -0.15479183197021484, -0.1497955322265625, -0.14479923248291016, -0.1398029327392578, -0.13480663299560547, -0.12981033325195312, -0.12481403350830078, -0.11981773376464844, -0.1148214340209961, -0.10982513427734375, -0.1048288345336914, -0.09983253479003906, -0.09483623504638672, -0.08983993530273438, -0.08484363555908203, -0.07984733581542969, -0.07485103607177734, -0.069854736328125, -0.06485843658447266, -0.05986213684082031, -0.05486583709716797, -0.049869537353515625, -0.04487323760986328, -0.03987693786621094, -0.034880638122558594, -0.02988433837890625, -0.024888038635253906, -0.019891738891601562, -0.014895439147949219, -0.009899139404296875, -0.004902839660644531, 9.34600830078125e-05, 0.005089759826660156, 0.0100860595703125, 0.015082359313964844, 0.020078659057617188, 0.02507495880126953, 0.030071258544921875, 0.03506755828857422, 0.04006385803222656, 0.045060157775878906, 0.05005645751953125, 0.055052757263183594, 0.06004905700683594, 0.06504535675048828, 0.07004165649414062, 0.07503795623779297, 0.08003425598144531, 0.08503055572509766, 0.09002685546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 2.0, 7.0, 18.0, 21.0, 20.0, 26.0, 31.0, 43.0, 75.0, 98.0, 173.0, 372.0, 931.0, 2429.0, 8932.0, 46871.0, 321153.0, 545034.0, 98985.0, 16856.0, 3950.0, 1322.0, 519.0, 251.0, 135.0, 84.0, 55.0, 22.0, 33.0, 20.0, 23.0, 14.0, 11.0, 9.0, 10.0, 6.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.06646728515625, -1.0352783203125, -1.00408935546875, -0.972900390625, -0.94171142578125, -0.9105224609375, -0.87933349609375, -0.84814453125, -0.81695556640625, -0.7857666015625, -0.75457763671875, -0.723388671875, -0.69219970703125, -0.6610107421875, -0.62982177734375, -0.5986328125, -0.56744384765625, -0.5362548828125, -0.50506591796875, -0.473876953125, -0.44268798828125, -0.4114990234375, -0.38031005859375, -0.34912109375, -0.31793212890625, -0.2867431640625, -0.25555419921875, -0.224365234375, -0.19317626953125, -0.1619873046875, -0.13079833984375, -0.099609375, -0.06842041015625, -0.0372314453125, -0.00604248046875, 0.025146484375, 0.05633544921875, 0.0875244140625, 0.11871337890625, 0.14990234375, 0.18109130859375, 0.2122802734375, 0.24346923828125, 0.274658203125, 0.30584716796875, 0.3370361328125, 0.36822509765625, 0.3994140625, 0.43060302734375, 0.4617919921875, 0.49298095703125, 0.524169921875, 0.55535888671875, 0.5865478515625, 0.61773681640625, 0.64892578125, 0.68011474609375, 0.7113037109375, 0.74249267578125, 0.773681640625, 0.80487060546875, 0.8360595703125, 0.86724853515625, 0.8984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 7.0, 11.0, 11.0, 18.0, 13.0, 14.0, 20.0, 32.0, 33.0, 36.0, 48.0, 34.0, 37.0, 46.0, 41.0, 44.0, 56.0, 48.0, 53.0, 51.0, 45.0, 37.0, 47.0, 31.0, 27.0, 28.0, 23.0, 10.0, 16.0, 11.0, 10.0, 10.0, 11.0, 12.0, 9.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.422607421875, -0.41127777099609375, -0.3999481201171875, -0.38861846923828125, -0.377288818359375, -0.36595916748046875, -0.3546295166015625, -0.34329986572265625, -0.33197021484375, -0.32064056396484375, -0.3093109130859375, -0.29798126220703125, -0.286651611328125, -0.27532196044921875, -0.2639923095703125, -0.25266265869140625, -0.2413330078125, -0.23000335693359375, -0.2186737060546875, -0.20734405517578125, -0.196014404296875, -0.18468475341796875, -0.1733551025390625, -0.16202545166015625, -0.15069580078125, -0.13936614990234375, -0.1280364990234375, -0.11670684814453125, -0.105377197265625, -0.09404754638671875, -0.0827178955078125, -0.07138824462890625, -0.06005859375, -0.04872894287109375, -0.0373992919921875, -0.02606964111328125, -0.014739990234375, -0.00341033935546875, 0.0079193115234375, 0.01924896240234375, 0.03057861328125, 0.04190826416015625, 0.0532379150390625, 0.06456756591796875, 0.075897216796875, 0.08722686767578125, 0.0985565185546875, 0.10988616943359375, 0.1212158203125, 0.13254547119140625, 0.1438751220703125, 0.15520477294921875, 0.166534423828125, 0.17786407470703125, 0.1891937255859375, 0.20052337646484375, 0.21185302734375, 0.22318267822265625, 0.2345123291015625, 0.24584197998046875, 0.257171630859375, 0.26850128173828125, 0.2798309326171875, 0.29116058349609375, 0.302490234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 14.0, 28.0, 37.0, 33.0, 47.0, 91.0, 128.0, 229.0, 359.0, 716.0, 1374.0, 3542.0, 10640.0, 40840.0, 233824.0, 578585.0, 137971.0, 26940.0, 7737.0, 2715.0, 1208.0, 612.0, 329.0, 182.0, 108.0, 76.0, 50.0, 34.0, 13.0, 17.0, 16.0, 3.0, 15.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.7607421875, -0.739227294921875, -0.71771240234375, -0.696197509765625, -0.6746826171875, -0.653167724609375, -0.63165283203125, -0.610137939453125, -0.588623046875, -0.567108154296875, -0.54559326171875, -0.524078369140625, -0.5025634765625, -0.481048583984375, -0.45953369140625, -0.438018798828125, -0.41650390625, -0.394989013671875, -0.37347412109375, -0.351959228515625, -0.3304443359375, -0.308929443359375, -0.28741455078125, -0.265899658203125, -0.244384765625, -0.222869873046875, -0.20135498046875, -0.179840087890625, -0.1583251953125, -0.136810302734375, -0.11529541015625, -0.093780517578125, -0.072265625, -0.050750732421875, -0.02923583984375, -0.007720947265625, 0.0137939453125, 0.035308837890625, 0.05682373046875, 0.078338623046875, 0.099853515625, 0.121368408203125, 0.14288330078125, 0.164398193359375, 0.1859130859375, 0.207427978515625, 0.22894287109375, 0.250457763671875, 0.27197265625, 0.293487548828125, 0.31500244140625, 0.336517333984375, 0.3580322265625, 0.379547119140625, 0.40106201171875, 0.422576904296875, 0.444091796875, 0.465606689453125, 0.48712158203125, 0.508636474609375, 0.5301513671875, 0.551666259765625, 0.57318115234375, 0.594696044921875, 0.6162109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 8.0, 7.0, 4.0, 9.0, 15.0, 7.0, 13.0, 22.0, 17.0, 31.0, 35.0, 42.0, 55.0, 60.0, 72.0, 63.0, 81.0, 55.0, 65.0, 53.0, 51.0, 42.0, 35.0, 20.0, 21.0, 26.0, 14.0, 18.0, 12.0, 4.0, 8.0, 5.0, 8.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011867284774780273, -0.00011477340012788773, -0.00011087395250797272, -0.00010697450488805771, -0.0001030750572681427, -9.917560964822769e-05, -9.527616202831268e-05, -9.137671440839767e-05, -8.747726678848267e-05, -8.357781916856766e-05, -7.967837154865265e-05, -7.577892392873764e-05, -7.187947630882263e-05, -6.798002868890762e-05, -6.408058106899261e-05, -6.0181133449077606e-05, -5.62816858291626e-05, -5.238223820924759e-05, -4.848279058933258e-05, -4.458334296941757e-05, -4.0683895349502563e-05, -3.6784447729587555e-05, -3.2885000109672546e-05, -2.8985552489757538e-05, -2.508610486984253e-05, -2.118665724992752e-05, -1.7287209630012512e-05, -1.3387762010097504e-05, -9.488314390182495e-06, -5.5888667702674866e-06, -1.689419150352478e-06, 2.2100284695625305e-06, 6.109476089477539e-06, 1.0008923709392548e-05, 1.3908371329307556e-05, 1.7807818949222565e-05, 2.1707266569137573e-05, 2.5606714189052582e-05, 2.950616180896759e-05, 3.34056094288826e-05, 3.730505704879761e-05, 4.1204504668712616e-05, 4.5103952288627625e-05, 4.900339990854263e-05, 5.290284752845764e-05, 5.680229514837265e-05, 6.070174276828766e-05, 6.460119038820267e-05, 6.850063800811768e-05, 7.240008562803268e-05, 7.629953324794769e-05, 8.01989808678627e-05, 8.409842848777771e-05, 8.799787610769272e-05, 9.189732372760773e-05, 9.579677134752274e-05, 9.969621896743774e-05, 0.00010359566658735275, 0.00010749511420726776, 0.00011139456182718277, 0.00011529400944709778, 0.00011919345706701279, 0.0001230929046869278, 0.0001269923523068428, 0.0001308917999267578]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 13.0, 19.0, 18.0, 35.0, 55.0, 120.0, 319.0, 715.0, 2518.0, 13561.0, 200174.0, 769814.0, 53022.0, 5872.0, 1416.0, 460.0, 201.0, 102.0, 54.0, 20.0, 14.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.080322265625, -1.03759765625, -0.994873046875, -0.9521484375, -0.909423828125, -0.86669921875, -0.823974609375, -0.78125, -0.738525390625, -0.69580078125, -0.653076171875, -0.6103515625, -0.567626953125, -0.52490234375, -0.482177734375, -0.439453125, -0.396728515625, -0.35400390625, -0.311279296875, -0.2685546875, -0.225830078125, -0.18310546875, -0.140380859375, -0.09765625, -0.054931640625, -0.01220703125, 0.030517578125, 0.0732421875, 0.115966796875, 0.15869140625, 0.201416015625, 0.244140625, 0.286865234375, 0.32958984375, 0.372314453125, 0.4150390625, 0.457763671875, 0.50048828125, 0.543212890625, 0.5859375, 0.628662109375, 0.67138671875, 0.714111328125, 0.7568359375, 0.799560546875, 0.84228515625, 0.885009765625, 0.927734375, 0.970458984375, 1.01318359375, 1.055908203125, 1.0986328125, 1.141357421875, 1.18408203125, 1.226806640625, 1.26953125, 1.312255859375, 1.35498046875, 1.397705078125, 1.4404296875, 1.483154296875, 1.52587890625, 1.568603515625, 1.611328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 2.0, 5.0, 11.0, 10.0, 16.0, 16.0, 35.0, 40.0, 67.0, 85.0, 75.0, 109.0, 111.0, 102.0, 81.0, 65.0, 49.0, 41.0, 19.0, 24.0, 9.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3388671875, -0.3264732360839844, -0.31407928466796875, -0.3016853332519531, -0.2892913818359375, -0.2768974304199219, -0.26450347900390625, -0.2521095275878906, -0.239715576171875, -0.22732162475585938, -0.21492767333984375, -0.20253372192382812, -0.1901397705078125, -0.17774581909179688, -0.16535186767578125, -0.15295791625976562, -0.14056396484375, -0.12817001342773438, -0.11577606201171875, -0.10338211059570312, -0.0909881591796875, -0.07859420776367188, -0.06620025634765625, -0.053806304931640625, -0.041412353515625, -0.029018402099609375, -0.01662445068359375, -0.004230499267578125, 0.0081634521484375, 0.020557403564453125, 0.03295135498046875, 0.045345306396484375, 0.0577392578125, 0.07013320922851562, 0.08252716064453125, 0.09492111206054688, 0.1073150634765625, 0.11970901489257812, 0.13210296630859375, 0.14449691772460938, 0.156890869140625, 0.16928482055664062, 0.18167877197265625, 0.19407272338867188, 0.2064666748046875, 0.21886062622070312, 0.23125457763671875, 0.24364852905273438, 0.25604248046875, 0.2684364318847656, 0.28083038330078125, 0.2932243347167969, 0.3056182861328125, 0.3180122375488281, 0.33040618896484375, 0.3428001403808594, 0.355194091796875, 0.3675880432128906, 0.37998199462890625, 0.3923759460449219, 0.4047698974609375, 0.4171638488769531, 0.42955780029296875, 0.4419517517089844, 0.454345703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 11.0, 88.0, 613.0, 280.0, 19.0, 7.0], "bins": [-49.956626892089844, -49.134239196777344, -48.31185531616211, -47.48946762084961, -46.66707992553711, -45.844696044921875, -45.022308349609375, -44.199920654296875, -43.377532958984375, -42.555145263671875, -41.73276138305664, -40.91037368774414, -40.08798599243164, -39.265602111816406, -38.443214416503906, -37.620826721191406, -36.79844284057617, -35.97605514526367, -35.15367126464844, -34.33128356933594, -33.50889587402344, -32.68650817871094, -31.864124298095703, -31.041736602783203, -30.219348907470703, -29.396963119506836, -28.574575424194336, -27.75218963623047, -26.92980194091797, -26.1074161529541, -25.285030364990234, -24.462642669677734, -23.640256881713867, -22.81787109375, -21.9954833984375, -21.173097610473633, -20.350709915161133, -19.528324127197266, -18.705936431884766, -17.8835506439209, -17.06116485595703, -16.238779067993164, -15.416391372680664, -14.594005584716797, -13.771618843078613, -12.94923210144043, -12.126845359802246, -11.304458618164062, -10.482071876525879, -9.659685134887695, -8.837298393249512, -8.014911651611328, -7.192525863647461, -6.370139122009277, -5.547752380371094, -4.725366115570068, -3.9029793739318848, -3.0805928707122803, -2.258206367492676, -1.4358196258544922, -0.6134331226348877, 0.2089533805847168, 1.0313401222229004, 1.8537263870239258, 2.6761131286621094]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 9.0, 8.0, 8.0, 18.0, 15.0, 21.0, 26.0, 33.0, 43.0, 47.0, 53.0, 47.0, 62.0, 42.0, 68.0, 64.0, 62.0, 52.0, 42.0, 55.0, 36.0, 40.0, 34.0, 17.0, 24.0, 17.0, 14.0, 7.0, 14.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8702404499053955, -2.770172595977783, -2.670104503631592, -2.5700366497039795, -2.469968795776367, -2.369900703430176, -2.2698328495025635, -2.169764995574951, -2.0696969032287598, -1.969628930091858, -1.869560956954956, -1.7694931030273438, -1.669425129890442, -1.56935715675354, -1.4692893028259277, -1.3692213296890259, -1.269153356552124, -1.1690853834152222, -1.0690174102783203, -0.968949556350708, -0.8688815832138062, -0.7688136100769043, -0.6687456965446472, -0.5686777830123901, -0.4686098098754883, -0.3685418665409088, -0.26847392320632935, -0.16840597987174988, -0.06833803653717041, 0.031729936599731445, 0.13179785013198853, 0.2318657636642456, 0.33193349838256836, 0.4320014417171478, 0.5320693850517273, 0.6321372985839844, 0.7322052717208862, 0.8322732448577881, 0.9323411583900452, 1.0324090719223022, 1.132477045059204, 1.232545018196106, 1.3326129913330078, 1.4326808452606201, 1.532748818397522, 1.6328167915344238, 1.7328846454620361, 1.832952618598938, 1.9330205917358398, 2.033088445663452, 2.1331565380096436, 2.233224391937256, 2.3332924842834473, 2.4333603382110596, 2.533428192138672, 2.6334962844848633, 2.7335641384124756, 2.833631992340088, 2.9337000846862793, 3.0337679386138916, 3.133835792541504, 3.2339038848876953, 3.3339717388153076, 3.43403959274292, 3.5341076850891113]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 16.0, 23.0, 26.0, 20.0, 57.0, 78.0, 122.0, 240.0, 523.0, 1664.0, 10252.0, 267427.0, 3879888.0, 28910.0, 3494.0, 862.0, 317.0, 144.0, 75.0, 46.0, 27.0, 13.0, 11.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.430450439453125, -2.34722900390625, -2.264007568359375, -2.1807861328125, -2.097564697265625, -2.01434326171875, -1.931121826171875, -1.847900390625, -1.764678955078125, -1.68145751953125, -1.598236083984375, -1.5150146484375, -1.431793212890625, -1.34857177734375, -1.265350341796875, -1.18212890625, -1.098907470703125, -1.01568603515625, -0.932464599609375, -0.8492431640625, -0.766021728515625, -0.68280029296875, -0.599578857421875, -0.516357421875, -0.433135986328125, -0.34991455078125, -0.266693115234375, -0.1834716796875, -0.100250244140625, -0.01702880859375, 0.066192626953125, 0.1494140625, 0.232635498046875, 0.31585693359375, 0.399078369140625, 0.4822998046875, 0.565521240234375, 0.64874267578125, 0.731964111328125, 0.815185546875, 0.898406982421875, 0.98162841796875, 1.064849853515625, 1.1480712890625, 1.231292724609375, 1.31451416015625, 1.397735595703125, 1.48095703125, 1.564178466796875, 1.64739990234375, 1.730621337890625, 1.8138427734375, 1.897064208984375, 1.98028564453125, 2.063507080078125, 2.146728515625, 2.229949951171875, 2.31317138671875, 2.396392822265625, 2.4796142578125, 2.562835693359375, 2.64605712890625, 2.729278564453125, 2.8125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 17.0, 29.0, 30.0, 62.0, 72.0, 98.0, 104.0, 135.0, 134.0, 102.0, 73.0, 50.0, 39.0, 27.0, 17.0, 12.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2396240234375, -0.23412322998046875, -0.2286224365234375, -0.22312164306640625, -0.217620849609375, -0.21212005615234375, -0.2066192626953125, -0.20111846923828125, -0.19561767578125, -0.19011688232421875, -0.1846160888671875, -0.17911529541015625, -0.173614501953125, -0.16811370849609375, -0.1626129150390625, -0.15711212158203125, -0.151611328125, -0.14611053466796875, -0.1406097412109375, -0.13510894775390625, -0.129608154296875, -0.12410736083984375, -0.1186065673828125, -0.11310577392578125, -0.10760498046875, -0.10210418701171875, -0.0966033935546875, -0.09110260009765625, -0.085601806640625, -0.08010101318359375, -0.0746002197265625, -0.06909942626953125, -0.0635986328125, -0.05809783935546875, -0.0525970458984375, -0.04709625244140625, -0.041595458984375, -0.03609466552734375, -0.0305938720703125, -0.02509307861328125, -0.01959228515625, -0.01409149169921875, -0.0085906982421875, -0.00308990478515625, 0.002410888671875, 0.00791168212890625, 0.0134124755859375, 0.01891326904296875, 0.0244140625, 0.02991485595703125, 0.0354156494140625, 0.04091644287109375, 0.046417236328125, 0.05191802978515625, 0.0574188232421875, 0.06291961669921875, 0.06842041015625, 0.07392120361328125, 0.0794219970703125, 0.08492279052734375, 0.090423583984375, 0.09592437744140625, 0.1014251708984375, 0.10692596435546875, 0.1124267578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 11.0, 19.0, 23.0, 35.0, 39.0, 54.0, 79.0, 92.0, 161.0, 278.0, 662.0, 3266.0, 73918.0, 4091649.0, 21013.0, 1861.0, 479.0, 207.0, 129.0, 88.0, 68.0, 50.0, 27.0, 13.0, 12.0, 5.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.701263427734375, -2.56854248046875, -2.435821533203125, -2.3031005859375, -2.170379638671875, -2.03765869140625, -1.904937744140625, -1.772216796875, -1.639495849609375, -1.50677490234375, -1.374053955078125, -1.2413330078125, -1.108612060546875, -0.97589111328125, -0.843170166015625, -0.71044921875, -0.577728271484375, -0.44500732421875, -0.312286376953125, -0.1795654296875, -0.046844482421875, 0.08587646484375, 0.218597412109375, 0.351318359375, 0.484039306640625, 0.61676025390625, 0.749481201171875, 0.8822021484375, 1.014923095703125, 1.14764404296875, 1.280364990234375, 1.4130859375, 1.545806884765625, 1.67852783203125, 1.811248779296875, 1.9439697265625, 2.076690673828125, 2.20941162109375, 2.342132568359375, 2.474853515625, 2.607574462890625, 2.74029541015625, 2.873016357421875, 3.0057373046875, 3.138458251953125, 3.27117919921875, 3.403900146484375, 3.53662109375, 3.669342041015625, 3.80206298828125, 3.934783935546875, 4.0675048828125, 4.200225830078125, 4.33294677734375, 4.465667724609375, 4.598388671875, 4.731109619140625, 4.86383056640625, 4.996551513671875, 5.1292724609375, 5.261993408203125, 5.39471435546875, 5.527435302734375, 5.66015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 15.0, 45.0, 109.0, 370.0, 2619.0, 642.0, 162.0, 58.0, 30.0, 11.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.15625, -1.1324958801269531, -1.1087417602539062, -1.0849876403808594, -1.0612335205078125, -1.0374794006347656, -1.0137252807617188, -0.9899711608886719, -0.966217041015625, -0.9424629211425781, -0.9187088012695312, -0.8949546813964844, -0.8712005615234375, -0.8474464416503906, -0.8236923217773438, -0.7999382019042969, -0.77618408203125, -0.7524299621582031, -0.7286758422851562, -0.7049217224121094, -0.6811676025390625, -0.6574134826660156, -0.6336593627929688, -0.6099052429199219, -0.586151123046875, -0.5623970031738281, -0.5386428833007812, -0.5148887634277344, -0.4911346435546875, -0.4673805236816406, -0.44362640380859375, -0.4198722839355469, -0.3961181640625, -0.3723640441894531, -0.34860992431640625, -0.3248558044433594, -0.3011016845703125, -0.2773475646972656, -0.25359344482421875, -0.22983932495117188, -0.206085205078125, -0.18233108520507812, -0.15857696533203125, -0.13482284545898438, -0.1110687255859375, -0.08731460571289062, -0.06356048583984375, -0.039806365966796875, -0.01605224609375, 0.007701873779296875, 0.03145599365234375, 0.055210113525390625, 0.0789642333984375, 0.10271835327148438, 0.12647247314453125, 0.15022659301757812, 0.173980712890625, 0.19773483276367188, 0.22148895263671875, 0.24524307250976562, 0.2689971923828125, 0.2927513122558594, 0.31650543212890625, 0.3402595520019531, 0.364013671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 13.0, 84.0, 259.0, 389.0, 180.0, 57.0, 19.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7279052734375, -8.543503761291504, -8.359102249145508, -8.174701690673828, -7.990300178527832, -7.805898666381836, -7.621497631072998, -7.437096118927002, -7.252695083618164, -7.068293571472168, -6.88389253616333, -6.699491024017334, -6.515089988708496, -6.3306884765625, -6.146287441253662, -5.961885929107666, -5.777484893798828, -5.593083381652832, -5.408682346343994, -5.224280834197998, -5.03987979888916, -4.855478286743164, -4.671077251434326, -4.48667573928833, -4.302274227142334, -4.117872714996338, -3.9334716796875, -3.749070405960083, -3.564669132232666, -3.380267858505249, -3.195866584777832, -3.011465072631836, -2.827063798904419, -2.642662525177002, -2.458261251449585, -2.273859977722168, -2.089458703994751, -1.905057430267334, -1.7206560373306274, -1.5362547636032104, -1.3518534898757935, -1.1674522161483765, -0.9830509424209595, -0.7986496090888977, -0.6142483353614807, -0.4298470616340637, -0.24544572830200195, -0.06104445457458496, 0.12335681915283203, 0.307758092880249, 0.4921593964099884, 0.6765606999397278, 0.8609619736671448, 1.045363187789917, 1.2297645807266235, 1.4141658544540405, 1.5985671281814575, 1.7829684019088745, 1.9673696756362915, 2.151771068572998, 2.336172342300415, 2.520573616027832, 2.704974889755249, 2.889376163482666, 3.073777437210083]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 17.0, 11.0, 24.0, 30.0, 45.0, 49.0, 67.0, 73.0, 96.0, 77.0, 87.0, 78.0, 67.0, 75.0, 49.0, 35.0, 41.0, 28.0, 19.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0495362281799316, -1.9921149015426636, -1.9346935749053955, -1.877272367477417, -1.819851040840149, -1.7624297142028809, -1.7050083875656128, -1.6475870609283447, -1.5901657342910767, -1.5327444076538086, -1.4753230810165405, -1.4179017543792725, -1.360480546951294, -1.3030592203140259, -1.2456378936767578, -1.1882165670394897, -1.1307952404022217, -1.0733739137649536, -1.0159525871276855, -0.9585313200950623, -0.9011099934577942, -0.8436887264251709, -0.7862673997879028, -0.7288460731506348, -0.6714248657226562, -0.6140035390853882, -0.5565822720527649, -0.4991609454154968, -0.44173961877822876, -0.3843183219432831, -0.3268970251083374, -0.26947569847106934, -0.21205437183380127, -0.1546330600976944, -0.09721175581216812, -0.039790451526641846, 0.017630860209465027, 0.0750521719455719, 0.13247346878051758, 0.18989479541778564, 0.24731609225273132, 0.304737389087677, 0.36215871572494507, 0.41958001255989075, 0.4770013093948364, 0.5344226360321045, 0.5918439626693726, 0.6492652893066406, 0.7066865563392639, 0.764107882976532, 0.8215291500091553, 0.8789504766464233, 0.9363718032836914, 0.9937931299209595, 1.0512144565582275, 1.108635663986206, 1.1660569906234741, 1.2234783172607422, 1.2808996438980103, 1.3383209705352783, 1.3957421779632568, 1.453163504600525, 1.510584831237793, 1.568006157875061, 1.625427484512329]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 5.0, 1.0, 3.0, 8.0, 11.0, 17.0, 22.0, 18.0, 27.0, 30.0, 47.0, 64.0, 105.0, 172.0, 305.0, 744.0, 1950.0, 5828.0, 21038.0, 98667.0, 472006.0, 357999.0, 66902.0, 15233.0, 4452.0, 1519.0, 599.0, 299.0, 168.0, 90.0, 59.0, 47.0, 28.0, 25.0, 15.0, 16.0, 7.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.09375, -1.0583343505859375, -1.022918701171875, -0.9875030517578125, -0.95208740234375, -0.9166717529296875, -0.881256103515625, -0.8458404541015625, -0.8104248046875, -0.7750091552734375, -0.739593505859375, -0.7041778564453125, -0.66876220703125, -0.6333465576171875, -0.597930908203125, -0.5625152587890625, -0.527099609375, -0.4916839599609375, -0.456268310546875, -0.4208526611328125, -0.38543701171875, -0.3500213623046875, -0.314605712890625, -0.2791900634765625, -0.2437744140625, -0.2083587646484375, -0.172943115234375, -0.1375274658203125, -0.10211181640625, -0.0666961669921875, -0.031280517578125, 0.0041351318359375, 0.03955078125, 0.0749664306640625, 0.110382080078125, 0.1457977294921875, 0.18121337890625, 0.2166290283203125, 0.252044677734375, 0.2874603271484375, 0.3228759765625, 0.3582916259765625, 0.393707275390625, 0.4291229248046875, 0.46453857421875, 0.4999542236328125, 0.535369873046875, 0.5707855224609375, 0.606201171875, 0.6416168212890625, 0.677032470703125, 0.7124481201171875, 0.74786376953125, 0.7832794189453125, 0.818695068359375, 0.8541107177734375, 0.8895263671875, 0.9249420166015625, 0.960357666015625, 0.9957733154296875, 1.03118896484375, 1.0666046142578125, 1.102020263671875, 1.1374359130859375, 1.1728515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 12.0, 10.0, 23.0, 27.0, 24.0, 21.0, 44.0, 49.0, 56.0, 68.0, 75.0, 73.0, 83.0, 63.0, 69.0, 64.0, 48.0, 46.0, 34.0, 33.0, 25.0, 18.0, 12.0, 11.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.12927627563476562, -0.12549591064453125, -0.12171554565429688, -0.1179351806640625, -0.11415481567382812, -0.11037445068359375, -0.10659408569335938, -0.102813720703125, -0.09903335571289062, -0.09525299072265625, -0.09147262573242188, -0.0876922607421875, -0.08391189575195312, -0.08013153076171875, -0.07635116577148438, -0.07257080078125, -0.06879043579101562, -0.06501007080078125, -0.061229705810546875, -0.0574493408203125, -0.053668975830078125, -0.04988861083984375, -0.046108245849609375, -0.042327880859375, -0.038547515869140625, -0.03476715087890625, -0.030986785888671875, -0.0272064208984375, -0.023426055908203125, -0.01964569091796875, -0.015865325927734375, -0.0120849609375, -0.008304595947265625, -0.00452423095703125, -0.000743865966796875, 0.0030364990234375, 0.006816864013671875, 0.01059722900390625, 0.014377593994140625, 0.018157958984375, 0.021938323974609375, 0.02571868896484375, 0.029499053955078125, 0.0332794189453125, 0.037059783935546875, 0.04084014892578125, 0.044620513916015625, 0.04840087890625, 0.052181243896484375, 0.05596160888671875, 0.059741973876953125, 0.0635223388671875, 0.06730270385742188, 0.07108306884765625, 0.07486343383789062, 0.078643798828125, 0.08242416381835938, 0.08620452880859375, 0.08998489379882812, 0.0937652587890625, 0.09754562377929688, 0.10132598876953125, 0.10510635375976562, 0.10888671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 6.0, 11.0, 11.0, 15.0, 32.0, 37.0, 50.0, 83.0, 101.0, 171.0, 260.0, 397.0, 622.0, 1047.0, 1867.0, 3354.0, 6664.0, 14307.0, 32782.0, 82705.0, 205645.0, 327931.0, 216780.0, 88209.0, 34845.0, 15034.0, 6992.0, 3589.0, 1977.0, 1136.0, 633.0, 405.0, 255.0, 179.0, 116.0, 80.0, 50.0, 47.0, 36.0, 20.0, 10.0, 13.0, 8.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.55029296875, -0.5333786010742188, -0.5164642333984375, -0.49954986572265625, -0.482635498046875, -0.46572113037109375, -0.4488067626953125, -0.43189239501953125, -0.41497802734375, -0.39806365966796875, -0.3811492919921875, -0.36423492431640625, -0.347320556640625, -0.33040618896484375, -0.3134918212890625, -0.29657745361328125, -0.2796630859375, -0.26274871826171875, -0.2458343505859375, -0.22891998291015625, -0.212005615234375, -0.19509124755859375, -0.1781768798828125, -0.16126251220703125, -0.14434814453125, -0.12743377685546875, -0.1105194091796875, -0.09360504150390625, -0.076690673828125, -0.05977630615234375, -0.0428619384765625, -0.02594757080078125, -0.009033203125, 0.00788116455078125, 0.0247955322265625, 0.04170989990234375, 0.058624267578125, 0.07553863525390625, 0.0924530029296875, 0.10936737060546875, 0.12628173828125, 0.14319610595703125, 0.1601104736328125, 0.17702484130859375, 0.193939208984375, 0.21085357666015625, 0.2277679443359375, 0.24468231201171875, 0.2615966796875, 0.27851104736328125, 0.2954254150390625, 0.31233978271484375, 0.329254150390625, 0.34616851806640625, 0.3630828857421875, 0.37999725341796875, 0.39691162109375, 0.41382598876953125, 0.4307403564453125, 0.44765472412109375, 0.464569091796875, 0.48148345947265625, 0.4983978271484375, 0.5153121948242188, 0.5322265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 8.0, 7.0, 14.0, 6.0, 16.0, 18.0, 12.0, 15.0, 31.0, 27.0, 27.0, 18.0, 21.0, 33.0, 28.0, 36.0, 36.0, 47.0, 45.0, 35.0, 37.0, 34.0, 38.0, 29.0, 36.0, 38.0, 27.0, 38.0, 25.0, 22.0, 28.0, 25.0, 23.0, 20.0, 14.0, 21.0, 12.0, 11.0, 8.0, 7.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3278236389160156, -0.31580352783203125, -0.3037834167480469, -0.2917633056640625, -0.2797431945800781, -0.26772308349609375, -0.2557029724121094, -0.243682861328125, -0.23166275024414062, -0.21964263916015625, -0.20762252807617188, -0.1956024169921875, -0.18358230590820312, -0.17156219482421875, -0.15954208374023438, -0.14752197265625, -0.13550186157226562, -0.12348175048828125, -0.11146163940429688, -0.0994415283203125, -0.08742141723632812, -0.07540130615234375, -0.06338119506835938, -0.051361083984375, -0.039340972900390625, -0.02732086181640625, -0.015300750732421875, -0.0032806396484375, 0.008739471435546875, 0.02075958251953125, 0.032779693603515625, 0.0447998046875, 0.056819915771484375, 0.06884002685546875, 0.08086013793945312, 0.0928802490234375, 0.10490036010742188, 0.11692047119140625, 0.12894058227539062, 0.140960693359375, 0.15298080444335938, 0.16500091552734375, 0.17702102661132812, 0.1890411376953125, 0.20106124877929688, 0.21308135986328125, 0.22510147094726562, 0.23712158203125, 0.24914169311523438, 0.26116180419921875, 0.2731819152832031, 0.2852020263671875, 0.2972221374511719, 0.30924224853515625, 0.3212623596191406, 0.333282470703125, 0.3453025817871094, 0.35732269287109375, 0.3693428039550781, 0.3813629150390625, 0.3933830261230469, 0.40540313720703125, 0.4174232482910156, 0.429443359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 12.0, 21.0, 18.0, 48.0, 44.0, 97.0, 150.0, 252.0, 489.0, 891.0, 1757.0, 4261.0, 11894.0, 48164.0, 370483.0, 515082.0, 70003.0, 15147.0, 5163.0, 2235.0, 1051.0, 517.0, 264.0, 173.0, 107.0, 71.0, 41.0, 28.0, 23.0, 16.0, 12.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.8056640625, -0.7813262939453125, -0.756988525390625, -0.7326507568359375, -0.70831298828125, -0.6839752197265625, -0.659637451171875, -0.6352996826171875, -0.6109619140625, -0.5866241455078125, -0.562286376953125, -0.5379486083984375, -0.51361083984375, -0.4892730712890625, -0.464935302734375, -0.4405975341796875, -0.416259765625, -0.3919219970703125, -0.367584228515625, -0.3432464599609375, -0.31890869140625, -0.2945709228515625, -0.270233154296875, -0.2458953857421875, -0.2215576171875, -0.1972198486328125, -0.172882080078125, -0.1485443115234375, -0.12420654296875, -0.0998687744140625, -0.075531005859375, -0.0511932373046875, -0.02685546875, -0.0025177001953125, 0.021820068359375, 0.0461578369140625, 0.07049560546875, 0.0948333740234375, 0.119171142578125, 0.1435089111328125, 0.1678466796875, 0.1921844482421875, 0.216522216796875, 0.2408599853515625, 0.26519775390625, 0.2895355224609375, 0.313873291015625, 0.3382110595703125, 0.362548828125, 0.3868865966796875, 0.411224365234375, 0.4355621337890625, 0.45989990234375, 0.4842376708984375, 0.508575439453125, 0.5329132080078125, 0.5572509765625, 0.5815887451171875, 0.605926513671875, 0.6302642822265625, 0.65460205078125, 0.6789398193359375, 0.703277587890625, 0.7276153564453125, 0.751953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 17.0, 21.0, 15.0, 25.0, 37.0, 56.0, 70.0, 73.0, 87.0, 98.0, 92.0, 58.0, 76.0, 66.0, 34.0, 34.0, 24.0, 20.0, 6.0, 11.0, 13.0, 11.0, 4.0, 3.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013828277587890625, -0.00013374164700508118, -0.0001292005181312561, -0.00012465938925743103, -0.00012011826038360596, -0.00011557713150978088, -0.00011103600263595581, -0.00010649487376213074, -0.00010195374488830566, -9.741261601448059e-05, -9.287148714065552e-05, -8.833035826683044e-05, -8.378922939300537e-05, -7.92481005191803e-05, -7.470697164535522e-05, -7.016584277153015e-05, -6.562471389770508e-05, -6.108358502388e-05, -5.654245615005493e-05, -5.200132727622986e-05, -4.7460198402404785e-05, -4.291906952857971e-05, -3.837794065475464e-05, -3.3836811780929565e-05, -2.9295682907104492e-05, -2.475455403327942e-05, -2.0213425159454346e-05, -1.5672296285629272e-05, -1.11311674118042e-05, -6.590038537979126e-06, -2.0489096641540527e-06, 2.4922192096710205e-06, 7.033348083496094e-06, 1.1574476957321167e-05, 1.611560583114624e-05, 2.0656734704971313e-05, 2.5197863578796387e-05, 2.973899245262146e-05, 3.428012132644653e-05, 3.8821250200271606e-05, 4.336237907409668e-05, 4.790350794792175e-05, 5.2444636821746826e-05, 5.69857656955719e-05, 6.152689456939697e-05, 6.606802344322205e-05, 7.060915231704712e-05, 7.515028119087219e-05, 7.969141006469727e-05, 8.423253893852234e-05, 8.877366781234741e-05, 9.331479668617249e-05, 9.785592555999756e-05, 0.00010239705443382263, 0.0001069381833076477, 0.00011147931218147278, 0.00011602044105529785, 0.00012056156992912292, 0.000125102698802948, 0.00012964382767677307, 0.00013418495655059814, 0.00013872608542442322, 0.0001432672142982483, 0.00014780834317207336, 0.00015234947204589844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 17.0, 17.0, 25.0, 58.0, 72.0, 95.0, 199.0, 371.0, 748.0, 1715.0, 4688.0, 17579.0, 198331.0, 758646.0, 51742.0, 9051.0, 2855.0, 1164.0, 519.0, 239.0, 156.0, 89.0, 63.0, 29.0, 23.0, 22.0, 12.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.3021087646484375, -1.260467529296875, -1.2188262939453125, -1.17718505859375, -1.1355438232421875, -1.093902587890625, -1.0522613525390625, -1.0106201171875, -0.9689788818359375, -0.927337646484375, -0.8856964111328125, -0.84405517578125, -0.8024139404296875, -0.760772705078125, -0.7191314697265625, -0.677490234375, -0.6358489990234375, -0.594207763671875, -0.5525665283203125, -0.51092529296875, -0.4692840576171875, -0.427642822265625, -0.3860015869140625, -0.3443603515625, -0.3027191162109375, -0.261077880859375, -0.2194366455078125, -0.17779541015625, -0.1361541748046875, -0.094512939453125, -0.0528717041015625, -0.01123046875, 0.0304107666015625, 0.072052001953125, 0.1136932373046875, 0.15533447265625, 0.1969757080078125, 0.238616943359375, 0.2802581787109375, 0.3218994140625, 0.3635406494140625, 0.405181884765625, 0.4468231201171875, 0.48846435546875, 0.5301055908203125, 0.571746826171875, 0.6133880615234375, 0.655029296875, 0.6966705322265625, 0.738311767578125, 0.7799530029296875, 0.82159423828125, 0.8632354736328125, 0.904876708984375, 0.9465179443359375, 0.9881591796875, 1.0298004150390625, 1.071441650390625, 1.1130828857421875, 1.15472412109375, 1.1963653564453125, 1.238006591796875, 1.2796478271484375, 1.3212890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 22.0, 46.0, 68.0, 128.0, 209.0, 197.0, 157.0, 64.0, 48.0, 21.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9951171875, -0.9675827026367188, -0.9400482177734375, -0.9125137329101562, -0.884979248046875, -0.8574447631835938, -0.8299102783203125, -0.8023757934570312, -0.77484130859375, -0.7473068237304688, -0.7197723388671875, -0.6922378540039062, -0.664703369140625, -0.6371688842773438, -0.6096343994140625, -0.5820999145507812, -0.5545654296875, -0.5270309448242188, -0.4994964599609375, -0.47196197509765625, -0.444427490234375, -0.41689300537109375, -0.3893585205078125, -0.36182403564453125, -0.33428955078125, -0.30675506591796875, -0.2792205810546875, -0.25168609619140625, -0.224151611328125, -0.19661712646484375, -0.1690826416015625, -0.14154815673828125, -0.114013671875, -0.08647918701171875, -0.0589447021484375, -0.03141021728515625, -0.003875732421875, 0.02365875244140625, 0.0511932373046875, 0.07872772216796875, 0.10626220703125, 0.13379669189453125, 0.1613311767578125, 0.18886566162109375, 0.216400146484375, 0.24393463134765625, 0.2714691162109375, 0.29900360107421875, 0.3265380859375, 0.35407257080078125, 0.3816070556640625, 0.40914154052734375, 0.436676025390625, 0.46421051025390625, 0.4917449951171875, 0.5192794799804688, 0.54681396484375, 0.5743484497070312, 0.6018829345703125, 0.6294174194335938, 0.656951904296875, 0.6844863891601562, 0.7120208740234375, 0.7395553588867188, 0.76708984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 9.0, 9.0, 14.0, 19.0, 34.0, 78.0, 100.0, 142.0, 170.0, 168.0, 106.0, 67.0, 34.0, 19.0, 16.0, 10.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.451545715332031, -8.247920989990234, -8.044296264648438, -7.840670585632324, -7.637045860290527, -7.4334211349487305, -7.229795932769775, -7.02617073059082, -6.822546005249023, -6.618921279907227, -6.4152960777282715, -6.211670875549316, -6.0080461502075195, -5.804421424865723, -5.600796222686768, -5.3971710205078125, -5.193546295166016, -4.989921569824219, -4.786296367645264, -4.582671165466309, -4.379046440124512, -4.175421714782715, -3.9717965126037598, -3.768171548843384, -3.564546585083008, -3.360921621322632, -3.157296657562256, -2.95367169380188, -2.750046730041504, -2.546421766281128, -2.342796802520752, -2.139171838760376, -1.9355473518371582, -1.7319223880767822, -1.5282974243164062, -1.3246724605560303, -1.1210474967956543, -0.9174225330352783, -0.7137975692749023, -0.5101726055145264, -0.3065476417541504, -0.10292267799377441, 0.10070228576660156, 0.30432724952697754, 0.5079522132873535, 0.7115771770477295, 0.9152021408081055, 1.1188271045684814, 1.3224520683288574, 1.5260770320892334, 1.7297019958496094, 1.9333269596099854, 2.1369519233703613, 2.3405768871307373, 2.5442018508911133, 2.7478268146514893, 2.9514517784118652, 3.155076742172241, 3.358701705932617, 3.562326669692993, 3.765951633453369, 3.969576597213745, 4.173201560974121, 4.376826286315918, 4.580451488494873]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 9.0, 11.0, 14.0, 26.0, 26.0, 34.0, 59.0, 53.0, 62.0, 93.0, 72.0, 80.0, 78.0, 82.0, 67.0, 56.0, 48.0, 36.0, 25.0, 29.0, 12.0, 10.0, 11.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8772807121276855, -5.716360569000244, -5.555440902709961, -5.3945207595825195, -5.233600616455078, -5.072680473327637, -4.911760330200195, -4.750840663909912, -4.589920520782471, -4.429000377655029, -4.268080711364746, -4.107160568237305, -3.9462404251098633, -3.785320281982422, -3.6244003772735596, -3.4634804725646973, -3.302560329437256, -3.1416401863098145, -2.980720281600952, -2.81980037689209, -2.6588802337646484, -2.497960090637207, -2.3370401859283447, -2.1761202812194824, -2.015200138092041, -1.8542801141738892, -1.6933600902557373, -1.5324400663375854, -1.3715200424194336, -1.2106000185012817, -1.0496799945831299, -0.888759970664978, -0.7278404235839844, -0.5669203996658325, -0.40600037574768066, -0.2450803518295288, -0.08416032791137695, 0.0767596960067749, 0.23767971992492676, 0.3985997438430786, 0.5595197677612305, 0.7204397916793823, 0.8813598155975342, 1.042279839515686, 1.203199863433838, 1.3641198873519897, 1.5250399112701416, 1.6859599351882935, 1.8468799591064453, 2.0078001022338867, 2.168720006942749, 2.3296399116516113, 2.4905600547790527, 2.651480197906494, 2.8124001026153564, 2.9733200073242188, 3.13424015045166, 3.2951602935791016, 3.456080198287964, 3.617000102996826, 3.7779202461242676, 3.938840389251709, 4.099760055541992, 4.260680198669434, 4.421600341796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 12.0, 24.0, 32.0, 63.0, 77.0, 153.0, 273.0, 668.0, 2103.0, 11260.0, 494782.0, 3659904.0, 20650.0, 2920.0, 769.0, 292.0, 125.0, 60.0, 46.0, 17.0, 11.0, 2.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.392578125, -3.3156890869140625, -3.238800048828125, -3.1619110107421875, -3.08502197265625, -3.0081329345703125, -2.931243896484375, -2.8543548583984375, -2.7774658203125, -2.7005767822265625, -2.623687744140625, -2.5467987060546875, -2.46990966796875, -2.3930206298828125, -2.316131591796875, -2.2392425537109375, -2.162353515625, -2.0854644775390625, -2.008575439453125, -1.9316864013671875, -1.85479736328125, -1.7779083251953125, -1.701019287109375, -1.6241302490234375, -1.5472412109375, -1.4703521728515625, -1.393463134765625, -1.3165740966796875, -1.23968505859375, -1.1627960205078125, -1.085906982421875, -1.0090179443359375, -0.93212890625, -0.8552398681640625, -0.778350830078125, -0.7014617919921875, -0.62457275390625, -0.5476837158203125, -0.470794677734375, -0.3939056396484375, -0.3170166015625, -0.2401275634765625, -0.163238525390625, -0.0863494873046875, -0.00946044921875, 0.0674285888671875, 0.144317626953125, 0.2212066650390625, 0.298095703125, 0.3749847412109375, 0.451873779296875, 0.5287628173828125, 0.60565185546875, 0.6825408935546875, 0.759429931640625, 0.8363189697265625, 0.9132080078125, 0.9900970458984375, 1.066986083984375, 1.1438751220703125, 1.22076416015625, 1.2976531982421875, 1.374542236328125, 1.4514312744140625, 1.5283203125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 13.0, 13.0, 29.0, 37.0, 46.0, 63.0, 72.0, 90.0, 111.0, 102.0, 95.0, 90.0, 98.0, 44.0, 37.0, 17.0, 17.0, 8.0, 6.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2652320861816406, -0.25946807861328125, -0.2537040710449219, -0.2479400634765625, -0.24217605590820312, -0.23641204833984375, -0.23064804077148438, -0.224884033203125, -0.21912002563476562, -0.21335601806640625, -0.20759201049804688, -0.2018280029296875, -0.19606399536132812, -0.19029998779296875, -0.18453598022460938, -0.17877197265625, -0.17300796508789062, -0.16724395751953125, -0.16147994995117188, -0.1557159423828125, -0.14995193481445312, -0.14418792724609375, -0.13842391967773438, -0.132659912109375, -0.12689590454101562, -0.12113189697265625, -0.11536788940429688, -0.1096038818359375, -0.10383987426757812, -0.09807586669921875, -0.09231185913085938, -0.0865478515625, -0.08078384399414062, -0.07501983642578125, -0.06925582885742188, -0.0634918212890625, -0.057727813720703125, -0.05196380615234375, -0.046199798583984375, -0.040435791015625, -0.034671783447265625, -0.02890777587890625, -0.023143768310546875, -0.0173797607421875, -0.011615753173828125, -0.00585174560546875, -8.7738037109375e-05, 0.00567626953125, 0.011440277099609375, 0.01720428466796875, 0.022968292236328125, 0.0287322998046875, 0.034496307373046875, 0.04026031494140625, 0.046024322509765625, 0.051788330078125, 0.057552337646484375, 0.06331634521484375, 0.06908035278320312, 0.0748443603515625, 0.08060836791992188, 0.08637237548828125, 0.09213638305664062, 0.097900390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 13.0, 8.0, 9.0, 13.0, 22.0, 31.0, 20.0, 26.0, 41.0, 66.0, 55.0, 94.0, 256.0, 879.0, 3947.0, 35635.0, 3859687.0, 280671.0, 10290.0, 1678.0, 448.0, 155.0, 64.0, 32.0, 39.0, 23.0, 22.0, 13.0, 13.0, 10.0, 11.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.845703125, -3.7513427734375, -3.656982421875, -3.5626220703125, -3.46826171875, -3.3739013671875, -3.279541015625, -3.1851806640625, -3.0908203125, -2.9964599609375, -2.902099609375, -2.8077392578125, -2.71337890625, -2.6190185546875, -2.524658203125, -2.4302978515625, -2.3359375, -2.2415771484375, -2.147216796875, -2.0528564453125, -1.95849609375, -1.8641357421875, -1.769775390625, -1.6754150390625, -1.5810546875, -1.4866943359375, -1.392333984375, -1.2979736328125, -1.20361328125, -1.1092529296875, -1.014892578125, -0.9205322265625, -0.826171875, -0.7318115234375, -0.637451171875, -0.5430908203125, -0.44873046875, -0.3543701171875, -0.260009765625, -0.1656494140625, -0.0712890625, 0.0230712890625, 0.117431640625, 0.2117919921875, 0.30615234375, 0.4005126953125, 0.494873046875, 0.5892333984375, 0.68359375, 0.7779541015625, 0.872314453125, 0.9666748046875, 1.06103515625, 1.1553955078125, 1.249755859375, 1.3441162109375, 1.4384765625, 1.5328369140625, 1.627197265625, 1.7215576171875, 1.81591796875, 1.9102783203125, 2.004638671875, 2.0989990234375, 2.193359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 6.0, 22.0, 41.0, 78.0, 215.0, 807.0, 2188.0, 443.0, 144.0, 52.0, 30.0, 20.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0654296875, -1.0438270568847656, -1.0222244262695312, -1.0006217956542969, -0.9790191650390625, -0.9574165344238281, -0.9358139038085938, -0.9142112731933594, -0.892608642578125, -0.8710060119628906, -0.8494033813476562, -0.8278007507324219, -0.8061981201171875, -0.7845954895019531, -0.7629928588867188, -0.7413902282714844, -0.71978759765625, -0.6981849670410156, -0.6765823364257812, -0.6549797058105469, -0.6333770751953125, -0.6117744445800781, -0.5901718139648438, -0.5685691833496094, -0.546966552734375, -0.5253639221191406, -0.5037612915039062, -0.4821586608886719, -0.4605560302734375, -0.4389533996582031, -0.41735076904296875, -0.3957481384277344, -0.3741455078125, -0.3525428771972656, -0.33094024658203125, -0.3093376159667969, -0.2877349853515625, -0.2661323547363281, -0.24452972412109375, -0.22292709350585938, -0.201324462890625, -0.17972183227539062, -0.15811920166015625, -0.13651657104492188, -0.1149139404296875, -0.09331130981445312, -0.07170867919921875, -0.050106048583984375, -0.02850341796875, -0.006900787353515625, 0.01470184326171875, 0.036304473876953125, 0.0579071044921875, 0.07950973510742188, 0.10111236572265625, 0.12271499633789062, 0.144317626953125, 0.16592025756835938, 0.18752288818359375, 0.20912551879882812, 0.2307281494140625, 0.2523307800292969, 0.27393341064453125, 0.2955360412597656, 0.317138671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 32.0, 109.0, 262.0, 373.0, 164.0, 37.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8736884593963623, -3.672372817993164, -3.4710569381713867, -3.2697412967681885, -3.0684256553649902, -2.867109775543213, -2.6657941341400146, -2.4644784927368164, -2.263162612915039, -2.061846971511841, -1.8605310916900635, -1.6592154502868652, -1.4578996896743774, -1.2565839290618896, -1.0552682876586914, -0.8539525270462036, -0.6526367664337158, -0.4513210356235504, -0.250005304813385, -0.04868960380554199, 0.1526261568069458, 0.3539419174194336, 0.5552575588226318, 0.7565733194351196, 0.9578890800476074, 1.1592048406600952, 1.360520601272583, 1.5618362426757812, 1.763152003288269, 1.9644677639007568, 2.165783405303955, 2.3670992851257324, 2.5684146881103516, 2.76973032951355, 2.971046209335327, 3.1723618507385254, 3.3736777305603027, 3.574993371963501, 3.776309013366699, 3.9776248931884766, 4.178940773010254, 4.380256652832031, 4.58157205581665, 4.782887935638428, 4.984203815460205, 5.185519218444824, 5.386835098266602, 5.588150978088379, 5.789466381072998, 5.990782260894775, 6.1920976638793945, 6.393413543701172, 6.594729423522949, 6.796045303344727, 6.997360706329346, 7.198676586151123, 7.399991989135742, 7.6013078689575195, 7.802623271942139, 8.003938674926758, 8.205254554748535, 8.406570434570312, 8.60788631439209, 8.809202194213867, 9.010518074035645]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 18.0, 28.0, 44.0, 57.0, 75.0, 84.0, 98.0, 95.0, 105.0, 79.0, 90.0, 66.0, 56.0, 30.0, 30.0, 12.0, 15.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.057626485824585, -1.9663258790969849, -1.8750253915786743, -1.7837247848510742, -1.6924242973327637, -1.6011236906051636, -1.5098230838775635, -1.418522596359253, -1.3272219896316528, -1.2359213829040527, -1.1446208953857422, -1.053320288658142, -0.9620197415351868, -0.8707191944122314, -0.7794185876846313, -0.688118040561676, -0.5968174934387207, -0.5055169463157654, -0.41421636939048767, -0.32291579246520996, -0.23161524534225464, -0.14031469821929932, -0.04901409149169922, 0.042286455631256104, 0.13358700275421143, 0.22488756477832794, 0.31618812680244446, 0.40748870372772217, 0.4987892508506775, 0.5900897979736328, 0.6813904047012329, 0.7726909518241882, 0.8639912605285645, 0.9552918076515198, 1.046592354774475, 1.1378929615020752, 1.2291934490203857, 1.3204940557479858, 1.411794662475586, 1.5030951499938965, 1.5943957567214966, 1.6856963634490967, 1.7769968509674072, 1.8682974576950073, 1.9595980644226074, 2.050898551940918, 2.1421990394592285, 2.233499765396118, 2.3248002529144287, 2.4161007404327393, 2.507401466369629, 2.5987019538879395, 2.69000244140625, 2.7813029289245605, 2.87260365486145, 2.9639041423797607, 3.0552048683166504, 3.146505355834961, 3.2378060817718506, 3.329106569290161, 3.4204070568084717, 3.5117077827453613, 3.603008270263672, 3.6943087577819824, 3.785609245300293]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 10.0, 16.0, 15.0, 9.0, 19.0, 23.0, 34.0, 49.0, 84.0, 178.0, 303.0, 765.0, 2218.0, 6892.0, 24699.0, 97450.0, 329589.0, 397665.0, 139297.0, 34951.0, 9371.0, 2999.0, 997.0, 386.0, 192.0, 96.0, 54.0, 33.0, 27.0, 13.0, 16.0, 15.0, 17.0, 15.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.814453125, -0.7874221801757812, -0.7603912353515625, -0.7333602905273438, -0.706329345703125, -0.6792984008789062, -0.6522674560546875, -0.6252365112304688, -0.59820556640625, -0.5711746215820312, -0.5441436767578125, -0.5171127319335938, -0.490081787109375, -0.46305084228515625, -0.4360198974609375, -0.40898895263671875, -0.3819580078125, -0.35492706298828125, -0.3278961181640625, -0.30086517333984375, -0.273834228515625, -0.24680328369140625, -0.2197723388671875, -0.19274139404296875, -0.16571044921875, -0.13867950439453125, -0.1116485595703125, -0.08461761474609375, -0.057586669921875, -0.03055572509765625, -0.0035247802734375, 0.02350616455078125, 0.050537109375, 0.07756805419921875, 0.1045989990234375, 0.13162994384765625, 0.158660888671875, 0.18569183349609375, 0.2127227783203125, 0.23975372314453125, 0.26678466796875, 0.29381561279296875, 0.3208465576171875, 0.34787750244140625, 0.374908447265625, 0.40193939208984375, 0.4289703369140625, 0.45600128173828125, 0.4830322265625, 0.5100631713867188, 0.5370941162109375, 0.5641250610351562, 0.591156005859375, 0.6181869506835938, 0.6452178955078125, 0.6722488403320312, 0.69927978515625, 0.7263107299804688, 0.7533416748046875, 0.7803726196289062, 0.807403564453125, 0.8344345092773438, 0.8614654541015625, 0.8884963989257812, 0.91552734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 9.0, 8.0, 15.0, 7.0, 19.0, 26.0, 26.0, 41.0, 46.0, 55.0, 40.0, 76.0, 72.0, 65.0, 71.0, 59.0, 84.0, 65.0, 48.0, 48.0, 34.0, 27.0, 14.0, 14.0, 11.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1962890625, -0.19159317016601562, -0.18689727783203125, -0.18220138549804688, -0.1775054931640625, -0.17280960083007812, -0.16811370849609375, -0.16341781616210938, -0.158721923828125, -0.15402603149414062, -0.14933013916015625, -0.14463424682617188, -0.1399383544921875, -0.13524246215820312, -0.13054656982421875, -0.12585067749023438, -0.12115478515625, -0.11645889282226562, -0.11176300048828125, -0.10706710815429688, -0.1023712158203125, -0.09767532348632812, -0.09297943115234375, -0.08828353881835938, -0.083587646484375, -0.07889175415039062, -0.07419586181640625, -0.06949996948242188, -0.0648040771484375, -0.060108184814453125, -0.05541229248046875, -0.050716400146484375, -0.0460205078125, -0.041324615478515625, -0.03662872314453125, -0.031932830810546875, -0.0272369384765625, -0.022541046142578125, -0.01784515380859375, -0.013149261474609375, -0.008453369140625, -0.003757476806640625, 0.00093841552734375, 0.005634307861328125, 0.0103302001953125, 0.015026092529296875, 0.01972198486328125, 0.024417877197265625, 0.02911376953125, 0.033809661865234375, 0.03850555419921875, 0.043201446533203125, 0.0478973388671875, 0.052593231201171875, 0.05728912353515625, 0.061985015869140625, 0.066680908203125, 0.07137680053710938, 0.07607269287109375, 0.08076858520507812, 0.0854644775390625, 0.09016036987304688, 0.09485626220703125, 0.09955215454101562, 0.104248046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 8.0, 10.0, 17.0, 17.0, 28.0, 48.0, 44.0, 75.0, 112.0, 137.0, 231.0, 321.0, 487.0, 830.0, 1423.0, 2681.0, 5701.0, 13929.0, 38349.0, 110500.0, 288275.0, 344242.0, 154373.0, 52575.0, 18882.0, 7351.0, 3410.0, 1714.0, 965.0, 620.0, 354.0, 272.0, 173.0, 99.0, 103.0, 62.0, 40.0, 24.0, 19.0, 11.0, 9.0, 4.0, 2.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.646484375, -0.6250457763671875, -0.603607177734375, -0.5821685791015625, -0.56072998046875, -0.5392913818359375, -0.517852783203125, -0.4964141845703125, -0.4749755859375, -0.4535369873046875, -0.432098388671875, -0.4106597900390625, -0.38922119140625, -0.3677825927734375, -0.346343994140625, -0.3249053955078125, -0.303466796875, -0.2820281982421875, -0.260589599609375, -0.2391510009765625, -0.21771240234375, -0.1962738037109375, -0.174835205078125, -0.1533966064453125, -0.1319580078125, -0.1105194091796875, -0.089080810546875, -0.0676422119140625, -0.04620361328125, -0.0247650146484375, -0.003326416015625, 0.0181121826171875, 0.03955078125, 0.0609893798828125, 0.082427978515625, 0.1038665771484375, 0.12530517578125, 0.1467437744140625, 0.168182373046875, 0.1896209716796875, 0.2110595703125, 0.2324981689453125, 0.253936767578125, 0.2753753662109375, 0.29681396484375, 0.3182525634765625, 0.339691162109375, 0.3611297607421875, 0.382568359375, 0.4040069580078125, 0.425445556640625, 0.4468841552734375, 0.46832275390625, 0.4897613525390625, 0.511199951171875, 0.5326385498046875, 0.5540771484375, 0.5755157470703125, 0.596954345703125, 0.6183929443359375, 0.63983154296875, 0.6612701416015625, 0.682708740234375, 0.7041473388671875, 0.7255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 9.0, 3.0, 4.0, 8.0, 10.0, 6.0, 9.0, 13.0, 12.0, 12.0, 20.0, 18.0, 19.0, 28.0, 27.0, 29.0, 29.0, 53.0, 34.0, 45.0, 34.0, 54.0, 58.0, 35.0, 50.0, 39.0, 41.0, 30.0, 30.0, 42.0, 22.0, 21.0, 24.0, 26.0, 21.0, 15.0, 14.0, 18.0, 14.0, 9.0, 5.0, 7.0, 7.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51513671875, -0.49600982666015625, -0.4768829345703125, -0.45775604248046875, -0.438629150390625, -0.41950225830078125, -0.4003753662109375, -0.38124847412109375, -0.36212158203125, -0.34299468994140625, -0.3238677978515625, -0.30474090576171875, -0.285614013671875, -0.26648712158203125, -0.2473602294921875, -0.22823333740234375, -0.2091064453125, -0.18997955322265625, -0.1708526611328125, -0.15172576904296875, -0.132598876953125, -0.11347198486328125, -0.0943450927734375, -0.07521820068359375, -0.05609130859375, -0.03696441650390625, -0.0178375244140625, 0.00128936767578125, 0.020416259765625, 0.03954315185546875, 0.0586700439453125, 0.07779693603515625, 0.096923828125, 0.11605072021484375, 0.1351776123046875, 0.15430450439453125, 0.173431396484375, 0.19255828857421875, 0.2116851806640625, 0.23081207275390625, 0.24993896484375, 0.26906585693359375, 0.2881927490234375, 0.30731964111328125, 0.326446533203125, 0.34557342529296875, 0.3647003173828125, 0.38382720947265625, 0.4029541015625, 0.42208099365234375, 0.4412078857421875, 0.46033477783203125, 0.479461669921875, 0.49858856201171875, 0.5177154541015625, 0.5368423461914062, 0.55596923828125, 0.5750961303710938, 0.5942230224609375, 0.6133499145507812, 0.632476806640625, 0.6516036987304688, 0.6707305908203125, 0.6898574829101562, 0.708984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 9.0, 11.0, 16.0, 23.0, 38.0, 49.0, 82.0, 136.0, 249.0, 506.0, 863.0, 1794.0, 4164.0, 10624.0, 31791.0, 126179.0, 515833.0, 270101.0, 57351.0, 17328.0, 6198.0, 2575.0, 1144.0, 638.0, 321.0, 192.0, 116.0, 77.0, 55.0, 29.0, 25.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58203125, -0.5624542236328125, -0.542877197265625, -0.5233001708984375, -0.50372314453125, -0.4841461181640625, -0.464569091796875, -0.4449920654296875, -0.4254150390625, -0.4058380126953125, -0.386260986328125, -0.3666839599609375, -0.34710693359375, -0.3275299072265625, -0.307952880859375, -0.2883758544921875, -0.268798828125, -0.2492218017578125, -0.229644775390625, -0.2100677490234375, -0.19049072265625, -0.1709136962890625, -0.151336669921875, -0.1317596435546875, -0.1121826171875, -0.0926055908203125, -0.073028564453125, -0.0534515380859375, -0.03387451171875, -0.0142974853515625, 0.005279541015625, 0.0248565673828125, 0.04443359375, 0.0640106201171875, 0.083587646484375, 0.1031646728515625, 0.12274169921875, 0.1423187255859375, 0.161895751953125, 0.1814727783203125, 0.2010498046875, 0.2206268310546875, 0.240203857421875, 0.2597808837890625, 0.27935791015625, 0.2989349365234375, 0.318511962890625, 0.3380889892578125, 0.357666015625, 0.3772430419921875, 0.396820068359375, 0.4163970947265625, 0.43597412109375, 0.4555511474609375, 0.475128173828125, 0.4947052001953125, 0.5142822265625, 0.5338592529296875, 0.553436279296875, 0.5730133056640625, 0.59259033203125, 0.6121673583984375, 0.631744384765625, 0.6513214111328125, 0.6708984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 12.0, 5.0, 14.0, 14.0, 23.0, 24.0, 21.0, 24.0, 45.0, 38.0, 45.0, 51.0, 60.0, 85.0, 69.0, 60.0, 57.0, 60.0, 45.0, 38.0, 28.0, 26.0, 30.0, 33.0, 25.0, 16.0, 8.0, 10.0, 2.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.165836334228516e-05, -7.87610188126564e-05, -7.586367428302765e-05, -7.29663297533989e-05, -7.006898522377014e-05, -6.717164069414139e-05, -6.427429616451263e-05, -6.137695163488388e-05, -5.847960710525513e-05, -5.558226257562637e-05, -5.268491804599762e-05, -4.9787573516368866e-05, -4.689022898674011e-05, -4.399288445711136e-05, -4.1095539927482605e-05, -3.819819539785385e-05, -3.53008508682251e-05, -3.2403506338596344e-05, -2.950616180896759e-05, -2.6608817279338837e-05, -2.3711472749710083e-05, -2.081412822008133e-05, -1.7916783690452576e-05, -1.5019439160823822e-05, -1.2122094631195068e-05, -9.224750101566315e-06, -6.327405571937561e-06, -3.4300610423088074e-06, -5.327165126800537e-07, 2.3646280169487e-06, 5.261972546577454e-06, 8.159317076206207e-06, 1.1056661605834961e-05, 1.3954006135463715e-05, 1.6851350665092468e-05, 1.9748695194721222e-05, 2.2646039724349976e-05, 2.554338425397873e-05, 2.8440728783607483e-05, 3.1338073313236237e-05, 3.423541784286499e-05, 3.7132762372493744e-05, 4.00301069021225e-05, 4.292745143175125e-05, 4.5824795961380005e-05, 4.872214049100876e-05, 5.161948502063751e-05, 5.4516829550266266e-05, 5.741417407989502e-05, 6.031151860952377e-05, 6.320886313915253e-05, 6.610620766878128e-05, 6.900355219841003e-05, 7.190089672803879e-05, 7.479824125766754e-05, 7.76955857872963e-05, 8.059293031692505e-05, 8.34902748465538e-05, 8.638761937618256e-05, 8.928496390581131e-05, 9.218230843544006e-05, 9.507965296506882e-05, 9.797699749469757e-05, 0.00010087434202432632, 0.00010377168655395508]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 8.0, 22.0, 25.0, 45.0, 45.0, 94.0, 147.0, 256.0, 394.0, 698.0, 1467.0, 3263.0, 8685.0, 27823.0, 125386.0, 571204.0, 242561.0, 44914.0, 12832.0, 4551.0, 1948.0, 918.0, 513.0, 274.0, 146.0, 110.0, 66.0, 49.0, 28.0, 22.0, 23.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.74609375, -0.724578857421875, -0.70306396484375, -0.681549072265625, -0.6600341796875, -0.638519287109375, -0.61700439453125, -0.595489501953125, -0.573974609375, -0.552459716796875, -0.53094482421875, -0.509429931640625, -0.4879150390625, -0.466400146484375, -0.44488525390625, -0.423370361328125, -0.40185546875, -0.380340576171875, -0.35882568359375, -0.337310791015625, -0.3157958984375, -0.294281005859375, -0.27276611328125, -0.251251220703125, -0.229736328125, -0.208221435546875, -0.18670654296875, -0.165191650390625, -0.1436767578125, -0.122161865234375, -0.10064697265625, -0.079132080078125, -0.0576171875, -0.036102294921875, -0.01458740234375, 0.006927490234375, 0.0284423828125, 0.049957275390625, 0.07147216796875, 0.092987060546875, 0.114501953125, 0.136016845703125, 0.15753173828125, 0.179046630859375, 0.2005615234375, 0.222076416015625, 0.24359130859375, 0.265106201171875, 0.28662109375, 0.308135986328125, 0.32965087890625, 0.351165771484375, 0.3726806640625, 0.394195556640625, 0.41571044921875, 0.437225341796875, 0.458740234375, 0.480255126953125, 0.50177001953125, 0.523284912109375, 0.5447998046875, 0.566314697265625, 0.58782958984375, 0.609344482421875, 0.630859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 13.0, 9.0, 16.0, 11.0, 15.0, 28.0, 38.0, 61.0, 63.0, 100.0, 114.0, 127.0, 105.0, 82.0, 47.0, 50.0, 21.0, 20.0, 16.0, 15.0, 10.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48779296875, -0.4705810546875, -0.453369140625, -0.4361572265625, -0.4189453125, -0.4017333984375, -0.384521484375, -0.3673095703125, -0.35009765625, -0.3328857421875, -0.315673828125, -0.2984619140625, -0.28125, -0.2640380859375, -0.246826171875, -0.2296142578125, -0.21240234375, -0.1951904296875, -0.177978515625, -0.1607666015625, -0.1435546875, -0.1263427734375, -0.109130859375, -0.0919189453125, -0.07470703125, -0.0574951171875, -0.040283203125, -0.0230712890625, -0.005859375, 0.0113525390625, 0.028564453125, 0.0457763671875, 0.06298828125, 0.0802001953125, 0.097412109375, 0.1146240234375, 0.1318359375, 0.1490478515625, 0.166259765625, 0.1834716796875, 0.20068359375, 0.2178955078125, 0.235107421875, 0.2523193359375, 0.26953125, 0.2867431640625, 0.303955078125, 0.3211669921875, 0.33837890625, 0.3555908203125, 0.372802734375, 0.3900146484375, 0.4072265625, 0.4244384765625, 0.441650390625, 0.4588623046875, 0.47607421875, 0.4932861328125, 0.510498046875, 0.5277099609375, 0.544921875, 0.5621337890625, 0.579345703125, 0.5965576171875, 0.61376953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 10.0, 6.0, 14.0, 22.0, 31.0, 49.0, 84.0, 100.0, 112.0, 132.0, 125.0, 116.0, 57.0, 45.0, 29.0, 22.0, 16.0, 10.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.677496433258057, -5.491958141326904, -5.306419849395752, -5.1208815574646, -4.935343265533447, -4.749804973602295, -4.564266204833984, -4.378727912902832, -4.19318962097168, -4.007651329040527, -3.822113037109375, -3.6365747451782227, -3.4510364532470703, -3.265498161315918, -3.0799596309661865, -2.894421339035034, -2.708883285522461, -2.5233449935913086, -2.3378067016601562, -2.152268409729004, -1.966729998588562, -1.7811917066574097, -1.5956532955169678, -1.4101150035858154, -1.224576711654663, -1.0390384197235107, -0.8535000681877136, -0.6679617166519165, -0.48242342472076416, -0.2968851327896118, -0.11134672164916992, 0.07419157028198242, 0.25973033905029297, 0.4452686607837677, 0.6308069825172424, 0.8163453340530396, 1.001883625984192, 1.1874219179153442, 1.3729603290557861, 1.5584986209869385, 1.7440369129180908, 1.9295752048492432, 2.1151134967803955, 2.300652027130127, 2.4861903190612793, 2.6717286109924316, 2.857266902923584, 3.0428051948547363, 3.2283434867858887, 3.413881778717041, 3.5994200706481934, 3.7849583625793457, 3.970496654510498, 4.15603494644165, 4.341573715209961, 4.527112007141113, 4.712650299072266, 4.898188591003418, 5.08372688293457, 5.269265174865723, 5.454803466796875, 5.640341758728027, 5.82588005065918, 6.011418342590332, 6.196956634521484]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 9.0, 7.0, 11.0, 16.0, 10.0, 15.0, 31.0, 37.0, 41.0, 37.0, 54.0, 48.0, 67.0, 88.0, 62.0, 76.0, 54.0, 58.0, 43.0, 46.0, 35.0, 25.0, 25.0, 16.0, 17.0, 11.0, 14.0, 8.0, 7.0, 7.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.148832321166992, -4.973106384277344, -4.797380447387695, -4.621654033660889, -4.44592809677124, -4.270202159881592, -4.094476222991943, -3.918750047683716, -3.7430238723754883, -3.56729793548584, -3.3915717601776123, -3.215845823287964, -3.0401196479797363, -2.864393711090088, -2.6886677742004395, -2.512941598892212, -2.3372156620025635, -2.161489725112915, -1.9857635498046875, -1.810037612915039, -1.6343114376068115, -1.458585500717163, -1.282859444618225, -1.107133388519287, -0.9314073324203491, -0.7556812763214111, -0.5799552202224731, -0.40422922372817993, -0.22850316762924194, -0.052777111530303955, 0.12294888496398926, 0.29867494106292725, 0.47440099716186523, 0.6501270532608032, 0.8258531093597412, 1.0015790462493896, 1.1773052215576172, 1.3530311584472656, 1.5287572145462036, 1.7044832706451416, 1.8802093267440796, 2.0559353828430176, 2.231661319732666, 2.4073874950408936, 2.583113431930542, 2.7588396072387695, 2.934565544128418, 3.1102914810180664, 3.286017656326294, 3.4617435932159424, 3.63746976852417, 3.8131957054138184, 3.988921880722046, 4.164648056030273, 4.340373992919922, 4.51609992980957, 4.691825866699219, 4.867551803588867, 5.043277740478516, 5.219004154205322, 5.394730091094971, 5.570456027984619, 5.746181964874268, 5.921908378601074, 6.097634315490723]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 8.0, 6.0, 7.0, 5.0, 9.0, 8.0, 13.0, 17.0, 19.0, 37.0, 64.0, 111.0, 220.0, 494.0, 1171.0, 3040.0, 9535.0, 41134.0, 391703.0, 3526187.0, 182206.0, 26649.0, 7178.0, 2413.0, 1041.0, 476.0, 239.0, 129.0, 59.0, 46.0, 21.0, 12.0, 9.0, 5.0, 1.0, 3.0, 2.0], "bins": [-1.6328125, -1.59759521484375, -1.5623779296875, -1.52716064453125, -1.491943359375, -1.45672607421875, -1.4215087890625, -1.38629150390625, -1.35107421875, -1.31585693359375, -1.2806396484375, -1.24542236328125, -1.210205078125, -1.17498779296875, -1.1397705078125, -1.10455322265625, -1.0693359375, -1.03411865234375, -0.9989013671875, -0.96368408203125, -0.928466796875, -0.89324951171875, -0.8580322265625, -0.82281494140625, -0.78759765625, -0.75238037109375, -0.7171630859375, -0.68194580078125, -0.646728515625, -0.61151123046875, -0.5762939453125, -0.54107666015625, -0.505859375, -0.47064208984375, -0.4354248046875, -0.40020751953125, -0.364990234375, -0.32977294921875, -0.2945556640625, -0.25933837890625, -0.22412109375, -0.18890380859375, -0.1536865234375, -0.11846923828125, -0.083251953125, -0.04803466796875, -0.0128173828125, 0.02239990234375, 0.0576171875, 0.09283447265625, 0.1280517578125, 0.16326904296875, 0.198486328125, 0.23370361328125, 0.2689208984375, 0.30413818359375, 0.33935546875, 0.37457275390625, 0.4097900390625, 0.44500732421875, 0.480224609375, 0.51544189453125, 0.5506591796875, 0.58587646484375, 0.62109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 15.0, 26.0, 26.0, 35.0, 49.0, 54.0, 63.0, 72.0, 63.0, 75.0, 59.0, 74.0, 64.0, 83.0, 66.0, 43.0, 33.0, 23.0, 22.0, 16.0, 9.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19707870483398438, -0.19176483154296875, -0.18645095825195312, -0.1811370849609375, -0.17582321166992188, -0.17050933837890625, -0.16519546508789062, -0.159881591796875, -0.15456771850585938, -0.14925384521484375, -0.14393997192382812, -0.1386260986328125, -0.13331222534179688, -0.12799835205078125, -0.12268447875976562, -0.11737060546875, -0.11205673217773438, -0.10674285888671875, -0.10142898559570312, -0.0961151123046875, -0.09080123901367188, -0.08548736572265625, -0.08017349243164062, -0.074859619140625, -0.06954574584960938, -0.06423187255859375, -0.058917999267578125, -0.0536041259765625, -0.048290252685546875, -0.04297637939453125, -0.037662506103515625, -0.0323486328125, -0.027034759521484375, -0.02172088623046875, -0.016407012939453125, -0.0110931396484375, -0.005779266357421875, -0.00046539306640625, 0.004848480224609375, 0.010162353515625, 0.015476226806640625, 0.02079010009765625, 0.026103973388671875, 0.0314178466796875, 0.036731719970703125, 0.04204559326171875, 0.047359466552734375, 0.05267333984375, 0.057987213134765625, 0.06330108642578125, 0.06861495971679688, 0.0739288330078125, 0.07924270629882812, 0.08455657958984375, 0.08987045288085938, 0.095184326171875, 0.10049819946289062, 0.10581207275390625, 0.11112594604492188, 0.1164398193359375, 0.12175369262695312, 0.12706756591796875, 0.13238143920898438, 0.1376953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 19.0, 30.0, 54.0, 86.0, 182.0, 481.0, 2355.0, 21856.0, 2947219.0, 1204239.0, 15266.0, 1674.0, 428.0, 171.0, 93.0, 56.0, 29.0, 20.0, 9.0, 8.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.013702392578125, -1.92193603515625, -1.830169677734375, -1.7384033203125, -1.646636962890625, -1.55487060546875, -1.463104248046875, -1.371337890625, -1.279571533203125, -1.18780517578125, -1.096038818359375, -1.0042724609375, -0.912506103515625, -0.82073974609375, -0.728973388671875, -0.63720703125, -0.545440673828125, -0.45367431640625, -0.361907958984375, -0.2701416015625, -0.178375244140625, -0.08660888671875, 0.005157470703125, 0.096923828125, 0.188690185546875, 0.28045654296875, 0.372222900390625, 0.4639892578125, 0.555755615234375, 0.64752197265625, 0.739288330078125, 0.8310546875, 0.922821044921875, 1.01458740234375, 1.106353759765625, 1.1981201171875, 1.289886474609375, 1.38165283203125, 1.473419189453125, 1.565185546875, 1.656951904296875, 1.74871826171875, 1.840484619140625, 1.9322509765625, 2.024017333984375, 2.11578369140625, 2.207550048828125, 2.29931640625, 2.391082763671875, 2.48284912109375, 2.574615478515625, 2.6663818359375, 2.758148193359375, 2.84991455078125, 2.941680908203125, 3.033447265625, 3.125213623046875, 3.21697998046875, 3.308746337890625, 3.4005126953125, 3.492279052734375, 3.58404541015625, 3.675811767578125, 3.767578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 9.0, 20.0, 16.0, 26.0, 40.0, 77.0, 152.0, 309.0, 811.0, 1487.0, 614.0, 225.0, 114.0, 69.0, 35.0, 25.0, 17.0, 4.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3623619079589844, -0.34264373779296875, -0.3229255676269531, -0.3032073974609375, -0.2834892272949219, -0.26377105712890625, -0.24405288696289062, -0.224334716796875, -0.20461654663085938, -0.18489837646484375, -0.16518020629882812, -0.1454620361328125, -0.12574386596679688, -0.10602569580078125, -0.08630752563476562, -0.06658935546875, -0.046871185302734375, -0.02715301513671875, -0.007434844970703125, 0.0122833251953125, 0.032001495361328125, 0.05171966552734375, 0.07143783569335938, 0.091156005859375, 0.11087417602539062, 0.13059234619140625, 0.15031051635742188, 0.1700286865234375, 0.18974685668945312, 0.20946502685546875, 0.22918319702148438, 0.2489013671875, 0.2686195373535156, 0.28833770751953125, 0.3080558776855469, 0.3277740478515625, 0.3474922180175781, 0.36721038818359375, 0.3869285583496094, 0.406646728515625, 0.4263648986816406, 0.44608306884765625, 0.4658012390136719, 0.4855194091796875, 0.5052375793457031, 0.5249557495117188, 0.5446739196777344, 0.56439208984375, 0.5841102600097656, 0.6038284301757812, 0.6235466003417969, 0.6432647705078125, 0.6629829406738281, 0.6827011108398438, 0.7024192810058594, 0.722137451171875, 0.7418556213378906, 0.7615737915039062, 0.7812919616699219, 0.8010101318359375, 0.8207283020019531, 0.8404464721679688, 0.8601646423339844, 0.8798828125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 27.0, 50.0, 117.0, 226.0, 272.0, 168.0, 86.0, 33.0, 8.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1158366203308105, -4.904696941375732, -4.693556785583496, -4.482417106628418, -4.27127742767334, -4.0601372718811035, -3.8489975929260254, -3.637857675552368, -3.426717758178711, -3.2155778408050537, -3.0044379234313965, -2.7932982444763184, -2.582158327102661, -2.371018409729004, -2.159878730773926, -1.9487388134002686, -1.7375988960266113, -1.526458978652954, -1.3153191804885864, -1.1041793823242188, -0.8930394649505615, -0.6818995475769043, -0.4707597494125366, -0.25961995124816895, -0.04848003387451172, 0.16265982389450073, 0.3737996816635132, 0.5849395394325256, 0.7960793972015381, 1.0072193145751953, 1.218359112739563, 1.4294989109039307, 1.6406383514404297, 1.851778268814087, 2.062918186187744, 2.2740578651428223, 2.4851977825164795, 2.6963376998901367, 2.907477378845215, 3.118617296218872, 3.3297572135925293, 3.5408971309661865, 3.7520370483398438, 3.963176727294922, 4.17431640625, 4.385456562042236, 4.5965962409973145, 4.807736396789551, 5.018876075744629, 5.230015754699707, 5.441155910491943, 5.6522955894470215, 5.863435745239258, 6.074575424194336, 6.285715103149414, 6.496854782104492, 6.7079949378967285, 6.919134616851807, 7.130274772644043, 7.341414451599121, 7.552554130554199, 7.7636942863464355, 7.974833965301514, 8.18597412109375, 8.397113800048828]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 19.0, 19.0, 25.0, 16.0, 33.0, 28.0, 54.0, 43.0, 47.0, 50.0, 61.0, 59.0, 48.0, 57.0, 53.0, 60.0, 49.0, 45.0, 42.0, 33.0, 30.0, 20.0, 21.0, 14.0, 12.0, 11.0, 12.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.4121780395507812, -2.345191478729248, -2.278204917907715, -2.2112183570861816, -2.1442317962646484, -2.0772452354431152, -2.010258674621582, -1.9432719945907593, -1.876285433769226, -1.8092988729476929, -1.7423123121261597, -1.6753257513046265, -1.6083390712738037, -1.5413525104522705, -1.4743659496307373, -1.407379388809204, -1.340392827987671, -1.2734062671661377, -1.2064197063446045, -1.1394331455230713, -1.072446584701538, -1.0054600238800049, -0.9384733438491821, -0.8714867830276489, -0.8045002222061157, -0.7375136613845825, -0.6705271005630493, -0.6035404801368713, -0.5365539193153381, -0.46956735849380493, -0.40258076786994934, -0.33559417724609375, -0.26860737800598145, -0.20162080228328705, -0.13463422656059265, -0.06764765083789825, -0.0006610751152038574, 0.06632548570632935, 0.13331207633018494, 0.20029866695404053, 0.26728522777557373, 0.33427178859710693, 0.4012583792209625, 0.4682449698448181, 0.5352315306663513, 0.6022180914878845, 0.6692047119140625, 0.7361912727355957, 0.8031778335571289, 0.8701643943786621, 0.9371509552001953, 1.0041375160217285, 1.0711240768432617, 1.138110637664795, 1.2050973176956177, 1.2720838785171509, 1.339070439338684, 1.4060570001602173, 1.4730435609817505, 1.5400301218032837, 1.6070168018341064, 1.6740033626556396, 1.7409899234771729, 1.807976484298706, 1.8749630451202393]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 20.0, 21.0, 45.0, 48.0, 79.0, 142.0, 244.0, 460.0, 1016.0, 2392.0, 6447.0, 18441.0, 61223.0, 208773.0, 430495.0, 222378.0, 64845.0, 19882.0, 6668.0, 2641.0, 1059.0, 499.0, 245.0, 175.0, 85.0, 62.0, 36.0, 29.0, 11.0, 10.0, 10.0, 12.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.86279296875, -0.8354263305664062, -0.8080596923828125, -0.7806930541992188, -0.753326416015625, -0.7259597778320312, -0.6985931396484375, -0.6712265014648438, -0.64385986328125, -0.6164932250976562, -0.5891265869140625, -0.5617599487304688, -0.534393310546875, -0.5070266723632812, -0.4796600341796875, -0.45229339599609375, -0.4249267578125, -0.39756011962890625, -0.3701934814453125, -0.34282684326171875, -0.315460205078125, -0.28809356689453125, -0.2607269287109375, -0.23336029052734375, -0.20599365234375, -0.17862701416015625, -0.1512603759765625, -0.12389373779296875, -0.096527099609375, -0.06916046142578125, -0.0417938232421875, -0.01442718505859375, 0.012939453125, 0.04030609130859375, 0.0676727294921875, 0.09503936767578125, 0.122406005859375, 0.14977264404296875, 0.1771392822265625, 0.20450592041015625, 0.23187255859375, 0.25923919677734375, 0.2866058349609375, 0.31397247314453125, 0.341339111328125, 0.36870574951171875, 0.3960723876953125, 0.42343902587890625, 0.4508056640625, 0.47817230224609375, 0.5055389404296875, 0.5329055786132812, 0.560272216796875, 0.5876388549804688, 0.6150054931640625, 0.6423721313476562, 0.66973876953125, 0.6971054077148438, 0.7244720458984375, 0.7518386840820312, 0.779205322265625, 0.8065719604492188, 0.8339385986328125, 0.8613052368164062, 0.888671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 4.0, 2.0, 2.0, 5.0, 9.0, 12.0, 15.0, 20.0, 26.0, 34.0, 46.0, 31.0, 57.0, 76.0, 56.0, 65.0, 71.0, 63.0, 65.0, 69.0, 62.0, 44.0, 46.0, 25.0, 26.0, 18.0, 16.0, 14.0, 14.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18073272705078125, -0.1751861572265625, -0.16963958740234375, -0.164093017578125, -0.15854644775390625, -0.1529998779296875, -0.14745330810546875, -0.14190673828125, -0.13636016845703125, -0.1308135986328125, -0.12526702880859375, -0.119720458984375, -0.11417388916015625, -0.1086273193359375, -0.10308074951171875, -0.0975341796875, -0.09198760986328125, -0.0864410400390625, -0.08089447021484375, -0.075347900390625, -0.06980133056640625, -0.0642547607421875, -0.05870819091796875, -0.05316162109375, -0.04761505126953125, -0.0420684814453125, -0.03652191162109375, -0.030975341796875, -0.02542877197265625, -0.0198822021484375, -0.01433563232421875, -0.0087890625, -0.00324249267578125, 0.0023040771484375, 0.00785064697265625, 0.013397216796875, 0.01894378662109375, 0.0244903564453125, 0.03003692626953125, 0.03558349609375, 0.04113006591796875, 0.0466766357421875, 0.05222320556640625, 0.057769775390625, 0.06331634521484375, 0.0688629150390625, 0.07440948486328125, 0.0799560546875, 0.08550262451171875, 0.0910491943359375, 0.09659576416015625, 0.102142333984375, 0.10768890380859375, 0.1132354736328125, 0.11878204345703125, 0.12432861328125, 0.12987518310546875, 0.1354217529296875, 0.14096832275390625, 0.146514892578125, 0.15206146240234375, 0.1576080322265625, 0.16315460205078125, 0.168701171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 10.0, 14.0, 12.0, 21.0, 41.0, 32.0, 74.0, 111.0, 156.0, 233.0, 406.0, 756.0, 1539.0, 3610.0, 8945.0, 25486.0, 82316.0, 267108.0, 413880.0, 166647.0, 49660.0, 16414.0, 5915.0, 2497.0, 1125.0, 631.0, 308.0, 198.0, 112.0, 89.0, 54.0, 32.0, 31.0, 20.0, 23.0, 8.0, 15.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.015625, -0.989776611328125, -0.96392822265625, -0.938079833984375, -0.9122314453125, -0.886383056640625, -0.86053466796875, -0.834686279296875, -0.808837890625, -0.782989501953125, -0.75714111328125, -0.731292724609375, -0.7054443359375, -0.679595947265625, -0.65374755859375, -0.627899169921875, -0.60205078125, -0.576202392578125, -0.55035400390625, -0.524505615234375, -0.4986572265625, -0.472808837890625, -0.44696044921875, -0.421112060546875, -0.395263671875, -0.369415283203125, -0.34356689453125, -0.317718505859375, -0.2918701171875, -0.266021728515625, -0.24017333984375, -0.214324951171875, -0.1884765625, -0.162628173828125, -0.13677978515625, -0.110931396484375, -0.0850830078125, -0.059234619140625, -0.03338623046875, -0.007537841796875, 0.018310546875, 0.044158935546875, 0.07000732421875, 0.095855712890625, 0.1217041015625, 0.147552490234375, 0.17340087890625, 0.199249267578125, 0.22509765625, 0.250946044921875, 0.27679443359375, 0.302642822265625, 0.3284912109375, 0.354339599609375, 0.38018798828125, 0.406036376953125, 0.431884765625, 0.457733154296875, 0.48358154296875, 0.509429931640625, 0.5352783203125, 0.561126708984375, 0.58697509765625, 0.612823486328125, 0.638671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 10.0, 9.0, 13.0, 13.0, 10.0, 17.0, 26.0, 32.0, 32.0, 35.0, 37.0, 62.0, 50.0, 53.0, 56.0, 48.0, 46.0, 53.0, 39.0, 34.0, 30.0, 46.0, 25.0, 27.0, 26.0, 15.0, 15.0, 27.0, 17.0, 17.0, 13.0, 12.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6051101684570312, -0.5827789306640625, -0.5604476928710938, -0.538116455078125, -0.5157852172851562, -0.4934539794921875, -0.47112274169921875, -0.44879150390625, -0.42646026611328125, -0.4041290283203125, -0.38179779052734375, -0.359466552734375, -0.33713531494140625, -0.3148040771484375, -0.29247283935546875, -0.2701416015625, -0.24781036376953125, -0.2254791259765625, -0.20314788818359375, -0.180816650390625, -0.15848541259765625, -0.1361541748046875, -0.11382293701171875, -0.09149169921875, -0.06916046142578125, -0.0468292236328125, -0.02449798583984375, -0.002166748046875, 0.02016448974609375, 0.0424957275390625, 0.06482696533203125, 0.087158203125, 0.10948944091796875, 0.1318206787109375, 0.15415191650390625, 0.176483154296875, 0.19881439208984375, 0.2211456298828125, 0.24347686767578125, 0.26580810546875, 0.28813934326171875, 0.3104705810546875, 0.33280181884765625, 0.355133056640625, 0.37746429443359375, 0.3997955322265625, 0.42212677001953125, 0.4444580078125, 0.46678924560546875, 0.4891204833984375, 0.5114517211914062, 0.533782958984375, 0.5561141967773438, 0.5784454345703125, 0.6007766723632812, 0.62310791015625, 0.6454391479492188, 0.6677703857421875, 0.6901016235351562, 0.712432861328125, 0.7347640991210938, 0.7570953369140625, 0.7794265747070312, 0.8017578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 1.0, 7.0, 4.0, 9.0, 17.0, 33.0, 51.0, 84.0, 180.0, 348.0, 708.0, 1691.0, 4647.0, 23387.0, 749801.0, 249430.0, 12452.0, 3215.0, 1309.0, 559.0, 282.0, 135.0, 78.0, 50.0, 23.0, 16.0, 12.0, 15.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7055206298828125, -1.646392822265625, -1.5872650146484375, -1.52813720703125, -1.4690093994140625, -1.409881591796875, -1.3507537841796875, -1.2916259765625, -1.2324981689453125, -1.173370361328125, -1.1142425537109375, -1.05511474609375, -0.9959869384765625, -0.936859130859375, -0.8777313232421875, -0.818603515625, -0.7594757080078125, -0.700347900390625, -0.6412200927734375, -0.58209228515625, -0.5229644775390625, -0.463836669921875, -0.4047088623046875, -0.3455810546875, -0.2864532470703125, -0.227325439453125, -0.1681976318359375, -0.10906982421875, -0.0499420166015625, 0.009185791015625, 0.0683135986328125, 0.12744140625, 0.1865692138671875, 0.245697021484375, 0.3048248291015625, 0.36395263671875, 0.4230804443359375, 0.482208251953125, 0.5413360595703125, 0.6004638671875, 0.6595916748046875, 0.718719482421875, 0.7778472900390625, 0.83697509765625, 0.8961029052734375, 0.955230712890625, 1.0143585205078125, 1.073486328125, 1.1326141357421875, 1.191741943359375, 1.2508697509765625, 1.30999755859375, 1.3691253662109375, 1.428253173828125, 1.4873809814453125, 1.5465087890625, 1.6056365966796875, 1.664764404296875, 1.7238922119140625, 1.78302001953125, 1.8421478271484375, 1.901275634765625, 1.9604034423828125, 2.01953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 15.0, 12.0, 19.0, 21.0, 27.0, 38.0, 37.0, 58.0, 69.0, 93.0, 105.0, 104.0, 87.0, 64.0, 42.0, 45.0, 31.0, 21.0, 22.0, 10.0, 11.0, 8.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.429454803466797e-05, -9.112898260354996e-05, -8.796341717243195e-05, -8.479785174131393e-05, -8.163228631019592e-05, -7.846672087907791e-05, -7.53011554479599e-05, -7.213559001684189e-05, -6.897002458572388e-05, -6.580445915460587e-05, -6.263889372348785e-05, -5.947332829236984e-05, -5.630776286125183e-05, -5.314219743013382e-05, -4.997663199901581e-05, -4.68110665678978e-05, -4.3645501136779785e-05, -4.0479935705661774e-05, -3.731437027454376e-05, -3.414880484342575e-05, -3.098323941230774e-05, -2.7817673981189728e-05, -2.4652108550071716e-05, -2.1486543118953705e-05, -1.8320977687835693e-05, -1.5155412256717682e-05, -1.198984682559967e-05, -8.824281394481659e-06, -5.6587159633636475e-06, -2.493150532245636e-06, 6.724148988723755e-07, 3.837980329990387e-06, 7.0035457611083984e-06, 1.016911119222641e-05, 1.3334676623344421e-05, 1.6500242054462433e-05, 1.9665807485580444e-05, 2.2831372916698456e-05, 2.5996938347816467e-05, 2.916250377893448e-05, 3.232806921005249e-05, 3.54936346411705e-05, 3.865920007228851e-05, 4.1824765503406525e-05, 4.4990330934524536e-05, 4.815589636564255e-05, 5.132146179676056e-05, 5.448702722787857e-05, 5.765259265899658e-05, 6.0818158090114594e-05, 6.39837235212326e-05, 6.714928895235062e-05, 7.031485438346863e-05, 7.348041981458664e-05, 7.664598524570465e-05, 7.981155067682266e-05, 8.297711610794067e-05, 8.614268153905869e-05, 8.93082469701767e-05, 9.247381240129471e-05, 9.563937783241272e-05, 9.880494326353073e-05, 0.00010197050869464874, 0.00010513607412576675, 0.00010830163955688477]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 12.0, 24.0, 49.0, 58.0, 95.0, 121.0, 244.0, 540.0, 1452.0, 5174.0, 44689.0, 927130.0, 60018.0, 6117.0, 1617.0, 564.0, 239.0, 141.0, 89.0, 59.0, 43.0, 26.0, 13.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25, -2.18292236328125, -2.1158447265625, -2.04876708984375, -1.981689453125, -1.91461181640625, -1.8475341796875, -1.78045654296875, -1.71337890625, -1.64630126953125, -1.5792236328125, -1.51214599609375, -1.445068359375, -1.37799072265625, -1.3109130859375, -1.24383544921875, -1.1767578125, -1.10968017578125, -1.0426025390625, -0.97552490234375, -0.908447265625, -0.84136962890625, -0.7742919921875, -0.70721435546875, -0.64013671875, -0.57305908203125, -0.5059814453125, -0.43890380859375, -0.371826171875, -0.30474853515625, -0.2376708984375, -0.17059326171875, -0.103515625, -0.03643798828125, 0.0306396484375, 0.09771728515625, 0.164794921875, 0.23187255859375, 0.2989501953125, 0.36602783203125, 0.43310546875, 0.50018310546875, 0.5672607421875, 0.63433837890625, 0.701416015625, 0.76849365234375, 0.8355712890625, 0.90264892578125, 0.9697265625, 1.03680419921875, 1.1038818359375, 1.17095947265625, 1.238037109375, 1.30511474609375, 1.3721923828125, 1.43927001953125, 1.50634765625, 1.57342529296875, 1.6405029296875, 1.70758056640625, 1.774658203125, 1.84173583984375, 1.9088134765625, 1.97589111328125, 2.04296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 22.0, 48.0, 138.0, 229.0, 265.0, 152.0, 71.0, 27.0, 19.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90380859375, -0.8589096069335938, -0.8140106201171875, -0.7691116333007812, -0.724212646484375, -0.6793136596679688, -0.6344146728515625, -0.5895156860351562, -0.54461669921875, -0.49971771240234375, -0.4548187255859375, -0.40991973876953125, -0.365020751953125, -0.32012176513671875, -0.2752227783203125, -0.23032379150390625, -0.1854248046875, -0.14052581787109375, -0.0956268310546875, -0.05072784423828125, -0.005828857421875, 0.03907012939453125, 0.0839691162109375, 0.12886810302734375, 0.17376708984375, 0.21866607666015625, 0.2635650634765625, 0.30846405029296875, 0.353363037109375, 0.39826202392578125, 0.4431610107421875, 0.48805999755859375, 0.532958984375, 0.5778579711914062, 0.6227569580078125, 0.6676559448242188, 0.712554931640625, 0.7574539184570312, 0.8023529052734375, 0.8472518920898438, 0.89215087890625, 0.9370498657226562, 0.9819488525390625, 1.0268478393554688, 1.071746826171875, 1.1166458129882812, 1.1615447998046875, 1.2064437866210938, 1.2513427734375, 1.2962417602539062, 1.3411407470703125, 1.3860397338867188, 1.430938720703125, 1.4758377075195312, 1.5207366943359375, 1.5656356811523438, 1.61053466796875, 1.6554336547851562, 1.7003326416015625, 1.7452316284179688, 1.790130615234375, 1.8350296020507812, 1.8799285888671875, 1.9248275756835938, 1.9697265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 8.0, 17.0, 25.0, 44.0, 74.0, 117.0, 125.0, 136.0, 120.0, 116.0, 74.0, 48.0, 35.0, 21.0, 14.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.143497467041016, -3.9068915843963623, -3.670285701751709, -3.4336800575256348, -3.1970741748809814, -2.960468292236328, -2.723862409591675, -2.4872565269470215, -2.2506508827209473, -2.014045000076294, -1.7774392366409302, -1.5408333539962769, -1.304227590560913, -1.0676217079162598, -0.8310158252716064, -0.5944100618362427, -0.3578040599822998, -0.12119822204113007, 0.11540761590003967, 0.3520134687423706, 0.5886192917823792, 0.8252251148223877, 1.061830997467041, 1.2984367609024048, 1.535042643547058, 1.7716485261917114, 2.008254289627075, 2.2448601722717285, 2.481466054916382, 2.718071937561035, 2.9546775817871094, 3.1912834644317627, 3.427889347076416, 3.6644952297210693, 3.9011011123657227, 4.137706756591797, 4.374312877655029, 4.6109185218811035, 4.847524642944336, 5.08413028717041, 5.320735931396484, 5.557341575622559, 5.793947696685791, 6.030553340911865, 6.267159461975098, 6.503765106201172, 6.740370750427246, 6.9769768714904785, 7.213582992553711, 7.450188636779785, 7.686794757843018, 7.923400402069092, 8.160006523132324, 8.396612167358398, 8.633217811584473, 8.869823455810547, 9.106429100036621, 9.343034744262695, 9.57964038848877, 9.81624698638916, 10.052852630615234, 10.289458274841309, 10.526063919067383, 10.762669563293457, 10.999276161193848]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 11.0, 12.0, 7.0, 12.0, 11.0, 26.0, 18.0, 23.0, 30.0, 26.0, 46.0, 49.0, 33.0, 43.0, 40.0, 62.0, 50.0, 50.0, 52.0, 52.0, 48.0, 38.0, 39.0, 30.0, 25.0, 31.0, 30.0, 15.0, 18.0, 10.0, 14.0, 7.0, 5.0, 7.0, 6.0, 1.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91196346282959, -4.769279956817627, -4.626596450805664, -4.483913421630859, -4.3412299156188965, -4.198546409606934, -4.055862903594971, -3.913179636001587, -3.770496368408203, -3.6278128623962402, -3.4851295948028564, -3.3424460887908936, -3.1997628211975098, -3.057079315185547, -2.914395809173584, -2.7717125415802, -2.6290290355682373, -2.4863455295562744, -2.3436622619628906, -2.2009787559509277, -2.058295488357544, -1.915611982345581, -1.7729285955429077, -1.6302452087402344, -1.487561821937561, -1.3448784351348877, -1.2021950483322144, -1.059511661529541, -0.9168282151222229, -0.7741448283195496, -0.6314613819122314, -0.4887779951095581, -0.34609460830688477, -0.20341120660305023, -0.0607278048992157, 0.08195561170578003, 0.22463899850845337, 0.3673223853111267, 0.5100058317184448, 0.6526892185211182, 0.7953726053237915, 0.9380559921264648, 1.0807393789291382, 1.2234227657318115, 1.3661062717437744, 1.5087895393371582, 1.651473045349121, 1.7941564321517944, 1.9368398189544678, 2.0795233249664307, 2.2222065925598145, 2.3648900985717773, 2.507573366165161, 2.650256872177124, 2.792940139770508, 2.9356236457824707, 3.0783071517944336, 3.2209906578063965, 3.3636739253997803, 3.506357431411743, 3.649040699005127, 3.79172420501709, 3.9344077110290527, 4.077091217041016, 4.21977424621582]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 6.0, 15.0, 14.0, 22.0, 37.0, 42.0, 68.0, 108.0, 173.0, 279.0, 475.0, 893.0, 1821.0, 4436.0, 12798.0, 53116.0, 712878.0, 3276388.0, 99609.0, 19693.0, 6386.0, 2475.0, 1172.0, 544.0, 301.0, 181.0, 112.0, 68.0, 49.0, 38.0, 27.0, 19.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3212890625, -1.2866668701171875, -1.252044677734375, -1.2174224853515625, -1.18280029296875, -1.1481781005859375, -1.113555908203125, -1.0789337158203125, -1.0443115234375, -1.0096893310546875, -0.975067138671875, -0.9404449462890625, -0.90582275390625, -0.8712005615234375, -0.836578369140625, -0.8019561767578125, -0.767333984375, -0.7327117919921875, -0.698089599609375, -0.6634674072265625, -0.62884521484375, -0.5942230224609375, -0.559600830078125, -0.5249786376953125, -0.4903564453125, -0.4557342529296875, -0.421112060546875, -0.3864898681640625, -0.35186767578125, -0.3172454833984375, -0.282623291015625, -0.2480010986328125, -0.21337890625, -0.1787567138671875, -0.144134521484375, -0.1095123291015625, -0.07489013671875, -0.0402679443359375, -0.005645751953125, 0.0289764404296875, 0.0635986328125, 0.0982208251953125, 0.132843017578125, 0.1674652099609375, 0.20208740234375, 0.2367095947265625, 0.271331787109375, 0.3059539794921875, 0.340576171875, 0.3751983642578125, 0.409820556640625, 0.4444427490234375, 0.47906494140625, 0.5136871337890625, 0.548309326171875, 0.5829315185546875, 0.6175537109375, 0.6521759033203125, 0.686798095703125, 0.7214202880859375, 0.75604248046875, 0.7906646728515625, 0.825286865234375, 0.8599090576171875, 0.89453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 13.0, 20.0, 17.0, 25.0, 33.0, 38.0, 47.0, 39.0, 55.0, 60.0, 52.0, 50.0, 66.0, 58.0, 71.0, 54.0, 53.0, 43.0, 32.0, 31.0, 31.0, 16.0, 23.0, 12.0, 10.0, 10.0, 3.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.1667156219482422, -0.16155624389648438, -0.15639686584472656, -0.15123748779296875, -0.14607810974121094, -0.14091873168945312, -0.1357593536376953, -0.1305999755859375, -0.1254405975341797, -0.12028121948242188, -0.11512184143066406, -0.10996246337890625, -0.10480308532714844, -0.09964370727539062, -0.09448432922363281, -0.089324951171875, -0.08416557312011719, -0.07900619506835938, -0.07384681701660156, -0.06868743896484375, -0.06352806091308594, -0.058368682861328125, -0.05320930480957031, -0.0480499267578125, -0.04289054870605469, -0.037731170654296875, -0.03257179260253906, -0.02741241455078125, -0.022253036499023438, -0.017093658447265625, -0.011934280395507812, -0.00677490234375, -0.0016155242919921875, 0.003543853759765625, 0.008703231811523438, 0.01386260986328125, 0.019021987915039062, 0.024181365966796875, 0.029340744018554688, 0.0345001220703125, 0.03965950012207031, 0.044818878173828125, 0.04997825622558594, 0.05513763427734375, 0.06029701232910156, 0.06545639038085938, 0.07061576843261719, 0.075775146484375, 0.08093452453613281, 0.08609390258789062, 0.09125328063964844, 0.09641265869140625, 0.10157203674316406, 0.10673141479492188, 0.11189079284667969, 0.1170501708984375, 0.12220954895019531, 0.12736892700195312, 0.13252830505371094, 0.13768768310546875, 0.14284706115722656, 0.14800643920898438, 0.1531658172607422, 0.1583251953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 8.0, 16.0, 27.0, 42.0, 51.0, 97.0, 170.0, 352.0, 789.0, 2710.0, 12930.0, 115894.0, 3588038.0, 435826.0, 29697.0, 5099.0, 1315.0, 508.0, 242.0, 146.0, 108.0, 56.0, 39.0, 25.0, 24.0, 14.0, 16.0, 10.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.2711639404296875, -1.215179443359375, -1.1591949462890625, -1.10321044921875, -1.0472259521484375, -0.991241455078125, -0.9352569580078125, -0.8792724609375, -0.8232879638671875, -0.767303466796875, -0.7113189697265625, -0.65533447265625, -0.5993499755859375, -0.543365478515625, -0.4873809814453125, -0.431396484375, -0.3754119873046875, -0.319427490234375, -0.2634429931640625, -0.20745849609375, -0.1514739990234375, -0.095489501953125, -0.0395050048828125, 0.0164794921875, 0.0724639892578125, 0.128448486328125, 0.1844329833984375, 0.24041748046875, 0.2964019775390625, 0.352386474609375, 0.4083709716796875, 0.46435546875, 0.5203399658203125, 0.576324462890625, 0.6323089599609375, 0.68829345703125, 0.7442779541015625, 0.800262451171875, 0.8562469482421875, 0.9122314453125, 0.9682159423828125, 1.024200439453125, 1.0801849365234375, 1.13616943359375, 1.1921539306640625, 1.248138427734375, 1.3041229248046875, 1.360107421875, 1.4160919189453125, 1.472076416015625, 1.5280609130859375, 1.58404541015625, 1.6400299072265625, 1.696014404296875, 1.7519989013671875, 1.8079833984375, 1.8639678955078125, 1.919952392578125, 1.9759368896484375, 2.03192138671875, 2.0879058837890625, 2.143890380859375, 2.1998748779296875, 2.255859375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 15.0, 19.0, 31.0, 42.0, 75.0, 130.0, 284.0, 625.0, 1552.0, 696.0, 252.0, 134.0, 64.0, 33.0, 37.0, 33.0, 16.0, 8.0, 9.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34521484375, -0.329193115234375, -0.31317138671875, -0.297149658203125, -0.2811279296875, -0.265106201171875, -0.24908447265625, -0.233062744140625, -0.217041015625, -0.201019287109375, -0.18499755859375, -0.168975830078125, -0.1529541015625, -0.136932373046875, -0.12091064453125, -0.104888916015625, -0.0888671875, -0.072845458984375, -0.05682373046875, -0.040802001953125, -0.0247802734375, -0.008758544921875, 0.00726318359375, 0.023284912109375, 0.039306640625, 0.055328369140625, 0.07135009765625, 0.087371826171875, 0.1033935546875, 0.119415283203125, 0.13543701171875, 0.151458740234375, 0.16748046875, 0.183502197265625, 0.19952392578125, 0.215545654296875, 0.2315673828125, 0.247589111328125, 0.26361083984375, 0.279632568359375, 0.295654296875, 0.311676025390625, 0.32769775390625, 0.343719482421875, 0.3597412109375, 0.375762939453125, 0.39178466796875, 0.407806396484375, 0.423828125, 0.439849853515625, 0.45587158203125, 0.471893310546875, 0.4879150390625, 0.503936767578125, 0.51995849609375, 0.535980224609375, 0.552001953125, 0.568023681640625, 0.58404541015625, 0.600067138671875, 0.6160888671875, 0.632110595703125, 0.64813232421875, 0.664154052734375, 0.68017578125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 13.0, 18.0, 20.0, 33.0, 54.0, 70.0, 78.0, 85.0, 113.0, 106.0, 106.0, 81.0, 53.0, 44.0, 34.0, 29.0, 12.0, 14.0, 6.0, 10.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9665902853012085, -1.8962568044662476, -1.825923204421997, -1.7555897235870361, -1.6852561235427856, -1.6149226427078247, -1.5445890426635742, -1.4742555618286133, -1.4039220809936523, -1.3335886001586914, -1.263255000114441, -1.19292151927948, -1.1225879192352295, -1.0522544384002686, -0.9819208979606628, -0.9115873575210571, -0.8412537574768066, -0.7709202170372009, -0.7005866765975952, -0.6302531957626343, -0.5599195957183838, -0.48958608508110046, -0.41925257444381714, -0.3489190340042114, -0.2785854935646057, -0.208251953125, -0.13791842758655548, -0.06758490204811096, 0.002748638391494751, 0.07308217883110046, 0.1434156894683838, 0.2137492299079895, 0.28408265113830566, 0.3544161915779114, 0.4247497320175171, 0.4950832426548004, 0.5654168128967285, 0.6357502937316895, 0.7060838341712952, 0.7764173746109009, 0.8467509150505066, 0.9170844554901123, 0.987417995929718, 1.0577515363693237, 1.1280850172042847, 1.1984186172485352, 1.268752098083496, 1.339085578918457, 1.4094191789627075, 1.4797526597976685, 1.550086259841919, 1.6204197406768799, 1.6907533407211304, 1.7610868215560913, 1.8314204216003418, 1.9017539024353027, 1.9720873832702637, 2.0424208641052246, 2.1127543449401855, 2.1830880641937256, 2.2534215450286865, 2.3237550258636475, 2.3940885066986084, 2.4644222259521484, 2.5347557067871094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 9.0, 5.0, 9.0, 13.0, 17.0, 21.0, 16.0, 18.0, 18.0, 30.0, 27.0, 40.0, 37.0, 36.0, 34.0, 37.0, 40.0, 55.0, 48.0, 48.0, 47.0, 41.0, 42.0, 46.0, 34.0, 37.0, 33.0, 24.0, 21.0, 21.0, 20.0, 15.0, 10.0, 12.0, 5.0, 10.0, 0.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4828131198883057, -1.4383490085601807, -1.3938850164413452, -1.3494209051132202, -1.3049569129943848, -1.2604928016662598, -1.2160286903381348, -1.1715645790100098, -1.1271005868911743, -1.0826364755630493, -1.0381724834442139, -0.9937083721160889, -0.9492443203926086, -0.9047802686691284, -0.8603161573410034, -0.8158521056175232, -0.771388053894043, -0.7269240021705627, -0.6824599504470825, -0.6379958391189575, -0.5935317873954773, -0.5490677356719971, -0.5046036243438721, -0.46013957262039185, -0.4156755208969116, -0.3712114691734314, -0.3267473876476288, -0.28228330612182617, -0.23781925439834595, -0.19335518777370453, -0.1488911211490631, -0.1044270396232605, -0.05996298789978027, -0.015498921275138855, 0.028965145349502563, 0.07342921197414398, 0.1178932785987854, 0.16235734522342682, 0.20682141184806824, 0.25128549337387085, 0.2957495450973511, 0.3402135968208313, 0.3846776783466339, 0.4291417598724365, 0.47360581159591675, 0.518069863319397, 0.562533974647522, 0.6069980263710022, 0.6514620780944824, 0.6959261298179626, 0.7403901815414429, 0.7848542928695679, 0.8293183445930481, 0.8737823963165283, 0.9182465076446533, 0.9627105593681335, 1.0071746110916138, 1.0516387224197388, 1.0961027145385742, 1.1405668258666992, 1.1850309371948242, 1.2294949293136597, 1.2739590406417847, 1.3184230327606201, 1.3628871440887451]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 10.0, 9.0, 14.0, 24.0, 26.0, 51.0, 84.0, 126.0, 198.0, 374.0, 691.0, 1172.0, 2308.0, 4492.0, 9268.0, 19950.0, 45921.0, 109261.0, 237860.0, 307116.0, 174413.0, 75366.0, 31723.0, 14285.0, 6607.0, 3251.0, 1765.0, 916.0, 476.0, 298.0, 174.0, 101.0, 76.0, 43.0, 31.0, 24.0, 11.0, 13.0, 7.0, 3.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.693359375, -0.6704635620117188, -0.6475677490234375, -0.6246719360351562, -0.601776123046875, -0.5788803100585938, -0.5559844970703125, -0.5330886840820312, -0.51019287109375, -0.48729705810546875, -0.4644012451171875, -0.44150543212890625, -0.418609619140625, -0.39571380615234375, -0.3728179931640625, -0.34992218017578125, -0.3270263671875, -0.30413055419921875, -0.2812347412109375, -0.25833892822265625, -0.235443115234375, -0.21254730224609375, -0.1896514892578125, -0.16675567626953125, -0.14385986328125, -0.12096405029296875, -0.0980682373046875, -0.07517242431640625, -0.052276611328125, -0.02938079833984375, -0.0064849853515625, 0.01641082763671875, 0.039306640625, 0.06220245361328125, 0.0850982666015625, 0.10799407958984375, 0.130889892578125, 0.15378570556640625, 0.1766815185546875, 0.19957733154296875, 0.22247314453125, 0.24536895751953125, 0.2682647705078125, 0.29116058349609375, 0.314056396484375, 0.33695220947265625, 0.3598480224609375, 0.38274383544921875, 0.4056396484375, 0.42853546142578125, 0.4514312744140625, 0.47432708740234375, 0.497222900390625, 0.5201187133789062, 0.5430145263671875, 0.5659103393554688, 0.58880615234375, 0.6117019653320312, 0.6345977783203125, 0.6574935913085938, 0.680389404296875, 0.7032852172851562, 0.7261810302734375, 0.7490768432617188, 0.77197265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 10.0, 19.0, 27.0, 19.0, 29.0, 27.0, 33.0, 34.0, 47.0, 38.0, 42.0, 45.0, 47.0, 57.0, 59.0, 58.0, 43.0, 45.0, 30.0, 46.0, 37.0, 28.0, 30.0, 21.0, 16.0, 21.0, 14.0, 12.0, 8.0, 8.0, 6.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.15372657775878906, -0.14876174926757812, -0.1437969207763672, -0.13883209228515625, -0.1338672637939453, -0.12890243530273438, -0.12393760681152344, -0.1189727783203125, -0.11400794982910156, -0.10904312133789062, -0.10407829284667969, -0.09911346435546875, -0.09414863586425781, -0.08918380737304688, -0.08421897888183594, -0.079254150390625, -0.07428932189941406, -0.06932449340820312, -0.06435966491699219, -0.05939483642578125, -0.05443000793457031, -0.049465179443359375, -0.04450035095214844, -0.0395355224609375, -0.03457069396972656, -0.029605865478515625, -0.024641036987304688, -0.01967620849609375, -0.014711380004882812, -0.009746551513671875, -0.0047817230224609375, 0.00018310546875, 0.0051479339599609375, 0.010112762451171875, 0.015077590942382812, 0.02004241943359375, 0.025007247924804688, 0.029972076416015625, 0.03493690490722656, 0.0399017333984375, 0.04486656188964844, 0.049831390380859375, 0.05479621887207031, 0.05976104736328125, 0.06472587585449219, 0.06969070434570312, 0.07465553283691406, 0.079620361328125, 0.08458518981933594, 0.08955001831054688, 0.09451484680175781, 0.09947967529296875, 0.10444450378417969, 0.10940933227539062, 0.11437416076660156, 0.1193389892578125, 0.12430381774902344, 0.12926864624023438, 0.1342334747314453, 0.13919830322265625, 0.1441631317138672, 0.14912796020507812, 0.15409278869628906, 0.1590576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 13.0, 8.0, 15.0, 22.0, 50.0, 59.0, 86.0, 195.0, 326.0, 655.0, 1587.0, 4656.0, 18038.0, 101502.0, 512882.0, 337210.0, 54551.0, 11115.0, 3220.0, 1177.0, 524.0, 281.0, 152.0, 86.0, 58.0, 40.0, 19.0, 14.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3624725341796875, -1.319671630859375, -1.2768707275390625, -1.23406982421875, -1.1912689208984375, -1.148468017578125, -1.1056671142578125, -1.0628662109375, -1.0200653076171875, -0.977264404296875, -0.9344635009765625, -0.89166259765625, -0.8488616943359375, -0.806060791015625, -0.7632598876953125, -0.720458984375, -0.6776580810546875, -0.634857177734375, -0.5920562744140625, -0.54925537109375, -0.5064544677734375, -0.463653564453125, -0.4208526611328125, -0.3780517578125, -0.3352508544921875, -0.292449951171875, -0.2496490478515625, -0.20684814453125, -0.1640472412109375, -0.121246337890625, -0.0784454345703125, -0.03564453125, 0.0071563720703125, 0.049957275390625, 0.0927581787109375, 0.13555908203125, 0.1783599853515625, 0.221160888671875, 0.2639617919921875, 0.3067626953125, 0.3495635986328125, 0.392364501953125, 0.4351654052734375, 0.47796630859375, 0.5207672119140625, 0.563568115234375, 0.6063690185546875, 0.649169921875, 0.6919708251953125, 0.734771728515625, 0.7775726318359375, 0.82037353515625, 0.8631744384765625, 0.905975341796875, 0.9487762451171875, 0.9915771484375, 1.0343780517578125, 1.077178955078125, 1.1199798583984375, 1.16278076171875, 1.2055816650390625, 1.248382568359375, 1.2911834716796875, 1.333984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 8.0, 11.0, 14.0, 19.0, 20.0, 30.0, 38.0, 39.0, 53.0, 61.0, 54.0, 59.0, 71.0, 72.0, 57.0, 65.0, 63.0, 47.0, 47.0, 22.0, 29.0, 31.0, 21.0, 14.0, 13.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.01617431640625, -0.9815673828125, -0.94696044921875, -0.912353515625, -0.87774658203125, -0.8431396484375, -0.80853271484375, -0.77392578125, -0.73931884765625, -0.7047119140625, -0.67010498046875, -0.635498046875, -0.60089111328125, -0.5662841796875, -0.53167724609375, -0.4970703125, -0.46246337890625, -0.4278564453125, -0.39324951171875, -0.358642578125, -0.32403564453125, -0.2894287109375, -0.25482177734375, -0.22021484375, -0.18560791015625, -0.1510009765625, -0.11639404296875, -0.081787109375, -0.04718017578125, -0.0125732421875, 0.02203369140625, 0.056640625, 0.09124755859375, 0.1258544921875, 0.16046142578125, 0.195068359375, 0.22967529296875, 0.2642822265625, 0.29888916015625, 0.33349609375, 0.36810302734375, 0.4027099609375, 0.43731689453125, 0.471923828125, 0.50653076171875, 0.5411376953125, 0.57574462890625, 0.6103515625, 0.64495849609375, 0.6795654296875, 0.71417236328125, 0.748779296875, 0.78338623046875, 0.8179931640625, 0.85260009765625, 0.88720703125, 0.92181396484375, 0.9564208984375, 0.99102783203125, 1.025634765625, 1.06024169921875, 1.0948486328125, 1.12945556640625, 1.1640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 8.0, 7.0, 9.0, 18.0, 16.0, 29.0, 72.0, 102.0, 242.0, 635.0, 2084.0, 8587.0, 58708.0, 791858.0, 164406.0, 16587.0, 3407.0, 1049.0, 364.0, 150.0, 78.0, 48.0, 20.0, 15.0, 15.0, 8.0, 8.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.5398101806640625, -1.492706298828125, -1.4456024169921875, -1.39849853515625, -1.3513946533203125, -1.304290771484375, -1.2571868896484375, -1.2100830078125, -1.1629791259765625, -1.115875244140625, -1.0687713623046875, -1.02166748046875, -0.9745635986328125, -0.927459716796875, -0.8803558349609375, -0.833251953125, -0.7861480712890625, -0.739044189453125, -0.6919403076171875, -0.64483642578125, -0.5977325439453125, -0.550628662109375, -0.5035247802734375, -0.4564208984375, -0.4093170166015625, -0.362213134765625, -0.3151092529296875, -0.26800537109375, -0.2209014892578125, -0.173797607421875, -0.1266937255859375, -0.07958984375, -0.0324859619140625, 0.014617919921875, 0.0617218017578125, 0.10882568359375, 0.1559295654296875, 0.203033447265625, 0.2501373291015625, 0.2972412109375, 0.3443450927734375, 0.391448974609375, 0.4385528564453125, 0.48565673828125, 0.5327606201171875, 0.579864501953125, 0.6269683837890625, 0.674072265625, 0.7211761474609375, 0.768280029296875, 0.8153839111328125, 0.86248779296875, 0.9095916748046875, 0.956695556640625, 1.0037994384765625, 1.0509033203125, 1.0980072021484375, 1.145111083984375, 1.1922149658203125, 1.23931884765625, 1.2864227294921875, 1.333526611328125, 1.3806304931640625, 1.427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 10.0, 19.0, 32.0, 48.0, 60.0, 85.0, 123.0, 145.0, 141.0, 80.0, 65.0, 47.0, 30.0, 31.0, 12.0, 17.0, 11.0, 11.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017583370208740234, -0.00017076916992664337, -0.0001657046377658844, -0.00016064010560512543, -0.00015557557344436646, -0.00015051104128360748, -0.0001454465091228485, -0.00014038197696208954, -0.00013531744480133057, -0.0001302529126405716, -0.00012518838047981262, -0.00012012384831905365, -0.00011505931615829468, -0.0001099947839975357, -0.00010493025183677673, -9.986571967601776e-05, -9.480118751525879e-05, -8.973665535449982e-05, -8.467212319374084e-05, -7.960759103298187e-05, -7.45430588722229e-05, -6.947852671146393e-05, -6.441399455070496e-05, -5.9349462389945984e-05, -5.428493022918701e-05, -4.922039806842804e-05, -4.415586590766907e-05, -3.9091333746910095e-05, -3.402680158615112e-05, -2.896226942539215e-05, -2.389773726463318e-05, -1.8833205103874207e-05, -1.3768672943115234e-05, -8.704140782356262e-06, -3.63960862159729e-06, 1.4249235391616821e-06, 6.489455699920654e-06, 1.1553987860679626e-05, 1.66185200214386e-05, 2.168305218219757e-05, 2.6747584342956543e-05, 3.1812116503715515e-05, 3.687664866447449e-05, 4.194118082523346e-05, 4.700571298599243e-05, 5.2070245146751404e-05, 5.7134777307510376e-05, 6.219930946826935e-05, 6.726384162902832e-05, 7.232837378978729e-05, 7.739290595054626e-05, 8.245743811130524e-05, 8.752197027206421e-05, 9.258650243282318e-05, 9.765103459358215e-05, 0.00010271556675434113, 0.0001077800989151001, 0.00011284463107585907, 0.00011790916323661804, 0.00012297369539737701, 0.00012803822755813599, 0.00013310275971889496, 0.00013816729187965393, 0.0001432318240404129, 0.00014829635620117188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 13.0, 11.0, 7.0, 18.0, 38.0, 39.0, 60.0, 109.0, 184.0, 290.0, 514.0, 894.0, 2034.0, 5571.0, 24018.0, 576072.0, 408880.0, 20760.0, 5102.0, 1816.0, 911.0, 516.0, 270.0, 137.0, 95.0, 80.0, 43.0, 18.0, 13.0, 11.0, 11.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.8668212890625, -1.800048828125, -1.7332763671875, -1.66650390625, -1.5997314453125, -1.532958984375, -1.4661865234375, -1.3994140625, -1.3326416015625, -1.265869140625, -1.1990966796875, -1.13232421875, -1.0655517578125, -0.998779296875, -0.9320068359375, -0.865234375, -0.7984619140625, -0.731689453125, -0.6649169921875, -0.59814453125, -0.5313720703125, -0.464599609375, -0.3978271484375, -0.3310546875, -0.2642822265625, -0.197509765625, -0.1307373046875, -0.06396484375, 0.0028076171875, 0.069580078125, 0.1363525390625, 0.203125, 0.2698974609375, 0.336669921875, 0.4034423828125, 0.47021484375, 0.5369873046875, 0.603759765625, 0.6705322265625, 0.7373046875, 0.8040771484375, 0.870849609375, 0.9376220703125, 1.00439453125, 1.0711669921875, 1.137939453125, 1.2047119140625, 1.271484375, 1.3382568359375, 1.405029296875, 1.4718017578125, 1.53857421875, 1.6053466796875, 1.672119140625, 1.7388916015625, 1.8056640625, 1.8724365234375, 1.939208984375, 2.0059814453125, 2.07275390625, 2.1395263671875, 2.206298828125, 2.2730712890625, 2.33984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 7.0, 14.0, 17.0, 45.0, 76.0, 168.0, 227.0, 202.0, 90.0, 56.0, 16.0, 9.0, 7.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.302734375, -1.2614288330078125, -1.220123291015625, -1.1788177490234375, -1.13751220703125, -1.0962066650390625, -1.054901123046875, -1.0135955810546875, -0.9722900390625, -0.9309844970703125, -0.889678955078125, -0.8483734130859375, -0.80706787109375, -0.7657623291015625, -0.724456787109375, -0.6831512451171875, -0.641845703125, -0.6005401611328125, -0.559234619140625, -0.5179290771484375, -0.47662353515625, -0.4353179931640625, -0.394012451171875, -0.3527069091796875, -0.3114013671875, -0.2700958251953125, -0.228790283203125, -0.1874847412109375, -0.14617919921875, -0.1048736572265625, -0.063568115234375, -0.0222625732421875, 0.01904296875, 0.0603485107421875, 0.101654052734375, 0.1429595947265625, 0.18426513671875, 0.2255706787109375, 0.266876220703125, 0.3081817626953125, 0.3494873046875, 0.3907928466796875, 0.432098388671875, 0.4734039306640625, 0.51470947265625, 0.5560150146484375, 0.597320556640625, 0.6386260986328125, 0.679931640625, 0.7212371826171875, 0.762542724609375, 0.8038482666015625, 0.84515380859375, 0.8864593505859375, 0.927764892578125, 0.9690704345703125, 1.0103759765625, 1.0516815185546875, 1.092987060546875, 1.1342926025390625, 1.17559814453125, 1.2169036865234375, 1.258209228515625, 1.2995147705078125, 1.3408203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 42.0, 73.0, 162.0, 219.0, 217.0, 136.0, 80.0, 23.0, 21.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.345518112182617, -9.9116792678833, -9.477840423583984, -9.044001579284668, -8.610162734985352, -8.176323890686035, -7.7424845695495605, -7.308645725250244, -6.874806880950928, -6.440968036651611, -6.007129192352295, -5.57328987121582, -5.139451026916504, -4.7056121826171875, -4.271773338317871, -3.8379344940185547, -3.4040956497192383, -2.970256805419922, -2.5364179611206055, -2.10257887840271, -1.6687400341033936, -1.2349011898040771, -0.8010621070861816, -0.36722326278686523, 0.06661558151245117, 0.5004544854164124, 0.9342933893203735, 1.3681323528289795, 1.801971197128296, 2.2358100414276123, 2.669649124145508, 3.103487968444824, 3.5373268127441406, 3.971165657043457, 4.405004501342773, 4.83884334564209, 5.272682189941406, 5.706521034240723, 6.140360355377197, 6.574199199676514, 7.00803804397583, 7.4418768882751465, 7.875715732574463, 8.309555053710938, 8.743393898010254, 9.17723274230957, 9.611071586608887, 10.044910430908203, 10.47874927520752, 10.912588119506836, 11.346426963806152, 11.780265808105469, 12.214104652404785, 12.647943496704102, 13.081783294677734, 13.515621185302734, 13.949460983276367, 14.383299827575684, 14.817138671875, 15.250977516174316, 15.684816360473633, 16.118656158447266, 16.552494049072266, 16.9863338470459, 17.4201717376709]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 13.0, 7.0, 9.0, 16.0, 16.0, 12.0, 21.0, 29.0, 21.0, 28.0, 34.0, 38.0, 33.0, 38.0, 43.0, 48.0, 45.0, 40.0, 46.0, 31.0, 40.0, 41.0, 43.0, 40.0, 33.0, 28.0, 32.0, 22.0, 18.0, 11.0, 23.0, 17.0, 14.0, 11.0, 16.0, 5.0, 6.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4974141120910645, -4.351196765899658, -4.204978942871094, -4.0587615966796875, -3.9125442504882812, -3.766326904296875, -3.6201093196868896, -3.4738917350769043, -3.327674388885498, -3.181457042694092, -3.0352394580841064, -2.889021873474121, -2.742804527282715, -2.5965871810913086, -2.4503695964813232, -2.304152011871338, -2.1579346656799316, -2.0117173194885254, -1.86549973487854, -1.7192822694778442, -1.5730648040771484, -1.4268473386764526, -1.2806298732757568, -1.134412407875061, -0.9881949424743652, -0.8419774770736694, -0.6957600116729736, -0.5495425462722778, -0.40332508087158203, -0.25710761547088623, -0.11089015007019043, 0.03532731533050537, 0.18154478073120117, 0.327762246131897, 0.4739797115325928, 0.6201971769332886, 0.7664146423339844, 0.9126321077346802, 1.058849573135376, 1.2050670385360718, 1.3512845039367676, 1.4975019693374634, 1.6437194347381592, 1.789936900138855, 1.9361543655395508, 2.082371711730957, 2.2285892963409424, 2.3748068809509277, 2.521024227142334, 2.6672415733337402, 2.8134591579437256, 2.959676742553711, 3.105894088745117, 3.2521114349365234, 3.398329019546509, 3.544546604156494, 3.6907639503479004, 3.8369812965393066, 3.983198881149292, 4.129416465759277, 4.275633811950684, 4.42185115814209, 4.568068504333496, 4.7142863273620605, 4.860503673553467]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 5.0, 8.0, 12.0, 12.0, 19.0, 32.0, 39.0, 64.0, 102.0, 155.0, 296.0, 475.0, 956.0, 1831.0, 4195.0, 10385.0, 32069.0, 154338.0, 3197173.0, 687024.0, 72720.0, 19385.0, 6835.0, 2984.0, 1445.0, 745.0, 406.0, 214.0, 147.0, 85.0, 46.0, 30.0, 21.0, 6.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.27734375, -1.2452392578125, -1.213134765625, -1.1810302734375, -1.14892578125, -1.1168212890625, -1.084716796875, -1.0526123046875, -1.0205078125, -0.9884033203125, -0.956298828125, -0.9241943359375, -0.89208984375, -0.8599853515625, -0.827880859375, -0.7957763671875, -0.763671875, -0.7315673828125, -0.699462890625, -0.6673583984375, -0.63525390625, -0.6031494140625, -0.571044921875, -0.5389404296875, -0.5068359375, -0.4747314453125, -0.442626953125, -0.4105224609375, -0.37841796875, -0.3463134765625, -0.314208984375, -0.2821044921875, -0.25, -0.2178955078125, -0.185791015625, -0.1536865234375, -0.12158203125, -0.0894775390625, -0.057373046875, -0.0252685546875, 0.0068359375, 0.0389404296875, 0.071044921875, 0.1031494140625, 0.13525390625, 0.1673583984375, 0.199462890625, 0.2315673828125, 0.263671875, 0.2957763671875, 0.327880859375, 0.3599853515625, 0.39208984375, 0.4241943359375, 0.456298828125, 0.4884033203125, 0.5205078125, 0.5526123046875, 0.584716796875, 0.6168212890625, 0.64892578125, 0.6810302734375, 0.713134765625, 0.7452392578125, 0.77734375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 13.0, 19.0, 25.0, 22.0, 31.0, 42.0, 45.0, 48.0, 58.0, 65.0, 62.0, 56.0, 78.0, 61.0, 48.0, 58.0, 46.0, 37.0, 27.0, 31.0, 16.0, 23.0, 18.0, 13.0, 12.0, 9.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21187591552734375, -0.2052459716796875, -0.19861602783203125, -0.191986083984375, -0.18535614013671875, -0.1787261962890625, -0.17209625244140625, -0.16546630859375, -0.15883636474609375, -0.1522064208984375, -0.14557647705078125, -0.138946533203125, -0.13231658935546875, -0.1256866455078125, -0.11905670166015625, -0.1124267578125, -0.10579681396484375, -0.0991668701171875, -0.09253692626953125, -0.085906982421875, -0.07927703857421875, -0.0726470947265625, -0.06601715087890625, -0.05938720703125, -0.05275726318359375, -0.0461273193359375, -0.03949737548828125, -0.032867431640625, -0.02623748779296875, -0.0196075439453125, -0.01297760009765625, -0.00634765625, 0.00028228759765625, 0.0069122314453125, 0.01354217529296875, 0.020172119140625, 0.02680206298828125, 0.0334320068359375, 0.04006195068359375, 0.04669189453125, 0.05332183837890625, 0.0599517822265625, 0.06658172607421875, 0.073211669921875, 0.07984161376953125, 0.0864715576171875, 0.09310150146484375, 0.0997314453125, 0.10636138916015625, 0.1129913330078125, 0.11962127685546875, 0.126251220703125, 0.13288116455078125, 0.1395111083984375, 0.14614105224609375, 0.15277099609375, 0.15940093994140625, 0.1660308837890625, 0.17266082763671875, 0.179290771484375, 0.18592071533203125, 0.1925506591796875, 0.19918060302734375, 0.205810546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 17.0, 16.0, 30.0, 53.0, 106.0, 199.0, 424.0, 991.0, 2297.0, 6339.0, 19085.0, 78463.0, 783028.0, 3083074.0, 171268.0, 33141.0, 9764.0, 3417.0, 1368.0, 600.0, 268.0, 123.0, 74.0, 38.0, 25.0, 15.0, 10.0, 6.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.18243408203125, -1.1373291015625, -1.09222412109375, -1.047119140625, -1.00201416015625, -0.9569091796875, -0.91180419921875, -0.86669921875, -0.82159423828125, -0.7764892578125, -0.73138427734375, -0.686279296875, -0.64117431640625, -0.5960693359375, -0.55096435546875, -0.505859375, -0.46075439453125, -0.4156494140625, -0.37054443359375, -0.325439453125, -0.28033447265625, -0.2352294921875, -0.19012451171875, -0.14501953125, -0.09991455078125, -0.0548095703125, -0.00970458984375, 0.035400390625, 0.08050537109375, 0.1256103515625, 0.17071533203125, 0.2158203125, 0.26092529296875, 0.3060302734375, 0.35113525390625, 0.396240234375, 0.44134521484375, 0.4864501953125, 0.53155517578125, 0.57666015625, 0.62176513671875, 0.6668701171875, 0.71197509765625, 0.757080078125, 0.80218505859375, 0.8472900390625, 0.89239501953125, 0.9375, 0.98260498046875, 1.0277099609375, 1.07281494140625, 1.117919921875, 1.16302490234375, 1.2081298828125, 1.25323486328125, 1.29833984375, 1.34344482421875, 1.3885498046875, 1.43365478515625, 1.478759765625, 1.52386474609375, 1.5689697265625, 1.61407470703125, 1.6591796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 6.0, 8.0, 16.0, 18.0, 18.0, 21.0, 34.0, 48.0, 63.0, 95.0, 127.0, 193.0, 361.0, 778.0, 1034.0, 492.0, 246.0, 137.0, 91.0, 70.0, 42.0, 28.0, 32.0, 17.0, 15.0, 12.0, 8.0, 12.0, 9.0, 2.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.465087890625, -0.45066070556640625, -0.4362335205078125, -0.42180633544921875, -0.407379150390625, -0.39295196533203125, -0.3785247802734375, -0.36409759521484375, -0.34967041015625, -0.33524322509765625, -0.3208160400390625, -0.30638885498046875, -0.291961669921875, -0.27753448486328125, -0.2631072998046875, -0.24868011474609375, -0.2342529296875, -0.21982574462890625, -0.2053985595703125, -0.19097137451171875, -0.176544189453125, -0.16211700439453125, -0.1476898193359375, -0.13326263427734375, -0.11883544921875, -0.10440826416015625, -0.0899810791015625, -0.07555389404296875, -0.061126708984375, -0.04669952392578125, -0.0322723388671875, -0.01784515380859375, -0.00341796875, 0.01100921630859375, 0.0254364013671875, 0.03986358642578125, 0.054290771484375, 0.06871795654296875, 0.0831451416015625, 0.09757232666015625, 0.11199951171875, 0.12642669677734375, 0.1408538818359375, 0.15528106689453125, 0.169708251953125, 0.18413543701171875, 0.1985626220703125, 0.21298980712890625, 0.2274169921875, 0.24184417724609375, 0.2562713623046875, 0.27069854736328125, 0.285125732421875, 0.29955291748046875, 0.3139801025390625, 0.32840728759765625, 0.34283447265625, 0.35726165771484375, 0.3716888427734375, 0.38611602783203125, 0.400543212890625, 0.41497039794921875, 0.4293975830078125, 0.44382476806640625, 0.458251953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 18.0, 24.0, 68.0, 124.0, 181.0, 214.0, 199.0, 85.0, 53.0, 17.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.230403900146484, -10.001459121704102, -9.772514343261719, -9.543569564819336, -9.314624786376953, -9.085679054260254, -8.856734275817871, -8.627789497375488, -8.398844718933105, -8.169899940490723, -7.94095516204834, -7.712009906768799, -7.483065128326416, -7.254120349884033, -7.025175094604492, -6.796230316162109, -6.567285537719727, -6.338340759277344, -6.109395980834961, -5.88045072555542, -5.651505947113037, -5.422561168670654, -5.193615913391113, -4.9646711349487305, -4.735726356506348, -4.506781578063965, -4.277836799621582, -4.048891544342041, -3.819946765899658, -3.5910019874572754, -3.3620569705963135, -3.1331119537353516, -2.9041671752929688, -2.675222396850586, -2.446277379989624, -2.217332363128662, -1.9883875846862793, -1.759442687034607, -1.5304977893829346, -1.3015528917312622, -1.0726079940795898, -0.8436630964279175, -0.6147181987762451, -0.38577330112457275, -0.1568284034729004, 0.07211649417877197, 0.30106139183044434, 0.5300062894821167, 0.7589511871337891, 0.9878960847854614, 1.2168409824371338, 1.4457858800888062, 1.6747307777404785, 1.9036756753921509, 2.1326205730438232, 2.361565589904785, 2.590510368347168, 2.819455146789551, 3.0484001636505127, 3.2773451805114746, 3.5062899589538574, 3.7352347373962402, 3.964179754257202, 4.193124771118164, 4.422069549560547]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 16.0, 8.0, 8.0, 19.0, 27.0, 23.0, 33.0, 41.0, 48.0, 46.0, 48.0, 49.0, 56.0, 54.0, 65.0, 57.0, 54.0, 66.0, 40.0, 54.0, 43.0, 20.0, 22.0, 32.0, 19.0, 14.0, 11.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.029204845428467, -2.9394326210021973, -2.8496601581573486, -2.759887933731079, -2.6701154708862305, -2.580343246459961, -2.4905710220336914, -2.400798797607422, -2.3110263347625732, -2.2212541103363037, -2.131481647491455, -2.0417094230651855, -1.9519370794296265, -1.8621647357940674, -1.7723925113677979, -1.6826201677322388, -1.5928478240966797, -1.5030754804611206, -1.4133031368255615, -1.323530912399292, -1.233758568763733, -1.1439862251281738, -1.0542140007019043, -0.9644416570663452, -0.8746693134307861, -0.784896969795227, -0.6951246857643127, -0.6053524017333984, -0.5155800580978394, -0.42580774426460266, -0.33603543043136597, -0.24626314640045166, -0.15649080276489258, -0.06671848893165588, 0.02305382490158081, 0.1128261387348175, 0.2025984525680542, 0.2923707664012909, 0.3821430802345276, 0.4719153642654419, 0.561687707901001, 0.6514600515365601, 0.7412323355674744, 0.8310046195983887, 0.9207769632339478, 1.0105493068695068, 1.1003215312957764, 1.1900938749313354, 1.2798662185668945, 1.3696385622024536, 1.4594109058380127, 1.5491831302642822, 1.6389554738998413, 1.7287278175354004, 1.81850004196167, 1.908272385597229, 1.998044729232788, 2.0878169536590576, 2.1775894165039062, 2.267361640930176, 2.3571338653564453, 2.446906328201294, 2.5366785526275635, 2.626451015472412, 2.7162232398986816]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 11.0, 32.0, 27.0, 45.0, 65.0, 102.0, 141.0, 225.0, 306.0, 520.0, 881.0, 1484.0, 3074.0, 5766.0, 12786.0, 30021.0, 77750.0, 225365.0, 390697.0, 186199.0, 65271.0, 25314.0, 10966.0, 5279.0, 2571.0, 1384.0, 765.0, 510.0, 316.0, 231.0, 143.0, 85.0, 56.0, 39.0, 33.0, 16.0, 15.0, 9.0, 0.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.92724609375, -0.900299072265625, -0.87335205078125, -0.846405029296875, -0.8194580078125, -0.792510986328125, -0.76556396484375, -0.738616943359375, -0.711669921875, -0.684722900390625, -0.65777587890625, -0.630828857421875, -0.6038818359375, -0.576934814453125, -0.54998779296875, -0.523040771484375, -0.49609375, -0.469146728515625, -0.44219970703125, -0.415252685546875, -0.3883056640625, -0.361358642578125, -0.33441162109375, -0.307464599609375, -0.280517578125, -0.253570556640625, -0.22662353515625, -0.199676513671875, -0.1727294921875, -0.145782470703125, -0.11883544921875, -0.091888427734375, -0.06494140625, -0.037994384765625, -0.01104736328125, 0.015899658203125, 0.0428466796875, 0.069793701171875, 0.09674072265625, 0.123687744140625, 0.150634765625, 0.177581787109375, 0.20452880859375, 0.231475830078125, 0.2584228515625, 0.285369873046875, 0.31231689453125, 0.339263916015625, 0.3662109375, 0.393157958984375, 0.42010498046875, 0.447052001953125, 0.4739990234375, 0.500946044921875, 0.52789306640625, 0.554840087890625, 0.581787109375, 0.608734130859375, 0.63568115234375, 0.662628173828125, 0.6895751953125, 0.716522216796875, 0.74346923828125, 0.770416259765625, 0.79736328125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 12.0, 7.0, 12.0, 14.0, 31.0, 28.0, 34.0, 33.0, 41.0, 45.0, 56.0, 48.0, 62.0, 59.0, 50.0, 53.0, 63.0, 48.0, 37.0, 37.0, 42.0, 35.0, 34.0, 24.0, 16.0, 22.0, 11.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.23206329345703125, -0.2251129150390625, -0.21816253662109375, -0.211212158203125, -0.20426177978515625, -0.1973114013671875, -0.19036102294921875, -0.18341064453125, -0.17646026611328125, -0.1695098876953125, -0.16255950927734375, -0.155609130859375, -0.14865875244140625, -0.1417083740234375, -0.13475799560546875, -0.1278076171875, -0.12085723876953125, -0.1139068603515625, -0.10695648193359375, -0.100006103515625, -0.09305572509765625, -0.0861053466796875, -0.07915496826171875, -0.07220458984375, -0.06525421142578125, -0.0583038330078125, -0.05135345458984375, -0.044403076171875, -0.03745269775390625, -0.0305023193359375, -0.02355194091796875, -0.0166015625, -0.00965118408203125, -0.0027008056640625, 0.00424957275390625, 0.011199951171875, 0.01815032958984375, 0.0251007080078125, 0.03205108642578125, 0.03900146484375, 0.04595184326171875, 0.0529022216796875, 0.05985260009765625, 0.066802978515625, 0.07375335693359375, 0.0807037353515625, 0.08765411376953125, 0.0946044921875, 0.10155487060546875, 0.1085052490234375, 0.11545562744140625, 0.122406005859375, 0.12935638427734375, 0.1363067626953125, 0.14325714111328125, 0.15020751953125, 0.15715789794921875, 0.1641082763671875, 0.17105865478515625, 0.178009033203125, 0.18495941162109375, 0.1919097900390625, 0.19886016845703125, 0.205810546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 14.0, 15.0, 16.0, 16.0, 44.0, 82.0, 123.0, 160.0, 300.0, 526.0, 1105.0, 2430.0, 6691.0, 22630.0, 99226.0, 485541.0, 340950.0, 64076.0, 15593.0, 5061.0, 1917.0, 889.0, 452.0, 247.0, 170.0, 89.0, 58.0, 35.0, 25.0, 22.0, 8.0, 11.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3125, -1.2699737548828125, -1.227447509765625, -1.1849212646484375, -1.14239501953125, -1.0998687744140625, -1.057342529296875, -1.0148162841796875, -0.9722900390625, -0.9297637939453125, -0.887237548828125, -0.8447113037109375, -0.80218505859375, -0.7596588134765625, -0.717132568359375, -0.6746063232421875, -0.632080078125, -0.5895538330078125, -0.547027587890625, -0.5045013427734375, -0.46197509765625, -0.4194488525390625, -0.376922607421875, -0.3343963623046875, -0.2918701171875, -0.2493438720703125, -0.206817626953125, -0.1642913818359375, -0.12176513671875, -0.0792388916015625, -0.036712646484375, 0.0058135986328125, 0.04833984375, 0.0908660888671875, 0.133392333984375, 0.1759185791015625, 0.21844482421875, 0.2609710693359375, 0.303497314453125, 0.3460235595703125, 0.3885498046875, 0.4310760498046875, 0.473602294921875, 0.5161285400390625, 0.55865478515625, 0.6011810302734375, 0.643707275390625, 0.6862335205078125, 0.728759765625, 0.7712860107421875, 0.813812255859375, 0.8563385009765625, 0.89886474609375, 0.9413909912109375, 0.983917236328125, 1.0264434814453125, 1.0689697265625, 1.1114959716796875, 1.154022216796875, 1.1965484619140625, 1.23907470703125, 1.2816009521484375, 1.324127197265625, 1.3666534423828125, 1.4091796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 11.0, 22.0, 20.0, 23.0, 27.0, 32.0, 38.0, 52.0, 58.0, 61.0, 68.0, 59.0, 52.0, 56.0, 52.0, 53.0, 43.0, 49.0, 42.0, 29.0, 32.0, 23.0, 15.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.1079559326171875, -1.072357177734375, -1.0367584228515625, -1.00115966796875, -0.9655609130859375, -0.929962158203125, -0.8943634033203125, -0.8587646484375, -0.8231658935546875, -0.787567138671875, -0.7519683837890625, -0.71636962890625, -0.6807708740234375, -0.645172119140625, -0.6095733642578125, -0.573974609375, -0.5383758544921875, -0.502777099609375, -0.4671783447265625, -0.43157958984375, -0.3959808349609375, -0.360382080078125, -0.3247833251953125, -0.2891845703125, -0.2535858154296875, -0.217987060546875, -0.1823883056640625, -0.14678955078125, -0.1111907958984375, -0.075592041015625, -0.0399932861328125, -0.00439453125, 0.0312042236328125, 0.066802978515625, 0.1024017333984375, 0.13800048828125, 0.1735992431640625, 0.209197998046875, 0.2447967529296875, 0.2803955078125, 0.3159942626953125, 0.351593017578125, 0.3871917724609375, 0.42279052734375, 0.4583892822265625, 0.493988037109375, 0.5295867919921875, 0.565185546875, 0.6007843017578125, 0.636383056640625, 0.6719818115234375, 0.70758056640625, 0.7431793212890625, 0.778778076171875, 0.8143768310546875, 0.8499755859375, 0.8855743408203125, 0.921173095703125, 0.9567718505859375, 0.99237060546875, 1.0279693603515625, 1.063568115234375, 1.0991668701171875, 1.134765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 6.0, 9.0, 25.0, 22.0, 44.0, 61.0, 97.0, 153.0, 302.0, 711.0, 2197.0, 8429.0, 51957.0, 813986.0, 149236.0, 15720.0, 3513.0, 1159.0, 408.0, 183.0, 112.0, 75.0, 50.0, 27.0, 16.0, 5.0, 11.0, 7.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1474456787109375, -1.104461669921875, -1.0614776611328125, -1.01849365234375, -0.9755096435546875, -0.932525634765625, -0.8895416259765625, -0.8465576171875, -0.8035736083984375, -0.760589599609375, -0.7176055908203125, -0.67462158203125, -0.6316375732421875, -0.588653564453125, -0.5456695556640625, -0.502685546875, -0.4597015380859375, -0.416717529296875, -0.3737335205078125, -0.33074951171875, -0.2877655029296875, -0.244781494140625, -0.2017974853515625, -0.1588134765625, -0.1158294677734375, -0.072845458984375, -0.0298614501953125, 0.01312255859375, 0.0561065673828125, 0.099090576171875, 0.1420745849609375, 0.18505859375, 0.2280426025390625, 0.271026611328125, 0.3140106201171875, 0.35699462890625, 0.3999786376953125, 0.442962646484375, 0.4859466552734375, 0.5289306640625, 0.5719146728515625, 0.614898681640625, 0.6578826904296875, 0.70086669921875, 0.7438507080078125, 0.786834716796875, 0.8298187255859375, 0.872802734375, 0.9157867431640625, 0.958770751953125, 1.0017547607421875, 1.04473876953125, 1.0877227783203125, 1.130706787109375, 1.1736907958984375, 1.2166748046875, 1.2596588134765625, 1.302642822265625, 1.3456268310546875, 1.38861083984375, 1.4315948486328125, 1.474578857421875, 1.5175628662109375, 1.560546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 11.0, 16.0, 23.0, 33.0, 79.0, 223.0, 325.0, 145.0, 39.0, 29.0, 21.0, 15.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002880096435546875, -0.00028135813772678375, -0.00027470663189888, -0.00026805512607097626, -0.0002614036202430725, -0.00025475211441516876, -0.000248100608587265, -0.00024144910275936127, -0.00023479759693145752, -0.00022814609110355377, -0.00022149458527565002, -0.00021484307944774628, -0.00020819157361984253, -0.00020154006779193878, -0.00019488856196403503, -0.0001882370561361313, -0.00018158555030822754, -0.0001749340444803238, -0.00016828253865242004, -0.0001616310328245163, -0.00015497952699661255, -0.0001483280211687088, -0.00014167651534080505, -0.0001350250095129013, -0.00012837350368499756, -0.00012172199785709381, -0.00011507049202919006, -0.00010841898620128632, -0.00010176748037338257, -9.511597454547882e-05, -8.846446871757507e-05, -8.181296288967133e-05, -7.516145706176758e-05, -6.850995123386383e-05, -6.185844540596008e-05, -5.5206939578056335e-05, -4.855543375015259e-05, -4.190392792224884e-05, -3.525242209434509e-05, -2.8600916266441345e-05, -2.1949410438537598e-05, -1.529790461063385e-05, -8.646398782730103e-06, -1.994892954826355e-06, 4.656612873077393e-06, 1.130811870098114e-05, 1.7959624528884888e-05, 2.4611130356788635e-05, 3.126263618469238e-05, 3.791414201259613e-05, 4.456564784049988e-05, 5.1217153668403625e-05, 5.786865949630737e-05, 6.452016532421112e-05, 7.117167115211487e-05, 7.782317698001862e-05, 8.447468280792236e-05, 9.112618863582611e-05, 9.777769446372986e-05, 0.0001044292002916336, 0.00011108070611953735, 0.0001177322119474411, 0.00012438371777534485, 0.0001310352236032486, 0.00013768672943115234]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 11.0, 15.0, 17.0, 24.0, 23.0, 43.0, 70.0, 124.0, 202.0, 389.0, 759.0, 1712.0, 4331.0, 12415.0, 47752.0, 710823.0, 229063.0, 26836.0, 8068.0, 3112.0, 1320.0, 624.0, 334.0, 200.0, 94.0, 68.0, 38.0, 26.0, 20.0, 12.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.2169952392578125, -1.176177978515625, -1.1353607177734375, -1.09454345703125, -1.0537261962890625, -1.012908935546875, -0.9720916748046875, -0.9312744140625, -0.8904571533203125, -0.849639892578125, -0.8088226318359375, -0.76800537109375, -0.7271881103515625, -0.686370849609375, -0.6455535888671875, -0.604736328125, -0.5639190673828125, -0.523101806640625, -0.4822845458984375, -0.44146728515625, -0.4006500244140625, -0.359832763671875, -0.3190155029296875, -0.2781982421875, -0.2373809814453125, -0.196563720703125, -0.1557464599609375, -0.11492919921875, -0.0741119384765625, -0.033294677734375, 0.0075225830078125, 0.04833984375, 0.0891571044921875, 0.129974365234375, 0.1707916259765625, 0.21160888671875, 0.2524261474609375, 0.293243408203125, 0.3340606689453125, 0.3748779296875, 0.4156951904296875, 0.456512451171875, 0.4973297119140625, 0.53814697265625, 0.5789642333984375, 0.619781494140625, 0.6605987548828125, 0.701416015625, 0.7422332763671875, 0.783050537109375, 0.8238677978515625, 0.86468505859375, 0.9055023193359375, 0.946319580078125, 0.9871368408203125, 1.0279541015625, 1.0687713623046875, 1.109588623046875, 1.1504058837890625, 1.19122314453125, 1.2320404052734375, 1.272857666015625, 1.3136749267578125, 1.3544921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 7.0, 7.0, 8.0, 4.0, 5.0, 13.0, 15.0, 22.0, 21.0, 33.0, 75.0, 86.0, 159.0, 160.0, 122.0, 72.0, 50.0, 29.0, 20.0, 13.0, 14.0, 9.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60546875, -0.5839462280273438, -0.5624237060546875, -0.5409011840820312, -0.519378662109375, -0.49785614013671875, -0.4763336181640625, -0.45481109619140625, -0.43328857421875, -0.41176605224609375, -0.3902435302734375, -0.36872100830078125, -0.347198486328125, -0.32567596435546875, -0.3041534423828125, -0.28263092041015625, -0.2611083984375, -0.23958587646484375, -0.2180633544921875, -0.19654083251953125, -0.175018310546875, -0.15349578857421875, -0.1319732666015625, -0.11045074462890625, -0.08892822265625, -0.06740570068359375, -0.0458831787109375, -0.02436065673828125, -0.002838134765625, 0.01868438720703125, 0.0402069091796875, 0.06172943115234375, 0.083251953125, 0.10477447509765625, 0.1262969970703125, 0.14781951904296875, 0.169342041015625, 0.19086456298828125, 0.2123870849609375, 0.23390960693359375, 0.25543212890625, 0.27695465087890625, 0.2984771728515625, 0.31999969482421875, 0.341522216796875, 0.36304473876953125, 0.3845672607421875, 0.40608978271484375, 0.4276123046875, 0.44913482666015625, 0.4706573486328125, 0.49217987060546875, 0.513702392578125, 0.5352249145507812, 0.5567474365234375, 0.5782699584960938, 0.59979248046875, 0.6213150024414062, 0.6428375244140625, 0.6643600463867188, 0.685882568359375, 0.7074050903320312, 0.7289276123046875, 0.7504501342773438, 0.77197265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 23.0, 43.0, 82.0, 119.0, 175.0, 198.0, 126.0, 95.0, 59.0, 35.0, 16.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.37704849243164, -7.999728679656982, -7.622408390045166, -7.245088577270508, -6.867768287658691, -6.490448474884033, -6.113128662109375, -5.735808372497559, -5.358488082885742, -4.981168270111084, -4.603847980499268, -4.226528167724609, -3.849207878112793, -3.4718880653381348, -3.0945680141448975, -2.71724796295166, -2.339928150177002, -1.9626080989837646, -1.5852880477905273, -1.2079681158065796, -0.8306480646133423, -0.453328013420105, -0.07600808143615723, 0.3013119697570801, 0.6786320209503174, 1.0559520721435547, 1.433272123336792, 1.8105920553207397, 2.1879119873046875, 2.565232276916504, 2.942552089691162, 3.3198721408843994, 3.6971921920776367, 4.074512004852295, 4.451832294464111, 4.8291521072387695, 5.206472396850586, 5.583792209625244, 5.961112022399902, 6.338432312011719, 6.715752601623535, 7.093072414398193, 7.47039270401001, 7.847712516784668, 8.225032806396484, 8.6023530960083, 8.9796724319458, 9.356992721557617, 9.734312057495117, 10.111632347106934, 10.488951683044434, 10.86627197265625, 11.243592262268066, 11.620912551879883, 11.998231887817383, 12.3755521774292, 12.752872467041016, 13.130192756652832, 13.507512092590332, 13.884832382202148, 14.262152671813965, 14.639472961425781, 15.016792297363281, 15.394112586975098, 15.771432876586914]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 14.0, 17.0, 16.0, 16.0, 19.0, 34.0, 28.0, 24.0, 27.0, 38.0, 38.0, 41.0, 33.0, 43.0, 46.0, 52.0, 47.0, 51.0, 43.0, 46.0, 44.0, 40.0, 33.0, 32.0, 26.0, 19.0, 31.0, 17.0, 17.0, 12.0, 17.0, 4.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.870394229888916, -4.711970329284668, -4.55354642868042, -4.395122051239014, -4.236698150634766, -4.078274250030518, -3.9198503494262695, -3.7614264488220215, -3.6030023097991943, -3.4445784091949463, -3.286154270172119, -3.127730369567871, -2.969306468963623, -2.810882329940796, -2.652458429336548, -2.4940342903137207, -2.3356103897094727, -2.1771864891052246, -2.0187623500823975, -1.8603384494781494, -1.7019144296646118, -1.5434904098510742, -1.3850665092468262, -1.2266424894332886, -1.068218469619751, -0.9097944498062134, -0.7513704895973206, -0.5929465293884277, -0.43452250957489014, -0.27609848976135254, -0.11767452955245972, 0.040749430656433105, 0.1991729736328125, 0.3575969636440277, 0.5160209536552429, 0.6744449138641357, 0.8328689336776733, 0.9912929534912109, 1.149716854095459, 1.3081408739089966, 1.4665648937225342, 1.6249889135360718, 1.7834129333496094, 1.9418368339538574, 2.1002607345581055, 2.2586848735809326, 2.4171087741851807, 2.575532913208008, 2.733956813812256, 2.892380714416504, 3.050804853439331, 3.209228754043579, 3.3676528930664062, 3.5260767936706543, 3.6845006942749023, 3.8429245948791504, 4.001348495483398, 4.1597723960876465, 4.3181962966918945, 4.476620674133301, 4.635044574737549, 4.793468475341797, 4.951892375946045, 5.110316276550293, 5.268740653991699]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 9.0, 14.0, 12.0, 27.0, 32.0, 68.0, 92.0, 174.0, 289.0, 488.0, 879.0, 1601.0, 3112.0, 6304.0, 14850.0, 44908.0, 243965.0, 3445110.0, 345971.0, 54309.0, 17609.0, 6966.0, 3453.0, 1715.0, 942.0, 504.0, 311.0, 205.0, 122.0, 68.0, 39.0, 28.0, 32.0, 13.0, 10.0, 13.0, 7.0, 4.0, 3.0, 9.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.88916015625, -0.8580398559570312, -0.8269195556640625, -0.7957992553710938, -0.764678955078125, -0.7335586547851562, -0.7024383544921875, -0.6713180541992188, -0.64019775390625, -0.6090774536132812, -0.5779571533203125, -0.5468368530273438, -0.515716552734375, -0.48459625244140625, -0.4534759521484375, -0.42235565185546875, -0.3912353515625, -0.36011505126953125, -0.3289947509765625, -0.29787445068359375, -0.266754150390625, -0.23563385009765625, -0.2045135498046875, -0.17339324951171875, -0.14227294921875, -0.11115264892578125, -0.0800323486328125, -0.04891204833984375, -0.017791748046875, 0.01332855224609375, 0.0444488525390625, 0.07556915283203125, 0.106689453125, 0.13780975341796875, 0.1689300537109375, 0.20005035400390625, 0.231170654296875, 0.26229095458984375, 0.2934112548828125, 0.32453155517578125, 0.35565185546875, 0.38677215576171875, 0.4178924560546875, 0.44901275634765625, 0.480133056640625, 0.5112533569335938, 0.5423736572265625, 0.5734939575195312, 0.6046142578125, 0.6357345581054688, 0.6668548583984375, 0.6979751586914062, 0.729095458984375, 0.7602157592773438, 0.7913360595703125, 0.8224563598632812, 0.85357666015625, 0.8846969604492188, 0.9158172607421875, 0.9469375610351562, 0.978057861328125, 1.0091781616210938, 1.0402984619140625, 1.0714187622070312, 1.1025390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 6.0, 11.0, 11.0, 18.0, 23.0, 29.0, 23.0, 33.0, 42.0, 52.0, 62.0, 63.0, 48.0, 57.0, 54.0, 65.0, 44.0, 53.0, 52.0, 53.0, 37.0, 32.0, 28.0, 26.0, 15.0, 18.0, 9.0, 18.0, 7.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18628311157226562, -0.17798614501953125, -0.16968917846679688, -0.1613922119140625, -0.15309524536132812, -0.14479827880859375, -0.13650131225585938, -0.128204345703125, -0.11990737915039062, -0.11161041259765625, -0.10331344604492188, -0.0950164794921875, -0.08671951293945312, -0.07842254638671875, -0.07012557983398438, -0.06182861328125, -0.053531646728515625, -0.04523468017578125, -0.036937713623046875, -0.0286407470703125, -0.020343780517578125, -0.01204681396484375, -0.003749847412109375, 0.004547119140625, 0.012844085693359375, 0.02114105224609375, 0.029438018798828125, 0.0377349853515625, 0.046031951904296875, 0.05432891845703125, 0.06262588500976562, 0.0709228515625, 0.07921981811523438, 0.08751678466796875, 0.09581375122070312, 0.1041107177734375, 0.11240768432617188, 0.12070465087890625, 0.12900161743164062, 0.137298583984375, 0.14559555053710938, 0.15389251708984375, 0.16218948364257812, 0.1704864501953125, 0.17878341674804688, 0.18708038330078125, 0.19537734985351562, 0.20367431640625, 0.21197128295898438, 0.22026824951171875, 0.22856521606445312, 0.2368621826171875, 0.24515914916992188, 0.25345611572265625, 0.2617530822753906, 0.270050048828125, 0.2783470153808594, 0.28664398193359375, 0.2949409484863281, 0.3032379150390625, 0.3115348815917969, 0.31983184814453125, 0.3281288146972656, 0.33642578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 21.0, 40.0, 96.0, 195.0, 378.0, 724.0, 1552.0, 4015.0, 12433.0, 62652.0, 1744639.0, 2278784.0, 67989.0, 13454.0, 4178.0, 1694.0, 706.0, 355.0, 153.0, 88.0, 42.0, 28.0, 18.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9267578125, -1.8646392822265625, -1.802520751953125, -1.7404022216796875, -1.67828369140625, -1.6161651611328125, -1.554046630859375, -1.4919281005859375, -1.4298095703125, -1.3676910400390625, -1.305572509765625, -1.2434539794921875, -1.18133544921875, -1.1192169189453125, -1.057098388671875, -0.9949798583984375, -0.932861328125, -0.8707427978515625, -0.808624267578125, -0.7465057373046875, -0.68438720703125, -0.6222686767578125, -0.560150146484375, -0.4980316162109375, -0.4359130859375, -0.3737945556640625, -0.311676025390625, -0.2495574951171875, -0.18743896484375, -0.1253204345703125, -0.063201904296875, -0.0010833740234375, 0.06103515625, 0.1231536865234375, 0.185272216796875, 0.2473907470703125, 0.30950927734375, 0.3716278076171875, 0.433746337890625, 0.4958648681640625, 0.5579833984375, 0.6201019287109375, 0.682220458984375, 0.7443389892578125, 0.80645751953125, 0.8685760498046875, 0.930694580078125, 0.9928131103515625, 1.054931640625, 1.1170501708984375, 1.179168701171875, 1.2412872314453125, 1.30340576171875, 1.3655242919921875, 1.427642822265625, 1.4897613525390625, 1.5518798828125, 1.6139984130859375, 1.676116943359375, 1.7382354736328125, 1.80035400390625, 1.8624725341796875, 1.924591064453125, 1.9867095947265625, 2.048828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 11.0, 7.0, 9.0, 11.0, 17.0, 21.0, 36.0, 59.0, 96.0, 166.0, 319.0, 671.0, 1348.0, 582.0, 243.0, 150.0, 89.0, 56.0, 41.0, 29.0, 21.0, 11.0, 19.0, 13.0, 4.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5517578125, -0.5361824035644531, -0.5206069946289062, -0.5050315856933594, -0.4894561767578125, -0.4738807678222656, -0.45830535888671875, -0.4427299499511719, -0.427154541015625, -0.4115791320800781, -0.39600372314453125, -0.3804283142089844, -0.3648529052734375, -0.3492774963378906, -0.33370208740234375, -0.3181266784667969, -0.30255126953125, -0.2869758605957031, -0.27140045166015625, -0.2558250427246094, -0.2402496337890625, -0.22467422485351562, -0.20909881591796875, -0.19352340698242188, -0.177947998046875, -0.16237258911132812, -0.14679718017578125, -0.13122177124023438, -0.1156463623046875, -0.10007095336914062, -0.08449554443359375, -0.06892013549804688, -0.0533447265625, -0.037769317626953125, -0.02219390869140625, -0.006618499755859375, 0.0089569091796875, 0.024532318115234375, 0.04010772705078125, 0.055683135986328125, 0.071258544921875, 0.08683395385742188, 0.10240936279296875, 0.11798477172851562, 0.1335601806640625, 0.14913558959960938, 0.16471099853515625, 0.18028640747070312, 0.19586181640625, 0.21143722534179688, 0.22701263427734375, 0.24258804321289062, 0.2581634521484375, 0.2737388610839844, 0.28931427001953125, 0.3048896789550781, 0.320465087890625, 0.3360404968261719, 0.35161590576171875, 0.3671913146972656, 0.3827667236328125, 0.3983421325683594, 0.41391754150390625, 0.4294929504394531, 0.445068359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 15.0, 30.0, 36.0, 35.0, 52.0, 86.0, 93.0, 92.0, 83.0, 96.0, 73.0, 74.0, 62.0, 40.0, 44.0, 18.0, 14.0, 17.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.122608184814453, -3.031907796859741, -2.9412074089050293, -2.8505070209503174, -2.7598066329956055, -2.6691062450408936, -2.5784058570861816, -2.4877052307128906, -2.397005081176758, -2.306304693222046, -2.215604305267334, -2.124903917312622, -2.03420352935791, -1.9435031414031982, -1.8528026342391968, -1.7621022462844849, -1.6714017391204834, -1.5807013511657715, -1.4900009632110596, -1.3993005752563477, -1.3086001873016357, -1.2178997993469238, -1.1271992921829224, -1.0364989042282104, -0.9457985162734985, -0.8550981283187866, -0.7643977403640747, -0.673697292804718, -0.5829969048500061, -0.4922965168952942, -0.4015960693359375, -0.3108956813812256, -0.22019529342651367, -0.12949489057064056, -0.038794487714767456, 0.051905930042266846, 0.14260631799697876, 0.23330670595169067, 0.32400715351104736, 0.4147075414657593, 0.5054079294204712, 0.5961083173751831, 0.686808705329895, 0.7775091528892517, 0.8682095408439636, 0.9589099287986755, 1.0496103763580322, 1.1403107643127441, 1.231011152267456, 1.321711540222168, 1.4124119281768799, 1.5031123161315918, 1.5938127040863037, 1.6845130920410156, 1.775213599205017, 1.865913987159729, 1.956614375114441, 2.0473148822784424, 2.1380152702331543, 2.228715658187866, 2.319416046142578, 2.41011643409729, 2.500816822052002, 2.591517210006714, 2.682217597961426]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 9.0, 14.0, 13.0, 13.0, 21.0, 24.0, 20.0, 29.0, 26.0, 39.0, 45.0, 35.0, 47.0, 43.0, 48.0, 33.0, 39.0, 47.0, 49.0, 42.0, 41.0, 42.0, 34.0, 39.0, 23.0, 29.0, 23.0, 9.0, 16.0, 15.0, 11.0, 10.0, 11.0, 4.0, 3.0, 8.0, 6.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9211729764938354, -1.863569974899292, -1.805967092514038, -1.7483640909194946, -1.6907612085342407, -1.6331582069396973, -1.5755553245544434, -1.5179523229599, -1.4603493213653564, -1.402746319770813, -1.345143437385559, -1.2875404357910156, -1.2299375534057617, -1.1723345518112183, -1.1147315502166748, -1.057128667831421, -0.999525785446167, -0.9419228434562683, -0.8843199014663696, -0.8267168998718262, -0.7691140174865723, -0.7115110158920288, -0.6539080739021301, -0.5963051319122314, -0.5387021899223328, -0.4810992479324341, -0.4234963059425354, -0.36589333415031433, -0.30829039216041565, -0.25068745017051697, -0.1930844783782959, -0.13548153638839722, -0.07787847518920898, -0.020275525748729706, 0.03732742369174957, 0.09493038058280945, 0.15253332257270813, 0.2101362645626068, 0.2677392363548279, 0.32534217834472656, 0.38294512033462524, 0.4405480623245239, 0.4981510043144226, 0.5557539463043213, 0.6133569478988647, 0.6709598302841187, 0.7285628318786621, 0.7861657738685608, 0.8437687158584595, 0.9013716578483582, 0.9589745998382568, 1.0165776014328003, 1.0741804838180542, 1.1317834854125977, 1.1893863677978516, 1.246989369392395, 1.3045923709869385, 1.362195372581482, 1.4197982549667358, 1.4774012565612793, 1.5350041389465332, 1.5926071405410767, 1.6502101421356201, 1.707813024520874, 1.765415906906128]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 9.0, 1.0, 7.0, 16.0, 30.0, 52.0, 60.0, 92.0, 136.0, 227.0, 427.0, 791.0, 1320.0, 2797.0, 5568.0, 12007.0, 26667.0, 64034.0, 166653.0, 346716.0, 250660.0, 98026.0, 39422.0, 16919.0, 7806.0, 3841.0, 1883.0, 1043.0, 556.0, 297.0, 176.0, 101.0, 56.0, 57.0, 36.0, 19.0, 11.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8737640380859375, -0.848602294921875, -0.8234405517578125, -0.79827880859375, -0.7731170654296875, -0.747955322265625, -0.7227935791015625, -0.6976318359375, -0.6724700927734375, -0.647308349609375, -0.6221466064453125, -0.59698486328125, -0.5718231201171875, -0.546661376953125, -0.5214996337890625, -0.496337890625, -0.4711761474609375, -0.446014404296875, -0.4208526611328125, -0.39569091796875, -0.3705291748046875, -0.345367431640625, -0.3202056884765625, -0.2950439453125, -0.2698822021484375, -0.244720458984375, -0.2195587158203125, -0.19439697265625, -0.1692352294921875, -0.144073486328125, -0.1189117431640625, -0.09375, -0.0685882568359375, -0.043426513671875, -0.0182647705078125, 0.00689697265625, 0.0320587158203125, 0.057220458984375, 0.0823822021484375, 0.1075439453125, 0.1327056884765625, 0.157867431640625, 0.1830291748046875, 0.20819091796875, 0.2333526611328125, 0.258514404296875, 0.2836761474609375, 0.308837890625, 0.3339996337890625, 0.359161376953125, 0.3843231201171875, 0.40948486328125, 0.4346466064453125, 0.459808349609375, 0.4849700927734375, 0.5101318359375, 0.5352935791015625, 0.560455322265625, 0.5856170654296875, 0.61077880859375, 0.6359405517578125, 0.661102294921875, 0.6862640380859375, 0.71142578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 0.0, 5.0, 16.0, 8.0, 4.0, 15.0, 9.0, 19.0, 20.0, 19.0, 25.0, 27.0, 29.0, 36.0, 25.0, 42.0, 37.0, 47.0, 48.0, 45.0, 34.0, 49.0, 49.0, 38.0, 33.0, 43.0, 37.0, 34.0, 18.0, 30.0, 28.0, 22.0, 18.0, 21.0, 8.0, 11.0, 9.0, 11.0, 7.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2041015625, -0.197662353515625, -0.19122314453125, -0.184783935546875, -0.1783447265625, -0.171905517578125, -0.16546630859375, -0.159027099609375, -0.152587890625, -0.146148681640625, -0.13970947265625, -0.133270263671875, -0.1268310546875, -0.120391845703125, -0.11395263671875, -0.107513427734375, -0.10107421875, -0.094635009765625, -0.08819580078125, -0.081756591796875, -0.0753173828125, -0.068878173828125, -0.06243896484375, -0.055999755859375, -0.049560546875, -0.043121337890625, -0.03668212890625, -0.030242919921875, -0.0238037109375, -0.017364501953125, -0.01092529296875, -0.004486083984375, 0.001953125, 0.008392333984375, 0.01483154296875, 0.021270751953125, 0.0277099609375, 0.034149169921875, 0.04058837890625, 0.047027587890625, 0.053466796875, 0.059906005859375, 0.06634521484375, 0.072784423828125, 0.0792236328125, 0.085662841796875, 0.09210205078125, 0.098541259765625, 0.10498046875, 0.111419677734375, 0.11785888671875, 0.124298095703125, 0.1307373046875, 0.137176513671875, 0.14361572265625, 0.150054931640625, 0.156494140625, 0.162933349609375, 0.16937255859375, 0.175811767578125, 0.1822509765625, 0.188690185546875, 0.19512939453125, 0.201568603515625, 0.2080078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 13.0, 16.0, 21.0, 39.0, 60.0, 110.0, 180.0, 351.0, 705.0, 1583.0, 4369.0, 13759.0, 53981.0, 275436.0, 532381.0, 125120.0, 27694.0, 7749.0, 2760.0, 1096.0, 490.0, 248.0, 137.0, 70.0, 59.0, 30.0, 30.0, 13.0, 7.0, 8.0, 4.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.2086029052734375, -1.164276123046875, -1.1199493408203125, -1.07562255859375, -1.0312957763671875, -0.986968994140625, -0.9426422119140625, -0.8983154296875, -0.8539886474609375, -0.809661865234375, -0.7653350830078125, -0.72100830078125, -0.6766815185546875, -0.632354736328125, -0.5880279541015625, -0.543701171875, -0.4993743896484375, -0.455047607421875, -0.4107208251953125, -0.36639404296875, -0.3220672607421875, -0.277740478515625, -0.2334136962890625, -0.1890869140625, -0.1447601318359375, -0.100433349609375, -0.0561065673828125, -0.01177978515625, 0.0325469970703125, 0.076873779296875, 0.1212005615234375, 0.16552734375, 0.2098541259765625, 0.254180908203125, 0.2985076904296875, 0.34283447265625, 0.3871612548828125, 0.431488037109375, 0.4758148193359375, 0.5201416015625, 0.5644683837890625, 0.608795166015625, 0.6531219482421875, 0.69744873046875, 0.7417755126953125, 0.786102294921875, 0.8304290771484375, 0.874755859375, 0.9190826416015625, 0.963409423828125, 1.0077362060546875, 1.05206298828125, 1.0963897705078125, 1.140716552734375, 1.1850433349609375, 1.2293701171875, 1.2736968994140625, 1.318023681640625, 1.3623504638671875, 1.40667724609375, 1.4510040283203125, 1.495330810546875, 1.5396575927734375, 1.583984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 13.0, 8.0, 17.0, 18.0, 19.0, 18.0, 26.0, 34.0, 31.0, 27.0, 49.0, 52.0, 57.0, 37.0, 55.0, 48.0, 53.0, 68.0, 39.0, 53.0, 38.0, 35.0, 34.0, 28.0, 22.0, 20.0, 12.0, 17.0, 9.0, 10.0, 6.0, 3.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0254974365234375, -0.990447998046875, -0.9553985595703125, -0.92034912109375, -0.8852996826171875, -0.850250244140625, -0.8152008056640625, -0.7801513671875, -0.7451019287109375, -0.710052490234375, -0.6750030517578125, -0.63995361328125, -0.6049041748046875, -0.569854736328125, -0.5348052978515625, -0.499755859375, -0.4647064208984375, -0.429656982421875, -0.3946075439453125, -0.35955810546875, -0.3245086669921875, -0.289459228515625, -0.2544097900390625, -0.2193603515625, -0.1843109130859375, -0.149261474609375, -0.1142120361328125, -0.07916259765625, -0.0441131591796875, -0.009063720703125, 0.0259857177734375, 0.06103515625, 0.0960845947265625, 0.131134033203125, 0.1661834716796875, 0.20123291015625, 0.2362823486328125, 0.271331787109375, 0.3063812255859375, 0.3414306640625, 0.3764801025390625, 0.411529541015625, 0.4465789794921875, 0.48162841796875, 0.5166778564453125, 0.551727294921875, 0.5867767333984375, 0.621826171875, 0.6568756103515625, 0.691925048828125, 0.7269744873046875, 0.76202392578125, 0.7970733642578125, 0.832122802734375, 0.8671722412109375, 0.9022216796875, 0.9372711181640625, 0.972320556640625, 1.0073699951171875, 1.04241943359375, 1.0774688720703125, 1.112518310546875, 1.1475677490234375, 1.1826171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 11.0, 5.0, 12.0, 17.0, 22.0, 47.0, 84.0, 132.0, 247.0, 563.0, 1381.0, 3765.0, 13257.0, 65951.0, 504103.0, 391214.0, 51215.0, 10989.0, 3218.0, 1231.0, 521.0, 264.0, 141.0, 57.0, 40.0, 18.0, 16.0, 7.0, 7.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.681640625, -0.6636695861816406, -0.6456985473632812, -0.6277275085449219, -0.6097564697265625, -0.5917854309082031, -0.5738143920898438, -0.5558433532714844, -0.537872314453125, -0.5199012756347656, -0.5019302368164062, -0.4839591979980469, -0.4659881591796875, -0.4480171203613281, -0.43004608154296875, -0.4120750427246094, -0.39410400390625, -0.3761329650878906, -0.35816192626953125, -0.3401908874511719, -0.3222198486328125, -0.3042488098144531, -0.28627777099609375, -0.2683067321777344, -0.250335693359375, -0.23236465454101562, -0.21439361572265625, -0.19642257690429688, -0.1784515380859375, -0.16048049926757812, -0.14250946044921875, -0.12453842163085938, -0.1065673828125, -0.08859634399414062, -0.07062530517578125, -0.052654266357421875, -0.0346832275390625, -0.016712188720703125, 0.00125885009765625, 0.019229888916015625, 0.037200927734375, 0.055171966552734375, 0.07314300537109375, 0.09111404418945312, 0.1090850830078125, 0.12705612182617188, 0.14502716064453125, 0.16299819946289062, 0.18096923828125, 0.19894027709960938, 0.21691131591796875, 0.23488235473632812, 0.2528533935546875, 0.2708244323730469, 0.28879547119140625, 0.3067665100097656, 0.324737548828125, 0.3427085876464844, 0.36067962646484375, 0.3786506652832031, 0.3966217041015625, 0.4145927429199219, 0.43256378173828125, 0.4505348205566406, 0.468505859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 11.0, 7.0, 13.0, 9.0, 17.0, 8.0, 22.0, 43.0, 49.0, 68.0, 81.0, 118.0, 124.0, 104.0, 81.0, 53.0, 35.0, 26.0, 18.0, 16.0, 15.0, 13.0, 6.0, 6.0, 5.0, 2.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.568431854248047e-05, -6.356928497552872e-05, -6.145425140857697e-05, -5.9339217841625214e-05, -5.722418427467346e-05, -5.510915070772171e-05, -5.299411714076996e-05, -5.087908357381821e-05, -4.8764050006866455e-05, -4.66490164399147e-05, -4.453398287296295e-05, -4.24189493060112e-05, -4.030391573905945e-05, -3.8188882172107697e-05, -3.6073848605155945e-05, -3.395881503820419e-05, -3.184378147125244e-05, -2.972874790430069e-05, -2.7613714337348938e-05, -2.5498680770397186e-05, -2.3383647203445435e-05, -2.1268613636493683e-05, -1.915358006954193e-05, -1.703854650259018e-05, -1.4923512935638428e-05, -1.2808479368686676e-05, -1.0693445801734924e-05, -8.578412234783173e-06, -6.463378667831421e-06, -4.348345100879669e-06, -2.2333115339279175e-06, -1.1827796697616577e-07, 1.996755599975586e-06, 4.111789166927338e-06, 6.226822733879089e-06, 8.341856300830841e-06, 1.0456889867782593e-05, 1.2571923434734344e-05, 1.4686957001686096e-05, 1.6801990568637848e-05, 1.89170241355896e-05, 2.103205770254135e-05, 2.3147091269493103e-05, 2.5262124836444855e-05, 2.7377158403396606e-05, 2.9492191970348358e-05, 3.160722553730011e-05, 3.372225910425186e-05, 3.583729267120361e-05, 3.7952326238155365e-05, 4.006735980510712e-05, 4.218239337205887e-05, 4.429742693901062e-05, 4.641246050596237e-05, 4.8527494072914124e-05, 5.0642527639865875e-05, 5.275756120681763e-05, 5.487259477376938e-05, 5.698762834072113e-05, 5.910266190767288e-05, 6.121769547462463e-05, 6.333272904157639e-05, 6.544776260852814e-05, 6.756279617547989e-05, 6.967782974243164e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 10.0, 8.0, 12.0, 15.0, 22.0, 38.0, 44.0, 77.0, 161.0, 257.0, 537.0, 1162.0, 3014.0, 9449.0, 37026.0, 204217.0, 621224.0, 132838.0, 26784.0, 7229.0, 2466.0, 940.0, 428.0, 246.0, 133.0, 78.0, 46.0, 41.0, 19.0, 14.0, 10.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.57177734375, -0.5564842224121094, -0.5411911010742188, -0.5258979797363281, -0.5106048583984375, -0.4953117370605469, -0.48001861572265625, -0.4647254943847656, -0.449432373046875, -0.4341392517089844, -0.41884613037109375, -0.4035530090332031, -0.3882598876953125, -0.3729667663574219, -0.35767364501953125, -0.3423805236816406, -0.32708740234375, -0.3117942810058594, -0.29650115966796875, -0.2812080383300781, -0.2659149169921875, -0.2506217956542969, -0.23532867431640625, -0.22003555297851562, -0.204742431640625, -0.18944931030273438, -0.17415618896484375, -0.15886306762695312, -0.1435699462890625, -0.12827682495117188, -0.11298370361328125, -0.09769058227539062, -0.0823974609375, -0.06710433959960938, -0.05181121826171875, -0.036518096923828125, -0.0212249755859375, -0.005931854248046875, 0.00936126708984375, 0.024654388427734375, 0.039947509765625, 0.055240631103515625, 0.07053375244140625, 0.08582687377929688, 0.1011199951171875, 0.11641311645507812, 0.13170623779296875, 0.14699935913085938, 0.16229248046875, 0.17758560180664062, 0.19287872314453125, 0.20817184448242188, 0.2234649658203125, 0.23875808715820312, 0.25405120849609375, 0.2693443298339844, 0.284637451171875, 0.2999305725097656, 0.31522369384765625, 0.3305168151855469, 0.3458099365234375, 0.3611030578613281, 0.37639617919921875, 0.3916893005371094, 0.406982421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 8.0, 10.0, 5.0, 7.0, 10.0, 18.0, 16.0, 32.0, 53.0, 65.0, 71.0, 110.0, 122.0, 107.0, 100.0, 67.0, 52.0, 30.0, 25.0, 10.0, 17.0, 16.0, 16.0, 6.0, 5.0, 7.0, 5.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.43268585205078125, -0.4190826416015625, -0.40547943115234375, -0.391876220703125, -0.37827301025390625, -0.3646697998046875, -0.35106658935546875, -0.33746337890625, -0.32386016845703125, -0.3102569580078125, -0.29665374755859375, -0.283050537109375, -0.26944732666015625, -0.2558441162109375, -0.24224090576171875, -0.2286376953125, -0.21503448486328125, -0.2014312744140625, -0.18782806396484375, -0.174224853515625, -0.16062164306640625, -0.1470184326171875, -0.13341522216796875, -0.11981201171875, -0.10620880126953125, -0.0926055908203125, -0.07900238037109375, -0.065399169921875, -0.05179595947265625, -0.0381927490234375, -0.02458953857421875, -0.010986328125, 0.00261688232421875, 0.0162200927734375, 0.02982330322265625, 0.043426513671875, 0.05702972412109375, 0.0706329345703125, 0.08423614501953125, 0.09783935546875, 0.11144256591796875, 0.1250457763671875, 0.13864898681640625, 0.152252197265625, 0.16585540771484375, 0.1794586181640625, 0.19306182861328125, 0.2066650390625, 0.22026824951171875, 0.2338714599609375, 0.24747467041015625, 0.261077880859375, 0.27468109130859375, 0.2882843017578125, 0.30188751220703125, 0.31549072265625, 0.32909393310546875, 0.3426971435546875, 0.35630035400390625, 0.369903564453125, 0.38350677490234375, 0.3971099853515625, 0.41071319580078125, 0.42431640625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 20.0, 25.0, 41.0, 66.0, 122.0, 139.0, 159.0, 156.0, 97.0, 89.0, 42.0, 16.0, 19.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.260943412780762, -3.969271183013916, -3.6775989532470703, -3.3859269618988037, -3.094254732131958, -2.8025825023651123, -2.5109105110168457, -2.21923828125, -1.9275660514831543, -1.6358938217163086, -1.3442217111587524, -1.0525496006011963, -0.7608773708343506, -0.4692051410675049, -0.17753303050994873, 0.11413908004760742, 0.4058113098144531, 0.697483479976654, 0.989155650138855, 1.2808277606964111, 1.5724999904632568, 1.8641722202301025, 2.155844211578369, 2.447516441345215, 2.7391886711120605, 3.0308609008789062, 3.322533130645752, 3.6142051219940186, 3.9058773517608643, 4.197549819946289, 4.489221572875977, 4.780893802642822, 5.072565078735352, 5.364237308502197, 5.655909538269043, 5.947581768035889, 6.239253997802734, 6.530925750732422, 6.822597980499268, 7.114270210266113, 7.405942440032959, 7.697614669799805, 7.98928689956665, 8.280959129333496, 8.572630882263184, 8.864303588867188, 9.155975341796875, 9.447647094726562, 9.739319801330566, 10.030991554260254, 10.322664260864258, 10.614336013793945, 10.90600872039795, 11.197680473327637, 11.48935317993164, 11.781024932861328, 12.072696685791016, 12.364368438720703, 12.656041145324707, 12.947712898254395, 13.239385604858398, 13.531057357788086, 13.82273006439209, 14.114401817321777, 14.406074523925781]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 6.0, 10.0, 13.0, 17.0, 23.0, 18.0, 34.0, 29.0, 32.0, 33.0, 42.0, 38.0, 45.0, 31.0, 49.0, 47.0, 49.0, 49.0, 51.0, 51.0, 46.0, 34.0, 30.0, 43.0, 21.0, 20.0, 22.0, 28.0, 15.0, 12.0, 17.0, 12.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.874125003814697, -4.705986022949219, -4.537846565246582, -4.369707107543945, -4.201568126678467, -4.033429145812988, -3.8652896881103516, -3.697150468826294, -3.5290112495422363, -3.3608720302581787, -3.192732810974121, -3.0245935916900635, -2.856454372406006, -2.6883151531219482, -2.5201759338378906, -2.352036714553833, -2.1838974952697754, -2.0157582759857178, -1.8476190567016602, -1.6794798374176025, -1.511340618133545, -1.3432013988494873, -1.1750621795654297, -1.006922960281372, -0.8387837409973145, -0.6706445217132568, -0.5025053024291992, -0.3343660831451416, -0.16622686386108398, 0.0019123554229736328, 0.17005157470703125, 0.33819079399108887, 0.5063295364379883, 0.6744687557220459, 0.8426079750061035, 1.0107471942901611, 1.1788864135742188, 1.3470256328582764, 1.515164852142334, 1.6833040714263916, 1.8514432907104492, 2.019582509994507, 2.1877217292785645, 2.355860948562622, 2.5240001678466797, 2.6921393871307373, 2.860278606414795, 3.0284178256988525, 3.19655704498291, 3.3646962642669678, 3.5328354835510254, 3.700974702835083, 3.8691139221191406, 4.037253379821777, 4.205392360687256, 4.373531341552734, 4.541670799255371, 4.709810256958008, 4.877949237823486, 5.046088218688965, 5.214227676391602, 5.382367134094238, 5.550506114959717, 5.718645095825195, 5.886784553527832]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 17.0, 8.0, 12.0, 11.0, 21.0, 37.0, 48.0, 62.0, 86.0, 112.0, 168.0, 233.0, 329.0, 508.0, 773.0, 1210.0, 2102.0, 3585.0, 6872.0, 15471.0, 49673.0, 700933.0, 3310456.0, 65527.0, 18245.0, 7554.0, 3901.0, 2084.0, 1410.0, 935.0, 585.0, 383.0, 262.0, 191.0, 132.0, 88.0, 59.0, 47.0, 34.0, 27.0, 17.0, 14.0, 13.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0], "bins": [-1.494140625, -1.446075439453125, -1.39801025390625, -1.349945068359375, -1.3018798828125, -1.253814697265625, -1.20574951171875, -1.157684326171875, -1.109619140625, -1.061553955078125, -1.01348876953125, -0.965423583984375, -0.9173583984375, -0.869293212890625, -0.82122802734375, -0.773162841796875, -0.72509765625, -0.677032470703125, -0.62896728515625, -0.580902099609375, -0.5328369140625, -0.484771728515625, -0.43670654296875, -0.388641357421875, -0.340576171875, -0.292510986328125, -0.24444580078125, -0.196380615234375, -0.1483154296875, -0.100250244140625, -0.05218505859375, -0.004119873046875, 0.0439453125, 0.092010498046875, 0.14007568359375, 0.188140869140625, 0.2362060546875, 0.284271240234375, 0.33233642578125, 0.380401611328125, 0.428466796875, 0.476531982421875, 0.52459716796875, 0.572662353515625, 0.6207275390625, 0.668792724609375, 0.71685791015625, 0.764923095703125, 0.81298828125, 0.861053466796875, 0.90911865234375, 0.957183837890625, 1.0052490234375, 1.053314208984375, 1.10137939453125, 1.149444580078125, 1.197509765625, 1.245574951171875, 1.29364013671875, 1.341705322265625, 1.3897705078125, 1.437835693359375, 1.48590087890625, 1.533966064453125, 1.58203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 8.0, 5.0, 6.0, 14.0, 9.0, 9.0, 12.0, 23.0, 16.0, 31.0, 25.0, 30.0, 27.0, 37.0, 41.0, 33.0, 35.0, 57.0, 54.0, 41.0, 26.0, 41.0, 48.0, 37.0, 50.0, 30.0, 32.0, 39.0, 28.0, 29.0, 20.0, 15.0, 15.0, 14.0, 9.0, 10.0, 9.0, 7.0, 7.0, 9.0, 1.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20654296875, -0.19970703125, -0.19287109375, -0.18603515625, -0.17919921875, -0.17236328125, -0.16552734375, -0.15869140625, -0.15185546875, -0.14501953125, -0.13818359375, -0.13134765625, -0.12451171875, -0.11767578125, -0.11083984375, -0.10400390625, -0.09716796875, -0.09033203125, -0.08349609375, -0.07666015625, -0.06982421875, -0.06298828125, -0.05615234375, -0.04931640625, -0.04248046875, -0.03564453125, -0.02880859375, -0.02197265625, -0.01513671875, -0.00830078125, -0.00146484375, 0.00537109375, 0.01220703125, 0.01904296875, 0.02587890625, 0.03271484375, 0.03955078125, 0.04638671875, 0.05322265625, 0.06005859375, 0.06689453125, 0.07373046875, 0.08056640625, 0.08740234375, 0.09423828125, 0.10107421875, 0.10791015625, 0.11474609375, 0.12158203125, 0.12841796875, 0.13525390625, 0.14208984375, 0.14892578125, 0.15576171875, 0.16259765625, 0.16943359375, 0.17626953125, 0.18310546875, 0.18994140625, 0.19677734375, 0.20361328125, 0.21044921875, 0.21728515625, 0.22412109375, 0.23095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 10.0, 24.0, 26.0, 51.0, 85.0, 153.0, 270.0, 561.0, 981.0, 1878.0, 4139.0, 9807.0, 27969.0, 125170.0, 3647041.0, 308349.0, 43402.0, 13748.0, 5477.0, 2534.0, 1226.0, 631.0, 332.0, 157.0, 102.0, 58.0, 44.0, 21.0, 14.0, 9.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.252960205078125, -1.20416259765625, -1.155364990234375, -1.1065673828125, -1.057769775390625, -1.00897216796875, -0.960174560546875, -0.911376953125, -0.862579345703125, -0.81378173828125, -0.764984130859375, -0.7161865234375, -0.667388916015625, -0.61859130859375, -0.569793701171875, -0.52099609375, -0.472198486328125, -0.42340087890625, -0.374603271484375, -0.3258056640625, -0.277008056640625, -0.22821044921875, -0.179412841796875, -0.130615234375, -0.081817626953125, -0.03302001953125, 0.015777587890625, 0.0645751953125, 0.113372802734375, 0.16217041015625, 0.210968017578125, 0.259765625, 0.308563232421875, 0.35736083984375, 0.406158447265625, 0.4549560546875, 0.503753662109375, 0.55255126953125, 0.601348876953125, 0.650146484375, 0.698944091796875, 0.74774169921875, 0.796539306640625, 0.8453369140625, 0.894134521484375, 0.94293212890625, 0.991729736328125, 1.04052734375, 1.089324951171875, 1.13812255859375, 1.186920166015625, 1.2357177734375, 1.284515380859375, 1.33331298828125, 1.382110595703125, 1.430908203125, 1.479705810546875, 1.52850341796875, 1.577301025390625, 1.6260986328125, 1.674896240234375, 1.72369384765625, 1.772491455078125, 1.8212890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 9.0, 9.0, 11.0, 21.0, 16.0, 22.0, 31.0, 54.0, 111.0, 224.0, 787.0, 2000.0, 347.0, 142.0, 80.0, 53.0, 21.0, 26.0, 19.0, 13.0, 15.0, 6.0, 10.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5078125, -0.4929656982421875, -0.478118896484375, -0.4632720947265625, -0.44842529296875, -0.4335784912109375, -0.418731689453125, -0.4038848876953125, -0.3890380859375, -0.3741912841796875, -0.359344482421875, -0.3444976806640625, -0.32965087890625, -0.3148040771484375, -0.299957275390625, -0.2851104736328125, -0.270263671875, -0.2554168701171875, -0.240570068359375, -0.2257232666015625, -0.21087646484375, -0.1960296630859375, -0.181182861328125, -0.1663360595703125, -0.1514892578125, -0.1366424560546875, -0.121795654296875, -0.1069488525390625, -0.09210205078125, -0.0772552490234375, -0.062408447265625, -0.0475616455078125, -0.03271484375, -0.0178680419921875, -0.003021240234375, 0.0118255615234375, 0.02667236328125, 0.0415191650390625, 0.056365966796875, 0.0712127685546875, 0.0860595703125, 0.1009063720703125, 0.115753173828125, 0.1305999755859375, 0.14544677734375, 0.1602935791015625, 0.175140380859375, 0.1899871826171875, 0.204833984375, 0.2196807861328125, 0.234527587890625, 0.2493743896484375, 0.26422119140625, 0.2790679931640625, 0.293914794921875, 0.3087615966796875, 0.3236083984375, 0.3384552001953125, 0.353302001953125, 0.3681488037109375, 0.38299560546875, 0.3978424072265625, 0.412689208984375, 0.4275360107421875, 0.4423828125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 15.0, 24.0, 56.0, 122.0, 182.0, 224.0, 199.0, 93.0, 51.0, 22.0, 11.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.217823505401611, -5.082035064697266, -4.946246147155762, -4.810457706451416, -4.67466926574707, -4.538880348205566, -4.403091907501221, -4.267303466796875, -4.131514549255371, -3.9957258701324463, -3.8599374294281006, -3.724148750305176, -3.58836030960083, -3.4525716304779053, -3.3167829513549805, -3.1809945106506348, -3.045206069946289, -2.9094173908233643, -2.7736289501190186, -2.6378402709960938, -2.502051830291748, -2.3662631511688232, -2.2304744720458984, -2.0946860313415527, -1.958897352218628, -1.8231087923049927, -1.6873202323913574, -1.5515315532684326, -1.4157429933547974, -1.279954433441162, -1.1441657543182373, -1.008377194404602, -0.8725886344909668, -0.7368000745773315, -0.6010114550590515, -0.46522286534309387, -0.32943427562713623, -0.19364571571350098, -0.05785709619522095, 0.07793152332305908, 0.21372008323669434, 0.349508672952652, 0.4852972626686096, 0.6210858821868896, 0.7568744421005249, 0.8926630020141602, 1.028451681137085, 1.1642402410507202, 1.3000288009643555, 1.4358173608779907, 1.571605920791626, 1.7073945999145508, 1.843183159828186, 1.9789717197418213, 2.114760398864746, 2.250548839569092, 2.3863375186920166, 2.5221261978149414, 2.657914638519287, 2.793703317642212, 2.9294919967651367, 3.0652804374694824, 3.2010691165924072, 3.336857795715332, 3.4726462364196777]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 5.0, 4.0, 11.0, 14.0, 7.0, 18.0, 15.0, 18.0, 24.0, 28.0, 26.0, 22.0, 27.0, 32.0, 27.0, 43.0, 43.0, 40.0, 41.0, 44.0, 43.0, 39.0, 47.0, 25.0, 31.0, 36.0, 32.0, 27.0, 29.0, 24.0, 20.0, 22.0, 20.0, 22.0, 11.0, 11.0, 11.0, 9.0, 12.0, 6.0, 4.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.1953881978988647, -1.1608850955963135, -1.1263819932937622, -1.091878890991211, -1.0573757886886597, -1.0228726863861084, -0.9883695840835571, -0.9538664817810059, -0.9193633794784546, -0.8848602771759033, -0.850357174873352, -0.8158540725708008, -0.7813509702682495, -0.7468478679656982, -0.712344765663147, -0.6778416633605957, -0.6433386206626892, -0.6088355183601379, -0.5743324160575867, -0.5398293137550354, -0.5053262114524841, -0.47082310914993286, -0.436320036649704, -0.4018169343471527, -0.36731383204460144, -0.33281072974205017, -0.2983076274394989, -0.26380455493927, -0.22930143773555756, -0.1947983354330063, -0.1602952480316162, -0.12579214572906494, -0.09128904342651367, -0.0567859448492527, -0.02228284627199173, 0.012220248579978943, 0.04672335088253021, 0.08122645318508148, 0.11572954058647156, 0.15023264288902283, 0.1847357451915741, 0.21923884749412537, 0.25374194979667664, 0.2882450222969055, 0.3227481245994568, 0.35725122690200806, 0.3917543292045593, 0.4262574315071106, 0.46076053380966187, 0.49526363611221313, 0.5297667384147644, 0.5642698407173157, 0.5987729430198669, 0.6332760453224182, 0.6677790880203247, 0.702282190322876, 0.7367852926254272, 0.7712883949279785, 0.8057914972305298, 0.840294599533081, 0.8747977018356323, 0.9093008041381836, 0.9438039064407349, 0.9783070087432861, 1.0128101110458374]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 11.0, 10.0, 18.0, 22.0, 32.0, 43.0, 63.0, 87.0, 122.0, 147.0, 246.0, 390.0, 583.0, 950.0, 1453.0, 2350.0, 4175.0, 7670.0, 15005.0, 32641.0, 77469.0, 193332.0, 342901.0, 211547.0, 85790.0, 35553.0, 16507.0, 8139.0, 4393.0, 2556.0, 1467.0, 948.0, 585.0, 413.0, 267.0, 176.0, 138.0, 110.0, 81.0, 46.0, 32.0, 28.0, 16.0, 12.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0744171142578125, -1.041412353515625, -1.0084075927734375, -0.97540283203125, -0.9423980712890625, -0.909393310546875, -0.8763885498046875, -0.8433837890625, -0.8103790283203125, -0.777374267578125, -0.7443695068359375, -0.71136474609375, -0.6783599853515625, -0.645355224609375, -0.6123504638671875, -0.579345703125, -0.5463409423828125, -0.513336181640625, -0.4803314208984375, -0.44732666015625, -0.4143218994140625, -0.381317138671875, -0.3483123779296875, -0.3153076171875, -0.2823028564453125, -0.249298095703125, -0.2162933349609375, -0.18328857421875, -0.1502838134765625, -0.117279052734375, -0.0842742919921875, -0.05126953125, -0.0182647705078125, 0.014739990234375, 0.0477447509765625, 0.08074951171875, 0.1137542724609375, 0.146759033203125, 0.1797637939453125, 0.2127685546875, 0.2457733154296875, 0.278778076171875, 0.3117828369140625, 0.34478759765625, 0.3777923583984375, 0.410797119140625, 0.4438018798828125, 0.476806640625, 0.5098114013671875, 0.542816162109375, 0.5758209228515625, 0.60882568359375, 0.6418304443359375, 0.674835205078125, 0.7078399658203125, 0.7408447265625, 0.7738494873046875, 0.806854248046875, 0.8398590087890625, 0.87286376953125, 0.9058685302734375, 0.938873291015625, 0.9718780517578125, 1.0048828125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 1.0, 13.0, 7.0, 5.0, 15.0, 11.0, 16.0, 19.0, 18.0, 19.0, 33.0, 32.0, 24.0, 38.0, 45.0, 45.0, 46.0, 46.0, 37.0, 41.0, 48.0, 49.0, 47.0, 36.0, 36.0, 42.0, 38.0, 28.0, 24.0, 24.0, 17.0, 19.0, 13.0, 15.0, 9.0, 9.0, 4.0, 6.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20654296875, -0.1995868682861328, -0.19263076782226562, -0.18567466735839844, -0.17871856689453125, -0.17176246643066406, -0.16480636596679688, -0.1578502655029297, -0.1508941650390625, -0.1439380645751953, -0.13698196411132812, -0.13002586364746094, -0.12306976318359375, -0.11611366271972656, -0.10915756225585938, -0.10220146179199219, -0.095245361328125, -0.08828926086425781, -0.08133316040039062, -0.07437705993652344, -0.06742095947265625, -0.06046485900878906, -0.053508758544921875, -0.04655265808105469, -0.0395965576171875, -0.03264045715332031, -0.025684356689453125, -0.018728256225585938, -0.01177215576171875, -0.0048160552978515625, 0.002140045166015625, 0.009096145629882812, 0.01605224609375, 0.023008346557617188, 0.029964447021484375, 0.03692054748535156, 0.04387664794921875, 0.05083274841308594, 0.057788848876953125, 0.06474494934082031, 0.0717010498046875, 0.07865715026855469, 0.08561325073242188, 0.09256935119628906, 0.09952545166015625, 0.10648155212402344, 0.11343765258789062, 0.12039375305175781, 0.127349853515625, 0.1343059539794922, 0.14126205444335938, 0.14821815490722656, 0.15517425537109375, 0.16213035583496094, 0.16908645629882812, 0.1760425567626953, 0.1829986572265625, 0.1899547576904297, 0.19691085815429688, 0.20386695861816406, 0.21082305908203125, 0.21777915954589844, 0.22473526000976562, 0.2316913604736328, 0.2386474609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 11.0, 12.0, 13.0, 7.0, 27.0, 41.0, 39.0, 99.0, 151.0, 262.0, 459.0, 813.0, 1708.0, 3859.0, 9054.0, 24770.0, 77354.0, 255317.0, 424764.0, 169660.0, 50968.0, 16860.0, 6578.0, 2836.0, 1290.0, 688.0, 355.0, 231.0, 106.0, 72.0, 48.0, 33.0, 15.0, 15.0, 13.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0205078125, -0.9889373779296875, -0.957366943359375, -0.9257965087890625, -0.89422607421875, -0.8626556396484375, -0.831085205078125, -0.7995147705078125, -0.7679443359375, -0.7363739013671875, -0.704803466796875, -0.6732330322265625, -0.64166259765625, -0.6100921630859375, -0.578521728515625, -0.5469512939453125, -0.515380859375, -0.4838104248046875, -0.452239990234375, -0.4206695556640625, -0.38909912109375, -0.3575286865234375, -0.325958251953125, -0.2943878173828125, -0.2628173828125, -0.2312469482421875, -0.199676513671875, -0.1681060791015625, -0.13653564453125, -0.1049652099609375, -0.073394775390625, -0.0418243408203125, -0.01025390625, 0.0213165283203125, 0.052886962890625, 0.0844573974609375, 0.11602783203125, 0.1475982666015625, 0.179168701171875, 0.2107391357421875, 0.2423095703125, 0.2738800048828125, 0.305450439453125, 0.3370208740234375, 0.36859130859375, 0.4001617431640625, 0.431732177734375, 0.4633026123046875, 0.494873046875, 0.5264434814453125, 0.558013916015625, 0.5895843505859375, 0.62115478515625, 0.6527252197265625, 0.684295654296875, 0.7158660888671875, 0.7474365234375, 0.7790069580078125, 0.810577392578125, 0.8421478271484375, 0.87371826171875, 0.9052886962890625, 0.936859130859375, 0.9684295654296875, 1.0]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 8.0, 13.0, 16.0, 16.0, 18.0, 15.0, 15.0, 24.0, 37.0, 30.0, 39.0, 32.0, 34.0, 52.0, 47.0, 32.0, 41.0, 51.0, 49.0, 38.0, 44.0, 27.0, 43.0, 41.0, 31.0, 24.0, 30.0, 10.0, 23.0, 21.0, 17.0, 6.0, 14.0, 5.0, 8.0, 5.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.0751953125, -1.0428543090820312, -1.0105133056640625, -0.9781723022460938, -0.945831298828125, -0.9134902954101562, -0.8811492919921875, -0.8488082885742188, -0.81646728515625, -0.7841262817382812, -0.7517852783203125, -0.7194442749023438, -0.687103271484375, -0.6547622680664062, -0.6224212646484375, -0.5900802612304688, -0.5577392578125, -0.5253982543945312, -0.4930572509765625, -0.46071624755859375, -0.428375244140625, -0.39603424072265625, -0.3636932373046875, -0.33135223388671875, -0.29901123046875, -0.26667022705078125, -0.2343292236328125, -0.20198822021484375, -0.169647216796875, -0.13730621337890625, -0.1049652099609375, -0.07262420654296875, -0.040283203125, -0.00794219970703125, 0.0243988037109375, 0.05673980712890625, 0.089080810546875, 0.12142181396484375, 0.1537628173828125, 0.18610382080078125, 0.21844482421875, 0.25078582763671875, 0.2831268310546875, 0.31546783447265625, 0.347808837890625, 0.38014984130859375, 0.4124908447265625, 0.44483184814453125, 0.4771728515625, 0.5095138549804688, 0.5418548583984375, 0.5741958618164062, 0.606536865234375, 0.6388778686523438, 0.6712188720703125, 0.7035598754882812, 0.73590087890625, 0.7682418823242188, 0.8005828857421875, 0.8329238891601562, 0.865264892578125, 0.8976058959960938, 0.9299468994140625, 0.9622879028320312, 0.99462890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 12.0, 27.0, 47.0, 64.0, 156.0, 316.0, 966.0, 3733.0, 18702.0, 167037.0, 746052.0, 94927.0, 12520.0, 2671.0, 770.0, 268.0, 125.0, 63.0, 24.0, 19.0, 16.0, 6.0, 9.0, 9.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.28125, -1.243988037109375, -1.20672607421875, -1.169464111328125, -1.1322021484375, -1.094940185546875, -1.05767822265625, -1.020416259765625, -0.983154296875, -0.945892333984375, -0.90863037109375, -0.871368408203125, -0.8341064453125, -0.796844482421875, -0.75958251953125, -0.722320556640625, -0.68505859375, -0.647796630859375, -0.61053466796875, -0.573272705078125, -0.5360107421875, -0.498748779296875, -0.46148681640625, -0.424224853515625, -0.386962890625, -0.349700927734375, -0.31243896484375, -0.275177001953125, -0.2379150390625, -0.200653076171875, -0.16339111328125, -0.126129150390625, -0.0888671875, -0.051605224609375, -0.01434326171875, 0.022918701171875, 0.0601806640625, 0.097442626953125, 0.13470458984375, 0.171966552734375, 0.209228515625, 0.246490478515625, 0.28375244140625, 0.321014404296875, 0.3582763671875, 0.395538330078125, 0.43280029296875, 0.470062255859375, 0.50732421875, 0.544586181640625, 0.58184814453125, 0.619110107421875, 0.6563720703125, 0.693634033203125, 0.73089599609375, 0.768157958984375, 0.805419921875, 0.842681884765625, 0.87994384765625, 0.917205810546875, 0.9544677734375, 0.991729736328125, 1.02899169921875, 1.066253662109375, 1.103515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 5.0, 7.0, 15.0, 8.0, 16.0, 16.0, 19.0, 26.0, 28.0, 37.0, 54.0, 71.0, 85.0, 99.0, 112.0, 83.0, 50.0, 44.0, 34.0, 30.0, 21.0, 26.0, 23.0, 9.0, 16.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.262561798095703e-05, -8.995179086923599e-05, -8.727796375751495e-05, -8.460413664579391e-05, -8.193030953407288e-05, -7.925648242235184e-05, -7.65826553106308e-05, -7.390882819890976e-05, -7.123500108718872e-05, -6.856117397546768e-05, -6.588734686374664e-05, -6.32135197520256e-05, -6.0539692640304565e-05, -5.7865865528583527e-05, -5.519203841686249e-05, -5.251821130514145e-05, -4.984438419342041e-05, -4.717055708169937e-05, -4.449672996997833e-05, -4.1822902858257294e-05, -3.9149075746536255e-05, -3.6475248634815216e-05, -3.380142152309418e-05, -3.112759441137314e-05, -2.84537672996521e-05, -2.577994018793106e-05, -2.3106113076210022e-05, -2.0432285964488983e-05, -1.7758458852767944e-05, -1.5084631741046906e-05, -1.2410804629325867e-05, -9.736977517604828e-06, -7.063150405883789e-06, -4.38932329416275e-06, -1.7154961824417114e-06, 9.583309292793274e-07, 3.632158041000366e-06, 6.305985152721405e-06, 8.979812264442444e-06, 1.1653639376163483e-05, 1.4327466487884521e-05, 1.700129359960556e-05, 1.96751207113266e-05, 2.2348947823047638e-05, 2.5022774934768677e-05, 2.7696602046489716e-05, 3.0370429158210754e-05, 3.304425626993179e-05, 3.571808338165283e-05, 3.839191049337387e-05, 4.106573760509491e-05, 4.373956471681595e-05, 4.641339182853699e-05, 4.9087218940258026e-05, 5.1761046051979065e-05, 5.4434873163700104e-05, 5.710870027542114e-05, 5.978252738714218e-05, 6.245635449886322e-05, 6.513018161058426e-05, 6.78040087223053e-05, 7.047783583402634e-05, 7.315166294574738e-05, 7.582549005746841e-05, 7.849931716918945e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 12.0, 17.0, 18.0, 34.0, 50.0, 102.0, 155.0, 307.0, 646.0, 1404.0, 3007.0, 7986.0, 25096.0, 104599.0, 517939.0, 300643.0, 60560.0, 15974.0, 5521.0, 2323.0, 1077.0, 491.0, 259.0, 116.0, 75.0, 61.0, 22.0, 18.0, 16.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66259765625, -0.636932373046875, -0.61126708984375, -0.585601806640625, -0.5599365234375, -0.534271240234375, -0.50860595703125, -0.482940673828125, -0.457275390625, -0.431610107421875, -0.40594482421875, -0.380279541015625, -0.3546142578125, -0.328948974609375, -0.30328369140625, -0.277618408203125, -0.251953125, -0.226287841796875, -0.20062255859375, -0.174957275390625, -0.1492919921875, -0.123626708984375, -0.09796142578125, -0.072296142578125, -0.046630859375, -0.020965576171875, 0.00469970703125, 0.030364990234375, 0.0560302734375, 0.081695556640625, 0.10736083984375, 0.133026123046875, 0.15869140625, 0.184356689453125, 0.21002197265625, 0.235687255859375, 0.2613525390625, 0.287017822265625, 0.31268310546875, 0.338348388671875, 0.364013671875, 0.389678955078125, 0.41534423828125, 0.441009521484375, 0.4666748046875, 0.492340087890625, 0.51800537109375, 0.543670654296875, 0.5693359375, 0.595001220703125, 0.62066650390625, 0.646331787109375, 0.6719970703125, 0.697662353515625, 0.72332763671875, 0.748992919921875, 0.774658203125, 0.800323486328125, 0.82598876953125, 0.851654052734375, 0.8773193359375, 0.902984619140625, 0.92864990234375, 0.954315185546875, 0.97998046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 3.0, 10.0, 7.0, 12.0, 16.0, 17.0, 17.0, 26.0, 34.0, 49.0, 61.0, 79.0, 110.0, 117.0, 96.0, 71.0, 58.0, 46.0, 25.0, 37.0, 21.0, 17.0, 10.0, 16.0, 6.0, 9.0, 5.0, 2.0, 6.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6823272705078125, -0.659088134765625, -0.6358489990234375, -0.61260986328125, -0.5893707275390625, -0.566131591796875, -0.5428924560546875, -0.5196533203125, -0.4964141845703125, -0.473175048828125, -0.4499359130859375, -0.42669677734375, -0.4034576416015625, -0.380218505859375, -0.3569793701171875, -0.333740234375, -0.3105010986328125, -0.287261962890625, -0.2640228271484375, -0.24078369140625, -0.2175445556640625, -0.194305419921875, -0.1710662841796875, -0.1478271484375, -0.1245880126953125, -0.101348876953125, -0.0781097412109375, -0.05487060546875, -0.0316314697265625, -0.008392333984375, 0.0148468017578125, 0.0380859375, 0.0613250732421875, 0.084564208984375, 0.1078033447265625, 0.13104248046875, 0.1542816162109375, 0.177520751953125, 0.2007598876953125, 0.2239990234375, 0.2472381591796875, 0.270477294921875, 0.2937164306640625, 0.31695556640625, 0.3401947021484375, 0.363433837890625, 0.3866729736328125, 0.409912109375, 0.4331512451171875, 0.456390380859375, 0.4796295166015625, 0.50286865234375, 0.5261077880859375, 0.549346923828125, 0.5725860595703125, 0.5958251953125, 0.6190643310546875, 0.642303466796875, 0.6655426025390625, 0.68878173828125, 0.7120208740234375, 0.735260009765625, 0.7584991455078125, 0.78173828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 13.0, 12.0, 30.0, 60.0, 83.0, 112.0, 210.0, 180.0, 116.0, 80.0, 51.0, 32.0, 17.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.012384414672852, -11.609152793884277, -11.205920219421387, -10.802688598632812, -10.399456024169922, -9.996224403381348, -9.592992782592773, -9.189760208129883, -8.786528587341309, -8.383296966552734, -7.980064392089844, -7.5768327713012695, -7.173600673675537, -6.770368576049805, -6.367136478424072, -5.96390438079834, -5.560672283172607, -5.157440185546875, -4.754208087921143, -4.35097599029541, -3.947744369506836, -3.5445122718811035, -3.141280174255371, -2.7380483150482178, -2.3348162174224854, -1.9315842390060425, -1.5283522605895996, -1.1251201629638672, -0.7218881845474243, -0.31865620613098145, 0.08457589149475098, 0.4878077507019043, 0.8910398483276367, 1.2942718267440796, 1.6975038051605225, 2.100735902786255, 2.503967761993408, 2.9071998596191406, 3.310431957244873, 3.7136638164520264, 4.11689567565918, 4.520127773284912, 4.9233598709106445, 5.326591491699219, 5.729823589324951, 6.133055686950684, 6.536287784576416, 6.939519882202148, 7.342751979827881, 7.745984077453613, 8.149215698242188, 8.552448272705078, 8.955679893493652, 9.358911514282227, 9.762144088745117, 10.165375709533691, 10.568608283996582, 10.971839904785156, 11.375072479248047, 11.778304100036621, 12.181536674499512, 12.584768295288086, 12.988000869750977, 13.39123249053955, 13.794464111328125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 7.0, 10.0, 5.0, 16.0, 17.0, 16.0, 21.0, 20.0, 23.0, 24.0, 21.0, 33.0, 36.0, 34.0, 33.0, 49.0, 59.0, 51.0, 42.0, 56.0, 48.0, 41.0, 45.0, 35.0, 39.0, 23.0, 24.0, 30.0, 30.0, 27.0, 23.0, 14.0, 7.0, 12.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.212226867675781, -5.007685661315918, -4.8031439781188965, -4.598602771759033, -4.39406156539917, -4.189519882202148, -3.984978675842285, -3.780437469482422, -3.5758960247039795, -3.371354579925537, -3.166813373565674, -2.9622719287872314, -2.757730484008789, -2.553189277648926, -2.3486478328704834, -2.144106388092041, -1.9395651817321777, -1.735023856163025, -1.530482530593872, -1.3259410858154297, -1.1213997602462769, -0.916858434677124, -0.7123169898986816, -0.5077756643295288, -0.303234338760376, -0.09869298338890076, 0.10584837198257446, 0.31038975715637207, 0.5149310827255249, 0.7194724082946777, 0.9240138530731201, 1.128555178642273, 1.3330965042114258, 1.5376378297805786, 1.7421791553497314, 1.9467206001281738, 2.151261806488037, 2.3558032512664795, 2.560344696044922, 2.764885902404785, 2.9694273471832275, 3.17396879196167, 3.378509998321533, 3.5830514430999756, 3.787592887878418, 3.9921340942382812, 4.1966753005981445, 4.401216983795166, 4.605758190155029, 4.810299396514893, 5.014841079711914, 5.219382286071777, 5.423923492431641, 5.628464698791504, 5.833006381988525, 6.037547588348389, 6.24208927154541, 6.446630477905273, 6.651172161102295, 6.855713367462158, 7.0602545738220215, 7.264796257019043, 7.469337463378906, 7.6738786697387695, 7.878419876098633]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 8.0, 11.0, 11.0, 20.0, 36.0, 50.0, 75.0, 142.0, 188.0, 333.0, 575.0, 1008.0, 1911.0, 3793.0, 8379.0, 19637.0, 56445.0, 245986.0, 3005655.0, 691053.0, 103864.0, 31374.0, 12343.0, 5410.0, 2642.0, 1397.0, 783.0, 418.0, 243.0, 160.0, 91.0, 60.0, 55.0, 34.0, 27.0, 15.0, 23.0, 7.0, 10.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.9614410400390625, -0.920928955078125, -0.8804168701171875, -0.83990478515625, -0.7993927001953125, -0.758880615234375, -0.7183685302734375, -0.6778564453125, -0.6373443603515625, -0.596832275390625, -0.5563201904296875, -0.51580810546875, -0.4752960205078125, -0.434783935546875, -0.3942718505859375, -0.353759765625, -0.3132476806640625, -0.272735595703125, -0.2322235107421875, -0.19171142578125, -0.1511993408203125, -0.110687255859375, -0.0701751708984375, -0.0296630859375, 0.0108489990234375, 0.051361083984375, 0.0918731689453125, 0.13238525390625, 0.1728973388671875, 0.213409423828125, 0.2539215087890625, 0.29443359375, 0.3349456787109375, 0.375457763671875, 0.4159698486328125, 0.45648193359375, 0.4969940185546875, 0.537506103515625, 0.5780181884765625, 0.6185302734375, 0.6590423583984375, 0.699554443359375, 0.7400665283203125, 0.78057861328125, 0.8210906982421875, 0.861602783203125, 0.9021148681640625, 0.942626953125, 0.9831390380859375, 1.023651123046875, 1.0641632080078125, 1.10467529296875, 1.1451873779296875, 1.185699462890625, 1.2262115478515625, 1.2667236328125, 1.3072357177734375, 1.347747802734375, 1.3882598876953125, 1.42877197265625, 1.4692840576171875, 1.509796142578125, 1.5503082275390625, 1.5908203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 8.0, 24.0, 13.0, 26.0, 26.0, 34.0, 36.0, 40.0, 45.0, 58.0, 51.0, 64.0, 58.0, 57.0, 59.0, 54.0, 55.0, 41.0, 53.0, 42.0, 32.0, 20.0, 17.0, 14.0, 14.0, 12.0, 7.0, 8.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.21923255920410156, -0.20933914184570312, -0.1994457244873047, -0.18955230712890625, -0.1796588897705078, -0.16976547241210938, -0.15987205505371094, -0.1499786376953125, -0.14008522033691406, -0.13019180297851562, -0.12029838562011719, -0.11040496826171875, -0.10051155090332031, -0.09061813354492188, -0.08072471618652344, -0.070831298828125, -0.06093788146972656, -0.051044464111328125, -0.04115104675292969, -0.03125762939453125, -0.021364212036132812, -0.011470794677734375, -0.0015773773193359375, 0.0083160400390625, 0.018209457397460938, 0.028102874755859375, 0.03799629211425781, 0.04788970947265625, 0.05778312683105469, 0.06767654418945312, 0.07756996154785156, 0.08746337890625, 0.09735679626464844, 0.10725021362304688, 0.11714363098144531, 0.12703704833984375, 0.1369304656982422, 0.14682388305664062, 0.15671730041503906, 0.1666107177734375, 0.17650413513183594, 0.18639755249023438, 0.1962909698486328, 0.20618438720703125, 0.2160778045654297, 0.22597122192382812, 0.23586463928222656, 0.245758056640625, 0.25565147399902344, 0.2655448913574219, 0.2754383087158203, 0.28533172607421875, 0.2952251434326172, 0.3051185607910156, 0.31501197814941406, 0.3249053955078125, 0.33479881286621094, 0.3446922302246094, 0.3545856475830078, 0.36447906494140625, 0.3743724822998047, 0.3842658996582031, 0.39415931701660156, 0.404052734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 9.0, 14.0, 19.0, 30.0, 42.0, 92.0, 129.0, 226.0, 417.0, 858.0, 1972.0, 5530.0, 19323.0, 99330.0, 1382571.0, 2515471.0, 133481.0, 23926.0, 6538.0, 2275.0, 966.0, 460.0, 254.0, 148.0, 77.0, 42.0, 28.0, 20.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.337890625, -1.2799072265625, -1.221923828125, -1.1639404296875, -1.10595703125, -1.0479736328125, -0.989990234375, -0.9320068359375, -0.8740234375, -0.8160400390625, -0.758056640625, -0.7000732421875, -0.64208984375, -0.5841064453125, -0.526123046875, -0.4681396484375, -0.41015625, -0.3521728515625, -0.294189453125, -0.2362060546875, -0.17822265625, -0.1202392578125, -0.062255859375, -0.0042724609375, 0.0537109375, 0.1116943359375, 0.169677734375, 0.2276611328125, 0.28564453125, 0.3436279296875, 0.401611328125, 0.4595947265625, 0.517578125, 0.5755615234375, 0.633544921875, 0.6915283203125, 0.74951171875, 0.8074951171875, 0.865478515625, 0.9234619140625, 0.9814453125, 1.0394287109375, 1.097412109375, 1.1553955078125, 1.21337890625, 1.2713623046875, 1.329345703125, 1.3873291015625, 1.4453125, 1.5032958984375, 1.561279296875, 1.6192626953125, 1.67724609375, 1.7352294921875, 1.793212890625, 1.8511962890625, 1.9091796875, 1.9671630859375, 2.025146484375, 2.0831298828125, 2.14111328125, 2.1990966796875, 2.257080078125, 2.3150634765625, 2.373046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 11.0, 19.0, 15.0, 41.0, 40.0, 58.0, 83.0, 125.0, 186.0, 329.0, 565.0, 1105.0, 567.0, 306.0, 193.0, 107.0, 81.0, 56.0, 38.0, 21.0, 23.0, 18.0, 10.0, 12.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47607421875, -0.4548797607421875, -0.433685302734375, -0.4124908447265625, -0.39129638671875, -0.3701019287109375, -0.348907470703125, -0.3277130126953125, -0.3065185546875, -0.2853240966796875, -0.264129638671875, -0.2429351806640625, -0.22174072265625, -0.2005462646484375, -0.179351806640625, -0.1581573486328125, -0.136962890625, -0.1157684326171875, -0.094573974609375, -0.0733795166015625, -0.05218505859375, -0.0309906005859375, -0.009796142578125, 0.0113983154296875, 0.0325927734375, 0.0537872314453125, 0.074981689453125, 0.0961761474609375, 0.11737060546875, 0.1385650634765625, 0.159759521484375, 0.1809539794921875, 0.2021484375, 0.2233428955078125, 0.244537353515625, 0.2657318115234375, 0.28692626953125, 0.3081207275390625, 0.329315185546875, 0.3505096435546875, 0.3717041015625, 0.3928985595703125, 0.414093017578125, 0.4352874755859375, 0.45648193359375, 0.4776763916015625, 0.498870849609375, 0.5200653076171875, 0.541259765625, 0.5624542236328125, 0.583648681640625, 0.6048431396484375, 0.62603759765625, 0.6472320556640625, 0.668426513671875, 0.6896209716796875, 0.7108154296875, 0.7320098876953125, 0.753204345703125, 0.7743988037109375, 0.79559326171875, 0.8167877197265625, 0.837982177734375, 0.8591766357421875, 0.88037109375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 12.0, 10.0, 15.0, 33.0, 68.0, 88.0, 107.0, 152.0, 133.0, 111.0, 90.0, 78.0, 38.0, 19.0, 19.0, 11.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0810368061065674, -1.8784935474395752, -1.6759504079818726, -1.4734071493148804, -1.2708640098571777, -1.0683207511901855, -0.8657774925231934, -0.6632343530654907, -0.46069109439849854, -0.2581478953361511, -0.05560466647148132, 0.14693856239318848, 0.3494817614555359, 0.5520249605178833, 0.7545682191848755, 0.9571113586425781, 1.1596546173095703, 1.3621978759765625, 1.5647410154342651, 1.7672842741012573, 1.96982741355896, 2.172370672225952, 2.3749139308929443, 2.5774569511413574, 2.7800002098083496, 2.982543468475342, 3.185086727142334, 3.387629985809326, 3.5901730060577393, 3.7927162647247314, 3.9952595233917236, 4.197802543640137, 4.400346279144287, 4.602889537811279, 4.8054327964782715, 5.007976055145264, 5.210519313812256, 5.41306209564209, 5.615605354309082, 5.818148612976074, 6.020691871643066, 6.223235130310059, 6.425778388977051, 6.628321647644043, 6.830864906311035, 7.033408164978027, 7.2359514236450195, 7.4384942054748535, 7.641037940979004, 7.843581199645996, 8.046124458312988, 8.24866771697998, 8.451210975646973, 8.653754234313965, 8.856297492980957, 9.05884075164795, 9.261383056640625, 9.463926315307617, 9.66646957397461, 9.869012832641602, 10.071556091308594, 10.274099349975586, 10.476642608642578, 10.67918586730957, 10.881729125976562]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 11.0, 8.0, 9.0, 8.0, 14.0, 18.0, 13.0, 12.0, 23.0, 26.0, 25.0, 40.0, 30.0, 33.0, 38.0, 32.0, 40.0, 36.0, 31.0, 38.0, 50.0, 49.0, 33.0, 49.0, 37.0, 41.0, 27.0, 29.0, 25.0, 27.0, 12.0, 25.0, 23.0, 16.0, 8.0, 9.0, 11.0, 6.0, 10.0, 4.0, 9.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.620591640472412, -3.5141234397888184, -3.4076550006866455, -3.3011868000030518, -3.194718360900879, -3.088250160217285, -2.9817819595336914, -2.8753137588500977, -2.768845319747925, -2.662377119064331, -2.555908679962158, -2.4494404792785645, -2.3429722785949707, -2.236503839492798, -2.130035638809204, -2.0235671997070312, -1.9170989990234375, -1.8106306791305542, -1.704162359237671, -1.5976941585540771, -1.4912258386611938, -1.3847575187683105, -1.2782893180847168, -1.1718209981918335, -1.0653526782989502, -0.9588843584060669, -0.8524160981178284, -0.7459478378295898, -0.6394795179367065, -0.5330111980438232, -0.4265429377555847, -0.3200746774673462, -0.2136063575744629, -0.10713806748390198, -0.0006697773933410645, 0.10579851269721985, 0.21226680278778076, 0.31873512268066406, 0.4252033829689026, 0.5316716432571411, 0.6381399631500244, 0.7446082830429077, 0.8510765433311462, 0.9575448036193848, 1.064013123512268, 1.1704814434051514, 1.2769496440887451, 1.3834179639816284, 1.4898862838745117, 1.596354603767395, 1.7028229236602783, 1.809291124343872, 1.9157594442367554, 2.0222277641296387, 2.1286959648132324, 2.235164165496826, 2.341632604598999, 2.4481008052825928, 2.5545692443847656, 2.6610374450683594, 2.767505645751953, 2.873974084854126, 2.9804422855377197, 3.0869107246398926, 3.1933789253234863]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 17.0, 16.0, 35.0, 50.0, 71.0, 98.0, 176.0, 234.0, 394.0, 612.0, 943.0, 1617.0, 2666.0, 4625.0, 8287.0, 14945.0, 28748.0, 55324.0, 105372.0, 178576.0, 223299.0, 184513.0, 111823.0, 59139.0, 30349.0, 15863.0, 8445.0, 4800.0, 2954.0, 1710.0, 1032.0, 633.0, 403.0, 264.0, 182.0, 98.0, 76.0, 46.0, 37.0, 14.0, 16.0, 15.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.70751953125, -0.684356689453125, -0.66119384765625, -0.638031005859375, -0.6148681640625, -0.591705322265625, -0.56854248046875, -0.545379638671875, -0.522216796875, -0.499053955078125, -0.47589111328125, -0.452728271484375, -0.4295654296875, -0.406402587890625, -0.38323974609375, -0.360076904296875, -0.3369140625, -0.313751220703125, -0.29058837890625, -0.267425537109375, -0.2442626953125, -0.221099853515625, -0.19793701171875, -0.174774169921875, -0.151611328125, -0.128448486328125, -0.10528564453125, -0.082122802734375, -0.0589599609375, -0.035797119140625, -0.01263427734375, 0.010528564453125, 0.03369140625, 0.056854248046875, 0.08001708984375, 0.103179931640625, 0.1263427734375, 0.149505615234375, 0.17266845703125, 0.195831298828125, 0.218994140625, 0.242156982421875, 0.26531982421875, 0.288482666015625, 0.3116455078125, 0.334808349609375, 0.35797119140625, 0.381134033203125, 0.404296875, 0.427459716796875, 0.45062255859375, 0.473785400390625, 0.4969482421875, 0.520111083984375, 0.54327392578125, 0.566436767578125, 0.589599609375, 0.612762451171875, 0.63592529296875, 0.659088134765625, 0.6822509765625, 0.705413818359375, 0.72857666015625, 0.751739501953125, 0.77490234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 9.0, 13.0, 19.0, 19.0, 23.0, 23.0, 28.0, 24.0, 26.0, 41.0, 40.0, 40.0, 44.0, 45.0, 40.0, 47.0, 43.0, 47.0, 45.0, 34.0, 34.0, 37.0, 32.0, 31.0, 31.0, 25.0, 22.0, 21.0, 18.0, 16.0, 11.0, 10.0, 10.0, 8.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.3447265625, -0.33455657958984375, -0.3243865966796875, -0.31421661376953125, -0.304046630859375, -0.29387664794921875, -0.2837066650390625, -0.27353668212890625, -0.26336669921875, -0.25319671630859375, -0.2430267333984375, -0.23285675048828125, -0.222686767578125, -0.21251678466796875, -0.2023468017578125, -0.19217681884765625, -0.1820068359375, -0.17183685302734375, -0.1616668701171875, -0.15149688720703125, -0.141326904296875, -0.13115692138671875, -0.1209869384765625, -0.11081695556640625, -0.10064697265625, -0.09047698974609375, -0.0803070068359375, -0.07013702392578125, -0.059967041015625, -0.04979705810546875, -0.0396270751953125, -0.02945709228515625, -0.019287109375, -0.00911712646484375, 0.0010528564453125, 0.01122283935546875, 0.021392822265625, 0.03156280517578125, 0.0417327880859375, 0.05190277099609375, 0.06207275390625, 0.07224273681640625, 0.0824127197265625, 0.09258270263671875, 0.102752685546875, 0.11292266845703125, 0.1230926513671875, 0.13326263427734375, 0.1434326171875, 0.15360260009765625, 0.1637725830078125, 0.17394256591796875, 0.184112548828125, 0.19428253173828125, 0.2044525146484375, 0.21462249755859375, 0.22479248046875, 0.23496246337890625, 0.2451324462890625, 0.25530242919921875, 0.265472412109375, 0.27564239501953125, 0.2858123779296875, 0.29598236083984375, 0.30615234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 5.0, 9.0, 12.0, 10.0, 27.0, 32.0, 54.0, 91.0, 130.0, 231.0, 425.0, 797.0, 1683.0, 3951.0, 11245.0, 38135.0, 167165.0, 500554.0, 245105.0, 54475.0, 15012.0, 5206.0, 2045.0, 938.0, 500.0, 282.0, 168.0, 91.0, 53.0, 48.0, 22.0, 20.0, 7.0, 13.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8310546875, -1.773162841796875, -1.71527099609375, -1.657379150390625, -1.5994873046875, -1.541595458984375, -1.48370361328125, -1.425811767578125, -1.367919921875, -1.310028076171875, -1.25213623046875, -1.194244384765625, -1.1363525390625, -1.078460693359375, -1.02056884765625, -0.962677001953125, -0.90478515625, -0.846893310546875, -0.78900146484375, -0.731109619140625, -0.6732177734375, -0.615325927734375, -0.55743408203125, -0.499542236328125, -0.441650390625, -0.383758544921875, -0.32586669921875, -0.267974853515625, -0.2100830078125, -0.152191162109375, -0.09429931640625, -0.036407470703125, 0.021484375, 0.079376220703125, 0.13726806640625, 0.195159912109375, 0.2530517578125, 0.310943603515625, 0.36883544921875, 0.426727294921875, 0.484619140625, 0.542510986328125, 0.60040283203125, 0.658294677734375, 0.7161865234375, 0.774078369140625, 0.83197021484375, 0.889862060546875, 0.94775390625, 1.005645751953125, 1.06353759765625, 1.121429443359375, 1.1793212890625, 1.237213134765625, 1.29510498046875, 1.352996826171875, 1.410888671875, 1.468780517578125, 1.52667236328125, 1.584564208984375, 1.6424560546875, 1.700347900390625, 1.75823974609375, 1.816131591796875, 1.8740234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 9.0, 11.0, 14.0, 15.0, 20.0, 23.0, 30.0, 32.0, 44.0, 50.0, 47.0, 55.0, 48.0, 52.0, 49.0, 57.0, 47.0, 50.0, 53.0, 50.0, 39.0, 27.0, 29.0, 19.0, 21.0, 20.0, 15.0, 20.0, 11.0, 8.0, 5.0, 4.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.337890625, -3.25225830078125, -3.1666259765625, -3.08099365234375, -2.995361328125, -2.90972900390625, -2.8240966796875, -2.73846435546875, -2.65283203125, -2.56719970703125, -2.4815673828125, -2.39593505859375, -2.310302734375, -2.22467041015625, -2.1390380859375, -2.05340576171875, -1.9677734375, -1.88214111328125, -1.7965087890625, -1.71087646484375, -1.625244140625, -1.53961181640625, -1.4539794921875, -1.36834716796875, -1.28271484375, -1.19708251953125, -1.1114501953125, -1.02581787109375, -0.940185546875, -0.85455322265625, -0.7689208984375, -0.68328857421875, -0.59765625, -0.51202392578125, -0.4263916015625, -0.34075927734375, -0.255126953125, -0.16949462890625, -0.0838623046875, 0.00177001953125, 0.08740234375, 0.17303466796875, 0.2586669921875, 0.34429931640625, 0.429931640625, 0.51556396484375, 0.6011962890625, 0.68682861328125, 0.7724609375, 0.85809326171875, 0.9437255859375, 1.02935791015625, 1.114990234375, 1.20062255859375, 1.2862548828125, 1.37188720703125, 1.45751953125, 1.54315185546875, 1.6287841796875, 1.71441650390625, 1.800048828125, 1.88568115234375, 1.9713134765625, 2.05694580078125, 2.142578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 9.0, 16.0, 26.0, 42.0, 59.0, 67.0, 135.0, 269.0, 528.0, 1224.0, 3378.0, 11446.0, 50866.0, 308387.0, 532516.0, 109381.0, 21085.0, 5608.0, 1884.0, 780.0, 347.0, 198.0, 96.0, 50.0, 42.0, 31.0, 20.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.991455078125, -0.95751953125, -0.923583984375, -0.8896484375, -0.855712890625, -0.82177734375, -0.787841796875, -0.75390625, -0.719970703125, -0.68603515625, -0.652099609375, -0.6181640625, -0.584228515625, -0.55029296875, -0.516357421875, -0.482421875, -0.448486328125, -0.41455078125, -0.380615234375, -0.3466796875, -0.312744140625, -0.27880859375, -0.244873046875, -0.2109375, -0.177001953125, -0.14306640625, -0.109130859375, -0.0751953125, -0.041259765625, -0.00732421875, 0.026611328125, 0.060546875, 0.094482421875, 0.12841796875, 0.162353515625, 0.1962890625, 0.230224609375, 0.26416015625, 0.298095703125, 0.33203125, 0.365966796875, 0.39990234375, 0.433837890625, 0.4677734375, 0.501708984375, 0.53564453125, 0.569580078125, 0.603515625, 0.637451171875, 0.67138671875, 0.705322265625, 0.7392578125, 0.773193359375, 0.80712890625, 0.841064453125, 0.875, 0.908935546875, 0.94287109375, 0.976806640625, 1.0107421875, 1.044677734375, 1.07861328125, 1.112548828125, 1.146484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 5.0, 9.0, 11.0, 22.0, 24.0, 33.0, 22.0, 41.0, 45.0, 62.0, 59.0, 71.0, 77.0, 69.0, 67.0, 76.0, 55.0, 42.0, 53.0, 33.0, 38.0, 15.0, 10.0, 16.0, 14.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.092952728271484e-05, -6.818585097789764e-05, -6.544217467308044e-05, -6.269849836826324e-05, -5.9954822063446045e-05, -5.7211145758628845e-05, -5.4467469453811646e-05, -5.1723793148994446e-05, -4.8980116844177246e-05, -4.6236440539360046e-05, -4.349276423454285e-05, -4.074908792972565e-05, -3.800541162490845e-05, -3.526173532009125e-05, -3.251805901527405e-05, -2.9774382710456848e-05, -2.703070640563965e-05, -2.428703010082245e-05, -2.154335379600525e-05, -1.879967749118805e-05, -1.605600118637085e-05, -1.331232488155365e-05, -1.056864857673645e-05, -7.82497227191925e-06, -5.081295967102051e-06, -2.337619662284851e-06, 4.0605664253234863e-07, 3.1497329473495483e-06, 5.893409252166748e-06, 8.637085556983948e-06, 1.1380761861801147e-05, 1.4124438166618347e-05, 1.6868114471435547e-05, 1.9611790776252747e-05, 2.2355467081069946e-05, 2.5099143385887146e-05, 2.7842819690704346e-05, 3.0586495995521545e-05, 3.3330172300338745e-05, 3.6073848605155945e-05, 3.8817524909973145e-05, 4.1561201214790344e-05, 4.4304877519607544e-05, 4.7048553824424744e-05, 4.979223012924194e-05, 5.253590643405914e-05, 5.527958273887634e-05, 5.802325904369354e-05, 6.076693534851074e-05, 6.351061165332794e-05, 6.625428795814514e-05, 6.899796426296234e-05, 7.174164056777954e-05, 7.448531687259674e-05, 7.722899317741394e-05, 7.997266948223114e-05, 8.271634578704834e-05, 8.546002209186554e-05, 8.820369839668274e-05, 9.094737470149994e-05, 9.369105100631714e-05, 9.643472731113434e-05, 9.917840361595154e-05, 0.00010192207992076874, 0.00010466575622558594]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 16.0, 23.0, 24.0, 48.0, 102.0, 170.0, 323.0, 837.0, 2135.0, 7736.0, 42891.0, 440723.0, 492893.0, 48314.0, 8502.0, 2146.0, 883.0, 372.0, 178.0, 94.0, 54.0, 37.0, 18.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6474609375, -1.5960235595703125, -1.544586181640625, -1.4931488037109375, -1.44171142578125, -1.3902740478515625, -1.338836669921875, -1.2873992919921875, -1.2359619140625, -1.1845245361328125, -1.133087158203125, -1.0816497802734375, -1.03021240234375, -0.9787750244140625, -0.927337646484375, -0.8759002685546875, -0.824462890625, -0.7730255126953125, -0.721588134765625, -0.6701507568359375, -0.61871337890625, -0.5672760009765625, -0.515838623046875, -0.4644012451171875, -0.4129638671875, -0.3615264892578125, -0.310089111328125, -0.2586517333984375, -0.20721435546875, -0.1557769775390625, -0.104339599609375, -0.0529022216796875, -0.00146484375, 0.0499725341796875, 0.101409912109375, 0.1528472900390625, 0.20428466796875, 0.2557220458984375, 0.307159423828125, 0.3585968017578125, 0.4100341796875, 0.4614715576171875, 0.512908935546875, 0.5643463134765625, 0.61578369140625, 0.6672210693359375, 0.718658447265625, 0.7700958251953125, 0.821533203125, 0.8729705810546875, 0.924407958984375, 0.9758453369140625, 1.02728271484375, 1.0787200927734375, 1.130157470703125, 1.1815948486328125, 1.2330322265625, 1.2844696044921875, 1.335906982421875, 1.3873443603515625, 1.43878173828125, 1.4902191162109375, 1.541656494140625, 1.5930938720703125, 1.64453125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 12.0, 18.0, 20.0, 25.0, 43.0, 57.0, 83.0, 100.0, 109.0, 121.0, 104.0, 104.0, 58.0, 42.0, 28.0, 19.0, 10.0, 14.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0094146728515625, -0.961212158203125, -0.9130096435546875, -0.86480712890625, -0.8166046142578125, -0.768402099609375, -0.7201995849609375, -0.6719970703125, -0.6237945556640625, -0.575592041015625, -0.5273895263671875, -0.47918701171875, -0.4309844970703125, -0.382781982421875, -0.3345794677734375, -0.286376953125, -0.2381744384765625, -0.189971923828125, -0.1417694091796875, -0.09356689453125, -0.0453643798828125, 0.002838134765625, 0.0510406494140625, 0.0992431640625, 0.1474456787109375, 0.195648193359375, 0.2438507080078125, 0.29205322265625, 0.3402557373046875, 0.388458251953125, 0.4366607666015625, 0.48486328125, 0.5330657958984375, 0.581268310546875, 0.6294708251953125, 0.67767333984375, 0.7258758544921875, 0.774078369140625, 0.8222808837890625, 0.8704833984375, 0.9186859130859375, 0.966888427734375, 1.0150909423828125, 1.06329345703125, 1.1114959716796875, 1.159698486328125, 1.2079010009765625, 1.256103515625, 1.3043060302734375, 1.352508544921875, 1.4007110595703125, 1.44891357421875, 1.4971160888671875, 1.545318603515625, 1.5935211181640625, 1.6417236328125, 1.6899261474609375, 1.738128662109375, 1.7863311767578125, 1.83453369140625, 1.8827362060546875, 1.930938720703125, 1.9791412353515625, 2.02734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 49.0, 231.0, 466.0, 193.0, 46.0, 17.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390380859375, -14.646133422851562, -12.901885032653809, -11.157637596130371, -9.413389205932617, -7.66914176940918, -5.924894332885742, -4.180645942687988, -2.436398506164551, -0.6921507120132446, 1.0520970821380615, 2.796344757080078, 4.540592670440674, 6.2848405838012695, 8.029088020324707, 9.773336410522461, 11.517583847045898, 13.261831283569336, 15.00607967376709, 16.750328063964844, 18.49457550048828, 20.23882293701172, 21.983070373535156, 23.727317810058594, 25.47156524658203, 27.21581268310547, 28.960060119628906, 30.704307556152344, 32.44855499267578, 34.19280242919922, 35.937049865722656, 37.68130111694336, 39.4255485534668, 41.169795989990234, 42.91404342651367, 44.65829086303711, 46.40253829956055, 48.14678955078125, 49.89103698730469, 51.635284423828125, 53.37953186035156, 55.123779296875, 56.86802673339844, 58.612274169921875, 60.35652160644531, 62.10076904296875, 63.84501647949219, 65.58926391601562, 67.33351135253906, 69.0777587890625, 70.82200622558594, 72.56625366210938, 74.31050109863281, 76.05474853515625, 77.79899597167969, 79.54324340820312, 81.2874984741211, 83.03174591064453, 84.77599334716797, 86.5202407836914, 88.26448822021484, 90.00873565673828, 91.75298309326172, 93.49723052978516, 95.2414779663086]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 8.0, 8.0, 9.0, 17.0, 19.0, 19.0, 22.0, 30.0, 44.0, 43.0, 37.0, 48.0, 62.0, 63.0, 58.0, 49.0, 61.0, 61.0, 38.0, 48.0, 37.0, 32.0, 36.0, 17.0, 22.0, 13.0, 21.0, 10.0, 11.0, 17.0, 4.0, 4.0, 6.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.327043533325195, -14.821370124816895, -14.315696716308594, -13.810022354125977, -13.304348945617676, -12.798675537109375, -12.293001174926758, -11.787327766418457, -11.281654357910156, -10.775980949401855, -10.270307540893555, -9.764633178710938, -9.258959770202637, -8.753286361694336, -8.247611999511719, -7.741938591003418, -7.236265182495117, -6.730591773986816, -6.224917888641357, -5.719244003295898, -5.213570594787598, -4.707897186279297, -4.202223300933838, -3.696549654006958, -3.190876007080078, -2.6852023601531982, -2.1795287132263184, -1.6738550662994385, -1.1681814193725586, -0.6625077724456787, -0.15683412551879883, 0.34883952140808105, 0.8545150756835938, 1.3601887226104736, 1.8658623695373535, 2.3715360164642334, 2.8772096633911133, 3.382883310317993, 3.888556957244873, 4.394230842590332, 4.899904251098633, 5.405577659606934, 5.911251544952393, 6.416925430297852, 6.922598838806152, 7.428272247314453, 7.933946132659912, 8.439620018005371, 8.945293426513672, 9.450966835021973, 9.956640243530273, 10.46231460571289, 10.967988014221191, 11.473661422729492, 11.97933578491211, 12.48500919342041, 12.990682601928711, 13.496356010437012, 14.002029418945312, 14.50770378112793, 15.01337718963623, 15.519050598144531, 16.02472496032715, 16.530397415161133, 17.03607177734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 7.0, 19.0, 29.0, 37.0, 62.0, 91.0, 157.0, 289.0, 524.0, 1163.0, 2956.0, 11633.0, 202341.0, 3945030.0, 22460.0, 4366.0, 1569.0, 668.0, 345.0, 196.0, 132.0, 57.0, 53.0, 33.0, 20.0, 13.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66015625, -1.58172607421875, -1.5032958984375, -1.42486572265625, -1.346435546875, -1.26800537109375, -1.1895751953125, -1.11114501953125, -1.03271484375, -0.95428466796875, -0.8758544921875, -0.79742431640625, -0.718994140625, -0.64056396484375, -0.5621337890625, -0.48370361328125, -0.4052734375, -0.32684326171875, -0.2484130859375, -0.16998291015625, -0.091552734375, -0.01312255859375, 0.0653076171875, 0.14373779296875, 0.22216796875, 0.30059814453125, 0.3790283203125, 0.45745849609375, 0.535888671875, 0.61431884765625, 0.6927490234375, 0.77117919921875, 0.849609375, 0.92803955078125, 1.0064697265625, 1.08489990234375, 1.163330078125, 1.24176025390625, 1.3201904296875, 1.39862060546875, 1.47705078125, 1.55548095703125, 1.6339111328125, 1.71234130859375, 1.790771484375, 1.86920166015625, 1.9476318359375, 2.02606201171875, 2.1044921875, 2.18292236328125, 2.2613525390625, 2.33978271484375, 2.418212890625, 2.49664306640625, 2.5750732421875, 2.65350341796875, 2.73193359375, 2.81036376953125, 2.8887939453125, 2.96722412109375, 3.045654296875, 3.12408447265625, 3.2025146484375, 3.28094482421875, 3.359375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 13.0, 6.0, 22.0, 23.0, 23.0, 31.0, 40.0, 44.0, 48.0, 58.0, 51.0, 53.0, 65.0, 55.0, 69.0, 66.0, 46.0, 51.0, 46.0, 28.0, 31.0, 20.0, 21.0, 11.0, 15.0, 10.0, 7.0, 4.0, 5.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6471023559570312, -0.6262359619140625, -0.6053695678710938, -0.584503173828125, -0.5636367797851562, -0.5427703857421875, -0.5219039916992188, -0.50103759765625, -0.48017120361328125, -0.4593048095703125, -0.43843841552734375, -0.417572021484375, -0.39670562744140625, -0.3758392333984375, -0.35497283935546875, -0.3341064453125, -0.31324005126953125, -0.2923736572265625, -0.27150726318359375, -0.250640869140625, -0.22977447509765625, -0.2089080810546875, -0.18804168701171875, -0.16717529296875, -0.14630889892578125, -0.1254425048828125, -0.10457611083984375, -0.083709716796875, -0.06284332275390625, -0.0419769287109375, -0.02111053466796875, -0.000244140625, 0.02062225341796875, 0.0414886474609375, 0.06235504150390625, 0.083221435546875, 0.10408782958984375, 0.1249542236328125, 0.14582061767578125, 0.16668701171875, 0.18755340576171875, 0.2084197998046875, 0.22928619384765625, 0.250152587890625, 0.27101898193359375, 0.2918853759765625, 0.31275177001953125, 0.3336181640625, 0.35448455810546875, 0.3753509521484375, 0.39621734619140625, 0.417083740234375, 0.43795013427734375, 0.4588165283203125, 0.47968292236328125, 0.50054931640625, 0.5214157104492188, 0.5422821044921875, 0.5631484985351562, 0.584014892578125, 0.6048812866210938, 0.6257476806640625, 0.6466140747070312, 0.66748046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 5.0, 4.0, 9.0, 12.0, 22.0, 27.0, 29.0, 39.0, 69.0, 86.0, 104.0, 157.0, 256.0, 337.0, 530.0, 868.0, 1480.0, 2594.0, 5135.0, 12350.0, 52707.0, 3750160.0, 321133.0, 27776.0, 8599.0, 4031.0, 2133.0, 1225.0, 784.0, 509.0, 335.0, 214.0, 137.0, 109.0, 74.0, 61.0, 43.0, 32.0, 19.0, 20.0, 17.0, 12.0, 4.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.7578125, -1.704254150390625, -1.65069580078125, -1.597137451171875, -1.5435791015625, -1.490020751953125, -1.43646240234375, -1.382904052734375, -1.329345703125, -1.275787353515625, -1.22222900390625, -1.168670654296875, -1.1151123046875, -1.061553955078125, -1.00799560546875, -0.954437255859375, -0.90087890625, -0.847320556640625, -0.79376220703125, -0.740203857421875, -0.6866455078125, -0.633087158203125, -0.57952880859375, -0.525970458984375, -0.472412109375, -0.418853759765625, -0.36529541015625, -0.311737060546875, -0.2581787109375, -0.204620361328125, -0.15106201171875, -0.097503662109375, -0.0439453125, 0.009613037109375, 0.06317138671875, 0.116729736328125, 0.1702880859375, 0.223846435546875, 0.27740478515625, 0.330963134765625, 0.384521484375, 0.438079833984375, 0.49163818359375, 0.545196533203125, 0.5987548828125, 0.652313232421875, 0.70587158203125, 0.759429931640625, 0.81298828125, 0.866546630859375, 0.92010498046875, 0.973663330078125, 1.0272216796875, 1.080780029296875, 1.13433837890625, 1.187896728515625, 1.241455078125, 1.295013427734375, 1.34857177734375, 1.402130126953125, 1.4556884765625, 1.509246826171875, 1.56280517578125, 1.616363525390625, 1.669921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 9.0, 8.0, 26.0, 50.0, 109.0, 357.0, 3131.0, 233.0, 54.0, 19.0, 16.0, 12.0, 9.0, 5.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2756309509277344, -0.26146697998046875, -0.24730300903320312, -0.2331390380859375, -0.21897506713867188, -0.20481109619140625, -0.19064712524414062, -0.176483154296875, -0.16231918334960938, -0.14815521240234375, -0.13399124145507812, -0.1198272705078125, -0.10566329956054688, -0.09149932861328125, -0.07733535766601562, -0.06317138671875, -0.049007415771484375, -0.03484344482421875, -0.020679473876953125, -0.0065155029296875, 0.007648468017578125, 0.02181243896484375, 0.035976409912109375, 0.050140380859375, 0.06430435180664062, 0.07846832275390625, 0.09263229370117188, 0.1067962646484375, 0.12096023559570312, 0.13512420654296875, 0.14928817749023438, 0.1634521484375, 0.17761611938476562, 0.19178009033203125, 0.20594406127929688, 0.2201080322265625, 0.23427200317382812, 0.24843597412109375, 0.2625999450683594, 0.276763916015625, 0.2909278869628906, 0.30509185791015625, 0.3192558288574219, 0.3334197998046875, 0.3475837707519531, 0.36174774169921875, 0.3759117126464844, 0.39007568359375, 0.4042396545410156, 0.41840362548828125, 0.4325675964355469, 0.4467315673828125, 0.4608955383300781, 0.47505950927734375, 0.4892234802246094, 0.503387451171875, 0.5175514221191406, 0.5317153930664062, 0.5458793640136719, 0.5600433349609375, 0.5742073059082031, 0.5883712768554688, 0.6025352478027344, 0.61669921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 27.0, 75.0, 144.0, 242.0, 283.0, 149.0, 59.0, 20.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4405779838562012, -1.3168010711669922, -1.1930242776870728, -1.0692473649978638, -0.9454705715179443, -0.8216936588287354, -0.6979168057441711, -0.5741399526596069, -0.4503630995750427, -0.3265862464904785, -0.2028093785047531, -0.07903251051902771, 0.0447443425655365, 0.1685212254524231, 0.2922980785369873, 0.4160749316215515, 0.5398517847061157, 0.6636286377906799, 0.7874054908752441, 0.9111824035644531, 1.0349591970443726, 1.1587361097335815, 1.282512903213501, 1.40628981590271, 1.530066728591919, 1.653843641281128, 1.7776204347610474, 1.9013973474502563, 2.025174140930176, 2.1489510536193848, 2.2727279663085938, 2.3965048789978027, 2.5202815532684326, 2.6440584659576416, 2.7678353786468506, 2.8916120529174805, 3.0153889656066895, 3.1391658782958984, 3.2629427909851074, 3.3867197036743164, 3.5104963779449463, 3.6342732906341553, 3.7580502033233643, 3.881826877593994, 4.005603790283203, 4.129380702972412, 4.253157615661621, 4.37693452835083, 4.500711441040039, 4.624488353729248, 4.748265266418457, 4.872042179107666, 4.995819091796875, 5.119595527648926, 5.243372440338135, 5.367149353027344, 5.490926265716553, 5.614703178405762, 5.738480091094971, 5.86225700378418, 5.986033916473389, 6.109810829162598, 6.233587265014648, 6.357364177703857, 6.481141090393066]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 11.0, 13.0, 18.0, 18.0, 19.0, 14.0, 21.0, 27.0, 28.0, 27.0, 31.0, 29.0, 30.0, 43.0, 32.0, 41.0, 36.0, 37.0, 40.0, 35.0, 37.0, 45.0, 28.0, 33.0, 25.0, 31.0, 29.0, 32.0, 31.0, 23.0, 21.0, 22.0, 21.0, 6.0, 13.0, 10.0, 8.0, 10.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.018538475036621, -0.9814477562904358, -0.9443570375442505, -0.9072663187980652, -0.8701756000518799, -0.8330848217010498, -0.7959941029548645, -0.7589033842086792, -0.7218126654624939, -0.6847219467163086, -0.6476312279701233, -0.610540509223938, -0.5734497308731079, -0.5363590717315674, -0.4992682933807373, -0.462177574634552, -0.4250868558883667, -0.3879961371421814, -0.3509054183959961, -0.3138146698474884, -0.2767239511013031, -0.2396332323551178, -0.2025424987077713, -0.1654517650604248, -0.1283610463142395, -0.0912703201174736, -0.0541795939207077, -0.017088867723941803, 0.020001858472824097, 0.0570925772190094, 0.0941833108663559, 0.1312740445137024, 0.1683647632598877, 0.205455482006073, 0.2425462156534195, 0.279636949300766, 0.3167276680469513, 0.3538183867931366, 0.3909091353416443, 0.4279998540878296, 0.4650905728340149, 0.5021812915802002, 0.5392720103263855, 0.5763627290725708, 0.6134535074234009, 0.6505441665649414, 0.6876349449157715, 0.7247256636619568, 0.7618163824081421, 0.7989071011543274, 0.8359978199005127, 0.873088538646698, 0.9101792573928833, 0.9472700357437134, 0.9843607544898987, 1.021451473236084, 1.058542251586914, 1.0956330299377441, 1.1327236890792847, 1.1698144674301147, 1.2069051265716553, 1.2439959049224854, 1.2810865640640259, 1.318177342414856, 1.3552680015563965]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 5.0, 6.0, 13.0, 21.0, 20.0, 30.0, 34.0, 58.0, 69.0, 115.0, 168.0, 249.0, 504.0, 953.0, 2056.0, 4845.0, 13068.0, 38078.0, 126459.0, 345651.0, 336954.0, 121229.0, 36801.0, 12324.0, 4697.0, 1924.0, 922.0, 500.0, 251.0, 178.0, 103.0, 75.0, 46.0, 37.0, 28.0, 20.0, 14.0, 9.0, 10.0, 12.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4990234375, -1.4549102783203125, -1.410797119140625, -1.3666839599609375, -1.32257080078125, -1.2784576416015625, -1.234344482421875, -1.1902313232421875, -1.1461181640625, -1.1020050048828125, -1.057891845703125, -1.0137786865234375, -0.96966552734375, -0.9255523681640625, -0.881439208984375, -0.8373260498046875, -0.793212890625, -0.7490997314453125, -0.704986572265625, -0.6608734130859375, -0.61676025390625, -0.5726470947265625, -0.528533935546875, -0.4844207763671875, -0.4403076171875, -0.3961944580078125, -0.352081298828125, -0.3079681396484375, -0.26385498046875, -0.2197418212890625, -0.175628662109375, -0.1315155029296875, -0.08740234375, -0.0432891845703125, 0.000823974609375, 0.0449371337890625, 0.08905029296875, 0.1331634521484375, 0.177276611328125, 0.2213897705078125, 0.2655029296875, 0.3096160888671875, 0.353729248046875, 0.3978424072265625, 0.44195556640625, 0.4860687255859375, 0.530181884765625, 0.5742950439453125, 0.618408203125, 0.6625213623046875, 0.706634521484375, 0.7507476806640625, 0.79486083984375, 0.8389739990234375, 0.883087158203125, 0.9272003173828125, 0.9713134765625, 1.0154266357421875, 1.059539794921875, 1.1036529541015625, 1.14776611328125, 1.1918792724609375, 1.235992431640625, 1.2801055908203125, 1.32421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 9.0, 12.0, 10.0, 12.0, 16.0, 20.0, 27.0, 31.0, 49.0, 39.0, 43.0, 49.0, 58.0, 59.0, 63.0, 73.0, 66.0, 61.0, 47.0, 37.0, 27.0, 37.0, 23.0, 21.0, 16.0, 23.0, 16.0, 12.0, 5.0, 7.0, 10.0, 5.0, 0.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6289291381835938, -0.6084442138671875, -0.5879592895507812, -0.567474365234375, -0.5469894409179688, -0.5265045166015625, -0.5060195922851562, -0.48553466796875, -0.46504974365234375, -0.4445648193359375, -0.42407989501953125, -0.403594970703125, -0.38311004638671875, -0.3626251220703125, -0.34214019775390625, -0.3216552734375, -0.30117034912109375, -0.2806854248046875, -0.26020050048828125, -0.239715576171875, -0.21923065185546875, -0.1987457275390625, -0.17826080322265625, -0.15777587890625, -0.13729095458984375, -0.1168060302734375, -0.09632110595703125, -0.075836181640625, -0.05535125732421875, -0.0348663330078125, -0.01438140869140625, 0.006103515625, 0.02658843994140625, 0.0470733642578125, 0.06755828857421875, 0.088043212890625, 0.10852813720703125, 0.1290130615234375, 0.14949798583984375, 0.16998291015625, 0.19046783447265625, 0.2109527587890625, 0.23143768310546875, 0.251922607421875, 0.27240753173828125, 0.2928924560546875, 0.31337738037109375, 0.3338623046875, 0.35434722900390625, 0.3748321533203125, 0.39531707763671875, 0.415802001953125, 0.43628692626953125, 0.4567718505859375, 0.47725677490234375, 0.49774169921875, 0.5182266235351562, 0.5387115478515625, 0.5591964721679688, 0.579681396484375, 0.6001663208007812, 0.6206512451171875, 0.6411361694335938, 0.66162109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 6.0, 7.0, 14.0, 15.0, 28.0, 32.0, 60.0, 75.0, 156.0, 277.0, 528.0, 1101.0, 2691.0, 7821.0, 27325.0, 133030.0, 562294.0, 248235.0, 46124.0, 11842.0, 3899.0, 1493.0, 665.0, 363.0, 188.0, 117.0, 54.0, 35.0, 21.0, 16.0, 8.0, 5.0, 8.0, 8.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.1206512451171875, -2.055755615234375, -1.9908599853515625, -1.92596435546875, -1.8610687255859375, -1.796173095703125, -1.7312774658203125, -1.6663818359375, -1.6014862060546875, -1.536590576171875, -1.4716949462890625, -1.40679931640625, -1.3419036865234375, -1.277008056640625, -1.2121124267578125, -1.147216796875, -1.0823211669921875, -1.017425537109375, -0.9525299072265625, -0.88763427734375, -0.8227386474609375, -0.757843017578125, -0.6929473876953125, -0.6280517578125, -0.5631561279296875, -0.498260498046875, -0.4333648681640625, -0.36846923828125, -0.3035736083984375, -0.238677978515625, -0.1737823486328125, -0.10888671875, -0.0439910888671875, 0.020904541015625, 0.0858001708984375, 0.15069580078125, 0.2155914306640625, 0.280487060546875, 0.3453826904296875, 0.4102783203125, 0.4751739501953125, 0.540069580078125, 0.6049652099609375, 0.66986083984375, 0.7347564697265625, 0.799652099609375, 0.8645477294921875, 0.929443359375, 0.9943389892578125, 1.059234619140625, 1.1241302490234375, 1.18902587890625, 1.2539215087890625, 1.318817138671875, 1.3837127685546875, 1.4486083984375, 1.5135040283203125, 1.578399658203125, 1.6432952880859375, 1.70819091796875, 1.7730865478515625, 1.837982177734375, 1.9028778076171875, 1.9677734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 3.0, 10.0, 15.0, 13.0, 11.0, 17.0, 29.0, 31.0, 27.0, 44.0, 28.0, 52.0, 50.0, 63.0, 49.0, 37.0, 43.0, 49.0, 47.0, 36.0, 55.0, 43.0, 44.0, 32.0, 22.0, 20.0, 33.0, 14.0, 15.0, 14.0, 9.0, 4.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.4375, -3.326873779296875, -3.21624755859375, -3.105621337890625, -2.9949951171875, -2.884368896484375, -2.77374267578125, -2.663116455078125, -2.552490234375, -2.441864013671875, -2.33123779296875, -2.220611572265625, -2.1099853515625, -1.999359130859375, -1.88873291015625, -1.778106689453125, -1.66748046875, -1.556854248046875, -1.44622802734375, -1.335601806640625, -1.2249755859375, -1.114349365234375, -1.00372314453125, -0.893096923828125, -0.782470703125, -0.671844482421875, -0.56121826171875, -0.450592041015625, -0.3399658203125, -0.229339599609375, -0.11871337890625, -0.008087158203125, 0.1025390625, 0.213165283203125, 0.32379150390625, 0.434417724609375, 0.5450439453125, 0.655670166015625, 0.76629638671875, 0.876922607421875, 0.987548828125, 1.098175048828125, 1.20880126953125, 1.319427490234375, 1.4300537109375, 1.540679931640625, 1.65130615234375, 1.761932373046875, 1.87255859375, 1.983184814453125, 2.09381103515625, 2.204437255859375, 2.3150634765625, 2.425689697265625, 2.53631591796875, 2.646942138671875, 2.757568359375, 2.868194580078125, 2.97882080078125, 3.089447021484375, 3.2000732421875, 3.310699462890625, 3.42132568359375, 3.531951904296875, 3.642578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 11.0, 16.0, 34.0, 50.0, 106.0, 261.0, 1298.0, 16133.0, 902038.0, 124067.0, 3665.0, 574.0, 158.0, 52.0, 39.0, 26.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.466796875, -3.37493896484375, -3.2830810546875, -3.19122314453125, -3.099365234375, -3.00750732421875, -2.9156494140625, -2.82379150390625, -2.73193359375, -2.64007568359375, -2.5482177734375, -2.45635986328125, -2.364501953125, -2.27264404296875, -2.1807861328125, -2.08892822265625, -1.9970703125, -1.90521240234375, -1.8133544921875, -1.72149658203125, -1.629638671875, -1.53778076171875, -1.4459228515625, -1.35406494140625, -1.26220703125, -1.17034912109375, -1.0784912109375, -0.98663330078125, -0.894775390625, -0.80291748046875, -0.7110595703125, -0.61920166015625, -0.52734375, -0.43548583984375, -0.3436279296875, -0.25177001953125, -0.159912109375, -0.06805419921875, 0.0238037109375, 0.11566162109375, 0.20751953125, 0.29937744140625, 0.3912353515625, 0.48309326171875, 0.574951171875, 0.66680908203125, 0.7586669921875, 0.85052490234375, 0.9423828125, 1.03424072265625, 1.1260986328125, 1.21795654296875, 1.309814453125, 1.40167236328125, 1.4935302734375, 1.58538818359375, 1.67724609375, 1.76910400390625, 1.8609619140625, 1.95281982421875, 2.044677734375, 2.13653564453125, 2.2283935546875, 2.32025146484375, 2.412109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 13.0, 13.0, 27.0, 20.0, 38.0, 48.0, 63.0, 64.0, 78.0, 92.0, 91.0, 88.0, 69.0, 63.0, 52.0, 40.0, 34.0, 25.0, 19.0, 9.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010877847671508789, -0.00010554958134889603, -0.00010232068598270416, -9.90917906165123e-05, -9.586289525032043e-05, -9.263399988412857e-05, -8.94051045179367e-05, -8.617620915174484e-05, -8.294731378555298e-05, -7.971841841936111e-05, -7.648952305316925e-05, -7.326062768697739e-05, -7.003173232078552e-05, -6.680283695459366e-05, -6.35739415884018e-05, -6.034504622220993e-05, -5.7116150856018066e-05, -5.38872554898262e-05, -5.065836012363434e-05, -4.7429464757442474e-05, -4.420056939125061e-05, -4.0971674025058746e-05, -3.774277865886688e-05, -3.451388329267502e-05, -3.1284987926483154e-05, -2.805609256029129e-05, -2.4827197194099426e-05, -2.1598301827907562e-05, -1.8369406461715698e-05, -1.5140511095523834e-05, -1.191161572933197e-05, -8.682720363140106e-06, -5.453824996948242e-06, -2.224929630756378e-06, 1.0039657354354858e-06, 4.23286110162735e-06, 7.461756467819214e-06, 1.0690651834011078e-05, 1.3919547200202942e-05, 1.7148442566394806e-05, 2.037733793258667e-05, 2.3606233298778534e-05, 2.6835128664970398e-05, 3.0064024031162262e-05, 3.3292919397354126e-05, 3.652181476354599e-05, 3.9750710129737854e-05, 4.297960549592972e-05, 4.620850086212158e-05, 4.9437396228313446e-05, 5.266629159450531e-05, 5.5895186960697174e-05, 5.912408232688904e-05, 6.23529776930809e-05, 6.558187305927277e-05, 6.881076842546463e-05, 7.20396637916565e-05, 7.526855915784836e-05, 7.849745452404022e-05, 8.172634989023209e-05, 8.495524525642395e-05, 8.818414062261581e-05, 9.141303598880768e-05, 9.464193135499954e-05, 9.78708267211914e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 10.0, 19.0, 17.0, 40.0, 44.0, 66.0, 107.0, 163.0, 247.0, 479.0, 924.0, 2116.0, 5597.0, 19305.0, 102266.0, 575485.0, 281982.0, 42842.0, 10462.0, 3392.0, 1350.0, 698.0, 348.0, 183.0, 149.0, 91.0, 40.0, 39.0, 17.0, 18.0, 18.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0537109375, -1.02154541015625, -0.9893798828125, -0.95721435546875, -0.925048828125, -0.89288330078125, -0.8607177734375, -0.82855224609375, -0.79638671875, -0.76422119140625, -0.7320556640625, -0.69989013671875, -0.667724609375, -0.63555908203125, -0.6033935546875, -0.57122802734375, -0.5390625, -0.50689697265625, -0.4747314453125, -0.44256591796875, -0.410400390625, -0.37823486328125, -0.3460693359375, -0.31390380859375, -0.28173828125, -0.24957275390625, -0.2174072265625, -0.18524169921875, -0.153076171875, -0.12091064453125, -0.0887451171875, -0.05657958984375, -0.0244140625, 0.00775146484375, 0.0399169921875, 0.07208251953125, 0.104248046875, 0.13641357421875, 0.1685791015625, 0.20074462890625, 0.23291015625, 0.26507568359375, 0.2972412109375, 0.32940673828125, 0.361572265625, 0.39373779296875, 0.4259033203125, 0.45806884765625, 0.490234375, 0.52239990234375, 0.5545654296875, 0.58673095703125, 0.618896484375, 0.65106201171875, 0.6832275390625, 0.71539306640625, 0.74755859375, 0.77972412109375, 0.8118896484375, 0.84405517578125, 0.876220703125, 0.90838623046875, 0.9405517578125, 0.97271728515625, 1.0048828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 11.0, 10.0, 28.0, 23.0, 29.0, 59.0, 84.0, 114.0, 139.0, 156.0, 106.0, 79.0, 62.0, 20.0, 29.0, 11.0, 11.0, 11.0, 3.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.7612152099609375, -1.702117919921875, -1.6430206298828125, -1.58392333984375, -1.5248260498046875, -1.465728759765625, -1.4066314697265625, -1.3475341796875, -1.2884368896484375, -1.229339599609375, -1.1702423095703125, -1.11114501953125, -1.0520477294921875, -0.992950439453125, -0.9338531494140625, -0.874755859375, -0.8156585693359375, -0.756561279296875, -0.6974639892578125, -0.63836669921875, -0.5792694091796875, -0.520172119140625, -0.4610748291015625, -0.4019775390625, -0.3428802490234375, -0.283782958984375, -0.2246856689453125, -0.16558837890625, -0.1064910888671875, -0.047393798828125, 0.0117034912109375, 0.07080078125, 0.1298980712890625, 0.188995361328125, 0.2480926513671875, 0.30718994140625, 0.3662872314453125, 0.425384521484375, 0.4844818115234375, 0.5435791015625, 0.6026763916015625, 0.661773681640625, 0.7208709716796875, 0.77996826171875, 0.8390655517578125, 0.898162841796875, 0.9572601318359375, 1.016357421875, 1.0754547119140625, 1.134552001953125, 1.1936492919921875, 1.25274658203125, 1.3118438720703125, 1.370941162109375, 1.4300384521484375, 1.4891357421875, 1.5482330322265625, 1.607330322265625, 1.6664276123046875, 1.72552490234375, 1.7846221923828125, 1.843719482421875, 1.9028167724609375, 1.9619140625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 9.0, 14.0, 69.0, 172.0, 335.0, 272.0, 99.0, 29.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-75.50756072998047, -74.15337371826172, -72.79917907714844, -71.44499206542969, -70.0907974243164, -68.73661041259766, -67.38241577148438, -66.02822875976562, -64.67404174804688, -63.31985092163086, -61.965660095214844, -60.61146926879883, -59.25727844238281, -57.90309143066406, -56.54890060424805, -55.19470977783203, -53.84051513671875, -52.486324310302734, -51.13213348388672, -49.7779426574707, -48.42375183105469, -47.06956481933594, -45.71537399291992, -44.361183166503906, -43.00699234008789, -41.652801513671875, -40.29861068725586, -38.944419860839844, -37.590232849121094, -36.23604202270508, -34.88185119628906, -33.52766036987305, -32.17346954345703, -30.819278717041016, -29.465087890625, -28.110898971557617, -26.7567081451416, -25.402517318725586, -24.048328399658203, -22.694137573242188, -21.33994483947754, -19.985754013061523, -18.63156509399414, -17.277374267578125, -15.92318344116211, -14.568992614746094, -13.214802742004395, -11.860612869262695, -10.50642204284668, -9.152231216430664, -7.798041343688965, -6.443850994110107, -5.08966064453125, -3.7354702949523926, -2.381279945373535, -1.027090072631836, 0.3271007537841797, 1.681291103363037, 3.0354814529418945, 4.389671802520752, 5.743862152099609, 7.098052501678467, 8.452242851257324, 9.806432723999023, 11.160623550415039]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 8.0, 4.0, 5.0, 3.0, 11.0, 17.0, 16.0, 21.0, 26.0, 25.0, 28.0, 36.0, 36.0, 38.0, 52.0, 46.0, 36.0, 61.0, 42.0, 52.0, 53.0, 44.0, 41.0, 28.0, 35.0, 26.0, 33.0, 21.0, 25.0, 23.0, 20.0, 22.0, 15.0, 5.0, 14.0, 8.0, 6.0, 9.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.37482452392578, -15.857985496520996, -15.341147422790527, -14.824308395385742, -14.307470321655273, -13.790631294250488, -13.273792266845703, -12.756954193115234, -12.24011516571045, -11.723276138305664, -11.206438064575195, -10.68959903717041, -10.172760009765625, -9.655921936035156, -9.139082908630371, -8.622243881225586, -8.105405807495117, -7.58856725692749, -7.071728706359863, -6.554889678955078, -6.038051128387451, -5.521212577819824, -5.004373550415039, -4.487534999847412, -3.970696449279785, -3.453857898712158, -2.937019109725952, -2.420180320739746, -1.9033417701721191, -1.3865032196044922, -0.8696644306182861, -0.3528256416320801, 0.16401290893554688, 0.6808515787124634, 1.1976902484893799, 1.7145289182662964, 2.231367588043213, 2.74820613861084, 3.265044927597046, 3.781883716583252, 4.298722267150879, 4.815560817718506, 5.332399368286133, 5.849238395690918, 6.366076946258545, 6.882915496826172, 7.399754524230957, 7.916593074798584, 8.433431625366211, 8.950270652770996, 9.467108726501465, 9.98394775390625, 10.500785827636719, 11.017624855041504, 11.534463882446289, 12.051301956176758, 12.568140983581543, 13.084980010986328, 13.601818084716797, 14.118657112121582, 14.635496139526367, 15.152334213256836, 15.669173240661621, 16.186012268066406, 16.702850341796875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 12.0, 9.0, 13.0, 28.0, 19.0, 44.0, 82.0, 113.0, 166.0, 301.0, 548.0, 940.0, 1944.0, 5051.0, 24520.0, 3765689.0, 370651.0, 16468.0, 3916.0, 1632.0, 866.0, 464.0, 289.0, 188.0, 124.0, 79.0, 42.0, 33.0, 20.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7958984375, -1.7237701416015625, -1.651641845703125, -1.5795135498046875, -1.50738525390625, -1.4352569580078125, -1.363128662109375, -1.2910003662109375, -1.2188720703125, -1.1467437744140625, -1.074615478515625, -1.0024871826171875, -0.93035888671875, -0.8582305908203125, -0.786102294921875, -0.7139739990234375, -0.641845703125, -0.5697174072265625, -0.497589111328125, -0.4254608154296875, -0.35333251953125, -0.2812042236328125, -0.209075927734375, -0.1369476318359375, -0.0648193359375, 0.0073089599609375, 0.079437255859375, 0.1515655517578125, 0.22369384765625, 0.2958221435546875, 0.367950439453125, 0.4400787353515625, 0.51220703125, 0.5843353271484375, 0.656463623046875, 0.7285919189453125, 0.80072021484375, 0.8728485107421875, 0.944976806640625, 1.0171051025390625, 1.0892333984375, 1.1613616943359375, 1.233489990234375, 1.3056182861328125, 1.37774658203125, 1.4498748779296875, 1.522003173828125, 1.5941314697265625, 1.666259765625, 1.7383880615234375, 1.810516357421875, 1.8826446533203125, 1.95477294921875, 2.0269012451171875, 2.099029541015625, 2.1711578369140625, 2.2432861328125, 2.3154144287109375, 2.387542724609375, 2.4596710205078125, 2.53179931640625, 2.6039276123046875, 2.676055908203125, 2.7481842041015625, 2.8203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 7.0, 13.0, 10.0, 11.0, 31.0, 31.0, 40.0, 44.0, 62.0, 62.0, 70.0, 90.0, 83.0, 73.0, 68.0, 62.0, 50.0, 40.0, 34.0, 22.0, 25.0, 14.0, 12.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9444122314453125, -0.917633056640625, -0.8908538818359375, -0.86407470703125, -0.8372955322265625, -0.810516357421875, -0.7837371826171875, -0.7569580078125, -0.7301788330078125, -0.703399658203125, -0.6766204833984375, -0.64984130859375, -0.6230621337890625, -0.596282958984375, -0.5695037841796875, -0.542724609375, -0.5159454345703125, -0.489166259765625, -0.4623870849609375, -0.43560791015625, -0.4088287353515625, -0.382049560546875, -0.3552703857421875, -0.3284912109375, -0.3017120361328125, -0.274932861328125, -0.2481536865234375, -0.22137451171875, -0.1945953369140625, -0.167816162109375, -0.1410369873046875, -0.1142578125, -0.0874786376953125, -0.060699462890625, -0.0339202880859375, -0.00714111328125, 0.0196380615234375, 0.046417236328125, 0.0731964111328125, 0.0999755859375, 0.1267547607421875, 0.153533935546875, 0.1803131103515625, 0.20709228515625, 0.2338714599609375, 0.260650634765625, 0.2874298095703125, 0.314208984375, 0.3409881591796875, 0.367767333984375, 0.3945465087890625, 0.42132568359375, 0.4481048583984375, 0.474884033203125, 0.5016632080078125, 0.5284423828125, 0.5552215576171875, 0.582000732421875, 0.6087799072265625, 0.63555908203125, 0.6623382568359375, 0.689117431640625, 0.7158966064453125, 0.74267578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 3.0, 7.0, 7.0, 10.0, 13.0, 17.0, 17.0, 20.0, 40.0, 50.0, 64.0, 74.0, 79.0, 136.0, 176.0, 273.0, 418.0, 703.0, 1202.0, 2079.0, 4580.0, 13046.0, 71774.0, 3675089.0, 378065.0, 30918.0, 7894.0, 3268.0, 1637.0, 892.0, 520.0, 316.0, 230.0, 169.0, 119.0, 83.0, 63.0, 56.0, 40.0, 25.0, 21.0, 17.0, 17.0, 13.0, 10.0, 5.0, 9.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5089111328125, -1.458251953125, -1.4075927734375, -1.35693359375, -1.3062744140625, -1.255615234375, -1.2049560546875, -1.154296875, -1.1036376953125, -1.052978515625, -1.0023193359375, -0.95166015625, -0.9010009765625, -0.850341796875, -0.7996826171875, -0.7490234375, -0.6983642578125, -0.647705078125, -0.5970458984375, -0.54638671875, -0.4957275390625, -0.445068359375, -0.3944091796875, -0.34375, -0.2930908203125, -0.242431640625, -0.1917724609375, -0.14111328125, -0.0904541015625, -0.039794921875, 0.0108642578125, 0.0615234375, 0.1121826171875, 0.162841796875, 0.2135009765625, 0.26416015625, 0.3148193359375, 0.365478515625, 0.4161376953125, 0.466796875, 0.5174560546875, 0.568115234375, 0.6187744140625, 0.66943359375, 0.7200927734375, 0.770751953125, 0.8214111328125, 0.8720703125, 0.9227294921875, 0.973388671875, 1.0240478515625, 1.07470703125, 1.1253662109375, 1.176025390625, 1.2266845703125, 1.27734375, 1.3280029296875, 1.378662109375, 1.4293212890625, 1.47998046875, 1.5306396484375, 1.581298828125, 1.6319580078125, 1.6826171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 8.0, 19.0, 26.0, 58.0, 107.0, 305.0, 2626.0, 576.0, 168.0, 53.0, 45.0, 19.0, 12.0, 8.0, 10.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3215370178222656, -0.30738067626953125, -0.2932243347167969, -0.2790679931640625, -0.2649116516113281, -0.25075531005859375, -0.23659896850585938, -0.222442626953125, -0.20828628540039062, -0.19412994384765625, -0.17997360229492188, -0.1658172607421875, -0.15166091918945312, -0.13750457763671875, -0.12334823608398438, -0.10919189453125, -0.09503555297851562, -0.08087921142578125, -0.06672286987304688, -0.0525665283203125, -0.038410186767578125, -0.02425384521484375, -0.010097503662109375, 0.004058837890625, 0.018215179443359375, 0.03237152099609375, 0.046527862548828125, 0.0606842041015625, 0.07484054565429688, 0.08899688720703125, 0.10315322875976562, 0.1173095703125, 0.13146591186523438, 0.14562225341796875, 0.15977859497070312, 0.1739349365234375, 0.18809127807617188, 0.20224761962890625, 0.21640396118164062, 0.230560302734375, 0.24471664428710938, 0.25887298583984375, 0.2730293273925781, 0.2871856689453125, 0.3013420104980469, 0.31549835205078125, 0.3296546936035156, 0.34381103515625, 0.3579673767089844, 0.37212371826171875, 0.3862800598144531, 0.4004364013671875, 0.4145927429199219, 0.42874908447265625, 0.4429054260253906, 0.457061767578125, 0.4712181091308594, 0.48537445068359375, 0.4995307922363281, 0.5136871337890625, 0.5278434753417969, 0.5419998168945312, 0.5561561584472656, 0.5703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 11.0, 36.0, 169.0, 378.0, 300.0, 84.0, 29.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7150459289550781, -1.5180264711380005, -1.3210068941116333, -1.1239874362945557, -0.9269679188728333, -0.7299484014511108, -0.5329289436340332, -0.335909366607666, -0.13888990879058838, 0.05812959372997284, 0.25514909625053406, 0.4521685838699341, 0.6491881012916565, 0.8462076187133789, 1.0432270765304565, 1.2402466535568237, 1.4372661113739014, 1.634285569190979, 1.8313051462173462, 2.028324604034424, 2.225344181060791, 2.422363758087158, 2.6193830966949463, 2.8164026737213135, 3.0134220123291016, 3.2104415893554688, 3.407460927963257, 3.604480504989624, 3.801500082015991, 3.9985194206237793, 4.1955389976501465, 4.392558574676514, 4.589578151702881, 4.786597728729248, 4.983617305755615, 5.180636405944824, 5.377655982971191, 5.574675559997559, 5.771695137023926, 5.968714714050293, 6.16573429107666, 6.362753868103027, 6.5597734451293945, 6.756793022155762, 6.953812122344971, 7.150831699371338, 7.347851276397705, 7.544870853424072, 7.741889953613281, 7.938909530639648, 8.135929107666016, 8.332948684692383, 8.52996826171875, 8.726987838745117, 8.924007415771484, 9.121026992797852, 9.318046569824219, 9.515066146850586, 9.712085723876953, 9.90910530090332, 10.106124877929688, 10.303144454956055, 10.500164031982422, 10.697183609008789, 10.89420223236084]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 17.0, 14.0, 12.0, 23.0, 19.0, 26.0, 32.0, 25.0, 33.0, 39.0, 46.0, 54.0, 37.0, 50.0, 38.0, 50.0, 49.0, 48.0, 30.0, 48.0, 48.0, 31.0, 30.0, 21.0, 31.0, 17.0, 23.0, 20.0, 15.0, 11.0, 12.0, 8.0, 14.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041919469833374, -1.0097886323928833, -0.977657675743103, -0.9455268383026123, -0.9133959412574768, -0.8812650442123413, -0.8491342067718506, -0.8170033097267151, -0.7848724126815796, -0.7527415156364441, -0.7206106185913086, -0.6884797811508179, -0.6563488841056824, -0.6242179870605469, -0.5920871496200562, -0.5599562525749207, -0.5278253555297852, -0.49569445848464966, -0.46356359124183655, -0.43143272399902344, -0.39930182695388794, -0.36717092990875244, -0.33504006266593933, -0.3029091954231262, -0.2707782983779907, -0.23864741623401642, -0.20651653409004211, -0.1743856519460678, -0.1422547698020935, -0.1101238876581192, -0.0779930055141449, -0.04586212337017059, -0.013731122016906738, 0.018399760127067566, 0.05053064227104187, 0.08266152441501617, 0.11479240655899048, 0.14692328870296478, 0.1790541708469391, 0.2111850529909134, 0.2433159351348877, 0.2754468321800232, 0.3075776994228363, 0.3397085666656494, 0.3718394637107849, 0.4039703607559204, 0.4361012279987335, 0.46823209524154663, 0.5003629922866821, 0.5324938893318176, 0.5646247863769531, 0.5967556238174438, 0.6288865208625793, 0.6610174179077148, 0.6931482553482056, 0.7252791523933411, 0.7574100494384766, 0.7895409464836121, 0.8216718435287476, 0.8538026809692383, 0.8859335780143738, 0.9180644750595093, 0.9501953125, 0.9823262095451355, 1.014457106590271]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 8.0, 4.0, 10.0, 17.0, 20.0, 45.0, 56.0, 89.0, 143.0, 265.0, 453.0, 779.0, 1692.0, 3483.0, 8618.0, 24067.0, 76911.0, 258881.0, 410903.0, 180020.0, 52946.0, 17116.0, 6479.0, 2638.0, 1288.0, 683.0, 361.0, 222.0, 123.0, 66.0, 55.0, 39.0, 23.0, 16.0, 12.0, 13.0, 3.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9816741943359375, -0.945770263671875, -0.9098663330078125, -0.87396240234375, -0.8380584716796875, -0.802154541015625, -0.7662506103515625, -0.7303466796875, -0.6944427490234375, -0.658538818359375, -0.6226348876953125, -0.58673095703125, -0.5508270263671875, -0.514923095703125, -0.4790191650390625, -0.443115234375, -0.4072113037109375, -0.371307373046875, -0.3354034423828125, -0.29949951171875, -0.2635955810546875, -0.227691650390625, -0.1917877197265625, -0.1558837890625, -0.1199798583984375, -0.084075927734375, -0.0481719970703125, -0.01226806640625, 0.0236358642578125, 0.059539794921875, 0.0954437255859375, 0.13134765625, 0.1672515869140625, 0.203155517578125, 0.2390594482421875, 0.27496337890625, 0.3108673095703125, 0.346771240234375, 0.3826751708984375, 0.4185791015625, 0.4544830322265625, 0.490386962890625, 0.5262908935546875, 0.56219482421875, 0.5980987548828125, 0.634002685546875, 0.6699066162109375, 0.705810546875, 0.7417144775390625, 0.777618408203125, 0.8135223388671875, 0.84942626953125, 0.8853302001953125, 0.921234130859375, 0.9571380615234375, 0.9930419921875, 1.0289459228515625, 1.064849853515625, 1.1007537841796875, 1.13665771484375, 1.1725616455078125, 1.208465576171875, 1.2443695068359375, 1.2802734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 17.0, 19.0, 25.0, 36.0, 41.0, 42.0, 57.0, 63.0, 70.0, 71.0, 75.0, 90.0, 72.0, 60.0, 49.0, 38.0, 37.0, 24.0, 31.0, 13.0, 8.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.8984756469726562, -0.8721466064453125, -0.8458175659179688, -0.819488525390625, -0.7931594848632812, -0.7668304443359375, -0.7405014038085938, -0.71417236328125, -0.6878433227539062, -0.6615142822265625, -0.6351852416992188, -0.608856201171875, -0.5825271606445312, -0.5561981201171875, -0.5298690795898438, -0.5035400390625, -0.47721099853515625, -0.4508819580078125, -0.42455291748046875, -0.398223876953125, -0.37189483642578125, -0.3455657958984375, -0.31923675537109375, -0.29290771484375, -0.26657867431640625, -0.2402496337890625, -0.21392059326171875, -0.187591552734375, -0.16126251220703125, -0.1349334716796875, -0.10860443115234375, -0.082275390625, -0.05594635009765625, -0.0296173095703125, -0.00328826904296875, 0.023040771484375, 0.04936981201171875, 0.0756988525390625, 0.10202789306640625, 0.12835693359375, 0.15468597412109375, 0.1810150146484375, 0.20734405517578125, 0.233673095703125, 0.26000213623046875, 0.2863311767578125, 0.31266021728515625, 0.3389892578125, 0.36531829833984375, 0.3916473388671875, 0.41797637939453125, 0.444305419921875, 0.47063446044921875, 0.4969635009765625, 0.5232925415039062, 0.54962158203125, 0.5759506225585938, 0.6022796630859375, 0.6286087036132812, 0.654937744140625, 0.6812667846679688, 0.7075958251953125, 0.7339248657226562, 0.76025390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 11.0, 19.0, 19.0, 22.0, 31.0, 57.0, 61.0, 77.0, 178.0, 237.0, 419.0, 812.0, 1662.0, 4442.0, 15611.0, 79802.0, 478853.0, 385268.0, 61212.0, 12810.0, 3704.0, 1452.0, 716.0, 350.0, 217.0, 151.0, 97.0, 65.0, 49.0, 30.0, 31.0, 24.0, 17.0, 11.0, 5.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.91796875, -1.8630523681640625, -1.808135986328125, -1.7532196044921875, -1.69830322265625, -1.6433868408203125, -1.588470458984375, -1.5335540771484375, -1.4786376953125, -1.4237213134765625, -1.368804931640625, -1.3138885498046875, -1.25897216796875, -1.2040557861328125, -1.149139404296875, -1.0942230224609375, -1.039306640625, -0.9843902587890625, -0.929473876953125, -0.8745574951171875, -0.81964111328125, -0.7647247314453125, -0.709808349609375, -0.6548919677734375, -0.5999755859375, -0.5450592041015625, -0.490142822265625, -0.4352264404296875, -0.38031005859375, -0.3253936767578125, -0.270477294921875, -0.2155609130859375, -0.16064453125, -0.1057281494140625, -0.050811767578125, 0.0041046142578125, 0.05902099609375, 0.1139373779296875, 0.168853759765625, 0.2237701416015625, 0.2786865234375, 0.3336029052734375, 0.388519287109375, 0.4434356689453125, 0.49835205078125, 0.5532684326171875, 0.608184814453125, 0.6631011962890625, 0.718017578125, 0.7729339599609375, 0.827850341796875, 0.8827667236328125, 0.93768310546875, 0.9925994873046875, 1.047515869140625, 1.1024322509765625, 1.1573486328125, 1.2122650146484375, 1.267181396484375, 1.3220977783203125, 1.37701416015625, 1.4319305419921875, 1.486846923828125, 1.5417633056640625, 1.5966796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 5.0, 2.0, 8.0, 6.0, 12.0, 11.0, 10.0, 15.0, 23.0, 22.0, 34.0, 45.0, 23.0, 51.0, 57.0, 57.0, 55.0, 61.0, 39.0, 63.0, 68.0, 46.0, 42.0, 39.0, 37.0, 36.0, 30.0, 20.0, 24.0, 16.0, 9.0, 6.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.70703125, -3.59857177734375, -3.4901123046875, -3.38165283203125, -3.273193359375, -3.16473388671875, -3.0562744140625, -2.94781494140625, -2.83935546875, -2.73089599609375, -2.6224365234375, -2.51397705078125, -2.405517578125, -2.29705810546875, -2.1885986328125, -2.08013916015625, -1.9716796875, -1.86322021484375, -1.7547607421875, -1.64630126953125, -1.537841796875, -1.42938232421875, -1.3209228515625, -1.21246337890625, -1.10400390625, -0.99554443359375, -0.8870849609375, -0.77862548828125, -0.670166015625, -0.56170654296875, -0.4532470703125, -0.34478759765625, -0.236328125, -0.12786865234375, -0.0194091796875, 0.08905029296875, 0.197509765625, 0.30596923828125, 0.4144287109375, 0.52288818359375, 0.63134765625, 0.73980712890625, 0.8482666015625, 0.95672607421875, 1.065185546875, 1.17364501953125, 1.2821044921875, 1.39056396484375, 1.4990234375, 1.60748291015625, 1.7159423828125, 1.82440185546875, 1.932861328125, 2.04132080078125, 2.1497802734375, 2.25823974609375, 2.36669921875, 2.47515869140625, 2.5836181640625, 2.69207763671875, 2.800537109375, 2.90899658203125, 3.0174560546875, 3.12591552734375, 3.234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 15.0, 5.0, 15.0, 12.0, 21.0, 34.0, 58.0, 92.0, 128.0, 276.0, 588.0, 1890.0, 8206.0, 84436.0, 819506.0, 119452.0, 10252.0, 2102.0, 705.0, 315.0, 163.0, 87.0, 62.0, 41.0, 22.0, 16.0, 14.0, 13.0, 5.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2497100830078125, -1.207427978515625, -1.1651458740234375, -1.12286376953125, -1.0805816650390625, -1.038299560546875, -0.9960174560546875, -0.9537353515625, -0.9114532470703125, -0.869171142578125, -0.8268890380859375, -0.78460693359375, -0.7423248291015625, -0.700042724609375, -0.6577606201171875, -0.615478515625, -0.5731964111328125, -0.530914306640625, -0.4886322021484375, -0.44635009765625, -0.4040679931640625, -0.361785888671875, -0.3195037841796875, -0.2772216796875, -0.2349395751953125, -0.192657470703125, -0.1503753662109375, -0.10809326171875, -0.0658111572265625, -0.023529052734375, 0.0187530517578125, 0.06103515625, 0.1033172607421875, 0.145599365234375, 0.1878814697265625, 0.23016357421875, 0.2724456787109375, 0.314727783203125, 0.3570098876953125, 0.3992919921875, 0.4415740966796875, 0.483856201171875, 0.5261383056640625, 0.56842041015625, 0.6107025146484375, 0.652984619140625, 0.6952667236328125, 0.737548828125, 0.7798309326171875, 0.822113037109375, 0.8643951416015625, 0.90667724609375, 0.9489593505859375, 0.991241455078125, 1.0335235595703125, 1.0758056640625, 1.1180877685546875, 1.160369873046875, 1.2026519775390625, 1.24493408203125, 1.2872161865234375, 1.329498291015625, 1.3717803955078125, 1.4140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 10.0, 13.0, 19.0, 32.0, 40.0, 72.0, 69.0, 65.0, 102.0, 84.0, 83.0, 87.0, 68.0, 61.0, 49.0, 34.0, 34.0, 17.0, 14.0, 12.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.70823860168457e-05, -8.407700806856155e-05, -8.10716301202774e-05, -7.806625217199326e-05, -7.50608742237091e-05, -7.205549627542496e-05, -6.905011832714081e-05, -6.604474037885666e-05, -6.303936243057251e-05, -6.003398448228836e-05, -5.702860653400421e-05, -5.402322858572006e-05, -5.101785063743591e-05, -4.8012472689151764e-05, -4.5007094740867615e-05, -4.2001716792583466e-05, -3.8996338844299316e-05, -3.599096089601517e-05, -3.298558294773102e-05, -2.998020499944687e-05, -2.697482705116272e-05, -2.396944910287857e-05, -2.096407115459442e-05, -1.7958693206310272e-05, -1.4953315258026123e-05, -1.1947937309741974e-05, -8.942559361457825e-06, -5.9371814131736755e-06, -2.9318034648895264e-06, 7.35744833946228e-08, 3.078952431678772e-06, 6.084330379962921e-06, 9.08970832824707e-06, 1.209508627653122e-05, 1.5100464224815369e-05, 1.8105842173099518e-05, 2.1111220121383667e-05, 2.4116598069667816e-05, 2.7121976017951965e-05, 3.0127353966236115e-05, 3.3132731914520264e-05, 3.613810986280441e-05, 3.914348781108856e-05, 4.214886575937271e-05, 4.515424370765686e-05, 4.815962165594101e-05, 5.116499960422516e-05, 5.417037755250931e-05, 5.717575550079346e-05, 6.0181133449077606e-05, 6.318651139736176e-05, 6.61918893456459e-05, 6.919726729393005e-05, 7.22026452422142e-05, 7.520802319049835e-05, 7.82134011387825e-05, 8.121877908706665e-05, 8.42241570353508e-05, 8.722953498363495e-05, 9.02349129319191e-05, 9.324029088020325e-05, 9.62456688284874e-05, 9.925104677677155e-05, 0.0001022564247250557, 0.00010526180267333984]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 4.0, 8.0, 12.0, 21.0, 39.0, 62.0, 116.0, 242.0, 527.0, 1452.0, 6547.0, 106498.0, 866727.0, 59412.0, 4802.0, 1181.0, 433.0, 196.0, 123.0, 61.0, 23.0, 18.0, 15.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7705078125, -1.72052001953125, -1.6705322265625, -1.62054443359375, -1.570556640625, -1.52056884765625, -1.4705810546875, -1.42059326171875, -1.37060546875, -1.32061767578125, -1.2706298828125, -1.22064208984375, -1.170654296875, -1.12066650390625, -1.0706787109375, -1.02069091796875, -0.970703125, -0.92071533203125, -0.8707275390625, -0.82073974609375, -0.770751953125, -0.72076416015625, -0.6707763671875, -0.62078857421875, -0.57080078125, -0.52081298828125, -0.4708251953125, -0.42083740234375, -0.370849609375, -0.32086181640625, -0.2708740234375, -0.22088623046875, -0.1708984375, -0.12091064453125, -0.0709228515625, -0.02093505859375, 0.029052734375, 0.07904052734375, 0.1290283203125, 0.17901611328125, 0.22900390625, 0.27899169921875, 0.3289794921875, 0.37896728515625, 0.428955078125, 0.47894287109375, 0.5289306640625, 0.57891845703125, 0.62890625, 0.67889404296875, 0.7288818359375, 0.77886962890625, 0.828857421875, 0.87884521484375, 0.9288330078125, 0.97882080078125, 1.02880859375, 1.07879638671875, 1.1287841796875, 1.17877197265625, 1.228759765625, 1.27874755859375, 1.3287353515625, 1.37872314453125, 1.4287109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 8.0, 27.0, 34.0, 75.0, 140.0, 231.0, 225.0, 146.0, 55.0, 29.0, 20.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4765625, -1.402099609375, -1.32763671875, -1.253173828125, -1.1787109375, -1.104248046875, -1.02978515625, -0.955322265625, -0.880859375, -0.806396484375, -0.73193359375, -0.657470703125, -0.5830078125, -0.508544921875, -0.43408203125, -0.359619140625, -0.28515625, -0.210693359375, -0.13623046875, -0.061767578125, 0.0126953125, 0.087158203125, 0.16162109375, 0.236083984375, 0.310546875, 0.385009765625, 0.45947265625, 0.533935546875, 0.6083984375, 0.682861328125, 0.75732421875, 0.831787109375, 0.90625, 0.980712890625, 1.05517578125, 1.129638671875, 1.2041015625, 1.278564453125, 1.35302734375, 1.427490234375, 1.501953125, 1.576416015625, 1.65087890625, 1.725341796875, 1.7998046875, 1.874267578125, 1.94873046875, 2.023193359375, 2.09765625, 2.172119140625, 2.24658203125, 2.321044921875, 2.3955078125, 2.469970703125, 2.54443359375, 2.618896484375, 2.693359375, 2.767822265625, 2.84228515625, 2.916748046875, 2.9912109375, 3.065673828125, 3.14013671875, 3.214599609375, 3.2890625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 17.0, 71.0, 192.0, 333.0, 250.0, 97.0, 33.0, 10.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.74045181274414, -15.592982292175293, -14.445512771606445, -13.298044204711914, -12.150574684143066, -11.003105163574219, -9.855636596679688, -8.70816707611084, -7.560697555541992, -6.4132280349731445, -5.265758991241455, -4.118289947509766, -2.970820426940918, -1.8233509063720703, -0.6758818626403809, 0.4715871810913086, 1.6190567016601562, 2.766525983810425, 3.9139952659606934, 5.061464309692383, 6.2089338302612305, 7.356403350830078, 8.50387191772461, 9.651341438293457, 10.798810958862305, 11.946280479431152, 13.09375, 14.241218566894531, 15.388688087463379, 16.536157608032227, 17.683626174926758, 18.831096649169922, 19.978561401367188, 21.12602996826172, 22.273500442504883, 23.420969009399414, 24.568439483642578, 25.71590805053711, 26.86337661743164, 28.010845184326172, 29.158315658569336, 30.305784225463867, 31.45325469970703, 32.60072326660156, 33.748191833496094, 34.895660400390625, 36.04313278198242, 37.19060134887695, 38.338069915771484, 39.485538482666016, 40.63300704956055, 41.780479431152344, 42.927947998046875, 44.075416564941406, 45.22288513183594, 46.37035369873047, 47.517822265625, 48.66529083251953, 49.81275939941406, 50.96023178100586, 52.10770034790039, 53.25516891479492, 54.40263748168945, 55.550106048583984, 56.69757843017578]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 10.0, 8.0, 18.0, 13.0, 18.0, 36.0, 35.0, 38.0, 37.0, 50.0, 60.0, 66.0, 57.0, 61.0, 66.0, 52.0, 49.0, 50.0, 50.0, 34.0, 30.0, 30.0, 21.0, 19.0, 12.0, 11.0, 15.0, 9.0, 3.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.07120132446289, -18.54913902282715, -18.027076721191406, -17.50501251220703, -16.98295021057129, -16.460887908935547, -15.938824653625488, -15.41676139831543, -14.894699096679688, -14.372636795043945, -13.850573539733887, -13.328510284423828, -12.806447982788086, -12.284385681152344, -11.762322425842285, -11.240259170532227, -10.718196868896484, -10.196134567260742, -9.674071311950684, -9.152008056640625, -8.629945755004883, -8.10788345336914, -7.585820198059082, -7.063757419586182, -6.541694641113281, -6.019631862640381, -5.4975690841674805, -4.97550630569458, -4.45344352722168, -3.9313807487487793, -3.409317970275879, -2.8872551918029785, -2.365192413330078, -1.8431296348571777, -1.3210668563842773, -0.799004077911377, -0.27694129943847656, 0.24512147903442383, 0.7671842575073242, 1.2892470359802246, 1.811309814453125, 2.3333725929260254, 2.855435371398926, 3.377498149871826, 3.8995609283447266, 4.421623706817627, 4.943686485290527, 5.465749263763428, 5.987812042236328, 6.5098748207092285, 7.031937599182129, 7.554000377655029, 8.07606315612793, 8.598125457763672, 9.12018871307373, 9.642251968383789, 10.164314270019531, 10.686376571655273, 11.208439826965332, 11.73050308227539, 12.252565383911133, 12.774627685546875, 13.296690940856934, 13.818754196166992, 14.340816497802734]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 13.0, 10.0, 26.0, 36.0, 63.0, 91.0, 146.0, 271.0, 489.0, 1168.0, 3939.0, 25557.0, 4033510.0, 116220.0, 9073.0, 2084.0, 717.0, 366.0, 191.0, 101.0, 81.0, 41.0, 26.0, 14.0, 11.0, 13.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.021484375, -1.951171875, -1.880859375, -1.810546875, -1.740234375, -1.669921875, -1.599609375, -1.529296875, -1.458984375, -1.388671875, -1.318359375, -1.248046875, -1.177734375, -1.107421875, -1.037109375, -0.966796875, -0.896484375, -0.826171875, -0.755859375, -0.685546875, -0.615234375, -0.544921875, -0.474609375, -0.404296875, -0.333984375, -0.263671875, -0.193359375, -0.123046875, -0.052734375, 0.017578125, 0.087890625, 0.158203125, 0.228515625, 0.298828125, 0.369140625, 0.439453125, 0.509765625, 0.580078125, 0.650390625, 0.720703125, 0.791015625, 0.861328125, 0.931640625, 1.001953125, 1.072265625, 1.142578125, 1.212890625, 1.283203125, 1.353515625, 1.423828125, 1.494140625, 1.564453125, 1.634765625, 1.705078125, 1.775390625, 1.845703125, 1.916015625, 1.986328125, 2.056640625, 2.126953125, 2.197265625, 2.267578125, 2.337890625, 2.408203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 2.0, 11.0, 17.0, 33.0, 26.0, 21.0, 46.0, 42.0, 66.0, 61.0, 64.0, 80.0, 81.0, 75.0, 57.0, 58.0, 60.0, 49.0, 35.0, 36.0, 15.0, 14.0, 11.0, 8.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.015625, -0.9903106689453125, -0.964996337890625, -0.9396820068359375, -0.91436767578125, -0.8890533447265625, -0.863739013671875, -0.8384246826171875, -0.8131103515625, -0.7877960205078125, -0.762481689453125, -0.7371673583984375, -0.71185302734375, -0.6865386962890625, -0.661224365234375, -0.6359100341796875, -0.610595703125, -0.5852813720703125, -0.559967041015625, -0.5346527099609375, -0.50933837890625, -0.4840240478515625, -0.458709716796875, -0.4333953857421875, -0.4080810546875, -0.3827667236328125, -0.357452392578125, -0.3321380615234375, -0.30682373046875, -0.2815093994140625, -0.256195068359375, -0.2308807373046875, -0.20556640625, -0.1802520751953125, -0.154937744140625, -0.1296234130859375, -0.10430908203125, -0.0789947509765625, -0.053680419921875, -0.0283660888671875, -0.0030517578125, 0.0222625732421875, 0.047576904296875, 0.0728912353515625, 0.09820556640625, 0.1235198974609375, 0.148834228515625, 0.1741485595703125, 0.199462890625, 0.2247772216796875, 0.250091552734375, 0.2754058837890625, 0.30072021484375, 0.3260345458984375, 0.351348876953125, 0.3766632080078125, 0.4019775390625, 0.4272918701171875, 0.452606201171875, 0.4779205322265625, 0.50323486328125, 0.5285491943359375, 0.553863525390625, 0.5791778564453125, 0.6044921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 0.0, 6.0, 8.0, 16.0, 20.0, 30.0, 38.0, 47.0, 68.0, 89.0, 110.0, 143.0, 217.0, 303.0, 446.0, 704.0, 1110.0, 1868.0, 3411.0, 7386.0, 20880.0, 83733.0, 3701124.0, 304799.0, 42616.0, 13040.0, 5209.0, 2572.0, 1435.0, 841.0, 593.0, 412.0, 241.0, 229.0, 149.0, 97.0, 80.0, 48.0, 41.0, 26.0, 26.0, 18.0, 12.0, 11.0, 4.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.966796875, -0.9363784790039062, -0.9059600830078125, -0.8755416870117188, -0.845123291015625, -0.8147048950195312, -0.7842864990234375, -0.7538681030273438, -0.72344970703125, -0.6930313110351562, -0.6626129150390625, -0.6321945190429688, -0.601776123046875, -0.5713577270507812, -0.5409393310546875, -0.5105209350585938, -0.4801025390625, -0.44968414306640625, -0.4192657470703125, -0.38884735107421875, -0.358428955078125, -0.32801055908203125, -0.2975921630859375, -0.26717376708984375, -0.23675537109375, -0.20633697509765625, -0.1759185791015625, -0.14550018310546875, -0.115081787109375, -0.08466339111328125, -0.0542449951171875, -0.02382659912109375, 0.006591796875, 0.03701019287109375, 0.0674285888671875, 0.09784698486328125, 0.128265380859375, 0.15868377685546875, 0.1891021728515625, 0.21952056884765625, 0.24993896484375, 0.28035736083984375, 0.3107757568359375, 0.34119415283203125, 0.371612548828125, 0.40203094482421875, 0.4324493408203125, 0.46286773681640625, 0.4932861328125, 0.5237045288085938, 0.5541229248046875, 0.5845413208007812, 0.614959716796875, 0.6453781127929688, 0.6757965087890625, 0.7062149047851562, 0.73663330078125, 0.7670516967773438, 0.7974700927734375, 0.8278884887695312, 0.858306884765625, 0.8887252807617188, 0.9191436767578125, 0.9495620727539062, 0.97998046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 32.0, 56.0, 122.0, 897.0, 2628.0, 143.0, 65.0, 40.0, 26.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30126953125, -0.288726806640625, -0.27618408203125, -0.263641357421875, -0.2510986328125, -0.238555908203125, -0.22601318359375, -0.213470458984375, -0.200927734375, -0.188385009765625, -0.17584228515625, -0.163299560546875, -0.1507568359375, -0.138214111328125, -0.12567138671875, -0.113128662109375, -0.1005859375, -0.088043212890625, -0.07550048828125, -0.062957763671875, -0.0504150390625, -0.037872314453125, -0.02532958984375, -0.012786865234375, -0.000244140625, 0.012298583984375, 0.02484130859375, 0.037384033203125, 0.0499267578125, 0.062469482421875, 0.07501220703125, 0.087554931640625, 0.10009765625, 0.112640380859375, 0.12518310546875, 0.137725830078125, 0.1502685546875, 0.162811279296875, 0.17535400390625, 0.187896728515625, 0.200439453125, 0.212982177734375, 0.22552490234375, 0.238067626953125, 0.2506103515625, 0.263153076171875, 0.27569580078125, 0.288238525390625, 0.30078125, 0.313323974609375, 0.32586669921875, 0.338409423828125, 0.3509521484375, 0.363494873046875, 0.37603759765625, 0.388580322265625, 0.401123046875, 0.413665771484375, 0.42620849609375, 0.438751220703125, 0.4512939453125, 0.463836669921875, 0.47637939453125, 0.488922119140625, 0.50146484375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 86.0, 401.0, 391.0, 99.0, 11.0, 10.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9110536575317383, -3.7307472229003906, -3.550441026687622, -3.3701345920562744, -3.189828395843506, -3.009521961212158, -2.8292155265808105, -2.648909091949463, -2.4686028957366943, -2.2882964611053467, -2.107990264892578, -1.9276838302612305, -1.7473775148391724, -1.5670711994171143, -1.3867647647857666, -1.2064584493637085, -1.0261521339416504, -0.8458458185195923, -0.6655394434928894, -0.4852330684661865, -0.3049267530441284, -0.12462043762207031, 0.055685997009277344, 0.23599231243133545, 0.41629862785339355, 0.5966049432754517, 0.7769113183021545, 0.9572176933288574, 1.1375240087509155, 1.3178303241729736, 1.4981367588043213, 1.6784430742263794, 1.8587498664855957, 2.0390563011169434, 2.219362497329712, 2.3996689319610596, 2.579975128173828, 2.760281562805176, 2.9405879974365234, 3.120894432067871, 3.3012006282806396, 3.4815070629119873, 3.661813259124756, 3.8421196937561035, 4.022426128387451, 4.202732086181641, 4.383038520812988, 4.563344955444336, 4.743651390075684, 4.923957824707031, 5.104264259338379, 5.284570693969727, 5.464876651763916, 5.645183086395264, 5.825489521026611, 6.005795955657959, 6.186101913452148, 6.366408348083496, 6.546714782714844, 6.727021217346191, 6.907327175140381, 7.0876336097717285, 7.267940044403076, 7.448246479034424, 7.6285529136657715]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 10.0, 19.0, 19.0, 31.0, 31.0, 32.0, 23.0, 32.0, 42.0, 49.0, 55.0, 57.0, 43.0, 45.0, 46.0, 51.0, 48.0, 51.0, 39.0, 38.0, 34.0, 30.0, 21.0, 34.0, 24.0, 26.0, 13.0, 6.0, 11.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9647848010063171, -0.9303900003433228, -0.8959951400756836, -0.8616003394126892, -0.82720547914505, -0.7928106784820557, -0.7584158182144165, -0.7240210175514221, -0.6896262168884277, -0.6552314162254333, -0.6208365559577942, -0.5864417552947998, -0.5520468950271606, -0.5176520943641663, -0.4832572638988495, -0.4488624334335327, -0.41446757316589355, -0.3800727427005768, -0.34567791223526, -0.3112831115722656, -0.27688825130462646, -0.2424934357404709, -0.2080986201763153, -0.17370378971099854, -0.13930895924568176, -0.10491412878036499, -0.07051930576562881, -0.03612448275089264, -0.0017296522855758667, 0.032665178179740906, 0.06705999374389648, 0.10145482420921326, 0.13584959506988525, 0.17024442553520203, 0.2046392560005188, 0.23903407156467438, 0.27342891693115234, 0.30782371759414673, 0.3422185480594635, 0.3766133785247803, 0.41100820899009705, 0.4454030394554138, 0.4797978699207306, 0.5141927003860474, 0.5485875010490417, 0.5829823613166809, 0.6173771619796753, 0.6517720222473145, 0.6861668229103088, 0.7205616235733032, 0.7549564838409424, 0.7893512845039368, 0.8237461447715759, 0.8581409454345703, 0.8925358057022095, 0.9269306063652039, 0.9613254070281982, 0.9957202076911926, 1.030115008354187, 1.0645098686218262, 1.0989047288894653, 1.1332995891571045, 1.167694330215454, 1.2020891904830933, 1.2364840507507324]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 10.0, 16.0, 21.0, 32.0, 38.0, 64.0, 106.0, 186.0, 300.0, 557.0, 1025.0, 2121.0, 4837.0, 11332.0, 29631.0, 83136.0, 235892.0, 373186.0, 196185.0, 68125.0, 24148.0, 9482.0, 4038.0, 1936.0, 904.0, 483.0, 268.0, 186.0, 91.0, 57.0, 49.0, 26.0, 24.0, 14.0, 11.0, 3.0, 3.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86181640625, -0.8343734741210938, -0.8069305419921875, -0.7794876098632812, -0.752044677734375, -0.7246017456054688, -0.6971588134765625, -0.6697158813476562, -0.64227294921875, -0.6148300170898438, -0.5873870849609375, -0.5599441528320312, -0.532501220703125, -0.5050582885742188, -0.4776153564453125, -0.45017242431640625, -0.4227294921875, -0.39528656005859375, -0.3678436279296875, -0.34040069580078125, -0.312957763671875, -0.28551483154296875, -0.2580718994140625, -0.23062896728515625, -0.20318603515625, -0.17574310302734375, -0.1483001708984375, -0.12085723876953125, -0.093414306640625, -0.06597137451171875, -0.0385284423828125, -0.01108551025390625, 0.016357421875, 0.04380035400390625, 0.0712432861328125, 0.09868621826171875, 0.126129150390625, 0.15357208251953125, 0.1810150146484375, 0.20845794677734375, 0.23590087890625, 0.26334381103515625, 0.2907867431640625, 0.31822967529296875, 0.345672607421875, 0.37311553955078125, 0.4005584716796875, 0.42800140380859375, 0.4554443359375, 0.48288726806640625, 0.5103302001953125, 0.5377731323242188, 0.565216064453125, 0.5926589965820312, 0.6201019287109375, 0.6475448608398438, 0.67498779296875, 0.7024307250976562, 0.7298736572265625, 0.7573165893554688, 0.784759521484375, 0.8122024536132812, 0.8396453857421875, 0.8670883178710938, 0.89453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 10.0, 9.0, 9.0, 13.0, 27.0, 28.0, 42.0, 43.0, 50.0, 67.0, 80.0, 76.0, 74.0, 73.0, 69.0, 71.0, 61.0, 43.0, 33.0, 31.0, 21.0, 18.0, 13.0, 11.0, 7.0, 3.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.078125, -1.0515289306640625, -1.024932861328125, -0.9983367919921875, -0.97174072265625, -0.9451446533203125, -0.918548583984375, -0.8919525146484375, -0.8653564453125, -0.8387603759765625, -0.812164306640625, -0.7855682373046875, -0.75897216796875, -0.7323760986328125, -0.705780029296875, -0.6791839599609375, -0.652587890625, -0.6259918212890625, -0.599395751953125, -0.5727996826171875, -0.54620361328125, -0.5196075439453125, -0.493011474609375, -0.4664154052734375, -0.4398193359375, -0.4132232666015625, -0.386627197265625, -0.3600311279296875, -0.33343505859375, -0.3068389892578125, -0.280242919921875, -0.2536468505859375, -0.22705078125, -0.2004547119140625, -0.173858642578125, -0.1472625732421875, -0.12066650390625, -0.0940704345703125, -0.067474365234375, -0.0408782958984375, -0.0142822265625, 0.0123138427734375, 0.038909912109375, 0.0655059814453125, 0.09210205078125, 0.1186981201171875, 0.145294189453125, 0.1718902587890625, 0.198486328125, 0.2250823974609375, 0.251678466796875, 0.2782745361328125, 0.30487060546875, 0.3314666748046875, 0.358062744140625, 0.3846588134765625, 0.4112548828125, 0.4378509521484375, 0.464447021484375, 0.4910430908203125, 0.51763916015625, 0.5442352294921875, 0.570831298828125, 0.5974273681640625, 0.6240234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 8.0, 13.0, 27.0, 31.0, 40.0, 72.0, 113.0, 195.0, 349.0, 715.0, 1816.0, 6356.0, 36163.0, 406411.0, 537181.0, 47405.0, 7862.0, 2081.0, 786.0, 377.0, 180.0, 126.0, 62.0, 48.0, 32.0, 18.0, 16.0, 12.0, 14.0, 6.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.625, -2.55780029296875, -2.4906005859375, -2.42340087890625, -2.356201171875, -2.28900146484375, -2.2218017578125, -2.15460205078125, -2.08740234375, -2.02020263671875, -1.9530029296875, -1.88580322265625, -1.818603515625, -1.75140380859375, -1.6842041015625, -1.61700439453125, -1.5498046875, -1.48260498046875, -1.4154052734375, -1.34820556640625, -1.281005859375, -1.21380615234375, -1.1466064453125, -1.07940673828125, -1.01220703125, -0.94500732421875, -0.8778076171875, -0.81060791015625, -0.743408203125, -0.67620849609375, -0.6090087890625, -0.54180908203125, -0.474609375, -0.40740966796875, -0.3402099609375, -0.27301025390625, -0.205810546875, -0.13861083984375, -0.0714111328125, -0.00421142578125, 0.06298828125, 0.13018798828125, 0.1973876953125, 0.26458740234375, 0.331787109375, 0.39898681640625, 0.4661865234375, 0.53338623046875, 0.6005859375, 0.66778564453125, 0.7349853515625, 0.80218505859375, 0.869384765625, 0.93658447265625, 1.0037841796875, 1.07098388671875, 1.13818359375, 1.20538330078125, 1.2725830078125, 1.33978271484375, 1.406982421875, 1.47418212890625, 1.5413818359375, 1.60858154296875, 1.67578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 5.0, 6.0, 10.0, 17.0, 16.0, 25.0, 27.0, 29.0, 26.0, 37.0, 33.0, 34.0, 37.0, 47.0, 49.0, 45.0, 41.0, 43.0, 52.0, 44.0, 38.0, 46.0, 35.0, 40.0, 30.0, 32.0, 27.0, 22.0, 18.0, 14.0, 13.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.342620849609375, -2.24969482421875, -2.156768798828125, -2.0638427734375, -1.970916748046875, -1.87799072265625, -1.785064697265625, -1.692138671875, -1.599212646484375, -1.50628662109375, -1.413360595703125, -1.3204345703125, -1.227508544921875, -1.13458251953125, -1.041656494140625, -0.94873046875, -0.855804443359375, -0.76287841796875, -0.669952392578125, -0.5770263671875, -0.484100341796875, -0.39117431640625, -0.298248291015625, -0.205322265625, -0.112396240234375, -0.01947021484375, 0.073455810546875, 0.1663818359375, 0.259307861328125, 0.35223388671875, 0.445159912109375, 0.5380859375, 0.631011962890625, 0.72393798828125, 0.816864013671875, 0.9097900390625, 1.002716064453125, 1.09564208984375, 1.188568115234375, 1.281494140625, 1.374420166015625, 1.46734619140625, 1.560272216796875, 1.6531982421875, 1.746124267578125, 1.83905029296875, 1.931976318359375, 2.02490234375, 2.117828369140625, 2.21075439453125, 2.303680419921875, 2.3966064453125, 2.489532470703125, 2.58245849609375, 2.675384521484375, 2.768310546875, 2.861236572265625, 2.95416259765625, 3.047088623046875, 3.1400146484375, 3.232940673828125, 3.32586669921875, 3.418792724609375, 3.51171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 11.0, 12.0, 17.0, 23.0, 40.0, 57.0, 103.0, 196.0, 416.0, 1093.0, 4141.0, 32172.0, 767149.0, 227315.0, 12228.0, 2174.0, 693.0, 287.0, 140.0, 94.0, 42.0, 44.0, 24.0, 17.0, 7.0, 5.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3475799560546875, -1.306488037109375, -1.2653961181640625, -1.22430419921875, -1.1832122802734375, -1.142120361328125, -1.1010284423828125, -1.0599365234375, -1.0188446044921875, -0.977752685546875, -0.9366607666015625, -0.89556884765625, -0.8544769287109375, -0.813385009765625, -0.7722930908203125, -0.731201171875, -0.6901092529296875, -0.649017333984375, -0.6079254150390625, -0.56683349609375, -0.5257415771484375, -0.484649658203125, -0.4435577392578125, -0.4024658203125, -0.3613739013671875, -0.320281982421875, -0.2791900634765625, -0.23809814453125, -0.1970062255859375, -0.155914306640625, -0.1148223876953125, -0.07373046875, -0.0326385498046875, 0.008453369140625, 0.0495452880859375, 0.09063720703125, 0.1317291259765625, 0.172821044921875, 0.2139129638671875, 0.2550048828125, 0.2960968017578125, 0.337188720703125, 0.3782806396484375, 0.41937255859375, 0.4604644775390625, 0.501556396484375, 0.5426483154296875, 0.583740234375, 0.6248321533203125, 0.665924072265625, 0.7070159912109375, 0.74810791015625, 0.7891998291015625, 0.830291748046875, 0.8713836669921875, 0.9124755859375, 0.9535675048828125, 0.994659423828125, 1.0357513427734375, 1.07684326171875, 1.1179351806640625, 1.159027099609375, 1.2001190185546875, 1.2412109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 10.0, 14.0, 8.0, 9.0, 11.0, 20.0, 26.0, 35.0, 47.0, 45.0, 55.0, 64.0, 87.0, 77.0, 102.0, 71.0, 43.0, 50.0, 38.0, 34.0, 24.0, 30.0, 22.0, 19.0, 9.0, 12.0, 7.0, 9.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.413459777832031e-05, -6.21061772108078e-05, -6.007775664329529e-05, -5.8049336075782776e-05, -5.6020915508270264e-05, -5.399249494075775e-05, -5.196407437324524e-05, -4.993565380573273e-05, -4.7907233238220215e-05, -4.58788126707077e-05, -4.385039210319519e-05, -4.182197153568268e-05, -3.9793550968170166e-05, -3.7765130400657654e-05, -3.573670983314514e-05, -3.370828926563263e-05, -3.167986869812012e-05, -2.9651448130607605e-05, -2.7623027563095093e-05, -2.559460699558258e-05, -2.356618642807007e-05, -2.1537765860557556e-05, -1.9509345293045044e-05, -1.7480924725532532e-05, -1.545250415802002e-05, -1.3424083590507507e-05, -1.1395663022994995e-05, -9.367242455482483e-06, -7.338821887969971e-06, -5.3104013204574585e-06, -3.2819807529449463e-06, -1.253560185432434e-06, 7.748603820800781e-07, 2.8032809495925903e-06, 4.8317015171051025e-06, 6.860122084617615e-06, 8.888542652130127e-06, 1.091696321964264e-05, 1.2945383787155151e-05, 1.4973804354667664e-05, 1.7002224922180176e-05, 1.9030645489692688e-05, 2.10590660572052e-05, 2.3087486624717712e-05, 2.5115907192230225e-05, 2.7144327759742737e-05, 2.917274832725525e-05, 3.120116889476776e-05, 3.3229589462280273e-05, 3.5258010029792786e-05, 3.72864305973053e-05, 3.931485116481781e-05, 4.134327173233032e-05, 4.3371692299842834e-05, 4.540011286735535e-05, 4.742853343486786e-05, 4.945695400238037e-05, 5.148537456989288e-05, 5.3513795137405396e-05, 5.554221570491791e-05, 5.757063627243042e-05, 5.959905683994293e-05, 6.162747740745544e-05, 6.365589797496796e-05, 6.568431854248047e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 8.0, 10.0, 13.0, 9.0, 27.0, 24.0, 52.0, 53.0, 90.0, 153.0, 297.0, 622.0, 1304.0, 3327.0, 11058.0, 58951.0, 564557.0, 356841.0, 38078.0, 8199.0, 2530.0, 1060.0, 535.0, 275.0, 162.0, 94.0, 55.0, 36.0, 28.0, 25.0, 11.0, 10.0, 16.0, 9.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.919921875, -0.8935546875, -0.8671875, -0.8408203125, -0.814453125, -0.7880859375, -0.76171875, -0.7353515625, -0.708984375, -0.6826171875, -0.65625, -0.6298828125, -0.603515625, -0.5771484375, -0.55078125, -0.5244140625, -0.498046875, -0.4716796875, -0.4453125, -0.4189453125, -0.392578125, -0.3662109375, -0.33984375, -0.3134765625, -0.287109375, -0.2607421875, -0.234375, -0.2080078125, -0.181640625, -0.1552734375, -0.12890625, -0.1025390625, -0.076171875, -0.0498046875, -0.0234375, 0.0029296875, 0.029296875, 0.0556640625, 0.08203125, 0.1083984375, 0.134765625, 0.1611328125, 0.1875, 0.2138671875, 0.240234375, 0.2666015625, 0.29296875, 0.3193359375, 0.345703125, 0.3720703125, 0.3984375, 0.4248046875, 0.451171875, 0.4775390625, 0.50390625, 0.5302734375, 0.556640625, 0.5830078125, 0.609375, 0.6357421875, 0.662109375, 0.6884765625, 0.71484375, 0.7412109375, 0.767578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 11.0, 6.0, 11.0, 10.0, 20.0, 28.0, 28.0, 45.0, 54.0, 59.0, 72.0, 102.0, 84.0, 93.0, 79.0, 58.0, 46.0, 45.0, 25.0, 28.0, 19.0, 16.0, 14.0, 12.0, 12.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77734375, -0.7519760131835938, -0.7266082763671875, -0.7012405395507812, -0.675872802734375, -0.6505050659179688, -0.6251373291015625, -0.5997695922851562, -0.57440185546875, -0.5490341186523438, -0.5236663818359375, -0.49829864501953125, -0.472930908203125, -0.44756317138671875, -0.4221954345703125, -0.39682769775390625, -0.3714599609375, -0.34609222412109375, -0.3207244873046875, -0.29535675048828125, -0.269989013671875, -0.24462127685546875, -0.2192535400390625, -0.19388580322265625, -0.16851806640625, -0.14315032958984375, -0.1177825927734375, -0.09241485595703125, -0.067047119140625, -0.04167938232421875, -0.0163116455078125, 0.00905609130859375, 0.034423828125, 0.05979156494140625, 0.0851593017578125, 0.11052703857421875, 0.135894775390625, 0.16126251220703125, 0.1866302490234375, 0.21199798583984375, 0.23736572265625, 0.26273345947265625, 0.2881011962890625, 0.31346893310546875, 0.338836669921875, 0.36420440673828125, 0.3895721435546875, 0.41493988037109375, 0.4403076171875, 0.46567535400390625, 0.4910430908203125, 0.5164108276367188, 0.541778564453125, 0.5671463012695312, 0.5925140380859375, 0.6178817749023438, 0.64324951171875, 0.6686172485351562, 0.6939849853515625, 0.7193527221679688, 0.744720458984375, 0.7700881958007812, 0.7954559326171875, 0.8208236694335938, 0.84619140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 12.0, 47.0, 158.0, 349.0, 304.0, 103.0, 27.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.73371887207031, -40.66122817993164, -39.58873748779297, -38.5162467956543, -37.443756103515625, -36.37126541137695, -35.29877471923828, -34.22628402709961, -33.15379333496094, -32.081302642822266, -31.008811950683594, -29.936321258544922, -28.86383056640625, -27.791339874267578, -26.718849182128906, -25.646358489990234, -24.57386589050293, -23.501375198364258, -22.428884506225586, -21.356393814086914, -20.283903121948242, -19.21141242980957, -18.138919830322266, -17.066429138183594, -15.993939399719238, -14.921448707580566, -13.848958015441895, -12.776466369628906, -11.703975677490234, -10.631484985351562, -9.55899429321289, -8.486503601074219, -7.414012908935547, -6.341522216796875, -5.269031524658203, -4.196540355682373, -3.124049663543701, -2.0515589714050293, -0.9790678024291992, 0.09342288970947266, 1.1659135818481445, 2.2384042739868164, 3.3108952045440674, 4.383386135101318, 5.45587682723999, 6.528367519378662, 7.600858688354492, 8.673349380493164, 9.745840072631836, 10.818330764770508, 11.89082145690918, 12.963312149047852, 14.035802841186523, 15.108293533325195, 16.1807861328125, 17.253276824951172, 18.325767517089844, 19.398258209228516, 20.470748901367188, 21.54323959350586, 22.61573028564453, 23.688220977783203, 24.760711669921875, 25.833202362060547, 26.90569305419922]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 1.0, 8.0, 11.0, 12.0, 15.0, 16.0, 13.0, 18.0, 19.0, 27.0, 27.0, 24.0, 32.0, 40.0, 38.0, 31.0, 60.0, 43.0, 59.0, 53.0, 52.0, 55.0, 31.0, 48.0, 43.0, 36.0, 23.0, 30.0, 17.0, 19.0, 20.0, 13.0, 15.0, 9.0, 6.0, 5.0, 5.0, 8.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-14.279024124145508, -13.877289772033691, -13.475554466247559, -13.073820114135742, -12.67208480834961, -12.270350456237793, -11.868616104125977, -11.466880798339844, -11.065145492553711, -10.663411140441895, -10.261675834655762, -9.859941482543945, -9.458206176757812, -9.056471824645996, -8.65473747253418, -8.253002166748047, -7.8512678146362305, -7.449532985687256, -7.047798156738281, -6.646063804626465, -6.244328498840332, -5.842594146728516, -5.440859317779541, -5.039124488830566, -4.637389659881592, -4.235654830932617, -3.8339200019836426, -3.432185411453247, -3.0304505825042725, -2.628715753555298, -2.2269811630249023, -1.8252463340759277, -1.4235115051269531, -1.0217766761779785, -0.6200419664382935, -0.2183072566986084, 0.1834275722503662, 0.5851624011993408, 0.9868969917297363, 1.388631820678711, 1.7903666496276855, 2.19210147857666, 2.5938363075256348, 2.9955708980560303, 3.397305727005005, 3.7990405559539795, 4.200775146484375, 4.60250997543335, 5.004244804382324, 5.405979633331299, 5.807714462280273, 6.20944881439209, 6.611184120178223, 7.012918472290039, 7.414653301239014, 7.816388130187988, 8.218122482299805, 8.619856834411621, 9.021592140197754, 9.42332649230957, 9.825061798095703, 10.22679615020752, 10.628530502319336, 11.030265808105469, 11.432001113891602]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 19.0, 18.0, 41.0, 68.0, 98.0, 164.0, 268.0, 479.0, 813.0, 1557.0, 3472.0, 11456.0, 82968.0, 3961594.0, 110587.0, 13200.0, 3847.0, 1631.0, 839.0, 482.0, 275.0, 163.0, 93.0, 57.0, 29.0, 15.0, 15.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1063385009765625, -1.059356689453125, -1.0123748779296875, -0.96539306640625, -0.9184112548828125, -0.871429443359375, -0.8244476318359375, -0.7774658203125, -0.7304840087890625, -0.683502197265625, -0.6365203857421875, -0.58953857421875, -0.5425567626953125, -0.495574951171875, -0.4485931396484375, -0.401611328125, -0.3546295166015625, -0.307647705078125, -0.2606658935546875, -0.21368408203125, -0.1667022705078125, -0.119720458984375, -0.0727386474609375, -0.0257568359375, 0.0212249755859375, 0.068206787109375, 0.1151885986328125, 0.16217041015625, 0.2091522216796875, 0.256134033203125, 0.3031158447265625, 0.35009765625, 0.3970794677734375, 0.444061279296875, 0.4910430908203125, 0.53802490234375, 0.5850067138671875, 0.631988525390625, 0.6789703369140625, 0.7259521484375, 0.7729339599609375, 0.819915771484375, 0.8668975830078125, 0.91387939453125, 0.9608612060546875, 1.007843017578125, 1.0548248291015625, 1.101806640625, 1.1487884521484375, 1.195770263671875, 1.2427520751953125, 1.28973388671875, 1.3367156982421875, 1.383697509765625, 1.4306793212890625, 1.4776611328125, 1.5246429443359375, 1.571624755859375, 1.6186065673828125, 1.66558837890625, 1.7125701904296875, 1.759552001953125, 1.8065338134765625, 1.853515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 14.0, 18.0, 27.0, 29.0, 40.0, 52.0, 49.0, 83.0, 70.0, 82.0, 83.0, 96.0, 83.0, 62.0, 46.0, 40.0, 29.0, 13.0, 19.0, 15.0, 13.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.951171875, -0.9238662719726562, -0.8965606689453125, -0.8692550659179688, -0.841949462890625, -0.8146438598632812, -0.7873382568359375, -0.7600326538085938, -0.73272705078125, -0.7054214477539062, -0.6781158447265625, -0.6508102416992188, -0.623504638671875, -0.5961990356445312, -0.5688934326171875, -0.5415878295898438, -0.5142822265625, -0.48697662353515625, -0.4596710205078125, -0.43236541748046875, -0.405059814453125, -0.37775421142578125, -0.3504486083984375, -0.32314300537109375, -0.29583740234375, -0.26853179931640625, -0.2412261962890625, -0.21392059326171875, -0.186614990234375, -0.15930938720703125, -0.1320037841796875, -0.10469818115234375, -0.077392578125, -0.05008697509765625, -0.0227813720703125, 0.00452423095703125, 0.031829833984375, 0.05913543701171875, 0.0864410400390625, 0.11374664306640625, 0.14105224609375, 0.16835784912109375, 0.1956634521484375, 0.22296905517578125, 0.250274658203125, 0.27758026123046875, 0.3048858642578125, 0.33219146728515625, 0.3594970703125, 0.38680267333984375, 0.4141082763671875, 0.44141387939453125, 0.468719482421875, 0.49602508544921875, 0.5233306884765625, 0.5506362915039062, 0.57794189453125, 0.6052474975585938, 0.6325531005859375, 0.6598587036132812, 0.687164306640625, 0.7144699096679688, 0.7417755126953125, 0.7690811157226562, 0.79638671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 5.0, 7.0, 14.0, 16.0, 17.0, 19.0, 24.0, 33.0, 34.0, 41.0, 61.0, 110.0, 326.0, 1057.0, 4016.0, 35525.0, 4107394.0, 39305.0, 4335.0, 1127.0, 333.0, 142.0, 58.0, 56.0, 37.0, 41.0, 32.0, 17.0, 21.0, 22.0, 8.0, 6.0, 10.0, 4.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.683929443359375, -2.58270263671875, -2.481475830078125, -2.3802490234375, -2.279022216796875, -2.17779541015625, -2.076568603515625, -1.975341796875, -1.874114990234375, -1.77288818359375, -1.671661376953125, -1.5704345703125, -1.469207763671875, -1.36798095703125, -1.266754150390625, -1.16552734375, -1.064300537109375, -0.96307373046875, -0.861846923828125, -0.7606201171875, -0.659393310546875, -0.55816650390625, -0.456939697265625, -0.355712890625, -0.254486083984375, -0.15325927734375, -0.052032470703125, 0.0491943359375, 0.150421142578125, 0.25164794921875, 0.352874755859375, 0.4541015625, 0.555328369140625, 0.65655517578125, 0.757781982421875, 0.8590087890625, 0.960235595703125, 1.06146240234375, 1.162689208984375, 1.263916015625, 1.365142822265625, 1.46636962890625, 1.567596435546875, 1.6688232421875, 1.770050048828125, 1.87127685546875, 1.972503662109375, 2.07373046875, 2.174957275390625, 2.27618408203125, 2.377410888671875, 2.4786376953125, 2.579864501953125, 2.68109130859375, 2.782318115234375, 2.883544921875, 2.984771728515625, 3.08599853515625, 3.187225341796875, 3.2884521484375, 3.389678955078125, 3.49090576171875, 3.592132568359375, 3.693359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 15.0, 42.0, 263.0, 3442.0, 243.0, 42.0, 10.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.46955108642578125, -0.4141998291015625, -0.35884857177734375, -0.303497314453125, -0.24814605712890625, -0.1927947998046875, -0.13744354248046875, -0.08209228515625, -0.02674102783203125, 0.0286102294921875, 0.08396148681640625, 0.139312744140625, 0.19466400146484375, 0.2500152587890625, 0.30536651611328125, 0.3607177734375, 0.41606903076171875, 0.4714202880859375, 0.5267715454101562, 0.582122802734375, 0.6374740600585938, 0.6928253173828125, 0.7481765747070312, 0.80352783203125, 0.8588790893554688, 0.9142303466796875, 0.9695816040039062, 1.024932861328125, 1.0802841186523438, 1.1356353759765625, 1.1909866333007812, 1.246337890625, 1.3016891479492188, 1.3570404052734375, 1.4123916625976562, 1.467742919921875, 1.5230941772460938, 1.5784454345703125, 1.6337966918945312, 1.68914794921875, 1.7444992065429688, 1.7998504638671875, 1.8552017211914062, 1.910552978515625, 1.9659042358398438, 2.0212554931640625, 2.0766067504882812, 2.1319580078125, 2.1873092651367188, 2.2426605224609375, 2.2980117797851562, 2.353363037109375, 2.4087142944335938, 2.4640655517578125, 2.5194168090820312, 2.57476806640625, 2.6301193237304688, 2.6854705810546875, 2.7408218383789062, 2.796173095703125, 2.8515243530273438, 2.9068756103515625, 2.9622268676757812, 3.017578125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 18.0, 40.0, 111.0, 212.0, 270.0, 215.0, 88.0, 25.0, 16.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.746006488800049, -2.5556764602661133, -2.3653464317321777, -2.175016403198242, -1.9846864938735962, -1.7943564653396606, -1.6040265560150146, -1.413696527481079, -1.2233664989471436, -1.033036470413208, -0.8427065014839172, -0.6523765325546265, -0.4620465040206909, -0.27171647548675537, -0.08138656616210938, 0.10894346237182617, 0.2992734909057617, 0.4896034896373749, 0.679933488368988, 0.8702634572982788, 1.0605934858322144, 1.25092351436615, 1.441253423690796, 1.6315834522247314, 1.821913480758667, 2.0122435092926025, 2.202573537826538, 2.3929033279418945, 2.58323335647583, 2.7735633850097656, 2.963893413543701, 3.1542234420776367, 3.344552993774414, 3.5348830223083496, 3.725213050842285, 3.9155430793762207, 4.105873107910156, 4.296203136444092, 4.486533164978027, 4.676862716674805, 4.867193222045898, 5.057523250579834, 5.2478532791137695, 5.438183307647705, 5.628513336181641, 5.818843364715576, 6.009173393249512, 6.199502944946289, 6.389832973480225, 6.58016300201416, 6.770493030548096, 6.960823059082031, 7.151153087615967, 7.341483116149902, 7.53181266784668, 7.722143173217773, 7.912472724914551, 8.102802276611328, 8.293132781982422, 8.4834623336792, 8.673792839050293, 8.86412239074707, 9.054452896118164, 9.244782447814941, 9.435112953186035]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 10.0, 10.0, 27.0, 31.0, 54.0, 59.0, 94.0, 96.0, 103.0, 135.0, 100.0, 95.0, 58.0, 50.0, 35.0, 21.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.381100177764893, -5.222248077392578, -5.0633955001831055, -4.904543399810791, -4.745690822601318, -4.586838722229004, -4.427986145019531, -4.269134044647217, -4.110281944274902, -3.951429605484009, -3.7925772666931152, -3.6337249279022217, -3.474872589111328, -3.3160204887390137, -3.15716814994812, -2.9983158111572266, -2.839463233947754, -2.6806108951568604, -2.521758556365967, -2.3629062175750732, -2.2040538787841797, -2.0452017784118652, -1.8863494396209717, -1.7274971008300781, -1.5686447620391846, -1.409792423248291, -1.2509400844573975, -1.0920878648757935, -0.9332355260848999, -0.7743831872940063, -0.6155309081077576, -0.4566786289215088, -0.29782581329345703, -0.13897350430488586, 0.019878804683685303, 0.17873111367225647, 0.33758342266082764, 0.4964357614517212, 0.65528804063797, 0.8141403198242188, 0.9729926586151123, 1.1318449974060059, 1.2906973361968994, 1.4495495557785034, 1.608401894569397, 1.7672542333602905, 1.9261064529418945, 2.084958791732788, 2.2438111305236816, 2.402663469314575, 2.5615158081054688, 2.7203681468963623, 2.879220485687256, 3.0380725860595703, 3.196924924850464, 3.3557772636413574, 3.514629602432251, 3.6734819412231445, 3.832334280014038, 3.9911866188049316, 4.150038719177246, 4.308891296386719, 4.467743396759033, 4.626595497131348, 4.78544807434082]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 9.0, 9.0, 14.0, 26.0, 60.0, 131.0, 343.0, 1564.0, 14120.0, 447422.0, 564706.0, 17710.0, 1787.0, 420.0, 118.0, 58.0, 22.0, 17.0, 14.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.054595947265625, -3.94512939453125, -3.835662841796875, -3.7261962890625, -3.616729736328125, -3.50726318359375, -3.397796630859375, -3.288330078125, -3.178863525390625, -3.06939697265625, -2.959930419921875, -2.8504638671875, -2.740997314453125, -2.63153076171875, -2.522064208984375, -2.41259765625, -2.303131103515625, -2.19366455078125, -2.084197998046875, -1.9747314453125, -1.865264892578125, -1.75579833984375, -1.646331787109375, -1.536865234375, -1.427398681640625, -1.31793212890625, -1.208465576171875, -1.0989990234375, -0.989532470703125, -0.88006591796875, -0.770599365234375, -0.6611328125, -0.551666259765625, -0.44219970703125, -0.332733154296875, -0.2232666015625, -0.113800048828125, -0.00433349609375, 0.105133056640625, 0.214599609375, 0.324066162109375, 0.43353271484375, 0.542999267578125, 0.6524658203125, 0.761932373046875, 0.87139892578125, 0.980865478515625, 1.09033203125, 1.199798583984375, 1.30926513671875, 1.418731689453125, 1.5281982421875, 1.637664794921875, 1.74713134765625, 1.856597900390625, 1.966064453125, 2.075531005859375, 2.18499755859375, 2.294464111328125, 2.4039306640625, 2.513397216796875, 2.62286376953125, 2.732330322265625, 2.841796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 10.0, 6.0, 13.0, 13.0, 21.0, 28.0, 41.0, 51.0, 66.0, 68.0, 67.0, 92.0, 93.0, 80.0, 81.0, 70.0, 53.0, 37.0, 25.0, 23.0, 15.0, 16.0, 12.0, 6.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.9745407104492188, -0.9441986083984375, -0.9138565063476562, -0.883514404296875, -0.8531723022460938, -0.8228302001953125, -0.7924880981445312, -0.76214599609375, -0.7318038940429688, -0.7014617919921875, -0.6711196899414062, -0.640777587890625, -0.6104354858398438, -0.5800933837890625, -0.5497512817382812, -0.5194091796875, -0.48906707763671875, -0.4587249755859375, -0.42838287353515625, -0.398040771484375, -0.36769866943359375, -0.3373565673828125, -0.30701446533203125, -0.27667236328125, -0.24633026123046875, -0.2159881591796875, -0.18564605712890625, -0.155303955078125, -0.12496185302734375, -0.0946197509765625, -0.06427764892578125, -0.033935546875, -0.00359344482421875, 0.0267486572265625, 0.05709075927734375, 0.087432861328125, 0.11777496337890625, 0.1481170654296875, 0.17845916748046875, 0.20880126953125, 0.23914337158203125, 0.2694854736328125, 0.29982757568359375, 0.330169677734375, 0.36051177978515625, 0.3908538818359375, 0.42119598388671875, 0.4515380859375, 0.48188018798828125, 0.5122222900390625, 0.5425643920898438, 0.572906494140625, 0.6032485961914062, 0.6335906982421875, 0.6639328002929688, 0.69427490234375, 0.7246170043945312, 0.7549591064453125, 0.7853012084960938, 0.815643310546875, 0.8459854125976562, 0.8763275146484375, 0.9066696166992188, 0.93701171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 3.0, 7.0, 18.0, 41.0, 59.0, 130.0, 274.0, 721.0, 2363.0, 25647.0, 914883.0, 98372.0, 4324.0, 1015.0, 373.0, 147.0, 75.0, 31.0, 24.0, 23.0, 3.0, 7.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.275146484375, -4.14013671875, -4.005126953125, -3.8701171875, -3.735107421875, -3.60009765625, -3.465087890625, -3.330078125, -3.195068359375, -3.06005859375, -2.925048828125, -2.7900390625, -2.655029296875, -2.52001953125, -2.385009765625, -2.25, -2.114990234375, -1.97998046875, -1.844970703125, -1.7099609375, -1.574951171875, -1.43994140625, -1.304931640625, -1.169921875, -1.034912109375, -0.89990234375, -0.764892578125, -0.6298828125, -0.494873046875, -0.35986328125, -0.224853515625, -0.08984375, 0.045166015625, 0.18017578125, 0.315185546875, 0.4501953125, 0.585205078125, 0.72021484375, 0.855224609375, 0.990234375, 1.125244140625, 1.26025390625, 1.395263671875, 1.5302734375, 1.665283203125, 1.80029296875, 1.935302734375, 2.0703125, 2.205322265625, 2.34033203125, 2.475341796875, 2.6103515625, 2.745361328125, 2.88037109375, 3.015380859375, 3.150390625, 3.285400390625, 3.42041015625, 3.555419921875, 3.6904296875, 3.825439453125, 3.96044921875, 4.095458984375, 4.23046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 11.0, 17.0, 15.0, 30.0, 60.0, 75.0, 117.0, 126.0, 137.0, 118.0, 101.0, 76.0, 46.0, 44.0, 18.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.29974365234375, -6.0916748046875, -5.88360595703125, -5.675537109375, -5.46746826171875, -5.2593994140625, -5.05133056640625, -4.84326171875, -4.63519287109375, -4.4271240234375, -4.21905517578125, -4.010986328125, -3.80291748046875, -3.5948486328125, -3.38677978515625, -3.1787109375, -2.97064208984375, -2.7625732421875, -2.55450439453125, -2.346435546875, -2.13836669921875, -1.9302978515625, -1.72222900390625, -1.51416015625, -1.30609130859375, -1.0980224609375, -0.88995361328125, -0.681884765625, -0.47381591796875, -0.2657470703125, -0.05767822265625, 0.150390625, 0.35845947265625, 0.5665283203125, 0.77459716796875, 0.982666015625, 1.19073486328125, 1.3988037109375, 1.60687255859375, 1.81494140625, 2.02301025390625, 2.2310791015625, 2.43914794921875, 2.647216796875, 2.85528564453125, 3.0633544921875, 3.27142333984375, 3.4794921875, 3.68756103515625, 3.8956298828125, 4.10369873046875, 4.311767578125, 4.51983642578125, 4.7279052734375, 4.93597412109375, 5.14404296875, 5.35211181640625, 5.5601806640625, 5.76824951171875, 5.976318359375, 6.18438720703125, 6.3924560546875, 6.60052490234375, 6.80859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 12.0, 14.0, 41.0, 49.0, 93.0, 198.0, 517.0, 2303.0, 25219.0, 841549.0, 170369.0, 6403.0, 1115.0, 334.0, 146.0, 75.0, 31.0, 22.0, 16.0, 11.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.02703857421875, -0.9886474609375, -0.95025634765625, -0.911865234375, -0.87347412109375, -0.8350830078125, -0.79669189453125, -0.75830078125, -0.71990966796875, -0.6815185546875, -0.64312744140625, -0.604736328125, -0.56634521484375, -0.5279541015625, -0.48956298828125, -0.451171875, -0.41278076171875, -0.3743896484375, -0.33599853515625, -0.297607421875, -0.25921630859375, -0.2208251953125, -0.18243408203125, -0.14404296875, -0.10565185546875, -0.0672607421875, -0.02886962890625, 0.009521484375, 0.04791259765625, 0.0863037109375, 0.12469482421875, 0.1630859375, 0.20147705078125, 0.2398681640625, 0.27825927734375, 0.316650390625, 0.35504150390625, 0.3934326171875, 0.43182373046875, 0.47021484375, 0.50860595703125, 0.5469970703125, 0.58538818359375, 0.623779296875, 0.66217041015625, 0.7005615234375, 0.73895263671875, 0.77734375, 0.81573486328125, 0.8541259765625, 0.89251708984375, 0.930908203125, 0.96929931640625, 1.0076904296875, 1.04608154296875, 1.08447265625, 1.12286376953125, 1.1612548828125, 1.19964599609375, 1.238037109375, 1.27642822265625, 1.3148193359375, 1.35321044921875, 1.3916015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 11.0, 12.0, 18.0, 16.0, 22.0, 21.0, 23.0, 35.0, 35.0, 39.0, 49.0, 51.0, 81.0, 82.0, 64.0, 63.0, 68.0, 36.0, 42.0, 37.0, 20.0, 22.0, 27.0, 19.0, 8.0, 12.0, 10.0, 3.0, 6.0, 15.0, 9.0, 1.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.46574592590332e-05, -5.282741039991379e-05, -5.099736154079437e-05, -4.916731268167496e-05, -4.733726382255554e-05, -4.550721496343613e-05, -4.367716610431671e-05, -4.1847117245197296e-05, -4.001706838607788e-05, -3.8187019526958466e-05, -3.635697066783905e-05, -3.4526921808719635e-05, -3.269687294960022e-05, -3.0866824090480804e-05, -2.903677523136139e-05, -2.7206726372241974e-05, -2.537667751312256e-05, -2.3546628654003143e-05, -2.1716579794883728e-05, -1.9886530935764313e-05, -1.8056482076644897e-05, -1.6226433217525482e-05, -1.4396384358406067e-05, -1.2566335499286652e-05, -1.0736286640167236e-05, -8.906237781047821e-06, -7.076188921928406e-06, -5.2461400628089905e-06, -3.416091203689575e-06, -1.58604234457016e-06, 2.4400651454925537e-07, 2.0740553736686707e-06, 3.904104232788086e-06, 5.734153091907501e-06, 7.5642019510269165e-06, 9.394250810146332e-06, 1.1224299669265747e-05, 1.3054348528385162e-05, 1.4884397387504578e-05, 1.6714446246623993e-05, 1.8544495105743408e-05, 2.0374543964862823e-05, 2.220459282398224e-05, 2.4034641683101654e-05, 2.586469054222107e-05, 2.7694739401340485e-05, 2.95247882604599e-05, 3.1354837119579315e-05, 3.318488597869873e-05, 3.5014934837818146e-05, 3.684498369693756e-05, 3.8675032556056976e-05, 4.050508141517639e-05, 4.233513027429581e-05, 4.416517913341522e-05, 4.599522799253464e-05, 4.782527685165405e-05, 4.965532571077347e-05, 5.148537456989288e-05, 5.33154234290123e-05, 5.5145472288131714e-05, 5.697552114725113e-05, 5.8805570006370544e-05, 6.063561886548996e-05, 6.246566772460938e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 20.0, 18.0, 37.0, 81.0, 174.0, 559.0, 2432.0, 32467.0, 944288.0, 63905.0, 3421.0, 698.0, 236.0, 98.0, 59.0, 30.0, 13.0, 9.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.82659912109375, -1.7752685546875, -1.72393798828125, -1.672607421875, -1.62127685546875, -1.5699462890625, -1.51861572265625, -1.46728515625, -1.41595458984375, -1.3646240234375, -1.31329345703125, -1.261962890625, -1.21063232421875, -1.1593017578125, -1.10797119140625, -1.056640625, -1.00531005859375, -0.9539794921875, -0.90264892578125, -0.851318359375, -0.79998779296875, -0.7486572265625, -0.69732666015625, -0.64599609375, -0.59466552734375, -0.5433349609375, -0.49200439453125, -0.440673828125, -0.38934326171875, -0.3380126953125, -0.28668212890625, -0.2353515625, -0.18402099609375, -0.1326904296875, -0.08135986328125, -0.030029296875, 0.02130126953125, 0.0726318359375, 0.12396240234375, 0.17529296875, 0.22662353515625, 0.2779541015625, 0.32928466796875, 0.380615234375, 0.43194580078125, 0.4832763671875, 0.53460693359375, 0.5859375, 0.63726806640625, 0.6885986328125, 0.73992919921875, 0.791259765625, 0.84259033203125, 0.8939208984375, 0.94525146484375, 0.99658203125, 1.04791259765625, 1.0992431640625, 1.15057373046875, 1.201904296875, 1.25323486328125, 1.3045654296875, 1.35589599609375, 1.4072265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 19.0, 25.0, 43.0, 56.0, 93.0, 117.0, 140.0, 161.0, 130.0, 78.0, 46.0, 37.0, 23.0, 12.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.185882568359375, -1.14617919921875, -1.106475830078125, -1.0667724609375, -1.027069091796875, -0.98736572265625, -0.947662353515625, -0.907958984375, -0.868255615234375, -0.82855224609375, -0.788848876953125, -0.7491455078125, -0.709442138671875, -0.66973876953125, -0.630035400390625, -0.59033203125, -0.550628662109375, -0.51092529296875, -0.471221923828125, -0.4315185546875, -0.391815185546875, -0.35211181640625, -0.312408447265625, -0.272705078125, -0.233001708984375, -0.19329833984375, -0.153594970703125, -0.1138916015625, -0.074188232421875, -0.03448486328125, 0.005218505859375, 0.044921875, 0.084625244140625, 0.12432861328125, 0.164031982421875, 0.2037353515625, 0.243438720703125, 0.28314208984375, 0.322845458984375, 0.362548828125, 0.402252197265625, 0.44195556640625, 0.481658935546875, 0.5213623046875, 0.561065673828125, 0.60076904296875, 0.640472412109375, 0.68017578125, 0.719879150390625, 0.75958251953125, 0.799285888671875, 0.8389892578125, 0.878692626953125, 0.91839599609375, 0.958099365234375, 0.997802734375, 1.037506103515625, 1.07720947265625, 1.116912841796875, 1.1566162109375, 1.196319580078125, 1.23602294921875, 1.275726318359375, 1.3154296875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 16.0, 69.0, 261.0, 365.0, 202.0, 58.0, 22.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.632320404052734, -32.52117156982422, -31.41002655029297, -30.298879623413086, -29.187732696533203, -28.076583862304688, -26.965436935424805, -25.854290008544922, -24.74314308166504, -23.631996154785156, -22.520849227905273, -21.40970230102539, -20.298553466796875, -19.187408447265625, -18.07625961303711, -16.965112686157227, -15.853965759277344, -14.742818832397461, -13.631671905517578, -12.520524024963379, -11.409377098083496, -10.298230171203613, -9.187082290649414, -8.075935363769531, -6.964788436889648, -5.853641510009766, -4.742494106292725, -3.6313469409942627, -2.520199775695801, -1.409052848815918, -0.29790544509887695, 0.8132419586181641, 1.9243927001953125, 3.0355398654937744, 4.146687030792236, 5.257834434509277, 6.36898136138916, 7.480128288269043, 8.591276168823242, 9.702423095703125, 10.813570022583008, 11.92471694946289, 13.035863876342773, 14.147011756896973, 15.258158683776855, 16.369304656982422, 17.480453491210938, 18.59160041809082, 19.702747344970703, 20.813894271850586, 21.92504119873047, 23.03618812561035, 24.147335052490234, 25.25848388671875, 26.369630813598633, 27.480777740478516, 28.5919246673584, 29.70307159423828, 30.814218521118164, 31.925365447998047, 33.03651428222656, 34.14765930175781, 35.25880813598633, 36.369956970214844, 37.481101989746094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 0.0, 7.0, 5.0, 7.0, 14.0, 18.0, 18.0, 12.0, 18.0, 33.0, 33.0, 43.0, 51.0, 47.0, 58.0, 54.0, 79.0, 64.0, 66.0, 54.0, 48.0, 40.0, 54.0, 39.0, 26.0, 16.0, 18.0, 11.0, 13.0, 15.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.184054374694824, -10.738739013671875, -10.29342269897461, -9.84810733795166, -9.402791976928711, -8.957475662231445, -8.512160301208496, -8.066844940185547, -7.621528625488281, -7.176212787628174, -6.730896949768066, -6.285581588745117, -5.84026575088501, -5.394949913024902, -4.949634552001953, -4.504318714141846, -4.059002876281738, -3.613687038421631, -3.1683714389801025, -2.723055839538574, -2.277740001678467, -1.8324241638183594, -1.387108564376831, -0.9417929649353027, -0.4964771270751953, -0.05116140842437744, 0.39415431022644043, 0.8394700288772583, 1.2847857475280762, 1.7301015853881836, 2.175417184829712, 2.6207327842712402, 3.0660476684570312, 3.5113635063171387, 3.956679105758667, 4.401994705200195, 4.847310543060303, 5.29262638092041, 5.737941741943359, 6.183257579803467, 6.628573417663574, 7.073889255523682, 7.519205093383789, 7.964520454406738, 8.409835815429688, 8.855152130126953, 9.300467491149902, 9.745782852172852, 10.191099166870117, 10.636414527893066, 11.081730842590332, 11.527046203613281, 11.972362518310547, 12.417677879333496, 12.862993240356445, 13.308309555053711, 13.75362491607666, 14.19894027709961, 14.644256591796875, 15.089571952819824, 15.534887313842773, 15.980203628540039, 16.425519943237305, 16.870834350585938, 17.316150665283203]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 5.0, 6.0, 12.0, 13.0, 16.0, 28.0, 43.0, 69.0, 125.0, 235.0, 507.0, 1299.0, 4754.0, 27953.0, 2946476.0, 1185392.0, 21250.0, 3943.0, 1150.0, 457.0, 217.0, 102.0, 83.0, 37.0, 21.0, 23.0, 12.0, 12.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.732421875, -2.658447265625, -2.58447265625, -2.510498046875, -2.4365234375, -2.362548828125, -2.28857421875, -2.214599609375, -2.140625, -2.066650390625, -1.99267578125, -1.918701171875, -1.8447265625, -1.770751953125, -1.69677734375, -1.622802734375, -1.548828125, -1.474853515625, -1.40087890625, -1.326904296875, -1.2529296875, -1.178955078125, -1.10498046875, -1.031005859375, -0.95703125, -0.883056640625, -0.80908203125, -0.735107421875, -0.6611328125, -0.587158203125, -0.51318359375, -0.439208984375, -0.365234375, -0.291259765625, -0.21728515625, -0.143310546875, -0.0693359375, 0.004638671875, 0.07861328125, 0.152587890625, 0.2265625, 0.300537109375, 0.37451171875, 0.448486328125, 0.5224609375, 0.596435546875, 0.67041015625, 0.744384765625, 0.818359375, 0.892333984375, 0.96630859375, 1.040283203125, 1.1142578125, 1.188232421875, 1.26220703125, 1.336181640625, 1.41015625, 1.484130859375, 1.55810546875, 1.632080078125, 1.7060546875, 1.780029296875, 1.85400390625, 1.927978515625, 2.001953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 5.0, 10.0, 8.0, 21.0, 22.0, 28.0, 28.0, 32.0, 47.0, 51.0, 59.0, 70.0, 69.0, 45.0, 73.0, 60.0, 74.0, 43.0, 43.0, 52.0, 31.0, 18.0, 19.0, 22.0, 17.0, 15.0, 5.0, 6.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65673828125, -0.636627197265625, -0.61651611328125, -0.596405029296875, -0.5762939453125, -0.556182861328125, -0.53607177734375, -0.515960693359375, -0.495849609375, -0.475738525390625, -0.45562744140625, -0.435516357421875, -0.4154052734375, -0.395294189453125, -0.37518310546875, -0.355072021484375, -0.3349609375, -0.314849853515625, -0.29473876953125, -0.274627685546875, -0.2545166015625, -0.234405517578125, -0.21429443359375, -0.194183349609375, -0.174072265625, -0.153961181640625, -0.13385009765625, -0.113739013671875, -0.0936279296875, -0.073516845703125, -0.05340576171875, -0.033294677734375, -0.01318359375, 0.006927490234375, 0.02703857421875, 0.047149658203125, 0.0672607421875, 0.087371826171875, 0.10748291015625, 0.127593994140625, 0.147705078125, 0.167816162109375, 0.18792724609375, 0.208038330078125, 0.2281494140625, 0.248260498046875, 0.26837158203125, 0.288482666015625, 0.30859375, 0.328704833984375, 0.34881591796875, 0.368927001953125, 0.3890380859375, 0.409149169921875, 0.42926025390625, 0.449371337890625, 0.469482421875, 0.489593505859375, 0.50970458984375, 0.529815673828125, 0.5499267578125, 0.570037841796875, 0.59014892578125, 0.610260009765625, 0.63037109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 8.0, 13.0, 19.0, 28.0, 74.0, 189.0, 481.0, 2055.0, 20451.0, 3387966.0, 767694.0, 13045.0, 1567.0, 408.0, 126.0, 62.0, 27.0, 15.0, 14.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.625, -3.52679443359375, -3.4285888671875, -3.33038330078125, -3.232177734375, -3.13397216796875, -3.0357666015625, -2.93756103515625, -2.83935546875, -2.74114990234375, -2.6429443359375, -2.54473876953125, -2.446533203125, -2.34832763671875, -2.2501220703125, -2.15191650390625, -2.0537109375, -1.95550537109375, -1.8572998046875, -1.75909423828125, -1.660888671875, -1.56268310546875, -1.4644775390625, -1.36627197265625, -1.26806640625, -1.16986083984375, -1.0716552734375, -0.97344970703125, -0.875244140625, -0.77703857421875, -0.6788330078125, -0.58062744140625, -0.482421875, -0.38421630859375, -0.2860107421875, -0.18780517578125, -0.089599609375, 0.00860595703125, 0.1068115234375, 0.20501708984375, 0.30322265625, 0.40142822265625, 0.4996337890625, 0.59783935546875, 0.696044921875, 0.79425048828125, 0.8924560546875, 0.99066162109375, 1.0888671875, 1.18707275390625, 1.2852783203125, 1.38348388671875, 1.481689453125, 1.57989501953125, 1.6781005859375, 1.77630615234375, 1.87451171875, 1.97271728515625, 2.0709228515625, 2.16912841796875, 2.267333984375, 2.36553955078125, 2.4637451171875, 2.56195068359375, 2.66015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 13.0, 8.0, 17.0, 37.0, 47.0, 125.0, 325.0, 1138.0, 1598.0, 469.0, 128.0, 65.0, 32.0, 16.0, 9.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9192047119140625, -1.851104736328125, -1.7830047607421875, -1.71490478515625, -1.6468048095703125, -1.578704833984375, -1.5106048583984375, -1.4425048828125, -1.3744049072265625, -1.306304931640625, -1.2382049560546875, -1.17010498046875, -1.1020050048828125, -1.033905029296875, -0.9658050537109375, -0.897705078125, -0.8296051025390625, -0.761505126953125, -0.6934051513671875, -0.62530517578125, -0.5572052001953125, -0.489105224609375, -0.4210052490234375, -0.3529052734375, -0.2848052978515625, -0.216705322265625, -0.1486053466796875, -0.08050537109375, -0.0124053955078125, 0.055694580078125, 0.1237945556640625, 0.19189453125, 0.2599945068359375, 0.328094482421875, 0.3961944580078125, 0.46429443359375, 0.5323944091796875, 0.600494384765625, 0.6685943603515625, 0.7366943359375, 0.8047943115234375, 0.872894287109375, 0.9409942626953125, 1.00909423828125, 1.0771942138671875, 1.145294189453125, 1.2133941650390625, 1.281494140625, 1.3495941162109375, 1.417694091796875, 1.4857940673828125, 1.55389404296875, 1.6219940185546875, 1.690093994140625, 1.7581939697265625, 1.8262939453125, 1.8943939208984375, 1.962493896484375, 2.0305938720703125, 2.09869384765625, 2.1667938232421875, 2.234893798828125, 2.3029937744140625, 2.37109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 13.0, 30.0, 39.0, 61.0, 69.0, 97.0, 99.0, 116.0, 96.0, 103.0, 88.0, 64.0, 29.0, 22.0, 14.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.21129035949707, -8.979612350463867, -8.747934341430664, -8.516256332397461, -8.284577369689941, -8.052899360656738, -7.821221351623535, -7.589543342590332, -7.357865333557129, -7.126187324523926, -6.8945088386535645, -6.662830829620361, -6.431152820587158, -6.199474334716797, -5.967796325683594, -5.736118316650391, -5.5044403076171875, -5.272762298583984, -5.041083812713623, -4.80940580368042, -4.577727794647217, -4.3460493087768555, -4.114371299743652, -3.882693290710449, -3.651014804840088, -3.4193365573883057, -3.1876585483551025, -2.9559803009033203, -2.724302291870117, -2.492624044418335, -2.2609457969665527, -2.0292677879333496, -1.7975897789001465, -1.5659116506576538, -1.3342335224151611, -1.102555274963379, -0.870877206325531, -0.6391990184783936, -0.4075208902359009, -0.1758427619934082, 0.05583536624908447, 0.28751349449157715, 0.5191916227340698, 0.7508698105812073, 0.9825479388237, 1.2142261266708374, 1.44590425491333, 1.6775823831558228, 1.9092605113983154, 2.1409387588500977, 2.372616767883301, 2.604295015335083, 2.835973024368286, 3.0676512718200684, 3.2993292808532715, 3.5310075283050537, 3.762685775756836, 3.994364023208618, 4.2260422706604, 4.4577202796936035, 4.689398288726807, 4.921076774597168, 5.152754783630371, 5.384432792663574, 5.616110801696777]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 13.0, 10.0, 8.0, 14.0, 19.0, 29.0, 22.0, 35.0, 40.0, 53.0, 59.0, 82.0, 55.0, 66.0, 55.0, 63.0, 53.0, 50.0, 53.0, 49.0, 39.0, 36.0, 22.0, 19.0, 17.0, 12.0, 2.0, 9.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703622817993164, -8.451614379882812, -8.199605941772461, -7.947597980499268, -7.695590019226074, -7.443581581115723, -7.191573143005371, -6.9395647048950195, -6.687556743621826, -6.435548305511475, -6.183540344238281, -5.93153190612793, -5.679523468017578, -5.427515506744385, -5.175507068634033, -4.92349910736084, -4.671490669250488, -4.419482231140137, -4.167474269866943, -3.915465831756592, -3.6634576320648193, -3.411449432373047, -3.1594409942626953, -2.907432794570923, -2.6554245948791504, -2.403416395187378, -2.1514081954956055, -1.899399757385254, -1.6473915576934814, -1.395383358001709, -1.143375039100647, -0.891366720199585, -0.6393594741821289, -0.38735121488571167, -0.13534295558929443, 0.1166653037071228, 0.36867356300354004, 0.6206817626953125, 0.8726900815963745, 1.1246984004974365, 1.376706600189209, 1.6287147998809814, 1.8807231187820435, 2.1327314376831055, 2.384739637374878, 2.6367478370666504, 2.888756275177002, 3.1407644748687744, 3.392772674560547, 3.6447808742523193, 3.896789073944092, 4.148797512054443, 4.400805473327637, 4.652813911437988, 4.90482234954834, 5.156830787658691, 5.408838748931885, 5.660847187042236, 5.91285514831543, 6.164863586425781, 6.416872024536133, 6.668879985809326, 6.920888423919678, 7.172896385192871, 7.424904823303223]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 15.0, 13.0, 18.0, 26.0, 42.0, 67.0, 120.0, 209.0, 292.0, 568.0, 1117.0, 2067.0, 4117.0, 8470.0, 17952.0, 39884.0, 89688.0, 199192.0, 312376.0, 203607.0, 91940.0, 40830.0, 18445.0, 8713.0, 4100.0, 2070.0, 1140.0, 637.0, 349.0, 183.0, 94.0, 82.0, 33.0, 26.0, 24.0, 11.0, 9.0, 6.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.75537109375, -0.7321395874023438, -0.7089080810546875, -0.6856765747070312, -0.662445068359375, -0.6392135620117188, -0.6159820556640625, -0.5927505493164062, -0.56951904296875, -0.5462875366210938, -0.5230560302734375, -0.49982452392578125, -0.476593017578125, -0.45336151123046875, -0.4301300048828125, -0.40689849853515625, -0.3836669921875, -0.36043548583984375, -0.3372039794921875, -0.31397247314453125, -0.290740966796875, -0.26750946044921875, -0.2442779541015625, -0.22104644775390625, -0.19781494140625, -0.17458343505859375, -0.1513519287109375, -0.12812042236328125, -0.104888916015625, -0.08165740966796875, -0.0584259033203125, -0.03519439697265625, -0.011962890625, 0.01126861572265625, 0.0345001220703125, 0.05773162841796875, 0.080963134765625, 0.10419464111328125, 0.1274261474609375, 0.15065765380859375, 0.17388916015625, 0.19712066650390625, 0.2203521728515625, 0.24358367919921875, 0.266815185546875, 0.29004669189453125, 0.3132781982421875, 0.33650970458984375, 0.3597412109375, 0.38297271728515625, 0.4062042236328125, 0.42943572998046875, 0.452667236328125, 0.47589874267578125, 0.4991302490234375, 0.5223617553710938, 0.54559326171875, 0.5688247680664062, 0.5920562744140625, 0.6152877807617188, 0.638519287109375, 0.6617507934570312, 0.6849822998046875, 0.7082138061523438, 0.7314453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 5.0, 5.0, 7.0, 2.0, 15.0, 10.0, 14.0, 16.0, 27.0, 24.0, 30.0, 20.0, 58.0, 35.0, 30.0, 39.0, 55.0, 47.0, 39.0, 55.0, 42.0, 53.0, 54.0, 30.0, 39.0, 26.0, 37.0, 26.0, 28.0, 22.0, 15.0, 15.0, 16.0, 12.0, 14.0, 10.0, 8.0, 4.0, 3.0, 7.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.54345703125, -0.528900146484375, -0.51434326171875, -0.499786376953125, -0.4852294921875, -0.470672607421875, -0.45611572265625, -0.441558837890625, -0.427001953125, -0.412445068359375, -0.39788818359375, -0.383331298828125, -0.3687744140625, -0.354217529296875, -0.33966064453125, -0.325103759765625, -0.310546875, -0.295989990234375, -0.28143310546875, -0.266876220703125, -0.2523193359375, -0.237762451171875, -0.22320556640625, -0.208648681640625, -0.194091796875, -0.179534912109375, -0.16497802734375, -0.150421142578125, -0.1358642578125, -0.121307373046875, -0.10675048828125, -0.092193603515625, -0.07763671875, -0.063079833984375, -0.04852294921875, -0.033966064453125, -0.0194091796875, -0.004852294921875, 0.00970458984375, 0.024261474609375, 0.038818359375, 0.053375244140625, 0.06793212890625, 0.082489013671875, 0.0970458984375, 0.111602783203125, 0.12615966796875, 0.140716552734375, 0.1552734375, 0.169830322265625, 0.18438720703125, 0.198944091796875, 0.2135009765625, 0.228057861328125, 0.24261474609375, 0.257171630859375, 0.271728515625, 0.286285400390625, 0.30084228515625, 0.315399169921875, 0.3299560546875, 0.344512939453125, 0.35906982421875, 0.373626708984375, 0.38818359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 4.0, 13.0, 18.0, 15.0, 34.0, 34.0, 71.0, 109.0, 180.0, 334.0, 655.0, 1584.0, 5198.0, 39403.0, 758284.0, 223763.0, 13833.0, 2819.0, 1053.0, 458.0, 280.0, 130.0, 84.0, 69.0, 29.0, 14.0, 16.0, 16.0, 11.0, 6.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.75, -2.666107177734375, -2.58221435546875, -2.498321533203125, -2.4144287109375, -2.330535888671875, -2.24664306640625, -2.162750244140625, -2.078857421875, -1.994964599609375, -1.91107177734375, -1.827178955078125, -1.7432861328125, -1.659393310546875, -1.57550048828125, -1.491607666015625, -1.40771484375, -1.323822021484375, -1.23992919921875, -1.156036376953125, -1.0721435546875, -0.988250732421875, -0.90435791015625, -0.820465087890625, -0.736572265625, -0.652679443359375, -0.56878662109375, -0.484893798828125, -0.4010009765625, -0.317108154296875, -0.23321533203125, -0.149322509765625, -0.0654296875, 0.018463134765625, 0.10235595703125, 0.186248779296875, 0.2701416015625, 0.354034423828125, 0.43792724609375, 0.521820068359375, 0.605712890625, 0.689605712890625, 0.77349853515625, 0.857391357421875, 0.9412841796875, 1.025177001953125, 1.10906982421875, 1.192962646484375, 1.27685546875, 1.360748291015625, 1.44464111328125, 1.528533935546875, 1.6124267578125, 1.696319580078125, 1.78021240234375, 1.864105224609375, 1.947998046875, 2.031890869140625, 2.11578369140625, 2.199676513671875, 2.2835693359375, 2.367462158203125, 2.45135498046875, 2.535247802734375, 2.619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 10.0, 7.0, 6.0, 8.0, 7.0, 12.0, 26.0, 19.0, 30.0, 38.0, 37.0, 36.0, 45.0, 56.0, 51.0, 59.0, 39.0, 57.0, 54.0, 49.0, 52.0, 53.0, 34.0, 44.0, 27.0, 29.0, 24.0, 26.0, 10.0, 15.0, 13.0, 5.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2890625, -2.215179443359375, -2.14129638671875, -2.067413330078125, -1.9935302734375, -1.919647216796875, -1.84576416015625, -1.771881103515625, -1.697998046875, -1.624114990234375, -1.55023193359375, -1.476348876953125, -1.4024658203125, -1.328582763671875, -1.25469970703125, -1.180816650390625, -1.10693359375, -1.033050537109375, -0.95916748046875, -0.885284423828125, -0.8114013671875, -0.737518310546875, -0.66363525390625, -0.589752197265625, -0.515869140625, -0.441986083984375, -0.36810302734375, -0.294219970703125, -0.2203369140625, -0.146453857421875, -0.07257080078125, 0.001312255859375, 0.0751953125, 0.149078369140625, 0.22296142578125, 0.296844482421875, 0.3707275390625, 0.444610595703125, 0.51849365234375, 0.592376708984375, 0.666259765625, 0.740142822265625, 0.81402587890625, 0.887908935546875, 0.9617919921875, 1.035675048828125, 1.10955810546875, 1.183441162109375, 1.25732421875, 1.331207275390625, 1.40509033203125, 1.478973388671875, 1.5528564453125, 1.626739501953125, 1.70062255859375, 1.774505615234375, 1.848388671875, 1.922271728515625, 1.99615478515625, 2.070037841796875, 2.1439208984375, 2.217803955078125, 2.29168701171875, 2.365570068359375, 2.439453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 7.0, 14.0, 5.0, 19.0, 21.0, 39.0, 70.0, 115.0, 219.0, 497.0, 1310.0, 5234.0, 40462.0, 814456.0, 169865.0, 12238.0, 2509.0, 743.0, 300.0, 144.0, 102.0, 45.0, 30.0, 28.0, 15.0, 11.0, 11.0, 7.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.06640625, -1.029296875, -0.9921875, -0.955078125, -0.91796875, -0.880859375, -0.84375, -0.806640625, -0.76953125, -0.732421875, -0.6953125, -0.658203125, -0.62109375, -0.583984375, -0.546875, -0.509765625, -0.47265625, -0.435546875, -0.3984375, -0.361328125, -0.32421875, -0.287109375, -0.25, -0.212890625, -0.17578125, -0.138671875, -0.1015625, -0.064453125, -0.02734375, 0.009765625, 0.046875, 0.083984375, 0.12109375, 0.158203125, 0.1953125, 0.232421875, 0.26953125, 0.306640625, 0.34375, 0.380859375, 0.41796875, 0.455078125, 0.4921875, 0.529296875, 0.56640625, 0.603515625, 0.640625, 0.677734375, 0.71484375, 0.751953125, 0.7890625, 0.826171875, 0.86328125, 0.900390625, 0.9375, 0.974609375, 1.01171875, 1.048828125, 1.0859375, 1.123046875, 1.16015625, 1.197265625, 1.234375, 1.271484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 5.0, 4.0, 7.0, 9.0, 12.0, 19.0, 14.0, 21.0, 26.0, 44.0, 44.0, 56.0, 97.0, 116.0, 142.0, 97.0, 69.0, 41.0, 35.0, 23.0, 17.0, 21.0, 16.0, 11.0, 12.0, 6.0, 9.0, 1.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001316070556640625, -0.00012813881039619446, -0.00012467056512832642, -0.00012120231986045837, -0.00011773407459259033, -0.00011426582932472229, -0.00011079758405685425, -0.0001073293387889862, -0.00010386109352111816, -0.00010039284825325012, -9.692460298538208e-05, -9.345635771751404e-05, -8.9988112449646e-05, -8.651986718177795e-05, -8.305162191390991e-05, -7.958337664604187e-05, -7.611513137817383e-05, -7.264688611030579e-05, -6.917864084243774e-05, -6.57103955745697e-05, -6.224215030670166e-05, -5.877390503883362e-05, -5.5305659770965576e-05, -5.1837414503097534e-05, -4.836916923522949e-05, -4.490092396736145e-05, -4.143267869949341e-05, -3.7964433431625366e-05, -3.4496188163757324e-05, -3.102794289588928e-05, -2.755969762802124e-05, -2.4091452360153198e-05, -2.0623207092285156e-05, -1.7154961824417114e-05, -1.3686716556549072e-05, -1.021847128868103e-05, -6.750226020812988e-06, -3.2819807529449463e-06, 1.862645149230957e-07, 3.6545097827911377e-06, 7.12275505065918e-06, 1.0591000318527222e-05, 1.4059245586395264e-05, 1.7527490854263306e-05, 2.0995736122131348e-05, 2.446398138999939e-05, 2.793222665786743e-05, 3.1400471925735474e-05, 3.4868717193603516e-05, 3.833696246147156e-05, 4.18052077293396e-05, 4.527345299720764e-05, 4.8741698265075684e-05, 5.2209943532943726e-05, 5.567818880081177e-05, 5.914643406867981e-05, 6.261467933654785e-05, 6.60829246044159e-05, 6.955116987228394e-05, 7.301941514015198e-05, 7.648766040802002e-05, 7.995590567588806e-05, 8.34241509437561e-05, 8.689239621162415e-05, 9.036064147949219e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 16.0, 13.0, 28.0, 31.0, 59.0, 60.0, 132.0, 206.0, 424.0, 747.0, 1639.0, 4677.0, 17975.0, 133073.0, 774533.0, 93612.0, 14217.0, 3961.0, 1508.0, 695.0, 338.0, 223.0, 114.0, 88.0, 48.0, 25.0, 29.0, 19.0, 10.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.1025390625, -1.0730819702148438, -1.0436248779296875, -1.0141677856445312, -0.984710693359375, -0.9552536010742188, -0.9257965087890625, -0.8963394165039062, -0.86688232421875, -0.8374252319335938, -0.8079681396484375, -0.7785110473632812, -0.749053955078125, -0.7195968627929688, -0.6901397705078125, -0.6606826782226562, -0.6312255859375, -0.6017684936523438, -0.5723114013671875, -0.5428543090820312, -0.513397216796875, -0.48394012451171875, -0.4544830322265625, -0.42502593994140625, -0.39556884765625, -0.36611175537109375, -0.3366546630859375, -0.30719757080078125, -0.277740478515625, -0.24828338623046875, -0.2188262939453125, -0.18936920166015625, -0.159912109375, -0.13045501708984375, -0.1009979248046875, -0.07154083251953125, -0.042083740234375, -0.01262664794921875, 0.0168304443359375, 0.04628753662109375, 0.07574462890625, 0.10520172119140625, 0.1346588134765625, 0.16411590576171875, 0.193572998046875, 0.22303009033203125, 0.2524871826171875, 0.28194427490234375, 0.3114013671875, 0.34085845947265625, 0.3703155517578125, 0.39977264404296875, 0.429229736328125, 0.45868682861328125, 0.4881439208984375, 0.5176010131835938, 0.54705810546875, 0.5765151977539062, 0.6059722900390625, 0.6354293823242188, 0.664886474609375, 0.6943435668945312, 0.7238006591796875, 0.7532577514648438, 0.78271484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 7.0, 3.0, 1.0, 3.0, 4.0, 15.0, 16.0, 14.0, 21.0, 25.0, 44.0, 52.0, 57.0, 76.0, 91.0, 93.0, 95.0, 86.0, 79.0, 63.0, 33.0, 33.0, 22.0, 20.0, 10.0, 11.0, 4.0, 6.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.71923828125, -0.69720458984375, -0.6751708984375, -0.65313720703125, -0.631103515625, -0.60906982421875, -0.5870361328125, -0.56500244140625, -0.54296875, -0.52093505859375, -0.4989013671875, -0.47686767578125, -0.454833984375, -0.43280029296875, -0.4107666015625, -0.38873291015625, -0.36669921875, -0.34466552734375, -0.3226318359375, -0.30059814453125, -0.278564453125, -0.25653076171875, -0.2344970703125, -0.21246337890625, -0.1904296875, -0.16839599609375, -0.1463623046875, -0.12432861328125, -0.102294921875, -0.08026123046875, -0.0582275390625, -0.03619384765625, -0.01416015625, 0.00787353515625, 0.0299072265625, 0.05194091796875, 0.073974609375, 0.09600830078125, 0.1180419921875, 0.14007568359375, 0.162109375, 0.18414306640625, 0.2061767578125, 0.22821044921875, 0.250244140625, 0.27227783203125, 0.2943115234375, 0.31634521484375, 0.33837890625, 0.36041259765625, 0.3824462890625, 0.40447998046875, 0.426513671875, 0.44854736328125, 0.4705810546875, 0.49261474609375, 0.5146484375, 0.53668212890625, 0.5587158203125, 0.58074951171875, 0.602783203125, 0.62481689453125, 0.6468505859375, 0.66888427734375, 0.69091796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 11.0, 26.0, 240.0, 494.0, 180.0, 37.0, 13.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.13744354248047, -42.923370361328125, -41.70929718017578, -40.4952278137207, -39.28115463256836, -38.067081451416016, -36.85301208496094, -35.638938903808594, -34.42486572265625, -33.210792541503906, -31.996721267700195, -30.782649993896484, -29.56857681274414, -28.354503631591797, -27.140432357788086, -25.926361083984375, -24.71228790283203, -23.498214721679688, -22.284143447875977, -21.070072174072266, -19.855998992919922, -18.641925811767578, -17.427854537963867, -16.213783264160156, -14.999710083007812, -13.785637855529785, -12.571565628051758, -11.35749340057373, -10.143421173095703, -8.929348945617676, -7.715276718139648, -6.501204490661621, -5.287128448486328, -4.073056221008301, -2.8589839935302734, -1.644911766052246, -0.43083953857421875, 0.7832326889038086, 1.997304916381836, 3.2113771438598633, 4.425449371337891, 5.639521598815918, 6.853593826293945, 8.067666053771973, 9.28173828125, 10.495810508728027, 11.709882736206055, 12.923954963684082, 14.13802719116211, 15.352099418640137, 16.566171646118164, 17.780242919921875, 18.99431610107422, 20.208389282226562, 21.422460556030273, 22.636531829833984, 23.850605010986328, 25.064678192138672, 26.278749465942383, 27.492820739746094, 28.706893920898438, 29.92096710205078, 31.135038375854492, 32.3491096496582, 33.56318283081055]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 7.0, 10.0, 11.0, 7.0, 10.0, 7.0, 19.0, 23.0, 16.0, 16.0, 22.0, 23.0, 41.0, 44.0, 32.0, 43.0, 32.0, 64.0, 54.0, 54.0, 47.0, 40.0, 39.0, 43.0, 39.0, 34.0, 25.0, 33.0, 29.0, 20.0, 15.0, 21.0, 6.0, 18.0, 13.0, 9.0, 12.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.848972797393799, -7.584721565246582, -7.320470333099365, -7.056219100952148, -6.791967868804932, -6.527716636657715, -6.26346492767334, -5.999214172363281, -5.734962463378906, -5.4707112312316895, -5.206459999084473, -4.942208766937256, -4.677957534790039, -4.413706302642822, -4.1494550704956055, -3.8852035999298096, -3.620952606201172, -3.356701374053955, -3.0924501419067383, -2.8281989097595215, -2.5639476776123047, -2.299696445465088, -2.035444974899292, -1.7711937427520752, -1.5069425106048584, -1.2426912784576416, -0.97843998670578, -0.7141886949539185, -0.44993746280670166, -0.18568623065948486, 0.07856512069702148, 0.3428163528442383, 0.6070671081542969, 0.8713183403015137, 1.1355695724487305, 1.3998209238052368, 1.6640721559524536, 1.9283233880996704, 2.1925747394561768, 2.4568259716033936, 2.7210772037506104, 2.985328435897827, 3.249579668045044, 3.51383113861084, 3.7780823707580566, 4.042333602905273, 4.30658483505249, 4.570836067199707, 4.835087299346924, 5.099338531494141, 5.363589763641357, 5.627840995788574, 5.892092227935791, 6.156343460083008, 6.420595169067383, 6.684845924377441, 6.949097633361816, 7.213348865509033, 7.47760009765625, 7.741851329803467, 8.006102561950684, 8.270354270935059, 8.534605026245117, 8.798856735229492, 9.06310749053955]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 3.0, 18.0, 18.0, 23.0, 38.0, 47.0, 73.0, 106.0, 177.0, 255.0, 438.0, 754.0, 1387.0, 2869.0, 6127.0, 16019.0, 61508.0, 689009.0, 3132298.0, 228154.0, 34930.0, 10851.0, 4459.0, 1989.0, 1102.0, 569.0, 343.0, 236.0, 149.0, 109.0, 64.0, 49.0, 18.0, 22.0, 16.0, 8.0, 14.0, 9.0, 4.0, 0.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.912109375, -0.88201904296875, -0.8519287109375, -0.82183837890625, -0.791748046875, -0.76165771484375, -0.7315673828125, -0.70147705078125, -0.67138671875, -0.64129638671875, -0.6112060546875, -0.58111572265625, -0.551025390625, -0.52093505859375, -0.4908447265625, -0.46075439453125, -0.4306640625, -0.40057373046875, -0.3704833984375, -0.34039306640625, -0.310302734375, -0.28021240234375, -0.2501220703125, -0.22003173828125, -0.18994140625, -0.15985107421875, -0.1297607421875, -0.09967041015625, -0.069580078125, -0.03948974609375, -0.0093994140625, 0.02069091796875, 0.05078125, 0.08087158203125, 0.1109619140625, 0.14105224609375, 0.171142578125, 0.20123291015625, 0.2313232421875, 0.26141357421875, 0.29150390625, 0.32159423828125, 0.3516845703125, 0.38177490234375, 0.411865234375, 0.44195556640625, 0.4720458984375, 0.50213623046875, 0.5322265625, 0.56231689453125, 0.5924072265625, 0.62249755859375, 0.652587890625, 0.68267822265625, 0.7127685546875, 0.74285888671875, 0.77294921875, 0.80303955078125, 0.8331298828125, 0.86322021484375, 0.893310546875, 0.92340087890625, 0.9534912109375, 0.98358154296875, 1.013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 10.0, 30.0, 21.0, 36.0, 42.0, 56.0, 56.0, 60.0, 64.0, 72.0, 74.0, 82.0, 77.0, 66.0, 46.0, 57.0, 30.0, 24.0, 19.0, 19.0, 13.0, 8.0, 8.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74755859375, -0.725799560546875, -0.70404052734375, -0.682281494140625, -0.6605224609375, -0.638763427734375, -0.61700439453125, -0.595245361328125, -0.573486328125, -0.551727294921875, -0.52996826171875, -0.508209228515625, -0.4864501953125, -0.464691162109375, -0.44293212890625, -0.421173095703125, -0.3994140625, -0.377655029296875, -0.35589599609375, -0.334136962890625, -0.3123779296875, -0.290618896484375, -0.26885986328125, -0.247100830078125, -0.225341796875, -0.203582763671875, -0.18182373046875, -0.160064697265625, -0.1383056640625, -0.116546630859375, -0.09478759765625, -0.073028564453125, -0.05126953125, -0.029510498046875, -0.00775146484375, 0.014007568359375, 0.0357666015625, 0.057525634765625, 0.07928466796875, 0.101043701171875, 0.122802734375, 0.144561767578125, 0.16632080078125, 0.188079833984375, 0.2098388671875, 0.231597900390625, 0.25335693359375, 0.275115966796875, 0.296875, 0.318634033203125, 0.34039306640625, 0.362152099609375, 0.3839111328125, 0.405670166015625, 0.42742919921875, 0.449188232421875, 0.470947265625, 0.492706298828125, 0.51446533203125, 0.536224365234375, 0.5579833984375, 0.579742431640625, 0.60150146484375, 0.623260498046875, 0.64501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 6.0, 10.0, 11.0, 36.0, 86.0, 223.0, 674.0, 2056.0, 7839.0, 38619.0, 903612.0, 3152373.0, 72970.0, 11534.0, 2899.0, 800.0, 276.0, 115.0, 52.0, 31.0, 22.0, 5.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3120880126953125, -1.259918212890625, -1.2077484130859375, -1.15557861328125, -1.1034088134765625, -1.051239013671875, -0.9990692138671875, -0.9468994140625, -0.8947296142578125, -0.842559814453125, -0.7903900146484375, -0.73822021484375, -0.6860504150390625, -0.633880615234375, -0.5817108154296875, -0.529541015625, -0.4773712158203125, -0.425201416015625, -0.3730316162109375, -0.32086181640625, -0.2686920166015625, -0.216522216796875, -0.1643524169921875, -0.1121826171875, -0.0600128173828125, -0.007843017578125, 0.0443267822265625, 0.09649658203125, 0.1486663818359375, 0.200836181640625, 0.2530059814453125, 0.30517578125, 0.3573455810546875, 0.409515380859375, 0.4616851806640625, 0.51385498046875, 0.5660247802734375, 0.618194580078125, 0.6703643798828125, 0.7225341796875, 0.7747039794921875, 0.826873779296875, 0.8790435791015625, 0.93121337890625, 0.9833831787109375, 1.035552978515625, 1.0877227783203125, 1.139892578125, 1.1920623779296875, 1.244232177734375, 1.2964019775390625, 1.34857177734375, 1.4007415771484375, 1.452911376953125, 1.5050811767578125, 1.5572509765625, 1.6094207763671875, 1.661590576171875, 1.7137603759765625, 1.76593017578125, 1.8180999755859375, 1.870269775390625, 1.9224395751953125, 1.974609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 8.0, 6.0, 9.0, 12.0, 13.0, 21.0, 22.0, 41.0, 37.0, 81.0, 155.0, 301.0, 556.0, 861.0, 803.0, 479.0, 241.0, 131.0, 92.0, 57.0, 45.0, 25.0, 12.0, 13.0, 7.0, 3.0, 14.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.015625, -0.98382568359375, -0.9520263671875, -0.92022705078125, -0.888427734375, -0.85662841796875, -0.8248291015625, -0.79302978515625, -0.76123046875, -0.72943115234375, -0.6976318359375, -0.66583251953125, -0.634033203125, -0.60223388671875, -0.5704345703125, -0.53863525390625, -0.5068359375, -0.47503662109375, -0.4432373046875, -0.41143798828125, -0.379638671875, -0.34783935546875, -0.3160400390625, -0.28424072265625, -0.25244140625, -0.22064208984375, -0.1888427734375, -0.15704345703125, -0.125244140625, -0.09344482421875, -0.0616455078125, -0.02984619140625, 0.001953125, 0.03375244140625, 0.0655517578125, 0.09735107421875, 0.129150390625, 0.16094970703125, 0.1927490234375, 0.22454833984375, 0.25634765625, 0.28814697265625, 0.3199462890625, 0.35174560546875, 0.383544921875, 0.41534423828125, 0.4471435546875, 0.47894287109375, 0.5107421875, 0.54254150390625, 0.5743408203125, 0.60614013671875, 0.637939453125, 0.66973876953125, 0.7015380859375, 0.73333740234375, 0.76513671875, 0.79693603515625, 0.8287353515625, 0.86053466796875, 0.892333984375, 0.92413330078125, 0.9559326171875, 0.98773193359375, 1.01953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 10.0, 39.0, 137.0, 332.0, 299.0, 130.0, 28.0, 14.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.897869110107422, -11.264400482177734, -10.630931854248047, -9.99746322631836, -9.363994598388672, -8.730525970458984, -8.097058296203613, -7.463589668273926, -6.830121040344238, -6.196652412414551, -5.563183784484863, -4.929715633392334, -4.2962470054626465, -3.662778377532959, -3.0293099880218506, -2.395841598510742, -1.7623729705810547, -1.1289044618606567, -0.4954359531402588, 0.13803255558013916, 0.7715010643005371, 1.4049696922302246, 2.038438081741333, 2.6719064712524414, 3.305375099182129, 3.9388437271118164, 4.572312355041504, 5.205780506134033, 5.839249134063721, 6.472717761993408, 7.1061859130859375, 7.739654541015625, 8.37312126159668, 9.006589889526367, 9.640058517456055, 10.273527145385742, 10.90699577331543, 11.540464401245117, 12.173932075500488, 12.807400703430176, 13.440869331359863, 14.07433795928955, 14.707806587219238, 15.341275215148926, 15.974742889404297, 16.608211517333984, 17.241680145263672, 17.87514877319336, 18.508617401123047, 19.142086029052734, 19.775554656982422, 20.40902328491211, 21.042491912841797, 21.675960540771484, 22.309429168701172, 22.94289779663086, 23.576366424560547, 24.209835052490234, 24.843303680419922, 25.47677230834961, 26.110240936279297, 26.743709564208984, 27.377178192138672, 28.01064682006836, 28.644113540649414]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 11.0, 11.0, 20.0, 26.0, 27.0, 33.0, 32.0, 39.0, 49.0, 48.0, 62.0, 71.0, 66.0, 60.0, 69.0, 44.0, 52.0, 53.0, 56.0, 33.0, 26.0, 30.0, 14.0, 17.0, 8.0, 14.0, 7.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3191022872924805, -5.1202616691589355, -4.921421051025391, -4.722580432891846, -4.523739814758301, -4.324899196624756, -4.126058578491211, -3.927217721939087, -3.728377103805542, -3.529536485671997, -3.330695867538452, -3.131855010986328, -2.933014392852783, -2.7341737747192383, -2.5353331565856934, -2.3364925384521484, -2.1376519203186035, -1.9388113021850586, -1.7399706840515137, -1.5411299467086792, -1.3422893285751343, -1.1434487104415894, -0.9446079730987549, -0.74576735496521, -0.546926736831665, -0.34808608889579773, -0.14924544095993042, 0.04959523677825928, 0.2484358549118042, 0.4472764730453491, 0.6461172103881836, 0.8449578285217285, 1.0437984466552734, 1.2426390647888184, 1.4414796829223633, 1.6403204202651978, 1.8391610383987427, 2.038001537322998, 2.236842393875122, 2.435683012008667, 2.634523630142212, 2.833364248275757, 3.0322048664093018, 3.231045722961426, 3.4298863410949707, 3.6287269592285156, 3.8275675773620605, 4.0264081954956055, 4.22524881362915, 4.424089431762695, 4.62293004989624, 4.821770668029785, 5.02061128616333, 5.219451904296875, 5.418292999267578, 5.617133140563965, 5.815974235534668, 6.014814853668213, 6.213655471801758, 6.412496089935303, 6.611336708068848, 6.810177326202393, 7.0090179443359375, 7.207859039306641, 7.406699180603027]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 9.0, 21.0, 24.0, 41.0, 59.0, 109.0, 166.0, 287.0, 525.0, 972.0, 1793.0, 3726.0, 7829.0, 17715.0, 41417.0, 101023.0, 245950.0, 342077.0, 166233.0, 67134.0, 28246.0, 12113.0, 5460.0, 2564.0, 1376.0, 695.0, 394.0, 242.0, 130.0, 78.0, 49.0, 37.0, 23.0, 13.0, 9.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8090896606445312, -0.7832183837890625, -0.7573471069335938, -0.731475830078125, -0.7056045532226562, -0.6797332763671875, -0.6538619995117188, -0.62799072265625, -0.6021194458007812, -0.5762481689453125, -0.5503768920898438, -0.524505615234375, -0.49863433837890625, -0.4727630615234375, -0.44689178466796875, -0.4210205078125, -0.39514923095703125, -0.3692779541015625, -0.34340667724609375, -0.317535400390625, -0.29166412353515625, -0.2657928466796875, -0.23992156982421875, -0.21405029296875, -0.18817901611328125, -0.1623077392578125, -0.13643646240234375, -0.110565185546875, -0.08469390869140625, -0.0588226318359375, -0.03295135498046875, -0.007080078125, 0.01879119873046875, 0.0446624755859375, 0.07053375244140625, 0.096405029296875, 0.12227630615234375, 0.1481475830078125, 0.17401885986328125, 0.19989013671875, 0.22576141357421875, 0.2516326904296875, 0.27750396728515625, 0.303375244140625, 0.32924652099609375, 0.3551177978515625, 0.38098907470703125, 0.4068603515625, 0.43273162841796875, 0.4586029052734375, 0.48447418212890625, 0.510345458984375, 0.5362167358398438, 0.5620880126953125, 0.5879592895507812, 0.61383056640625, 0.6397018432617188, 0.6655731201171875, 0.6914443969726562, 0.717315673828125, 0.7431869506835938, 0.7690582275390625, 0.7949295043945312, 0.82080078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 5.0, 8.0, 3.0, 10.0, 10.0, 23.0, 13.0, 23.0, 23.0, 27.0, 36.0, 39.0, 48.0, 50.0, 44.0, 44.0, 54.0, 55.0, 50.0, 51.0, 53.0, 41.0, 41.0, 41.0, 34.0, 34.0, 30.0, 18.0, 22.0, 17.0, 16.0, 7.0, 7.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.39180755615234375, -0.3759002685546875, -0.35999298095703125, -0.344085693359375, -0.32817840576171875, -0.3122711181640625, -0.29636383056640625, -0.28045654296875, -0.26454925537109375, -0.2486419677734375, -0.23273468017578125, -0.216827392578125, -0.20092010498046875, -0.1850128173828125, -0.16910552978515625, -0.1531982421875, -0.13729095458984375, -0.1213836669921875, -0.10547637939453125, -0.089569091796875, -0.07366180419921875, -0.0577545166015625, -0.04184722900390625, -0.02593994140625, -0.01003265380859375, 0.0058746337890625, 0.02178192138671875, 0.037689208984375, 0.05359649658203125, 0.0695037841796875, 0.08541107177734375, 0.101318359375, 0.11722564697265625, 0.1331329345703125, 0.14904022216796875, 0.164947509765625, 0.18085479736328125, 0.1967620849609375, 0.21266937255859375, 0.22857666015625, 0.24448394775390625, 0.2603912353515625, 0.27629852294921875, 0.292205810546875, 0.30811309814453125, 0.3240203857421875, 0.33992767333984375, 0.3558349609375, 0.37174224853515625, 0.3876495361328125, 0.40355682373046875, 0.419464111328125, 0.43537139892578125, 0.4512786865234375, 0.46718597412109375, 0.48309326171875, 0.49900054931640625, 0.5149078369140625, 0.5308151245117188, 0.546722412109375, 0.5626296997070312, 0.5785369873046875, 0.5944442749023438, 0.6103515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 11.0, 9.0, 17.0, 20.0, 24.0, 44.0, 56.0, 105.0, 136.0, 212.0, 326.0, 576.0, 1410.0, 4207.0, 18071.0, 125449.0, 713098.0, 155479.0, 21287.0, 4748.0, 1515.0, 707.0, 370.0, 202.0, 147.0, 91.0, 52.0, 53.0, 23.0, 22.0, 21.0, 16.0, 12.0, 6.0, 5.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.009765625, -1.949859619140625, -1.88995361328125, -1.830047607421875, -1.7701416015625, -1.710235595703125, -1.65032958984375, -1.590423583984375, -1.530517578125, -1.470611572265625, -1.41070556640625, -1.350799560546875, -1.2908935546875, -1.230987548828125, -1.17108154296875, -1.111175537109375, -1.05126953125, -0.991363525390625, -0.93145751953125, -0.871551513671875, -0.8116455078125, -0.751739501953125, -0.69183349609375, -0.631927490234375, -0.572021484375, -0.512115478515625, -0.45220947265625, -0.392303466796875, -0.3323974609375, -0.272491455078125, -0.21258544921875, -0.152679443359375, -0.0927734375, -0.032867431640625, 0.02703857421875, 0.086944580078125, 0.1468505859375, 0.206756591796875, 0.26666259765625, 0.326568603515625, 0.386474609375, 0.446380615234375, 0.50628662109375, 0.566192626953125, 0.6260986328125, 0.686004638671875, 0.74591064453125, 0.805816650390625, 0.86572265625, 0.925628662109375, 0.98553466796875, 1.045440673828125, 1.1053466796875, 1.165252685546875, 1.22515869140625, 1.285064697265625, 1.344970703125, 1.404876708984375, 1.46478271484375, 1.524688720703125, 1.5845947265625, 1.644500732421875, 1.70440673828125, 1.764312744140625, 1.82421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 10.0, 12.0, 7.0, 16.0, 12.0, 16.0, 20.0, 28.0, 36.0, 33.0, 36.0, 44.0, 55.0, 46.0, 49.0, 32.0, 48.0, 49.0, 63.0, 43.0, 39.0, 37.0, 39.0, 23.0, 30.0, 33.0, 24.0, 29.0, 15.0, 15.0, 16.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8037109375, -1.7448883056640625, -1.686065673828125, -1.6272430419921875, -1.56842041015625, -1.5095977783203125, -1.450775146484375, -1.3919525146484375, -1.3331298828125, -1.2743072509765625, -1.215484619140625, -1.1566619873046875, -1.09783935546875, -1.0390167236328125, -0.980194091796875, -0.9213714599609375, -0.862548828125, -0.8037261962890625, -0.744903564453125, -0.6860809326171875, -0.62725830078125, -0.5684356689453125, -0.509613037109375, -0.4507904052734375, -0.3919677734375, -0.3331451416015625, -0.274322509765625, -0.2154998779296875, -0.15667724609375, -0.0978546142578125, -0.039031982421875, 0.0197906494140625, 0.07861328125, 0.1374359130859375, 0.196258544921875, 0.2550811767578125, 0.31390380859375, 0.3727264404296875, 0.431549072265625, 0.4903717041015625, 0.5491943359375, 0.6080169677734375, 0.666839599609375, 0.7256622314453125, 0.78448486328125, 0.8433074951171875, 0.902130126953125, 0.9609527587890625, 1.019775390625, 1.0785980224609375, 1.137420654296875, 1.1962432861328125, 1.25506591796875, 1.3138885498046875, 1.372711181640625, 1.4315338134765625, 1.4903564453125, 1.5491790771484375, 1.608001708984375, 1.6668243408203125, 1.72564697265625, 1.7844696044921875, 1.843292236328125, 1.9021148681640625, 1.9609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 9.0, 8.0, 10.0, 13.0, 22.0, 41.0, 78.0, 156.0, 406.0, 1802.0, 17051.0, 893673.0, 129498.0, 4446.0, 823.0, 261.0, 103.0, 43.0, 36.0, 17.0, 10.0, 5.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.50714111328125, -1.4547119140625, -1.40228271484375, -1.349853515625, -1.29742431640625, -1.2449951171875, -1.19256591796875, -1.14013671875, -1.08770751953125, -1.0352783203125, -0.98284912109375, -0.930419921875, -0.87799072265625, -0.8255615234375, -0.77313232421875, -0.720703125, -0.66827392578125, -0.6158447265625, -0.56341552734375, -0.510986328125, -0.45855712890625, -0.4061279296875, -0.35369873046875, -0.30126953125, -0.24884033203125, -0.1964111328125, -0.14398193359375, -0.091552734375, -0.03912353515625, 0.0133056640625, 0.06573486328125, 0.1181640625, 0.17059326171875, 0.2230224609375, 0.27545166015625, 0.327880859375, 0.38031005859375, 0.4327392578125, 0.48516845703125, 0.53759765625, 0.59002685546875, 0.6424560546875, 0.69488525390625, 0.747314453125, 0.79974365234375, 0.8521728515625, 0.90460205078125, 0.95703125, 1.00946044921875, 1.0618896484375, 1.11431884765625, 1.166748046875, 1.21917724609375, 1.2716064453125, 1.32403564453125, 1.37646484375, 1.42889404296875, 1.4813232421875, 1.53375244140625, 1.586181640625, 1.63861083984375, 1.6910400390625, 1.74346923828125, 1.7958984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 3.0, 3.0, 20.0, 26.0, 30.0, 35.0, 55.0, 72.0, 78.0, 117.0, 131.0, 104.0, 74.0, 53.0, 48.0, 29.0, 24.0, 14.0, 19.0, 11.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011324882507324219, -0.00010940432548522949, -0.0001055598258972168, -0.0001017153263092041, -9.78708267211914e-05, -9.402632713317871e-05, -9.018182754516602e-05, -8.633732795715332e-05, -8.249282836914062e-05, -7.864832878112793e-05, -7.480382919311523e-05, -7.095932960510254e-05, -6.711483001708984e-05, -6.327033042907715e-05, -5.942583084106445e-05, -5.558133125305176e-05, -5.173683166503906e-05, -4.789233207702637e-05, -4.404783248901367e-05, -4.0203332901000977e-05, -3.635883331298828e-05, -3.2514333724975586e-05, -2.866983413696289e-05, -2.4825334548950195e-05, -2.09808349609375e-05, -1.7136335372924805e-05, -1.329183578491211e-05, -9.447336196899414e-06, -5.602836608886719e-06, -1.7583370208740234e-06, 2.086162567138672e-06, 5.930662155151367e-06, 9.775161743164062e-06, 1.3619661331176758e-05, 1.7464160919189453e-05, 2.130866050720215e-05, 2.5153160095214844e-05, 2.899765968322754e-05, 3.2842159271240234e-05, 3.668665885925293e-05, 4.0531158447265625e-05, 4.437565803527832e-05, 4.8220157623291016e-05, 5.206465721130371e-05, 5.5909156799316406e-05, 5.97536563873291e-05, 6.35981559753418e-05, 6.744265556335449e-05, 7.128715515136719e-05, 7.513165473937988e-05, 7.897615432739258e-05, 8.282065391540527e-05, 8.666515350341797e-05, 9.050965309143066e-05, 9.435415267944336e-05, 9.819865226745605e-05, 0.00010204315185546875, 0.00010588765144348145, 0.00010973215103149414, 0.00011357665061950684, 0.00011742115020751953, 0.00012126564979553223, 0.00012511014938354492, 0.00012895464897155762, 0.0001327991485595703]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 12.0, 19.0, 19.0, 42.0, 57.0, 76.0, 140.0, 259.0, 542.0, 1118.0, 2978.0, 10661.0, 61410.0, 653952.0, 277554.0, 29417.0, 6404.0, 2079.0, 850.0, 405.0, 202.0, 126.0, 70.0, 41.0, 25.0, 16.0, 19.0, 9.0, 11.0, 7.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6430587768554688, -0.6181488037109375, -0.5932388305664062, -0.568328857421875, -0.5434188842773438, -0.5185089111328125, -0.49359893798828125, -0.46868896484375, -0.44377899169921875, -0.4188690185546875, -0.39395904541015625, -0.369049072265625, -0.34413909912109375, -0.3192291259765625, -0.29431915283203125, -0.2694091796875, -0.24449920654296875, -0.2195892333984375, -0.19467926025390625, -0.169769287109375, -0.14485931396484375, -0.1199493408203125, -0.09503936767578125, -0.07012939453125, -0.04521942138671875, -0.0203094482421875, 0.00460052490234375, 0.029510498046875, 0.05442047119140625, 0.0793304443359375, 0.10424041748046875, 0.129150390625, 0.15406036376953125, 0.1789703369140625, 0.20388031005859375, 0.228790283203125, 0.25370025634765625, 0.2786102294921875, 0.30352020263671875, 0.32843017578125, 0.35334014892578125, 0.3782501220703125, 0.40316009521484375, 0.428070068359375, 0.45298004150390625, 0.4778900146484375, 0.5027999877929688, 0.5277099609375, 0.5526199340820312, 0.5775299072265625, 0.6024398803710938, 0.627349853515625, 0.6522598266601562, 0.6771697998046875, 0.7020797729492188, 0.72698974609375, 0.7518997192382812, 0.7768096923828125, 0.8017196655273438, 0.826629638671875, 0.8515396118164062, 0.8764495849609375, 0.9013595581054688, 0.92626953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 3.0, 12.0, 13.0, 21.0, 11.0, 27.0, 30.0, 36.0, 44.0, 77.0, 79.0, 82.0, 85.0, 69.0, 59.0, 74.0, 52.0, 47.0, 27.0, 34.0, 28.0, 17.0, 12.0, 13.0, 6.0, 6.0, 3.0, 7.0, 3.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5150794982910156, -0.49939727783203125, -0.4837150573730469, -0.4680328369140625, -0.4523506164550781, -0.43666839599609375, -0.4209861755371094, -0.405303955078125, -0.3896217346191406, -0.37393951416015625, -0.3582572937011719, -0.3425750732421875, -0.3268928527832031, -0.31121063232421875, -0.2955284118652344, -0.27984619140625, -0.2641639709472656, -0.24848175048828125, -0.23279953002929688, -0.2171173095703125, -0.20143508911132812, -0.18575286865234375, -0.17007064819335938, -0.154388427734375, -0.13870620727539062, -0.12302398681640625, -0.10734176635742188, -0.0916595458984375, -0.07597732543945312, -0.06029510498046875, -0.044612884521484375, -0.0289306640625, -0.013248443603515625, 0.00243377685546875, 0.018115997314453125, 0.0337982177734375, 0.049480438232421875, 0.06516265869140625, 0.08084487915039062, 0.096527099609375, 0.11220932006835938, 0.12789154052734375, 0.14357376098632812, 0.1592559814453125, 0.17493820190429688, 0.19062042236328125, 0.20630264282226562, 0.22198486328125, 0.23766708374023438, 0.25334930419921875, 0.2690315246582031, 0.2847137451171875, 0.3003959655761719, 0.31607818603515625, 0.3317604064941406, 0.347442626953125, 0.3631248474121094, 0.37880706787109375, 0.3944892883300781, 0.4101715087890625, 0.4258537292480469, 0.44153594970703125, 0.4572181701660156, 0.472900390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 16.0, 46.0, 176.0, 394.0, 249.0, 75.0, 24.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.123693466186523, -28.303258895874023, -27.482824325561523, -26.66238784790039, -25.84195327758789, -25.02151870727539, -24.20108413696289, -23.38064956665039, -22.560213088989258, -21.739778518676758, -20.919343948364258, -20.098907470703125, -19.278472900390625, -18.458038330078125, -17.637603759765625, -16.817169189453125, -15.996733665466309, -15.176299095153809, -14.355863571166992, -13.535429000854492, -12.714993476867676, -11.894558906555176, -11.07412338256836, -10.25368881225586, -9.43325424194336, -8.61281967163086, -7.792384147644043, -6.971949577331543, -6.151514053344727, -5.331079483032227, -4.510644435882568, -3.69020938873291, -2.8697738647460938, -2.0493388175964355, -1.228903889656067, -0.40846896171569824, 0.41196608543395996, 1.232400894165039, 2.0528359413146973, 2.8732709884643555, 3.6937060356140137, 4.514141082763672, 5.33457612991333, 6.155011177062988, 6.975445747375488, 7.7958807945251465, 8.616315841674805, 9.436750411987305, 10.257185935974121, 11.077620506286621, 11.898056030273438, 12.718490600585938, 13.538926124572754, 14.359360694885254, 15.17979621887207, 16.00023078918457, 16.82066535949707, 17.64109992980957, 18.46153450012207, 19.281970977783203, 20.102405548095703, 20.922840118408203, 21.743274688720703, 22.563709259033203, 23.384145736694336]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 2.0, 10.0, 9.0, 17.0, 21.0, 17.0, 19.0, 21.0, 17.0, 21.0, 22.0, 28.0, 30.0, 39.0, 33.0, 38.0, 50.0, 40.0, 68.0, 48.0, 62.0, 46.0, 35.0, 26.0, 31.0, 32.0, 33.0, 19.0, 25.0, 14.0, 14.0, 13.0, 13.0, 9.0, 13.0, 9.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.330990791320801, -6.11978006362915, -5.908569812774658, -5.697359085083008, -5.486148357391357, -5.274937629699707, -5.063727378845215, -4.8525166511535645, -4.641305923461914, -4.430095195770264, -4.2188849449157715, -4.007674217224121, -3.7964634895324707, -3.5852530002593994, -3.374042510986328, -3.1628317832946777, -2.9516215324401855, -2.7404110431671143, -2.529200315475464, -2.3179898262023926, -2.106779098510742, -1.895568609237671, -1.6843581199645996, -1.4731475114822388, -1.261936902999878, -1.050726294517517, -0.839515745639801, -0.628305196762085, -0.4170945882797241, -0.20588397979736328, 0.005326509475708008, 0.21653711795806885, 0.4277472496032715, 0.6389578580856323, 0.8501684069633484, 1.0613789558410645, 1.2725895643234253, 1.4838001728057861, 1.6950106620788574, 1.9062212705612183, 2.117431879043579, 2.3286423683166504, 2.539853096008301, 2.751063585281372, 2.9622740745544434, 3.1734848022460938, 3.384695291519165, 3.5959057807922363, 3.8071165084838867, 4.018327236175537, 4.229537487030029, 4.44074821472168, 4.65195894241333, 4.8631696701049805, 5.074379920959473, 5.285590648651123, 5.496801376342773, 5.708012104034424, 5.919222354888916, 6.130433082580566, 6.341643810272217, 6.552854537963867, 6.764064788818359, 6.97527551651001, 7.186485767364502]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 4.0, 6.0, 14.0, 15.0, 32.0, 47.0, 75.0, 135.0, 220.0, 360.0, 717.0, 1470.0, 3503.0, 9493.0, 33026.0, 186631.0, 2316764.0, 1480763.0, 123499.0, 24642.0, 7493.0, 2714.0, 1219.0, 606.0, 331.0, 176.0, 111.0, 77.0, 43.0, 26.0, 16.0, 14.0, 7.0, 11.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6334686279296875, -0.605804443359375, -0.5781402587890625, -0.55047607421875, -0.5228118896484375, -0.495147705078125, -0.4674835205078125, -0.4398193359375, -0.4121551513671875, -0.384490966796875, -0.3568267822265625, -0.32916259765625, -0.3014984130859375, -0.273834228515625, -0.2461700439453125, -0.218505859375, -0.1908416748046875, -0.163177490234375, -0.1355133056640625, -0.10784912109375, -0.0801849365234375, -0.052520751953125, -0.0248565673828125, 0.0028076171875, 0.0304718017578125, 0.058135986328125, 0.0858001708984375, 0.11346435546875, 0.1411285400390625, 0.168792724609375, 0.1964569091796875, 0.22412109375, 0.2517852783203125, 0.279449462890625, 0.3071136474609375, 0.33477783203125, 0.3624420166015625, 0.390106201171875, 0.4177703857421875, 0.4454345703125, 0.4730987548828125, 0.500762939453125, 0.5284271240234375, 0.55609130859375, 0.5837554931640625, 0.611419677734375, 0.6390838623046875, 0.666748046875, 0.6944122314453125, 0.722076416015625, 0.7497406005859375, 0.77740478515625, 0.8050689697265625, 0.832733154296875, 0.8603973388671875, 0.8880615234375, 0.9157257080078125, 0.943389892578125, 0.9710540771484375, 0.99871826171875, 1.0263824462890625, 1.054046630859375, 1.0817108154296875, 1.109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 7.0, 8.0, 16.0, 6.0, 18.0, 13.0, 23.0, 32.0, 25.0, 34.0, 35.0, 57.0, 44.0, 61.0, 47.0, 48.0, 57.0, 41.0, 56.0, 46.0, 39.0, 40.0, 35.0, 39.0, 30.0, 24.0, 23.0, 20.0, 21.0, 14.0, 6.0, 9.0, 7.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3762359619140625, -0.362579345703125, -0.3489227294921875, -0.33526611328125, -0.3216094970703125, -0.307952880859375, -0.2942962646484375, -0.2806396484375, -0.2669830322265625, -0.253326416015625, -0.2396697998046875, -0.22601318359375, -0.2123565673828125, -0.198699951171875, -0.1850433349609375, -0.17138671875, -0.1577301025390625, -0.144073486328125, -0.1304168701171875, -0.11676025390625, -0.1031036376953125, -0.089447021484375, -0.0757904052734375, -0.0621337890625, -0.0484771728515625, -0.034820556640625, -0.0211639404296875, -0.00750732421875, 0.0061492919921875, 0.019805908203125, 0.0334625244140625, 0.047119140625, 0.0607757568359375, 0.074432373046875, 0.0880889892578125, 0.10174560546875, 0.1154022216796875, 0.129058837890625, 0.1427154541015625, 0.1563720703125, 0.1700286865234375, 0.183685302734375, 0.1973419189453125, 0.21099853515625, 0.2246551513671875, 0.238311767578125, 0.2519683837890625, 0.265625, 0.2792816162109375, 0.292938232421875, 0.3065948486328125, 0.32025146484375, 0.3339080810546875, 0.347564697265625, 0.3612213134765625, 0.3748779296875, 0.3885345458984375, 0.402191162109375, 0.4158477783203125, 0.42950439453125, 0.4431610107421875, 0.456817626953125, 0.4704742431640625, 0.484130859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 17.0, 22.0, 33.0, 49.0, 74.0, 146.0, 304.0, 660.0, 1683.0, 5368.0, 24288.0, 179869.0, 3285940.0, 637145.0, 47069.0, 8248.0, 2088.0, 673.0, 259.0, 112.0, 71.0, 35.0, 30.0, 20.0, 13.0, 9.0, 7.0, 8.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.646484375, -1.6039581298828125, -1.561431884765625, -1.5189056396484375, -1.47637939453125, -1.4338531494140625, -1.391326904296875, -1.3488006591796875, -1.3062744140625, -1.2637481689453125, -1.221221923828125, -1.1786956787109375, -1.13616943359375, -1.0936431884765625, -1.051116943359375, -1.0085906982421875, -0.966064453125, -0.9235382080078125, -0.881011962890625, -0.8384857177734375, -0.79595947265625, -0.7534332275390625, -0.710906982421875, -0.6683807373046875, -0.6258544921875, -0.5833282470703125, -0.540802001953125, -0.4982757568359375, -0.45574951171875, -0.4132232666015625, -0.370697021484375, -0.3281707763671875, -0.28564453125, -0.2431182861328125, -0.200592041015625, -0.1580657958984375, -0.11553955078125, -0.0730133056640625, -0.030487060546875, 0.0120391845703125, 0.0545654296875, 0.0970916748046875, 0.139617919921875, 0.1821441650390625, 0.22467041015625, 0.2671966552734375, 0.309722900390625, 0.3522491455078125, 0.394775390625, 0.4373016357421875, 0.479827880859375, 0.5223541259765625, 0.56488037109375, 0.6074066162109375, 0.649932861328125, 0.6924591064453125, 0.7349853515625, 0.7775115966796875, 0.820037841796875, 0.8625640869140625, 0.90509033203125, 0.9476165771484375, 0.990142822265625, 1.0326690673828125, 1.0751953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 32.0, 37.0, 53.0, 92.0, 104.0, 183.0, 319.0, 612.0, 938.0, 738.0, 373.0, 214.0, 128.0, 69.0, 43.0, 24.0, 19.0, 22.0, 6.0, 5.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.58984375, -1.54864501953125, -1.5074462890625, -1.46624755859375, -1.425048828125, -1.38385009765625, -1.3426513671875, -1.30145263671875, -1.26025390625, -1.21905517578125, -1.1778564453125, -1.13665771484375, -1.095458984375, -1.05426025390625, -1.0130615234375, -0.97186279296875, -0.9306640625, -0.88946533203125, -0.8482666015625, -0.80706787109375, -0.765869140625, -0.72467041015625, -0.6834716796875, -0.64227294921875, -0.60107421875, -0.55987548828125, -0.5186767578125, -0.47747802734375, -0.436279296875, -0.39508056640625, -0.3538818359375, -0.31268310546875, -0.271484375, -0.23028564453125, -0.1890869140625, -0.14788818359375, -0.106689453125, -0.06549072265625, -0.0242919921875, 0.01690673828125, 0.05810546875, 0.09930419921875, 0.1405029296875, 0.18170166015625, 0.222900390625, 0.26409912109375, 0.3052978515625, 0.34649658203125, 0.3876953125, 0.42889404296875, 0.4700927734375, 0.51129150390625, 0.552490234375, 0.59368896484375, 0.6348876953125, 0.67608642578125, 0.71728515625, 0.75848388671875, 0.7996826171875, 0.84088134765625, 0.882080078125, 0.92327880859375, 0.9644775390625, 1.00567626953125, 1.046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 21.0, 45.0, 69.0, 142.0, 188.0, 192.0, 150.0, 75.0, 47.0, 14.0, 10.0, 8.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.025124549865723, -14.634866714477539, -14.244609832763672, -13.854352951049805, -13.464095115661621, -13.073837280273438, -12.68358039855957, -12.293323516845703, -11.90306568145752, -11.512807846069336, -11.122550964355469, -10.732294082641602, -10.342036247253418, -9.951778411865234, -9.561521530151367, -9.1712646484375, -8.781006813049316, -8.390748977661133, -8.000492095947266, -7.61023473739624, -7.219977378845215, -6.8297200202941895, -6.439462661743164, -6.049205303192139, -5.658947944641113, -5.268690586090088, -4.8784332275390625, -4.488175868988037, -4.097918510437012, -3.7076611518859863, -3.317403793334961, -2.9271464347839355, -2.5368881225585938, -2.1466307640075684, -1.756373405456543, -1.3661160469055176, -0.9758586883544922, -0.5856013298034668, -0.1953439712524414, 0.19491338729858398, 0.5851707458496094, 0.9754281044006348, 1.3656854629516602, 1.7559428215026855, 2.146200180053711, 2.5364575386047363, 2.9267148971557617, 3.316972255706787, 3.7072296142578125, 4.097486972808838, 4.487744331359863, 4.878001689910889, 5.268259048461914, 5.6585164070129395, 6.048773765563965, 6.43903112411499, 6.829288482666016, 7.219545841217041, 7.609803199768066, 8.00006103515625, 8.390317916870117, 8.780574798583984, 9.170832633972168, 9.561090469360352, 9.951347351074219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 15.0, 19.0, 21.0, 28.0, 24.0, 31.0, 37.0, 41.0, 46.0, 38.0, 39.0, 39.0, 48.0, 39.0, 61.0, 40.0, 33.0, 42.0, 38.0, 37.0, 33.0, 34.0, 29.0, 23.0, 19.0, 19.0, 16.0, 15.0, 10.0, 11.0, 4.0, 7.0, 4.0, 1.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.922654151916504, -4.765636920928955, -4.608619689941406, -4.451601982116699, -4.29458475112915, -4.137567520141602, -3.9805500507354736, -3.8235325813293457, -3.666515350341797, -3.509498119354248, -3.35248064994812, -3.195463180541992, -3.0384459495544434, -2.8814287185668945, -2.7244112491607666, -2.5673937797546387, -2.41037654876709, -2.253359317779541, -2.096341848373413, -1.9393244981765747, -1.7823071479797363, -1.625289797782898, -1.4682724475860596, -1.3112550973892212, -1.1542377471923828, -0.9972203969955444, -0.840203046798706, -0.6831856966018677, -0.5261683464050293, -0.3691509962081909, -0.21213364601135254, -0.05511629581451416, 0.10190105438232422, 0.2589184045791626, 0.415935754776001, 0.5729531049728394, 0.7299704551696777, 0.8869878053665161, 1.0440051555633545, 1.2010225057601929, 1.3580398559570312, 1.5150572061538696, 1.672074556350708, 1.8290919065475464, 1.9861092567443848, 2.1431264877319336, 2.3001439571380615, 2.4571614265441895, 2.6141786575317383, 2.771195888519287, 2.928213357925415, 3.085230827331543, 3.242248058319092, 3.3992652893066406, 3.5562827587127686, 3.7133002281188965, 3.8703174591064453, 4.027334690093994, 4.184351921081543, 4.34136962890625, 4.498386859893799, 4.655404090881348, 4.812421798706055, 4.9694390296936035, 5.126456260681152]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 9.0, 8.0, 10.0, 20.0, 37.0, 65.0, 90.0, 131.0, 246.0, 430.0, 983.0, 2110.0, 5652.0, 17501.0, 56199.0, 178475.0, 407428.0, 256547.0, 83468.0, 25369.0, 8296.0, 2887.0, 1265.0, 577.0, 310.0, 173.0, 101.0, 56.0, 40.0, 29.0, 13.0, 10.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.2236328125, -1.1902618408203125, -1.156890869140625, -1.1235198974609375, -1.09014892578125, -1.0567779541015625, -1.023406982421875, -0.9900360107421875, -0.9566650390625, -0.9232940673828125, -0.889923095703125, -0.8565521240234375, -0.82318115234375, -0.7898101806640625, -0.756439208984375, -0.7230682373046875, -0.689697265625, -0.6563262939453125, -0.622955322265625, -0.5895843505859375, -0.55621337890625, -0.5228424072265625, -0.489471435546875, -0.4561004638671875, -0.4227294921875, -0.3893585205078125, -0.355987548828125, -0.3226165771484375, -0.28924560546875, -0.2558746337890625, -0.222503662109375, -0.1891326904296875, -0.15576171875, -0.1223907470703125, -0.089019775390625, -0.0556488037109375, -0.02227783203125, 0.0110931396484375, 0.044464111328125, 0.0778350830078125, 0.1112060546875, 0.1445770263671875, 0.177947998046875, 0.2113189697265625, 0.24468994140625, 0.2780609130859375, 0.311431884765625, 0.3448028564453125, 0.378173828125, 0.4115447998046875, 0.444915771484375, 0.4782867431640625, 0.51165771484375, 0.5450286865234375, 0.578399658203125, 0.6117706298828125, 0.6451416015625, 0.6785125732421875, 0.711883544921875, 0.7452545166015625, 0.77862548828125, 0.8119964599609375, 0.845367431640625, 0.8787384033203125, 0.912109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 12.0, 11.0, 16.0, 18.0, 21.0, 19.0, 31.0, 33.0, 31.0, 26.0, 35.0, 51.0, 30.0, 42.0, 55.0, 48.0, 43.0, 43.0, 30.0, 41.0, 45.0, 48.0, 30.0, 37.0, 31.0, 27.0, 29.0, 12.0, 15.0, 12.0, 16.0, 13.0, 9.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.41064453125, -0.3987236022949219, -0.38680267333984375, -0.3748817443847656, -0.3629608154296875, -0.3510398864746094, -0.33911895751953125, -0.3271980285644531, -0.315277099609375, -0.3033561706542969, -0.29143524169921875, -0.2795143127441406, -0.2675933837890625, -0.2556724548339844, -0.24375152587890625, -0.23183059692382812, -0.21990966796875, -0.20798873901367188, -0.19606781005859375, -0.18414688110351562, -0.1722259521484375, -0.16030502319335938, -0.14838409423828125, -0.13646316528320312, -0.124542236328125, -0.11262130737304688, -0.10070037841796875, -0.08877944946289062, -0.0768585205078125, -0.06493759155273438, -0.05301666259765625, -0.041095733642578125, -0.0291748046875, -0.017253875732421875, -0.00533294677734375, 0.006587982177734375, 0.0185089111328125, 0.030429840087890625, 0.04235076904296875, 0.054271697998046875, 0.066192626953125, 0.07811355590820312, 0.09003448486328125, 0.10195541381835938, 0.1138763427734375, 0.12579727172851562, 0.13771820068359375, 0.14963912963867188, 0.16156005859375, 0.17348098754882812, 0.18540191650390625, 0.19732284545898438, 0.2092437744140625, 0.22116470336914062, 0.23308563232421875, 0.24500656127929688, 0.256927490234375, 0.2688484191894531, 0.28076934814453125, 0.2926902770996094, 0.3046112060546875, 0.3165321350097656, 0.32845306396484375, 0.3403739929199219, 0.352294921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 12.0, 9.0, 13.0, 18.0, 24.0, 35.0, 63.0, 84.0, 100.0, 159.0, 221.0, 357.0, 547.0, 895.0, 1734.0, 3955.0, 14268.0, 110463.0, 739092.0, 149609.0, 17739.0, 4479.0, 1896.0, 999.0, 599.0, 367.0, 225.0, 170.0, 121.0, 69.0, 50.0, 40.0, 32.0, 22.0, 19.0, 18.0, 8.0, 8.0, 7.0, 10.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.998046875, -1.9366912841796875, -1.875335693359375, -1.8139801025390625, -1.75262451171875, -1.6912689208984375, -1.629913330078125, -1.5685577392578125, -1.5072021484375, -1.4458465576171875, -1.384490966796875, -1.3231353759765625, -1.26177978515625, -1.2004241943359375, -1.139068603515625, -1.0777130126953125, -1.016357421875, -0.9550018310546875, -0.893646240234375, -0.8322906494140625, -0.77093505859375, -0.7095794677734375, -0.648223876953125, -0.5868682861328125, -0.5255126953125, -0.4641571044921875, -0.402801513671875, -0.3414459228515625, -0.28009033203125, -0.2187347412109375, -0.157379150390625, -0.0960235595703125, -0.03466796875, 0.0266876220703125, 0.088043212890625, 0.1493988037109375, 0.21075439453125, 0.2721099853515625, 0.333465576171875, 0.3948211669921875, 0.4561767578125, 0.5175323486328125, 0.578887939453125, 0.6402435302734375, 0.70159912109375, 0.7629547119140625, 0.824310302734375, 0.8856658935546875, 0.947021484375, 1.0083770751953125, 1.069732666015625, 1.1310882568359375, 1.19244384765625, 1.2537994384765625, 1.315155029296875, 1.3765106201171875, 1.4378662109375, 1.4992218017578125, 1.560577392578125, 1.6219329833984375, 1.68328857421875, 1.7446441650390625, 1.805999755859375, 1.8673553466796875, 1.9287109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 18.0, 12.0, 18.0, 28.0, 20.0, 32.0, 25.0, 29.0, 52.0, 44.0, 51.0, 40.0, 51.0, 45.0, 45.0, 52.0, 40.0, 49.0, 49.0, 49.0, 39.0, 30.0, 28.0, 18.0, 30.0, 19.0, 16.0, 11.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.812255859375, -1.75537109375, -1.698486328125, -1.6416015625, -1.584716796875, -1.52783203125, -1.470947265625, -1.4140625, -1.357177734375, -1.30029296875, -1.243408203125, -1.1865234375, -1.129638671875, -1.07275390625, -1.015869140625, -0.958984375, -0.902099609375, -0.84521484375, -0.788330078125, -0.7314453125, -0.674560546875, -0.61767578125, -0.560791015625, -0.50390625, -0.447021484375, -0.39013671875, -0.333251953125, -0.2763671875, -0.219482421875, -0.16259765625, -0.105712890625, -0.048828125, 0.008056640625, 0.06494140625, 0.121826171875, 0.1787109375, 0.235595703125, 0.29248046875, 0.349365234375, 0.40625, 0.463134765625, 0.52001953125, 0.576904296875, 0.6337890625, 0.690673828125, 0.74755859375, 0.804443359375, 0.861328125, 0.918212890625, 0.97509765625, 1.031982421875, 1.0888671875, 1.145751953125, 1.20263671875, 1.259521484375, 1.31640625, 1.373291015625, 1.43017578125, 1.487060546875, 1.5439453125, 1.600830078125, 1.65771484375, 1.714599609375, 1.771484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 3.0, 6.0, 10.0, 17.0, 12.0, 26.0, 31.0, 49.0, 62.0, 109.0, 133.0, 266.0, 493.0, 1261.0, 4821.0, 31269.0, 586000.0, 390137.0, 27191.0, 4242.0, 1171.0, 490.0, 259.0, 147.0, 95.0, 54.0, 49.0, 33.0, 22.0, 21.0, 13.0, 5.0, 14.0, 8.0, 4.0, 3.0, 2.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.7476272583007812, -0.7218170166015625, -0.6960067749023438, -0.670196533203125, -0.6443862915039062, -0.6185760498046875, -0.5927658081054688, -0.56695556640625, -0.5411453247070312, -0.5153350830078125, -0.48952484130859375, -0.463714599609375, -0.43790435791015625, -0.4120941162109375, -0.38628387451171875, -0.3604736328125, -0.33466339111328125, -0.3088531494140625, -0.28304290771484375, -0.257232666015625, -0.23142242431640625, -0.2056121826171875, -0.17980194091796875, -0.15399169921875, -0.12818145751953125, -0.1023712158203125, -0.07656097412109375, -0.050750732421875, -0.02494049072265625, 0.0008697509765625, 0.02667999267578125, 0.052490234375, 0.07830047607421875, 0.1041107177734375, 0.12992095947265625, 0.155731201171875, 0.18154144287109375, 0.2073516845703125, 0.23316192626953125, 0.25897216796875, 0.28478240966796875, 0.3105926513671875, 0.33640289306640625, 0.362213134765625, 0.38802337646484375, 0.4138336181640625, 0.43964385986328125, 0.4654541015625, 0.49126434326171875, 0.5170745849609375, 0.5428848266601562, 0.568695068359375, 0.5945053100585938, 0.6203155517578125, 0.6461257934570312, 0.67193603515625, 0.6977462768554688, 0.7235565185546875, 0.7493667602539062, 0.775177001953125, 0.8009872436523438, 0.8267974853515625, 0.8526077270507812, 0.87841796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 7.0, 13.0, 15.0, 18.0, 19.0, 28.0, 40.0, 40.0, 57.0, 69.0, 94.0, 106.0, 113.0, 92.0, 45.0, 41.0, 42.0, 31.0, 26.0, 19.0, 14.0, 18.0, 6.0, 8.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001480579376220703, -0.00014398153871297836, -0.00013990513980388641, -0.00013582874089479446, -0.00013175234198570251, -0.00012767594307661057, -0.00012359954416751862, -0.00011952314525842667, -0.00011544674634933472, -0.00011137034744024277, -0.00010729394853115082, -0.00010321754962205887, -9.914115071296692e-05, -9.506475180387497e-05, -9.098835289478302e-05, -8.691195398569107e-05, -8.283555507659912e-05, -7.875915616750717e-05, -7.468275725841522e-05, -7.060635834932327e-05, -6.652995944023132e-05, -6.245356053113937e-05, -5.8377161622047424e-05, -5.4300762712955475e-05, -5.0224363803863525e-05, -4.6147964894771576e-05, -4.2071565985679626e-05, -3.799516707658768e-05, -3.391876816749573e-05, -2.9842369258403778e-05, -2.576597034931183e-05, -2.168957144021988e-05, -1.761317253112793e-05, -1.353677362203598e-05, -9.46037471294403e-06, -5.383975803852081e-06, -1.3075768947601318e-06, 2.7688220143318176e-06, 6.845220923423767e-06, 1.0921619832515717e-05, 1.4998018741607666e-05, 1.9074417650699615e-05, 2.3150816559791565e-05, 2.7227215468883514e-05, 3.1303614377975464e-05, 3.538001328706741e-05, 3.945641219615936e-05, 4.353281110525131e-05, 4.760921001434326e-05, 5.168560892343521e-05, 5.576200783252716e-05, 5.983840674161911e-05, 6.391480565071106e-05, 6.799120455980301e-05, 7.206760346889496e-05, 7.614400237798691e-05, 8.022040128707886e-05, 8.429680019617081e-05, 8.837319910526276e-05, 9.24495980143547e-05, 9.652599692344666e-05, 0.0001006023958325386, 0.00010467879474163055, 0.0001087551936507225, 0.00011283159255981445]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 11.0, 6.0, 23.0, 29.0, 60.0, 93.0, 157.0, 306.0, 572.0, 1334.0, 3991.0, 17319.0, 226745.0, 753153.0, 34774.0, 6426.0, 1971.0, 764.0, 341.0, 165.0, 116.0, 62.0, 39.0, 27.0, 11.0, 13.0, 11.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.90643310546875, -0.8753662109375, -0.84429931640625, -0.813232421875, -0.78216552734375, -0.7510986328125, -0.72003173828125, -0.68896484375, -0.65789794921875, -0.6268310546875, -0.59576416015625, -0.564697265625, -0.53363037109375, -0.5025634765625, -0.47149658203125, -0.4404296875, -0.40936279296875, -0.3782958984375, -0.34722900390625, -0.316162109375, -0.28509521484375, -0.2540283203125, -0.22296142578125, -0.19189453125, -0.16082763671875, -0.1297607421875, -0.09869384765625, -0.067626953125, -0.03656005859375, -0.0054931640625, 0.02557373046875, 0.056640625, 0.08770751953125, 0.1187744140625, 0.14984130859375, 0.180908203125, 0.21197509765625, 0.2430419921875, 0.27410888671875, 0.30517578125, 0.33624267578125, 0.3673095703125, 0.39837646484375, 0.429443359375, 0.46051025390625, 0.4915771484375, 0.52264404296875, 0.5537109375, 0.58477783203125, 0.6158447265625, 0.64691162109375, 0.677978515625, 0.70904541015625, 0.7401123046875, 0.77117919921875, 0.80224609375, 0.83331298828125, 0.8643798828125, 0.89544677734375, 0.926513671875, 0.95758056640625, 0.9886474609375, 1.01971435546875, 1.05078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 3.0, 6.0, 14.0, 19.0, 33.0, 44.0, 68.0, 86.0, 131.0, 121.0, 112.0, 107.0, 74.0, 57.0, 33.0, 24.0, 15.0, 16.0, 8.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7374954223632812, -0.7142486572265625, -0.6910018920898438, -0.667755126953125, -0.6445083618164062, -0.6212615966796875, -0.5980148315429688, -0.57476806640625, -0.5515213012695312, -0.5282745361328125, -0.5050277709960938, -0.481781005859375, -0.45853424072265625, -0.4352874755859375, -0.41204071044921875, -0.3887939453125, -0.36554718017578125, -0.3423004150390625, -0.31905364990234375, -0.295806884765625, -0.27256011962890625, -0.2493133544921875, -0.22606658935546875, -0.20281982421875, -0.17957305908203125, -0.1563262939453125, -0.13307952880859375, -0.109832763671875, -0.08658599853515625, -0.0633392333984375, -0.04009246826171875, -0.016845703125, 0.00640106201171875, 0.0296478271484375, 0.05289459228515625, 0.076141357421875, 0.09938812255859375, 0.1226348876953125, 0.14588165283203125, 0.16912841796875, 0.19237518310546875, 0.2156219482421875, 0.23886871337890625, 0.262115478515625, 0.28536224365234375, 0.3086090087890625, 0.33185577392578125, 0.3551025390625, 0.37834930419921875, 0.4015960693359375, 0.42484283447265625, 0.448089599609375, 0.47133636474609375, 0.4945831298828125, 0.5178298950195312, 0.54107666015625, 0.5643234252929688, 0.5875701904296875, 0.6108169555664062, 0.634063720703125, 0.6573104858398438, 0.6805572509765625, 0.7038040161132812, 0.72705078125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 23.0, 30.0, 64.0, 101.0, 155.0, 195.0, 152.0, 97.0, 72.0, 39.0, 24.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00645637512207, -6.683718204498291, -6.360980033874512, -6.038241863250732, -5.715503692626953, -5.392765998840332, -5.070027828216553, -4.747289657592773, -4.424551486968994, -4.101813316345215, -3.7790751457214355, -3.4563372135162354, -3.133599042892456, -2.8108608722686768, -2.4881229400634766, -2.1653847694396973, -1.842646598815918, -1.5199084281921387, -1.197170376777649, -0.8744322657585144, -0.5516941547393799, -0.22895598411560059, 0.09378206729888916, 0.4165201187133789, 0.7392582893371582, 1.0619964599609375, 1.3847345113754272, 1.707472562789917, 2.0302107334136963, 2.3529489040374756, 2.675686836242676, 2.998425006866455, 3.3211631774902344, 3.6439013481140137, 3.966639518737793, 4.289377689361572, 4.612115859985352, 4.934853553771973, 5.257591724395752, 5.580329895019531, 5.9030680656433105, 6.22580623626709, 6.548544406890869, 6.871282577514648, 7.1940202713012695, 7.516758918762207, 7.839496612548828, 8.162235260009766, 8.484972953796387, 8.807710647583008, 9.130449295043945, 9.453186988830566, 9.775925636291504, 10.098663330078125, 10.421401977539062, 10.744139671325684, 11.066877365112305, 11.389615058898926, 11.712353706359863, 12.035091400146484, 12.357830047607422, 12.680567741394043, 13.00330638885498, 13.326044082641602, 13.648782730102539]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 6.0, 8.0, 9.0, 7.0, 16.0, 14.0, 12.0, 17.0, 20.0, 18.0, 26.0, 42.0, 33.0, 32.0, 42.0, 47.0, 43.0, 61.0, 50.0, 64.0, 34.0, 42.0, 46.0, 34.0, 31.0, 26.0, 20.0, 21.0, 24.0, 19.0, 19.0, 20.0, 16.0, 12.0, 5.0, 8.0, 6.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.158337593078613, -5.9691162109375, -5.7798943519592285, -5.590672969818115, -5.401451110839844, -5.2122297286987305, -5.023008346557617, -4.833786487579346, -4.644564628601074, -4.455343246459961, -4.2661213874816895, -4.076900005340576, -3.8876781463623047, -3.6984567642211914, -3.509235143661499, -3.3200135231018066, -3.1307921409606934, -2.941570520401001, -2.7523488998413086, -2.5631275177001953, -2.373905658721924, -2.1846842765808105, -1.9954626560211182, -1.8062410354614258, -1.6170194149017334, -1.427797794342041, -1.2385761737823486, -1.0493546724319458, -0.8601330518722534, -0.670911431312561, -0.4816899299621582, -0.2924683094024658, -0.10324716567993164, 0.08597442507743835, 0.27519601583480835, 0.46441757678985596, 0.6536391973495483, 0.8428608179092407, 1.0320823192596436, 1.221303939819336, 1.4105255603790283, 1.5997471809387207, 1.788968801498413, 1.978190302848816, 2.1674118041992188, 2.3566336631774902, 2.5458550453186035, 2.735076665878296, 2.9242982864379883, 3.1135199069976807, 3.302741527557373, 3.4919629096984863, 3.681184768676758, 3.870406150817871, 4.059627532958984, 4.248849391937256, 4.438071250915527, 4.627292633056641, 4.816514492034912, 5.005735874176025, 5.194957733154297, 5.38417911529541, 5.573400497436523, 5.762622356414795, 5.951843738555908]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 9.0, 15.0, 15.0, 31.0, 47.0, 91.0, 174.0, 332.0, 671.0, 1426.0, 3717.0, 12603.0, 58887.0, 727017.0, 3083710.0, 258102.0, 34330.0, 8495.0, 2657.0, 1046.0, 440.0, 224.0, 104.0, 51.0, 28.0, 27.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.123992919921875, -1.09466552734375, -1.065338134765625, -1.0360107421875, -1.006683349609375, -0.97735595703125, -0.948028564453125, -0.918701171875, -0.889373779296875, -0.86004638671875, -0.830718994140625, -0.8013916015625, -0.772064208984375, -0.74273681640625, -0.713409423828125, -0.68408203125, -0.654754638671875, -0.62542724609375, -0.596099853515625, -0.5667724609375, -0.537445068359375, -0.50811767578125, -0.478790283203125, -0.449462890625, -0.420135498046875, -0.39080810546875, -0.361480712890625, -0.3321533203125, -0.302825927734375, -0.27349853515625, -0.244171142578125, -0.21484375, -0.185516357421875, -0.15618896484375, -0.126861572265625, -0.0975341796875, -0.068206787109375, -0.03887939453125, -0.009552001953125, 0.019775390625, 0.049102783203125, 0.07843017578125, 0.107757568359375, 0.1370849609375, 0.166412353515625, 0.19573974609375, 0.225067138671875, 0.25439453125, 0.283721923828125, 0.31304931640625, 0.342376708984375, 0.3717041015625, 0.401031494140625, 0.43035888671875, 0.459686279296875, 0.489013671875, 0.518341064453125, 0.54766845703125, 0.576995849609375, 0.6063232421875, 0.635650634765625, 0.66497802734375, 0.694305419921875, 0.7236328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 10.0, 15.0, 21.0, 18.0, 23.0, 21.0, 37.0, 38.0, 41.0, 53.0, 52.0, 48.0, 65.0, 62.0, 58.0, 55.0, 57.0, 45.0, 46.0, 40.0, 30.0, 29.0, 22.0, 25.0, 14.0, 15.0, 13.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.591796875, -0.5767669677734375, -0.561737060546875, -0.5467071533203125, -0.53167724609375, -0.5166473388671875, -0.501617431640625, -0.4865875244140625, -0.4715576171875, -0.4565277099609375, -0.441497802734375, -0.4264678955078125, -0.41143798828125, -0.3964080810546875, -0.381378173828125, -0.3663482666015625, -0.351318359375, -0.3362884521484375, -0.321258544921875, -0.3062286376953125, -0.29119873046875, -0.2761688232421875, -0.261138916015625, -0.2461090087890625, -0.2310791015625, -0.2160491943359375, -0.201019287109375, -0.1859893798828125, -0.17095947265625, -0.1559295654296875, -0.140899658203125, -0.1258697509765625, -0.11083984375, -0.0958099365234375, -0.080780029296875, -0.0657501220703125, -0.05072021484375, -0.0356903076171875, -0.020660400390625, -0.0056304931640625, 0.0093994140625, 0.0244293212890625, 0.039459228515625, 0.0544891357421875, 0.06951904296875, 0.0845489501953125, 0.099578857421875, 0.1146087646484375, 0.129638671875, 0.1446685791015625, 0.159698486328125, 0.1747283935546875, 0.18975830078125, 0.2047882080078125, 0.219818115234375, 0.2348480224609375, 0.2498779296875, 0.2649078369140625, 0.279937744140625, 0.2949676513671875, 0.30999755859375, 0.3250274658203125, 0.340057373046875, 0.3550872802734375, 0.3701171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 7.0, 10.0, 9.0, 14.0, 30.0, 39.0, 92.0, 187.0, 440.0, 961.0, 2650.0, 10865.0, 88261.0, 3025467.0, 1013444.0, 41895.0, 6847.0, 1841.0, 626.0, 301.0, 138.0, 75.0, 29.0, 24.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5068359375, -1.45953369140625, -1.4122314453125, -1.36492919921875, -1.317626953125, -1.27032470703125, -1.2230224609375, -1.17572021484375, -1.12841796875, -1.08111572265625, -1.0338134765625, -0.98651123046875, -0.939208984375, -0.89190673828125, -0.8446044921875, -0.79730224609375, -0.75, -0.70269775390625, -0.6553955078125, -0.60809326171875, -0.560791015625, -0.51348876953125, -0.4661865234375, -0.41888427734375, -0.37158203125, -0.32427978515625, -0.2769775390625, -0.22967529296875, -0.182373046875, -0.13507080078125, -0.0877685546875, -0.04046630859375, 0.0068359375, 0.05413818359375, 0.1014404296875, 0.14874267578125, 0.196044921875, 0.24334716796875, 0.2906494140625, 0.33795166015625, 0.38525390625, 0.43255615234375, 0.4798583984375, 0.52716064453125, 0.574462890625, 0.62176513671875, 0.6690673828125, 0.71636962890625, 0.763671875, 0.81097412109375, 0.8582763671875, 0.90557861328125, 0.952880859375, 1.00018310546875, 1.0474853515625, 1.09478759765625, 1.14208984375, 1.18939208984375, 1.2366943359375, 1.28399658203125, 1.331298828125, 1.37860107421875, 1.4259033203125, 1.47320556640625, 1.5205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 14.0, 21.0, 25.0, 41.0, 73.0, 103.0, 181.0, 402.0, 720.0, 939.0, 752.0, 361.0, 174.0, 99.0, 38.0, 32.0, 25.0, 11.0, 15.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2890625, -1.2469024658203125, -1.204742431640625, -1.1625823974609375, -1.12042236328125, -1.0782623291015625, -1.036102294921875, -0.9939422607421875, -0.9517822265625, -0.9096221923828125, -0.867462158203125, -0.8253021240234375, -0.78314208984375, -0.7409820556640625, -0.698822021484375, -0.6566619873046875, -0.614501953125, -0.5723419189453125, -0.530181884765625, -0.4880218505859375, -0.44586181640625, -0.4037017822265625, -0.361541748046875, -0.3193817138671875, -0.2772216796875, -0.2350616455078125, -0.192901611328125, -0.1507415771484375, -0.10858154296875, -0.0664215087890625, -0.024261474609375, 0.0178985595703125, 0.06005859375, 0.1022186279296875, 0.144378662109375, 0.1865386962890625, 0.22869873046875, 0.2708587646484375, 0.313018798828125, 0.3551788330078125, 0.3973388671875, 0.4394989013671875, 0.481658935546875, 0.5238189697265625, 0.56597900390625, 0.6081390380859375, 0.650299072265625, 0.6924591064453125, 0.734619140625, 0.7767791748046875, 0.818939208984375, 0.8610992431640625, 0.90325927734375, 0.9454193115234375, 0.987579345703125, 1.0297393798828125, 1.0718994140625, 1.1140594482421875, 1.156219482421875, 1.1983795166015625, 1.24053955078125, 1.2826995849609375, 1.324859619140625, 1.3670196533203125, 1.4091796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 14.0, 19.0, 43.0, 154.0, 255.0, 302.0, 148.0, 41.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28385353088379, -22.676546096801758, -22.069236755371094, -21.461929321289062, -20.85462188720703, -20.247314453125, -19.640005111694336, -19.032697677612305, -18.425390243530273, -17.818082809448242, -17.210773468017578, -16.603466033935547, -15.996158599853516, -15.388850212097168, -14.78154182434082, -14.174234390258789, -13.566926002502441, -12.959617614746094, -12.352310180664062, -11.745001792907715, -11.137694358825684, -10.530385971069336, -9.923078536987305, -9.315770149230957, -8.70846176147461, -8.101153373718262, -7.4938459396362305, -6.886537551879883, -6.279230117797852, -5.671921730041504, -5.0646138191223145, -4.457305908203125, -3.8499975204467773, -3.242689609527588, -2.6353816986083984, -2.02807354927063, -1.4207656383514404, -0.813457727432251, -0.20614957809448242, 0.40115833282470703, 1.0084662437438965, 1.615774154663086, 2.2230820655822754, 2.830390214920044, 3.4376981258392334, 4.045005798339844, 4.652314186096191, 5.259622097015381, 5.86693000793457, 6.47423791885376, 7.081545829772949, 7.688854217529297, 8.296161651611328, 8.903470039367676, 9.510778427124023, 10.118085861206055, 10.725393295288086, 11.332701683044434, 11.940009117126465, 12.547317504882812, 13.154624938964844, 13.761933326721191, 14.369241714477539, 14.97654914855957, 15.583857536315918]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 2.0, 4.0, 9.0, 7.0, 9.0, 10.0, 23.0, 20.0, 16.0, 18.0, 19.0, 25.0, 33.0, 30.0, 35.0, 42.0, 37.0, 54.0, 45.0, 56.0, 38.0, 57.0, 46.0, 53.0, 48.0, 48.0, 39.0, 24.0, 40.0, 23.0, 13.0, 17.0, 11.0, 11.0, 6.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.232562065124512, -4.072485446929932, -3.9124088287353516, -3.7523319721221924, -3.5922553539276123, -3.4321787357330322, -3.272101879119873, -3.112025260925293, -2.951948642730713, -2.791872024536133, -2.6317954063415527, -2.4717185497283936, -2.3116419315338135, -2.1515653133392334, -1.9914885759353638, -1.8314118385314941, -1.671335220336914, -1.511258602142334, -1.3511818647384644, -1.1911051273345947, -1.0310285091400146, -0.8709518313407898, -0.7108751535415649, -0.5507984161376953, -0.39072179794311523, -0.23064512014389038, -0.07056844234466553, 0.08950823545455933, 0.24958491325378418, 0.40966159105300903, 0.5697382688522339, 0.7298150062561035, 0.8898916244506836, 1.0499682426452637, 1.2100449800491333, 1.370121717453003, 1.530198335647583, 1.690274953842163, 1.8503516912460327, 2.0104284286499023, 2.1705050468444824, 2.3305816650390625, 2.4906582832336426, 2.6507351398468018, 2.810811758041382, 2.970888376235962, 3.130965232849121, 3.291041851043701, 3.4511184692382812, 3.6111950874328613, 3.7712717056274414, 3.9313485622406006, 4.091424942016602, 4.25150203704834, 4.41157865524292, 4.5716552734375, 4.73173189163208, 4.89180850982666, 5.05188512802124, 5.21196174621582, 5.372038841247559, 5.532115459442139, 5.692192077636719, 5.852268695831299, 6.012345314025879]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 4.0, 9.0, 11.0, 16.0, 17.0, 29.0, 39.0, 51.0, 84.0, 154.0, 256.0, 471.0, 890.0, 1694.0, 4096.0, 10850.0, 31811.0, 100088.0, 308407.0, 382150.0, 138887.0, 43979.0, 14759.0, 5224.0, 2212.0, 1014.0, 552.0, 284.0, 167.0, 119.0, 79.0, 39.0, 24.0, 16.0, 14.0, 14.0, 7.0, 6.0, 6.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.09375, -1.0617141723632812, -1.0296783447265625, -0.9976425170898438, -0.965606689453125, -0.9335708618164062, -0.9015350341796875, -0.8694992065429688, -0.83746337890625, -0.8054275512695312, -0.7733917236328125, -0.7413558959960938, -0.709320068359375, -0.6772842407226562, -0.6452484130859375, -0.6132125854492188, -0.5811767578125, -0.5491409301757812, -0.5171051025390625, -0.48506927490234375, -0.453033447265625, -0.42099761962890625, -0.3889617919921875, -0.35692596435546875, -0.32489013671875, -0.29285430908203125, -0.2608184814453125, -0.22878265380859375, -0.196746826171875, -0.16471099853515625, -0.1326751708984375, -0.10063934326171875, -0.068603515625, -0.03656768798828125, -0.0045318603515625, 0.02750396728515625, 0.059539794921875, 0.09157562255859375, 0.1236114501953125, 0.15564727783203125, 0.18768310546875, 0.21971893310546875, 0.2517547607421875, 0.28379058837890625, 0.315826416015625, 0.34786224365234375, 0.3798980712890625, 0.41193389892578125, 0.4439697265625, 0.47600555419921875, 0.5080413818359375, 0.5400772094726562, 0.572113037109375, 0.6041488647460938, 0.6361846923828125, 0.6682205200195312, 0.70025634765625, 0.7322921752929688, 0.7643280029296875, 0.7963638305664062, 0.828399658203125, 0.8604354858398438, 0.8924713134765625, 0.9245071411132812, 0.95654296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 11.0, 8.0, 15.0, 14.0, 13.0, 19.0, 22.0, 34.0, 31.0, 28.0, 47.0, 50.0, 46.0, 50.0, 50.0, 49.0, 45.0, 48.0, 55.0, 43.0, 52.0, 48.0, 31.0, 37.0, 29.0, 25.0, 16.0, 22.0, 8.0, 13.0, 7.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.5048828125, -0.49083709716796875, -0.4767913818359375, -0.46274566650390625, -0.448699951171875, -0.43465423583984375, -0.4206085205078125, -0.40656280517578125, -0.39251708984375, -0.37847137451171875, -0.3644256591796875, -0.35037994384765625, -0.336334228515625, -0.32228851318359375, -0.3082427978515625, -0.29419708251953125, -0.2801513671875, -0.26610565185546875, -0.2520599365234375, -0.23801422119140625, -0.223968505859375, -0.20992279052734375, -0.1958770751953125, -0.18183135986328125, -0.16778564453125, -0.15373992919921875, -0.1396942138671875, -0.12564849853515625, -0.111602783203125, -0.09755706787109375, -0.0835113525390625, -0.06946563720703125, -0.055419921875, -0.04137420654296875, -0.0273284912109375, -0.01328277587890625, 0.000762939453125, 0.01480865478515625, 0.0288543701171875, 0.04290008544921875, 0.05694580078125, 0.07099151611328125, 0.0850372314453125, 0.09908294677734375, 0.113128662109375, 0.12717437744140625, 0.1412200927734375, 0.15526580810546875, 0.1693115234375, 0.18335723876953125, 0.1974029541015625, 0.21144866943359375, 0.225494384765625, 0.23954010009765625, 0.2535858154296875, 0.26763153076171875, 0.28167724609375, 0.29572296142578125, 0.3097686767578125, 0.32381439208984375, 0.337860107421875, 0.35190582275390625, 0.3659515380859375, 0.37999725341796875, 0.39404296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 10.0, 12.0, 14.0, 31.0, 35.0, 69.0, 91.0, 157.0, 236.0, 483.0, 894.0, 2027.0, 6667.0, 46183.0, 738140.0, 228326.0, 18506.0, 3791.0, 1333.0, 651.0, 337.0, 204.0, 122.0, 78.0, 56.0, 29.0, 18.0, 18.0, 6.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.017486572265625, -1.93927001953125, -1.861053466796875, -1.7828369140625, -1.704620361328125, -1.62640380859375, -1.548187255859375, -1.469970703125, -1.391754150390625, -1.31353759765625, -1.235321044921875, -1.1571044921875, -1.078887939453125, -1.00067138671875, -0.922454833984375, -0.84423828125, -0.766021728515625, -0.68780517578125, -0.609588623046875, -0.5313720703125, -0.453155517578125, -0.37493896484375, -0.296722412109375, -0.218505859375, -0.140289306640625, -0.06207275390625, 0.016143798828125, 0.0943603515625, 0.172576904296875, 0.25079345703125, 0.329010009765625, 0.4072265625, 0.485443115234375, 0.56365966796875, 0.641876220703125, 0.7200927734375, 0.798309326171875, 0.87652587890625, 0.954742431640625, 1.032958984375, 1.111175537109375, 1.18939208984375, 1.267608642578125, 1.3458251953125, 1.424041748046875, 1.50225830078125, 1.580474853515625, 1.65869140625, 1.736907958984375, 1.81512451171875, 1.893341064453125, 1.9715576171875, 2.049774169921875, 2.12799072265625, 2.206207275390625, 2.284423828125, 2.362640380859375, 2.44085693359375, 2.519073486328125, 2.5972900390625, 2.675506591796875, 2.75372314453125, 2.831939697265625, 2.91015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 6.0, 15.0, 14.0, 26.0, 31.0, 33.0, 24.0, 32.0, 47.0, 47.0, 70.0, 49.0, 55.0, 71.0, 63.0, 49.0, 55.0, 50.0, 54.0, 47.0, 28.0, 22.0, 26.0, 16.0, 15.0, 14.0, 10.0, 12.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.83984375, -1.7762451171875, -1.712646484375, -1.6490478515625, -1.58544921875, -1.5218505859375, -1.458251953125, -1.3946533203125, -1.3310546875, -1.2674560546875, -1.203857421875, -1.1402587890625, -1.07666015625, -1.0130615234375, -0.949462890625, -0.8858642578125, -0.822265625, -0.7586669921875, -0.695068359375, -0.6314697265625, -0.56787109375, -0.5042724609375, -0.440673828125, -0.3770751953125, -0.3134765625, -0.2498779296875, -0.186279296875, -0.1226806640625, -0.05908203125, 0.0045166015625, 0.068115234375, 0.1317138671875, 0.1953125, 0.2589111328125, 0.322509765625, 0.3861083984375, 0.44970703125, 0.5133056640625, 0.576904296875, 0.6405029296875, 0.7041015625, 0.7677001953125, 0.831298828125, 0.8948974609375, 0.95849609375, 1.0220947265625, 1.085693359375, 1.1492919921875, 1.212890625, 1.2764892578125, 1.340087890625, 1.4036865234375, 1.46728515625, 1.5308837890625, 1.594482421875, 1.6580810546875, 1.7216796875, 1.7852783203125, 1.848876953125, 1.9124755859375, 1.97607421875, 2.0396728515625, 2.103271484375, 2.1668701171875, 2.23046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 11.0, 21.0, 19.0, 23.0, 45.0, 67.0, 141.0, 242.0, 829.0, 4360.0, 69246.0, 930318.0, 38671.0, 3259.0, 712.0, 235.0, 117.0, 68.0, 47.0, 28.0, 25.0, 16.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 5.0, 0.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.2845916748046875, -1.244964599609375, -1.2053375244140625, -1.16571044921875, -1.1260833740234375, -1.086456298828125, -1.0468292236328125, -1.0072021484375, -0.9675750732421875, -0.927947998046875, -0.8883209228515625, -0.84869384765625, -0.8090667724609375, -0.769439697265625, -0.7298126220703125, -0.690185546875, -0.6505584716796875, -0.610931396484375, -0.5713043212890625, -0.53167724609375, -0.4920501708984375, -0.452423095703125, -0.4127960205078125, -0.3731689453125, -0.3335418701171875, -0.293914794921875, -0.2542877197265625, -0.21466064453125, -0.1750335693359375, -0.135406494140625, -0.0957794189453125, -0.05615234375, -0.0165252685546875, 0.023101806640625, 0.0627288818359375, 0.10235595703125, 0.1419830322265625, 0.181610107421875, 0.2212371826171875, 0.2608642578125, 0.3004913330078125, 0.340118408203125, 0.3797454833984375, 0.41937255859375, 0.4589996337890625, 0.498626708984375, 0.5382537841796875, 0.577880859375, 0.6175079345703125, 0.657135009765625, 0.6967620849609375, 0.73638916015625, 0.7760162353515625, 0.815643310546875, 0.8552703857421875, 0.8948974609375, 0.9345245361328125, 0.974151611328125, 1.0137786865234375, 1.05340576171875, 1.0930328369140625, 1.132659912109375, 1.1722869873046875, 1.2119140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 4.0, 11.0, 8.0, 4.0, 9.0, 8.0, 7.0, 24.0, 16.0, 27.0, 23.0, 23.0, 38.0, 68.0, 102.0, 110.0, 97.0, 102.0, 66.0, 57.0, 43.0, 30.0, 20.0, 18.0, 12.0, 8.0, 13.0, 11.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010007619857788086, -9.64989885687828e-05, -9.292177855968475e-05, -8.93445685505867e-05, -8.576735854148865e-05, -8.21901485323906e-05, -7.861293852329254e-05, -7.503572851419449e-05, -7.145851850509644e-05, -6.788130849599838e-05, -6.430409848690033e-05, -6.0726888477802277e-05, -5.7149678468704224e-05, -5.357246845960617e-05, -4.999525845050812e-05, -4.6418048441410065e-05, -4.284083843231201e-05, -3.926362842321396e-05, -3.5686418414115906e-05, -3.210920840501785e-05, -2.85319983959198e-05, -2.4954788386821747e-05, -2.1377578377723694e-05, -1.780036836862564e-05, -1.4223158359527588e-05, -1.0645948350429535e-05, -7.068738341331482e-06, -3.491528332233429e-06, 8.568167686462402e-08, 3.662891685962677e-06, 7.24010169506073e-06, 1.0817311704158783e-05, 1.4394521713256836e-05, 1.797173172235489e-05, 2.1548941731452942e-05, 2.5126151740550995e-05, 2.8703361749649048e-05, 3.22805717587471e-05, 3.5857781767845154e-05, 3.943499177694321e-05, 4.301220178604126e-05, 4.658941179513931e-05, 5.0166621804237366e-05, 5.374383181333542e-05, 5.732104182243347e-05, 6.0898251831531525e-05, 6.447546184062958e-05, 6.805267184972763e-05, 7.162988185882568e-05, 7.520709186792374e-05, 7.878430187702179e-05, 8.236151188611984e-05, 8.59387218952179e-05, 8.951593190431595e-05, 9.3093141913414e-05, 9.667035192251205e-05, 0.00010024756193161011, 0.00010382477194070816, 0.00010740198194980621, 0.00011097919195890427, 0.00011455640196800232, 0.00011813361197710037, 0.00012171082198619843, 0.00012528803199529648, 0.00012886524200439453]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 12.0, 9.0, 12.0, 14.0, 28.0, 33.0, 44.0, 69.0, 97.0, 144.0, 238.0, 369.0, 664.0, 1356.0, 3010.0, 7649.0, 24460.0, 130287.0, 690566.0, 148073.0, 26813.0, 8183.0, 3157.0, 1428.0, 711.0, 399.0, 222.0, 153.0, 99.0, 67.0, 58.0, 34.0, 24.0, 20.0, 12.0, 12.0, 5.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.56005859375, -0.5442962646484375, -0.528533935546875, -0.5127716064453125, -0.49700927734375, -0.4812469482421875, -0.465484619140625, -0.4497222900390625, -0.4339599609375, -0.4181976318359375, -0.402435302734375, -0.3866729736328125, -0.37091064453125, -0.3551483154296875, -0.339385986328125, -0.3236236572265625, -0.307861328125, -0.2920989990234375, -0.276336669921875, -0.2605743408203125, -0.24481201171875, -0.2290496826171875, -0.213287353515625, -0.1975250244140625, -0.1817626953125, -0.1660003662109375, -0.150238037109375, -0.1344757080078125, -0.11871337890625, -0.1029510498046875, -0.087188720703125, -0.0714263916015625, -0.0556640625, -0.0399017333984375, -0.024139404296875, -0.0083770751953125, 0.00738525390625, 0.0231475830078125, 0.038909912109375, 0.0546722412109375, 0.0704345703125, 0.0861968994140625, 0.101959228515625, 0.1177215576171875, 0.13348388671875, 0.1492462158203125, 0.165008544921875, 0.1807708740234375, 0.196533203125, 0.2122955322265625, 0.228057861328125, 0.2438201904296875, 0.25958251953125, 0.2753448486328125, 0.291107177734375, 0.3068695068359375, 0.3226318359375, 0.3383941650390625, 0.354156494140625, 0.3699188232421875, 0.38568115234375, 0.4014434814453125, 0.417205810546875, 0.4329681396484375, 0.44873046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 4.0, 7.0, 8.0, 15.0, 20.0, 18.0, 51.0, 56.0, 74.0, 98.0, 111.0, 130.0, 109.0, 80.0, 60.0, 37.0, 30.0, 17.0, 16.0, 11.0, 4.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6962890625, -0.6774749755859375, -0.658660888671875, -0.6398468017578125, -0.62103271484375, -0.6022186279296875, -0.583404541015625, -0.5645904541015625, -0.5457763671875, -0.5269622802734375, -0.508148193359375, -0.4893341064453125, -0.47052001953125, -0.4517059326171875, -0.432891845703125, -0.4140777587890625, -0.395263671875, -0.3764495849609375, -0.357635498046875, -0.3388214111328125, -0.32000732421875, -0.3011932373046875, -0.282379150390625, -0.2635650634765625, -0.2447509765625, -0.2259368896484375, -0.207122802734375, -0.1883087158203125, -0.16949462890625, -0.1506805419921875, -0.131866455078125, -0.1130523681640625, -0.09423828125, -0.0754241943359375, -0.056610107421875, -0.0377960205078125, -0.01898193359375, -0.0001678466796875, 0.018646240234375, 0.0374603271484375, 0.0562744140625, 0.0750885009765625, 0.093902587890625, 0.1127166748046875, 0.13153076171875, 0.1503448486328125, 0.169158935546875, 0.1879730224609375, 0.206787109375, 0.2256011962890625, 0.244415283203125, 0.2632293701171875, 0.28204345703125, 0.3008575439453125, 0.319671630859375, 0.3384857177734375, 0.3572998046875, 0.3761138916015625, 0.394927978515625, 0.4137420654296875, 0.43255615234375, 0.4513702392578125, 0.470184326171875, 0.4889984130859375, 0.5078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 29.0, 84.0, 195.0, 361.0, 198.0, 72.0, 23.0, 8.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.933807373046875, -27.320947647094727, -26.708086013793945, -26.095226287841797, -25.482364654541016, -24.869504928588867, -24.25664520263672, -23.643783569335938, -23.03092384338379, -22.41806411743164, -21.80520248413086, -21.19234275817871, -20.579483032226562, -19.96662139892578, -19.353761672973633, -18.740901947021484, -18.128040313720703, -17.515180587768555, -16.902318954467773, -16.289459228515625, -15.67659854888916, -15.063737869262695, -14.450878143310547, -13.838017463684082, -13.225156784057617, -12.612296104431152, -11.999435424804688, -11.386575698852539, -10.773715019226074, -10.16085433959961, -9.547994613647461, -8.935133934020996, -8.322274208068848, -7.709413528442383, -7.096553325653076, -6.4836931228637695, -5.870832443237305, -5.25797176361084, -4.645111560821533, -4.032251358032227, -3.4193906784057617, -2.806530237197876, -2.1936697959899902, -1.5808093547821045, -0.9679489135742188, -0.355088472366333, 0.25777196884155273, 0.8706321716308594, 1.4834928512573242, 2.09635329246521, 2.7092137336730957, 3.3220741748809814, 3.934934616088867, 4.547795295715332, 5.160655498504639, 5.773515701293945, 6.38637638092041, 6.999237060546875, 7.612097263336182, 8.224957466125488, 8.837818145751953, 9.450678825378418, 10.063539505004883, 10.676399230957031, 11.289259910583496]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 10.0, 6.0, 12.0, 15.0, 16.0, 19.0, 22.0, 18.0, 16.0, 25.0, 17.0, 37.0, 28.0, 31.0, 32.0, 54.0, 61.0, 61.0, 62.0, 61.0, 51.0, 34.0, 42.0, 43.0, 32.0, 20.0, 21.0, 13.0, 16.0, 20.0, 15.0, 11.0, 11.0, 15.0, 9.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.408458709716797, -6.203574180603027, -5.9986891746521, -5.79380464553833, -5.5889201164245605, -5.384035110473633, -5.179150581359863, -4.974266052246094, -4.769381046295166, -4.5644965171813965, -4.359611511230469, -4.154726982116699, -3.9498422145843506, -3.744957447052002, -3.5400729179382324, -3.335188150405884, -3.1303036212921143, -2.9254188537597656, -2.720534324645996, -2.5156495571136475, -2.310764789581299, -2.1058802604675293, -1.9009954929351807, -1.696110725402832, -1.491226077079773, -1.2863414287567139, -1.0814566612243652, -0.8765720129013062, -0.6716873049736023, -0.46680259704589844, -0.26191794872283936, -0.05703318119049072, 0.14785146713256836, 0.3527361750602722, 0.5576208829879761, 0.7625055313110352, 0.967390239238739, 1.1722749471664429, 1.377159595489502, 1.5820443630218506, 1.7869290113449097, 1.9918136596679688, 2.1966984272003174, 2.401583194732666, 2.6064677238464355, 2.811352491378784, 3.016237258911133, 3.2211217880249023, 3.426006555557251, 3.6308913230895996, 3.835775852203369, 4.040660858154297, 4.245545387268066, 4.450429916381836, 4.6553144454956055, 4.860199451446533, 5.065083980560303, 5.269968509674072, 5.474853515625, 5.6797380447387695, 5.884622573852539, 6.089507579803467, 6.294392108917236, 6.499277114868164, 6.704161643981934]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 28.0, 35.0, 36.0, 81.0, 121.0, 244.0, 463.0, 999.0, 2794.0, 10529.0, 77769.0, 2818607.0, 1226050.0, 44809.0, 7782.0, 2241.0, 863.0, 390.0, 174.0, 94.0, 73.0, 25.0, 12.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1008453369140625, -1.063995361328125, -1.0271453857421875, -0.99029541015625, -0.9534454345703125, -0.916595458984375, -0.8797454833984375, -0.8428955078125, -0.8060455322265625, -0.769195556640625, -0.7323455810546875, -0.69549560546875, -0.6586456298828125, -0.621795654296875, -0.5849456787109375, -0.548095703125, -0.5112457275390625, -0.474395751953125, -0.4375457763671875, -0.40069580078125, -0.3638458251953125, -0.326995849609375, -0.2901458740234375, -0.2532958984375, -0.2164459228515625, -0.179595947265625, -0.1427459716796875, -0.10589599609375, -0.0690460205078125, -0.032196044921875, 0.0046539306640625, 0.04150390625, 0.0783538818359375, 0.115203857421875, 0.1520538330078125, 0.18890380859375, 0.2257537841796875, 0.262603759765625, 0.2994537353515625, 0.3363037109375, 0.3731536865234375, 0.410003662109375, 0.4468536376953125, 0.48370361328125, 0.5205535888671875, 0.557403564453125, 0.5942535400390625, 0.631103515625, 0.6679534912109375, 0.704803466796875, 0.7416534423828125, 0.77850341796875, 0.8153533935546875, 0.852203369140625, 0.8890533447265625, 0.9259033203125, 0.9627532958984375, 0.999603271484375, 1.0364532470703125, 1.07330322265625, 1.1101531982421875, 1.147003173828125, 1.1838531494140625, 1.220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 10.0, 8.0, 20.0, 29.0, 24.0, 29.0, 49.0, 41.0, 41.0, 58.0, 53.0, 58.0, 70.0, 66.0, 60.0, 56.0, 54.0, 44.0, 39.0, 32.0, 28.0, 32.0, 22.0, 17.0, 7.0, 7.0, 13.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.66162109375, -0.6453170776367188, -0.6290130615234375, -0.6127090454101562, -0.596405029296875, -0.5801010131835938, -0.5637969970703125, -0.5474929809570312, -0.53118896484375, -0.5148849487304688, -0.4985809326171875, -0.48227691650390625, -0.465972900390625, -0.44966888427734375, -0.4333648681640625, -0.41706085205078125, -0.4007568359375, -0.38445281982421875, -0.3681488037109375, -0.35184478759765625, -0.335540771484375, -0.31923675537109375, -0.3029327392578125, -0.28662872314453125, -0.27032470703125, -0.25402069091796875, -0.2377166748046875, -0.22141265869140625, -0.205108642578125, -0.18880462646484375, -0.1725006103515625, -0.15619659423828125, -0.139892578125, -0.12358856201171875, -0.1072845458984375, -0.09098052978515625, -0.074676513671875, -0.05837249755859375, -0.0420684814453125, -0.02576446533203125, -0.00946044921875, 0.00684356689453125, 0.0231475830078125, 0.03945159912109375, 0.055755615234375, 0.07205963134765625, 0.0883636474609375, 0.10466766357421875, 0.1209716796875, 0.13727569580078125, 0.1535797119140625, 0.16988372802734375, 0.186187744140625, 0.20249176025390625, 0.2187957763671875, 0.23509979248046875, 0.25140380859375, 0.26770782470703125, 0.2840118408203125, 0.30031585693359375, 0.316619873046875, 0.33292388916015625, 0.3492279052734375, 0.36553192138671875, 0.3818359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 20.0, 29.0, 35.0, 57.0, 141.0, 251.0, 613.0, 1335.0, 3705.0, 17080.0, 470641.0, 3632147.0, 57346.0, 7291.0, 2023.0, 743.0, 376.0, 187.0, 102.0, 60.0, 20.0, 24.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.115234375, -2.0551910400390625, -1.995147705078125, -1.9351043701171875, -1.87506103515625, -1.8150177001953125, -1.754974365234375, -1.6949310302734375, -1.6348876953125, -1.5748443603515625, -1.514801025390625, -1.4547576904296875, -1.39471435546875, -1.3346710205078125, -1.274627685546875, -1.2145843505859375, -1.154541015625, -1.0944976806640625, -1.034454345703125, -0.9744110107421875, -0.91436767578125, -0.8543243408203125, -0.794281005859375, -0.7342376708984375, -0.6741943359375, -0.6141510009765625, -0.554107666015625, -0.4940643310546875, -0.43402099609375, -0.3739776611328125, -0.313934326171875, -0.2538909912109375, -0.19384765625, -0.1338043212890625, -0.073760986328125, -0.0137176513671875, 0.04632568359375, 0.1063690185546875, 0.166412353515625, 0.2264556884765625, 0.2864990234375, 0.3465423583984375, 0.406585693359375, 0.4666290283203125, 0.52667236328125, 0.5867156982421875, 0.646759033203125, 0.7068023681640625, 0.766845703125, 0.8268890380859375, 0.886932373046875, 0.9469757080078125, 1.00701904296875, 1.0670623779296875, 1.127105712890625, 1.1871490478515625, 1.2471923828125, 1.3072357177734375, 1.367279052734375, 1.4273223876953125, 1.48736572265625, 1.5474090576171875, 1.607452392578125, 1.6674957275390625, 1.7275390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 20.0, 34.0, 48.0, 113.0, 286.0, 777.0, 1269.0, 840.0, 318.0, 137.0, 79.0, 45.0, 22.0, 17.0, 15.0, 12.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.57421875, -1.5226898193359375, -1.471160888671875, -1.4196319580078125, -1.36810302734375, -1.3165740966796875, -1.265045166015625, -1.2135162353515625, -1.1619873046875, -1.1104583740234375, -1.058929443359375, -1.0074005126953125, -0.95587158203125, -0.9043426513671875, -0.852813720703125, -0.8012847900390625, -0.749755859375, -0.6982269287109375, -0.646697998046875, -0.5951690673828125, -0.54364013671875, -0.4921112060546875, -0.440582275390625, -0.3890533447265625, -0.3375244140625, -0.2859954833984375, -0.234466552734375, -0.1829376220703125, -0.13140869140625, -0.0798797607421875, -0.028350830078125, 0.0231781005859375, 0.07470703125, 0.1262359619140625, 0.177764892578125, 0.2292938232421875, 0.28082275390625, 0.3323516845703125, 0.383880615234375, 0.4354095458984375, 0.4869384765625, 0.5384674072265625, 0.589996337890625, 0.6415252685546875, 0.69305419921875, 0.7445831298828125, 0.796112060546875, 0.8476409912109375, 0.899169921875, 0.9506988525390625, 1.002227783203125, 1.0537567138671875, 1.10528564453125, 1.1568145751953125, 1.208343505859375, 1.2598724365234375, 1.3114013671875, 1.3629302978515625, 1.414459228515625, 1.4659881591796875, 1.51751708984375, 1.5690460205078125, 1.620574951171875, 1.6721038818359375, 1.7236328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 11.0, 43.0, 170.0, 366.0, 293.0, 72.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.587276458740234, -15.914616584777832, -15.24195671081543, -14.569295883178711, -13.896636009216309, -13.223976135253906, -12.551315307617188, -11.878655433654785, -11.205995559692383, -10.53333568572998, -9.860675811767578, -9.18801498413086, -8.515355110168457, -7.842695236206055, -7.170034885406494, -6.497374534606934, -5.824714660644531, -5.152054786682129, -4.479394435882568, -3.806734323501587, -3.1340742111206055, -2.461414098739624, -1.7887539863586426, -1.116093635559082, -0.4434337615966797, 0.22922635078430176, 0.9018864631652832, 1.5745465755462646, 2.247206687927246, 2.9198668003082275, 3.592526912689209, 4.2651872634887695, 4.937849044799805, 5.610508918762207, 6.283169269561768, 6.955829620361328, 7.6284894943237305, 8.301149368286133, 8.973810195922852, 9.646470069885254, 10.319129943847656, 10.991789817810059, 11.664449691772461, 12.33711051940918, 13.009770393371582, 13.682430267333984, 14.355091094970703, 15.027750968933105, 15.700410842895508, 16.373071670532227, 17.045730590820312, 17.71839141845703, 18.39105224609375, 19.063711166381836, 19.736371994018555, 20.40903091430664, 21.08169174194336, 21.754352569580078, 22.427011489868164, 23.099672317504883, 23.77233123779297, 24.444992065429688, 25.117652893066406, 25.790313720703125, 26.46297264099121]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 6.0, 10.0, 18.0, 27.0, 33.0, 51.0, 85.0, 112.0, 114.0, 113.0, 113.0, 79.0, 77.0, 48.0, 52.0, 23.0, 16.0, 6.0, 8.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.131828308105469, -11.812901496887207, -11.493973731994629, -11.175046920776367, -10.856120109558105, -10.537193298339844, -10.218265533447266, -9.899338722229004, -9.580411911010742, -9.26148509979248, -8.942557334899902, -8.62363052368164, -8.304703712463379, -7.985776424407959, -7.666849136352539, -7.347922325134277, -7.028995037078857, -6.7100677490234375, -6.391140937805176, -6.072213649749756, -5.753286838531494, -5.434359550476074, -5.1154327392578125, -4.796505451202393, -4.477578163146973, -4.158650875091553, -3.839724063873291, -3.520796775817871, -3.2018699645996094, -2.8829426765441895, -2.5640156269073486, -2.245088577270508, -1.926161766052246, -1.6072347164154053, -1.2883076667785645, -0.9693804979324341, -0.6504534482955933, -0.33152639865875244, -0.01259922981262207, 0.30632781982421875, 0.6252548694610596, 0.9441819190979004, 1.2631089687347412, 1.5820361375808716, 1.9009631872177124, 2.2198901176452637, 2.5388174057006836, 2.8577444553375244, 3.1766715049743652, 3.495598554611206, 3.814525604248047, 4.133452892303467, 4.4523797035217285, 4.771306991577148, 5.09023380279541, 5.40916109085083, 5.72808837890625, 6.04701566696167, 6.365942478179932, 6.684869766235352, 7.003796577453613, 7.322723865509033, 7.641651153564453, 7.960577964782715, 8.279504776000977]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 7.0, 18.0, 12.0, 22.0, 43.0, 50.0, 80.0, 115.0, 152.0, 404.0, 747.0, 1763.0, 5268.0, 18451.0, 83410.0, 355060.0, 430912.0, 116107.0, 25089.0, 6640.0, 2177.0, 966.0, 408.0, 209.0, 127.0, 76.0, 60.0, 40.0, 24.0, 23.0, 19.0, 13.0, 18.0, 4.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0], "bins": [-1.365234375, -1.330322265625, -1.29541015625, -1.260498046875, -1.2255859375, -1.190673828125, -1.15576171875, -1.120849609375, -1.0859375, -1.051025390625, -1.01611328125, -0.981201171875, -0.9462890625, -0.911376953125, -0.87646484375, -0.841552734375, -0.806640625, -0.771728515625, -0.73681640625, -0.701904296875, -0.6669921875, -0.632080078125, -0.59716796875, -0.562255859375, -0.52734375, -0.492431640625, -0.45751953125, -0.422607421875, -0.3876953125, -0.352783203125, -0.31787109375, -0.282958984375, -0.248046875, -0.213134765625, -0.17822265625, -0.143310546875, -0.1083984375, -0.073486328125, -0.03857421875, -0.003662109375, 0.03125, 0.066162109375, 0.10107421875, 0.135986328125, 0.1708984375, 0.205810546875, 0.24072265625, 0.275634765625, 0.310546875, 0.345458984375, 0.38037109375, 0.415283203125, 0.4501953125, 0.485107421875, 0.52001953125, 0.554931640625, 0.58984375, 0.624755859375, 0.65966796875, 0.694580078125, 0.7294921875, 0.764404296875, 0.79931640625, 0.834228515625, 0.869140625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 11.0, 25.0, 13.0, 24.0, 28.0, 51.0, 52.0, 53.0, 59.0, 72.0, 66.0, 74.0, 73.0, 67.0, 58.0, 51.0, 49.0, 29.0, 39.0, 27.0, 23.0, 12.0, 13.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7346534729003906, -0.7154006958007812, -0.6961479187011719, -0.6768951416015625, -0.6576423645019531, -0.6383895874023438, -0.6191368103027344, -0.599884033203125, -0.5806312561035156, -0.5613784790039062, -0.5421257019042969, -0.5228729248046875, -0.5036201477050781, -0.48436737060546875, -0.4651145935058594, -0.44586181640625, -0.4266090393066406, -0.40735626220703125, -0.3881034851074219, -0.3688507080078125, -0.3495979309082031, -0.33034515380859375, -0.3110923767089844, -0.291839599609375, -0.2725868225097656, -0.25333404541015625, -0.23408126831054688, -0.2148284912109375, -0.19557571411132812, -0.17632293701171875, -0.15707015991210938, -0.1378173828125, -0.11856460571289062, -0.09931182861328125, -0.08005905151367188, -0.0608062744140625, -0.041553497314453125, -0.02230072021484375, -0.003047943115234375, 0.016204833984375, 0.035457611083984375, 0.05471038818359375, 0.07396316528320312, 0.0932159423828125, 0.11246871948242188, 0.13172149658203125, 0.15097427368164062, 0.17022705078125, 0.18947982788085938, 0.20873260498046875, 0.22798538208007812, 0.2472381591796875, 0.2664909362792969, 0.28574371337890625, 0.3049964904785156, 0.324249267578125, 0.3435020446777344, 0.36275482177734375, 0.3820075988769531, 0.4012603759765625, 0.4205131530761719, 0.43976593017578125, 0.4590187072753906, 0.478271484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 6.0, 5.0, 13.0, 14.0, 29.0, 33.0, 42.0, 65.0, 113.0, 177.0, 463.0, 1034.0, 3394.0, 15076.0, 100422.0, 687392.0, 204988.0, 27204.0, 5356.0, 1528.0, 569.0, 247.0, 127.0, 76.0, 55.0, 36.0, 20.0, 13.0, 8.0, 18.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1628265380859375, -1.115692138671875, -1.0685577392578125, -1.02142333984375, -0.9742889404296875, -0.927154541015625, -0.8800201416015625, -0.8328857421875, -0.7857513427734375, -0.738616943359375, -0.6914825439453125, -0.64434814453125, -0.5972137451171875, -0.550079345703125, -0.5029449462890625, -0.455810546875, -0.4086761474609375, -0.361541748046875, -0.3144073486328125, -0.26727294921875, -0.2201385498046875, -0.173004150390625, -0.1258697509765625, -0.0787353515625, -0.0316009521484375, 0.015533447265625, 0.0626678466796875, 0.10980224609375, 0.1569366455078125, 0.204071044921875, 0.2512054443359375, 0.29833984375, 0.3454742431640625, 0.392608642578125, 0.4397430419921875, 0.48687744140625, 0.5340118408203125, 0.581146240234375, 0.6282806396484375, 0.6754150390625, 0.7225494384765625, 0.769683837890625, 0.8168182373046875, 0.86395263671875, 0.9110870361328125, 0.958221435546875, 1.0053558349609375, 1.052490234375, 1.0996246337890625, 1.146759033203125, 1.1938934326171875, 1.24102783203125, 1.2881622314453125, 1.335296630859375, 1.3824310302734375, 1.4295654296875, 1.4766998291015625, 1.523834228515625, 1.5709686279296875, 1.61810302734375, 1.6652374267578125, 1.712371826171875, 1.7595062255859375, 1.806640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 4.0, 8.0, 7.0, 12.0, 10.0, 19.0, 14.0, 23.0, 20.0, 19.0, 28.0, 30.0, 49.0, 40.0, 49.0, 62.0, 53.0, 60.0, 56.0, 49.0, 44.0, 49.0, 46.0, 37.0, 41.0, 31.0, 15.0, 22.0, 24.0, 19.0, 13.0, 12.0, 8.0, 3.0, 8.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3206024169921875, -1.271087646484375, -1.2215728759765625, -1.17205810546875, -1.1225433349609375, -1.073028564453125, -1.0235137939453125, -0.9739990234375, -0.9244842529296875, -0.874969482421875, -0.8254547119140625, -0.77593994140625, -0.7264251708984375, -0.676910400390625, -0.6273956298828125, -0.577880859375, -0.5283660888671875, -0.478851318359375, -0.4293365478515625, -0.37982177734375, -0.3303070068359375, -0.280792236328125, -0.2312774658203125, -0.1817626953125, -0.1322479248046875, -0.082733154296875, -0.0332183837890625, 0.01629638671875, 0.0658111572265625, 0.115325927734375, 0.1648406982421875, 0.21435546875, 0.2638702392578125, 0.313385009765625, 0.3628997802734375, 0.41241455078125, 0.4619293212890625, 0.511444091796875, 0.5609588623046875, 0.6104736328125, 0.6599884033203125, 0.709503173828125, 0.7590179443359375, 0.80853271484375, 0.8580474853515625, 0.907562255859375, 0.9570770263671875, 1.006591796875, 1.0561065673828125, 1.105621337890625, 1.1551361083984375, 1.20465087890625, 1.2541656494140625, 1.303680419921875, 1.3531951904296875, 1.4027099609375, 1.4522247314453125, 1.501739501953125, 1.5512542724609375, 1.60076904296875, 1.6502838134765625, 1.699798583984375, 1.7493133544921875, 1.798828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 10.0, 15.0, 18.0, 28.0, 49.0, 82.0, 139.0, 268.0, 618.0, 1546.0, 4512.0, 15612.0, 61801.0, 290919.0, 555563.0, 86863.0, 21044.0, 5927.0, 2041.0, 744.0, 320.0, 168.0, 100.0, 47.0, 45.0, 18.0, 11.0, 7.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.387939453125, -0.377197265625, -0.366455078125, -0.355712890625, -0.344970703125, -0.334228515625, -0.323486328125, -0.312744140625, -0.302001953125, -0.291259765625, -0.280517578125, -0.269775390625, -0.259033203125, -0.248291015625, -0.237548828125, -0.226806640625, -0.216064453125, -0.205322265625, -0.194580078125, -0.183837890625, -0.173095703125, -0.162353515625, -0.151611328125, -0.140869140625, -0.130126953125, -0.119384765625, -0.108642578125, -0.097900390625, -0.087158203125, -0.076416015625, -0.065673828125, -0.054931640625, -0.044189453125, -0.033447265625, -0.022705078125, -0.011962890625, -0.001220703125, 0.009521484375, 0.020263671875, 0.031005859375, 0.041748046875, 0.052490234375, 0.063232421875, 0.073974609375, 0.084716796875, 0.095458984375, 0.106201171875, 0.116943359375, 0.127685546875, 0.138427734375, 0.149169921875, 0.159912109375, 0.170654296875, 0.181396484375, 0.192138671875, 0.202880859375, 0.213623046875, 0.224365234375, 0.235107421875, 0.245849609375, 0.256591796875, 0.267333984375, 0.278076171875, 0.288818359375, 0.299560546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 6.0, 8.0, 5.0, 9.0, 10.0, 13.0, 10.0, 18.0, 23.0, 17.0, 33.0, 36.0, 51.0, 63.0, 73.0, 77.0, 83.0, 90.0, 68.0, 63.0, 53.0, 31.0, 34.0, 29.0, 19.0, 17.0, 9.0, 10.0, 6.0, 5.0, 4.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.236003875732422e-05, -7.019378244876862e-05, -6.802752614021301e-05, -6.586126983165741e-05, -6.36950135231018e-05, -6.15287572145462e-05, -5.93625009059906e-05, -5.7196244597435e-05, -5.5029988288879395e-05, -5.286373198032379e-05, -5.069747567176819e-05, -4.8531219363212585e-05, -4.636496305465698e-05, -4.419870674610138e-05, -4.2032450437545776e-05, -3.986619412899017e-05, -3.769993782043457e-05, -3.553368151187897e-05, -3.3367425203323364e-05, -3.120116889476776e-05, -2.9034912586212158e-05, -2.6868656277656555e-05, -2.4702399969100952e-05, -2.253614366054535e-05, -2.0369887351989746e-05, -1.8203631043434143e-05, -1.603737473487854e-05, -1.3871118426322937e-05, -1.1704862117767334e-05, -9.538605809211731e-06, -7.372349500656128e-06, -5.206093192100525e-06, -3.039836883544922e-06, -8.735805749893188e-07, 1.2926757335662842e-06, 3.458932042121887e-06, 5.62518835067749e-06, 7.791444659233093e-06, 9.957700967788696e-06, 1.21239572763443e-05, 1.4290213584899902e-05, 1.6456469893455505e-05, 1.862272620201111e-05, 2.078898251056671e-05, 2.2955238819122314e-05, 2.5121495127677917e-05, 2.728775143623352e-05, 2.9454007744789124e-05, 3.1620264053344727e-05, 3.378652036190033e-05, 3.595277667045593e-05, 3.8119032979011536e-05, 4.028528928756714e-05, 4.245154559612274e-05, 4.4617801904678345e-05, 4.678405821323395e-05, 4.895031452178955e-05, 5.1116570830345154e-05, 5.328282713890076e-05, 5.544908344745636e-05, 5.761533975601196e-05, 5.9781596064567566e-05, 6.194785237312317e-05, 6.411410868167877e-05, 6.628036499023438e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 16.0, 33.0, 42.0, 110.0, 276.0, 664.0, 2234.0, 9471.0, 62369.0, 658875.0, 275215.0, 31255.0, 5564.0, 1574.0, 455.0, 197.0, 71.0, 47.0, 27.0, 17.0, 6.0, 12.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5510940551757812, -0.5348052978515625, -0.5185165405273438, -0.502227783203125, -0.48593902587890625, -0.4696502685546875, -0.45336151123046875, -0.43707275390625, -0.42078399658203125, -0.4044952392578125, -0.38820648193359375, -0.371917724609375, -0.35562896728515625, -0.3393402099609375, -0.32305145263671875, -0.3067626953125, -0.29047393798828125, -0.2741851806640625, -0.25789642333984375, -0.241607666015625, -0.22531890869140625, -0.2090301513671875, -0.19274139404296875, -0.17645263671875, -0.16016387939453125, -0.1438751220703125, -0.12758636474609375, -0.111297607421875, -0.09500885009765625, -0.0787200927734375, -0.06243133544921875, -0.046142578125, -0.02985382080078125, -0.0135650634765625, 0.00272369384765625, 0.019012451171875, 0.03530120849609375, 0.0515899658203125, 0.06787872314453125, 0.08416748046875, 0.10045623779296875, 0.1167449951171875, 0.13303375244140625, 0.149322509765625, 0.16561126708984375, 0.1819000244140625, 0.19818878173828125, 0.2144775390625, 0.23076629638671875, 0.2470550537109375, 0.26334381103515625, 0.279632568359375, 0.29592132568359375, 0.3122100830078125, 0.32849884033203125, 0.34478759765625, 0.36107635498046875, 0.3773651123046875, 0.39365386962890625, 0.409942626953125, 0.42623138427734375, 0.4425201416015625, 0.45880889892578125, 0.47509765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 8.0, 13.0, 14.0, 24.0, 34.0, 50.0, 66.0, 78.0, 91.0, 95.0, 98.0, 96.0, 71.0, 79.0, 53.0, 23.0, 26.0, 16.0, 9.0, 11.0, 8.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.4088325500488281, -0.39579010009765625, -0.3827476501464844, -0.3697052001953125, -0.3566627502441406, -0.34362030029296875, -0.3305778503417969, -0.317535400390625, -0.3044929504394531, -0.29145050048828125, -0.2784080505371094, -0.2653656005859375, -0.2523231506347656, -0.23928070068359375, -0.22623825073242188, -0.21319580078125, -0.20015335083007812, -0.18711090087890625, -0.17406845092773438, -0.1610260009765625, -0.14798355102539062, -0.13494110107421875, -0.12189865112304688, -0.108856201171875, -0.09581375122070312, -0.08277130126953125, -0.06972885131835938, -0.0566864013671875, -0.043643951416015625, -0.03060150146484375, -0.017559051513671875, -0.0045166015625, 0.008525848388671875, 0.02156829833984375, 0.034610748291015625, 0.0476531982421875, 0.060695648193359375, 0.07373809814453125, 0.08678054809570312, 0.099822998046875, 0.11286544799804688, 0.12590789794921875, 0.13895034790039062, 0.1519927978515625, 0.16503524780273438, 0.17807769775390625, 0.19112014770507812, 0.20416259765625, 0.21720504760742188, 0.23024749755859375, 0.24328994750976562, 0.2563323974609375, 0.2693748474121094, 0.28241729736328125, 0.2954597473144531, 0.308502197265625, 0.3215446472167969, 0.33458709716796875, 0.3476295471191406, 0.3606719970703125, 0.3737144470214844, 0.38675689697265625, 0.3997993469238281, 0.412841796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 14.0, 32.0, 42.0, 100.0, 137.0, 262.0, 177.0, 106.0, 53.0, 35.0, 10.0, 4.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.354994773864746, -12.025959968566895, -11.696925163269043, -11.367890357971191, -11.038856506347656, -10.709821701049805, -10.380786895751953, -10.051752090454102, -9.72271728515625, -9.393682479858398, -9.064647674560547, -8.735612869262695, -8.406578063964844, -8.077544212341309, -7.748509407043457, -7.4194746017456055, -7.090439796447754, -6.761404991149902, -6.432370185852051, -6.103335857391357, -5.774301052093506, -5.445266246795654, -5.116231918334961, -4.787197113037109, -4.458162307739258, -4.129127502441406, -3.800092935562134, -3.4710583686828613, -3.1420235633850098, -2.812988758087158, -2.4839541912078857, -2.1549196243286133, -1.8258857727050781, -1.4968510866165161, -1.167816400527954, -0.8387817144393921, -0.5097470283508301, -0.18071234226226807, 0.14832234382629395, 0.4773569107055664, 0.806391716003418, 1.13542640209198, 1.464461088180542, 1.793495774269104, 2.122530460357666, 2.4515652656555176, 2.78059983253479, 3.1096343994140625, 3.438669204711914, 3.7677040100097656, 4.096738815307617, 4.4257731437683105, 4.754807949066162, 5.083842754364014, 5.412877082824707, 5.741911888122559, 6.07094669342041, 6.399981498718262, 6.729016304016113, 7.058050632476807, 7.387085437774658, 7.71612024307251, 8.045154571533203, 8.374189376831055, 8.703224182128906]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 9.0, 11.0, 7.0, 11.0, 13.0, 10.0, 13.0, 19.0, 21.0, 30.0, 20.0, 28.0, 37.0, 44.0, 49.0, 49.0, 55.0, 82.0, 82.0, 55.0, 48.0, 49.0, 39.0, 29.0, 27.0, 26.0, 14.0, 14.0, 16.0, 25.0, 13.0, 8.0, 5.0, 9.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.281209468841553, -6.097168922424316, -5.91312837600708, -5.729087829589844, -5.545047283172607, -5.361006736755371, -5.176965713500977, -4.99292516708374, -4.808884620666504, -4.624844074249268, -4.440803527832031, -4.256762981414795, -4.072722434997559, -3.888681650161743, -3.704641103744507, -3.5206003189086914, -3.336560010910034, -3.152519464492798, -2.9684789180755615, -2.784438133239746, -2.6003975868225098, -2.4163570404052734, -2.232316493988037, -2.048275947570801, -1.864235281944275, -1.6801947355270386, -1.4961540699005127, -1.3121135234832764, -1.12807297706604, -0.9440323114395142, -0.7599917650222778, -0.575951099395752, -0.3919105529785156, -0.20786996185779572, -0.023829370737075806, 0.1602112054824829, 0.344251811504364, 0.5282924175262451, 0.7123329639434814, 0.8963736295700073, 1.0804141759872437, 1.26445472240448, 1.4484953880310059, 1.6325359344482422, 1.8165764808654785, 2.000617027282715, 2.184657573699951, 2.3686983585357666, 2.552738904953003, 2.7367794513702393, 2.9208199977874756, 3.104860782623291, 3.2889013290405273, 3.4729418754577637, 3.656982421875, 3.8410229682922363, 4.025063514709473, 4.209104061126709, 4.393144607543945, 4.577185153961182, 4.761225700378418, 4.9452667236328125, 5.129306793212891, 5.313347816467285, 5.4973883628845215]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 10.0, 14.0, 19.0, 25.0, 37.0, 68.0, 98.0, 161.0, 268.0, 472.0, 929.0, 1869.0, 4622.0, 14504.0, 71649.0, 753253.0, 2914212.0, 367876.0, 45644.0, 11165.0, 3858.0, 1707.0, 817.0, 395.0, 240.0, 113.0, 92.0, 47.0, 37.0, 15.0, 13.0, 10.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.796875, -0.77496337890625, -0.7530517578125, -0.73114013671875, -0.709228515625, -0.68731689453125, -0.6654052734375, -0.64349365234375, -0.62158203125, -0.59967041015625, -0.5777587890625, -0.55584716796875, -0.533935546875, -0.51202392578125, -0.4901123046875, -0.46820068359375, -0.4462890625, -0.42437744140625, -0.4024658203125, -0.38055419921875, -0.358642578125, -0.33673095703125, -0.3148193359375, -0.29290771484375, -0.27099609375, -0.24908447265625, -0.2271728515625, -0.20526123046875, -0.183349609375, -0.16143798828125, -0.1395263671875, -0.11761474609375, -0.095703125, -0.07379150390625, -0.0518798828125, -0.02996826171875, -0.008056640625, 0.01385498046875, 0.0357666015625, 0.05767822265625, 0.07958984375, 0.10150146484375, 0.1234130859375, 0.14532470703125, 0.167236328125, 0.18914794921875, 0.2110595703125, 0.23297119140625, 0.2548828125, 0.27679443359375, 0.2987060546875, 0.32061767578125, 0.342529296875, 0.36444091796875, 0.3863525390625, 0.40826416015625, 0.43017578125, 0.45208740234375, 0.4739990234375, 0.49591064453125, 0.517822265625, 0.53973388671875, 0.5616455078125, 0.58355712890625, 0.60546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 10.0, 15.0, 19.0, 23.0, 24.0, 39.0, 45.0, 52.0, 61.0, 62.0, 66.0, 71.0, 79.0, 72.0, 64.0, 49.0, 45.0, 45.0, 28.0, 34.0, 22.0, 18.0, 15.0, 8.0, 7.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.71728515625, -0.6993064880371094, -0.6813278198242188, -0.6633491516113281, -0.6453704833984375, -0.6273918151855469, -0.6094131469726562, -0.5914344787597656, -0.573455810546875, -0.5554771423339844, -0.5374984741210938, -0.5195198059082031, -0.5015411376953125, -0.4835624694824219, -0.46558380126953125, -0.4476051330566406, -0.42962646484375, -0.4116477966308594, -0.39366912841796875, -0.3756904602050781, -0.3577117919921875, -0.3397331237792969, -0.32175445556640625, -0.3037757873535156, -0.285797119140625, -0.2678184509277344, -0.24983978271484375, -0.23186111450195312, -0.2138824462890625, -0.19590377807617188, -0.17792510986328125, -0.15994644165039062, -0.1419677734375, -0.12398910522460938, -0.10601043701171875, -0.08803176879882812, -0.0700531005859375, -0.052074432373046875, -0.03409576416015625, -0.016117095947265625, 0.001861572265625, 0.019840240478515625, 0.03781890869140625, 0.055797576904296875, 0.0737762451171875, 0.09175491333007812, 0.10973358154296875, 0.12771224975585938, 0.14569091796875, 0.16366958618164062, 0.18164825439453125, 0.19962692260742188, 0.2176055908203125, 0.23558425903320312, 0.25356292724609375, 0.2715415954589844, 0.289520263671875, 0.3074989318847656, 0.32547760009765625, 0.3434562683105469, 0.3614349365234375, 0.3794136047363281, 0.39739227294921875, 0.4153709411621094, 0.433349609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 3.0, 14.0, 26.0, 32.0, 62.0, 122.0, 231.0, 582.0, 2167.0, 12807.0, 304873.0, 3770991.0, 92902.0, 7141.0, 1396.0, 460.0, 212.0, 113.0, 58.0, 25.0, 20.0, 9.0, 8.0, 7.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.75390625, -1.705657958984375, -1.65740966796875, -1.609161376953125, -1.5609130859375, -1.512664794921875, -1.46441650390625, -1.416168212890625, -1.367919921875, -1.319671630859375, -1.27142333984375, -1.223175048828125, -1.1749267578125, -1.126678466796875, -1.07843017578125, -1.030181884765625, -0.98193359375, -0.933685302734375, -0.88543701171875, -0.837188720703125, -0.7889404296875, -0.740692138671875, -0.69244384765625, -0.644195556640625, -0.595947265625, -0.547698974609375, -0.49945068359375, -0.451202392578125, -0.4029541015625, -0.354705810546875, -0.30645751953125, -0.258209228515625, -0.2099609375, -0.161712646484375, -0.11346435546875, -0.065216064453125, -0.0169677734375, 0.031280517578125, 0.07952880859375, 0.127777099609375, 0.176025390625, 0.224273681640625, 0.27252197265625, 0.320770263671875, 0.3690185546875, 0.417266845703125, 0.46551513671875, 0.513763427734375, 0.56201171875, 0.610260009765625, 0.65850830078125, 0.706756591796875, 0.7550048828125, 0.803253173828125, 0.85150146484375, 0.899749755859375, 0.947998046875, 0.996246337890625, 1.04449462890625, 1.092742919921875, 1.1409912109375, 1.189239501953125, 1.23748779296875, 1.285736083984375, 1.333984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 6.0, 5.0, 15.0, 17.0, 25.0, 44.0, 82.0, 167.0, 290.0, 543.0, 825.0, 887.0, 518.0, 258.0, 152.0, 87.0, 58.0, 36.0, 25.0, 13.0, 8.0, 10.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6435546875, -0.6096038818359375, -0.575653076171875, -0.5417022705078125, -0.50775146484375, -0.4738006591796875, -0.439849853515625, -0.4058990478515625, -0.3719482421875, -0.3379974365234375, -0.304046630859375, -0.2700958251953125, -0.23614501953125, -0.2021942138671875, -0.168243408203125, -0.1342926025390625, -0.100341796875, -0.0663909912109375, -0.032440185546875, 0.0015106201171875, 0.03546142578125, 0.0694122314453125, 0.103363037109375, 0.1373138427734375, 0.1712646484375, 0.2052154541015625, 0.239166259765625, 0.2731170654296875, 0.30706787109375, 0.3410186767578125, 0.374969482421875, 0.4089202880859375, 0.44287109375, 0.4768218994140625, 0.510772705078125, 0.5447235107421875, 0.57867431640625, 0.6126251220703125, 0.646575927734375, 0.6805267333984375, 0.7144775390625, 0.7484283447265625, 0.782379150390625, 0.8163299560546875, 0.85028076171875, 0.8842315673828125, 0.918182373046875, 0.9521331787109375, 0.986083984375, 1.0200347900390625, 1.053985595703125, 1.0879364013671875, 1.12188720703125, 1.1558380126953125, 1.189788818359375, 1.2237396240234375, 1.2576904296875, 1.2916412353515625, 1.325592041015625, 1.3595428466796875, 1.39349365234375, 1.4274444580078125, 1.461395263671875, 1.4953460693359375, 1.529296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 25.0, 52.0, 130.0, 246.0, 240.0, 158.0, 81.0, 34.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.039699554443359, -5.663516998291016, -5.287333965301514, -4.91115140914917, -4.534968852996826, -4.158785820007324, -3.7826032638549805, -3.4064207077026367, -3.030237913131714, -2.654055118560791, -2.2778725624084473, -1.9016897678375244, -1.5255070924758911, -1.1493244171142578, -0.773141622543335, -0.3969590663909912, -0.02077627182006836, 0.35540643334388733, 0.731589138507843, 1.107771873474121, 1.4839545488357544, 1.8601372241973877, 2.2363200187683105, 2.6125025749206543, 2.988685369491577, 3.3648681640625, 3.7410507202148438, 4.1172332763671875, 4.4934163093566895, 4.869598865509033, 5.245781898498535, 5.621964454650879, 5.998147010803223, 6.374329566955566, 6.750512599945068, 7.126695156097412, 7.502877712249756, 7.879060745239258, 8.255243301391602, 8.631425857543945, 9.007608413696289, 9.383790969848633, 9.759973526000977, 10.13615608215332, 10.51233959197998, 10.888522148132324, 11.264704704284668, 11.640887260437012, 12.017070770263672, 12.393253326416016, 12.76943588256836, 13.145618438720703, 13.521801948547363, 13.897984504699707, 14.27416706085205, 14.650349617004395, 15.026532173156738, 15.402714729309082, 15.778897285461426, 16.155080795288086, 16.53126335144043, 16.907445907592773, 17.283628463745117, 17.65981101989746, 18.035993576049805]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 7.0, 8.0, 7.0, 6.0, 12.0, 10.0, 29.0, 12.0, 17.0, 26.0, 35.0, 32.0, 34.0, 40.0, 32.0, 36.0, 35.0, 48.0, 49.0, 47.0, 41.0, 43.0, 35.0, 35.0, 36.0, 29.0, 42.0, 37.0, 18.0, 21.0, 27.0, 25.0, 14.0, 13.0, 11.0, 15.0, 5.0, 6.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1443800926208496, -3.0447545051574707, -2.945128917694092, -2.845503330230713, -2.745877981185913, -2.646252393722534, -2.5466268062591553, -2.4470012187957764, -2.3473758697509766, -2.2477502822875977, -2.1481246948242188, -2.04849910736084, -1.94887375831604, -1.8492481708526611, -1.7496225833892822, -1.6499969959259033, -1.5503714084625244, -1.4507458209991455, -1.3511203527450562, -1.2514947652816772, -1.151869297027588, -1.052243709564209, -0.9526181221008301, -0.852992594242096, -0.7533670663833618, -0.6537415385246277, -0.5541160106658936, -0.45449042320251465, -0.3548648953437805, -0.2552393674850464, -0.15561378002166748, -0.05598825216293335, 0.04363751411437988, 0.1432630568742752, 0.24288859963417053, 0.34251415729522705, 0.4421396851539612, 0.5417652130126953, 0.6413908004760742, 0.7410163283348083, 0.8406418561935425, 0.9402673840522766, 1.0398929119110107, 1.1395184993743896, 1.2391440868377686, 1.338769555091858, 1.4383951425552368, 1.5380206108093262, 1.637646198272705, 1.737271785736084, 1.8368972539901733, 1.9365228414535522, 2.0361483097076416, 2.1357738971710205, 2.2353994846343994, 2.3350250720977783, 2.434650421142578, 2.534276008605957, 2.633901596069336, 2.733527183532715, 2.8331525325775146, 2.9327781200408936, 3.0324037075042725, 3.1320292949676514, 3.2316548824310303]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 8.0, 7.0, 13.0, 10.0, 26.0, 20.0, 45.0, 56.0, 92.0, 192.0, 321.0, 724.0, 1633.0, 4212.0, 12713.0, 44998.0, 177279.0, 461509.0, 252659.0, 64735.0, 17789.0, 5646.0, 2026.0, 882.0, 409.0, 205.0, 119.0, 85.0, 54.0, 30.0, 13.0, 14.0, 8.0, 9.0, 7.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.97216796875, -0.9440994262695312, -0.9160308837890625, -0.8879623413085938, -0.859893798828125, -0.8318252563476562, -0.8037567138671875, -0.7756881713867188, -0.74761962890625, -0.7195510864257812, -0.6914825439453125, -0.6634140014648438, -0.635345458984375, -0.6072769165039062, -0.5792083740234375, -0.5511398315429688, -0.5230712890625, -0.49500274658203125, -0.4669342041015625, -0.43886566162109375, -0.410797119140625, -0.38272857666015625, -0.3546600341796875, -0.32659149169921875, -0.29852294921875, -0.27045440673828125, -0.2423858642578125, -0.21431732177734375, -0.186248779296875, -0.15818023681640625, -0.1301116943359375, -0.10204315185546875, -0.073974609375, -0.04590606689453125, -0.0178375244140625, 0.01023101806640625, 0.038299560546875, 0.06636810302734375, 0.0944366455078125, 0.12250518798828125, 0.15057373046875, 0.17864227294921875, 0.2067108154296875, 0.23477935791015625, 0.262847900390625, 0.29091644287109375, 0.3189849853515625, 0.34705352783203125, 0.3751220703125, 0.40319061279296875, 0.4312591552734375, 0.45932769775390625, 0.487396240234375, 0.5154647827148438, 0.5435333251953125, 0.5716018676757812, 0.59967041015625, 0.6277389526367188, 0.6558074951171875, 0.6838760375976562, 0.711944580078125, 0.7400131225585938, 0.7680816650390625, 0.7961502075195312, 0.82421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 11.0, 20.0, 15.0, 14.0, 28.0, 30.0, 47.0, 41.0, 58.0, 71.0, 73.0, 67.0, 55.0, 65.0, 65.0, 50.0, 76.0, 40.0, 41.0, 31.0, 15.0, 21.0, 16.0, 14.0, 10.0, 8.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7216796875, -0.7037773132324219, -0.6858749389648438, -0.6679725646972656, -0.6500701904296875, -0.6321678161621094, -0.6142654418945312, -0.5963630676269531, -0.578460693359375, -0.5605583190917969, -0.5426559448242188, -0.5247535705566406, -0.5068511962890625, -0.4889488220214844, -0.47104644775390625, -0.4531440734863281, -0.43524169921875, -0.4173393249511719, -0.39943695068359375, -0.3815345764160156, -0.3636322021484375, -0.3457298278808594, -0.32782745361328125, -0.3099250793457031, -0.292022705078125, -0.2741203308105469, -0.25621795654296875, -0.23831558227539062, -0.2204132080078125, -0.20251083374023438, -0.18460845947265625, -0.16670608520507812, -0.1488037109375, -0.13090133666992188, -0.11299896240234375, -0.09509658813476562, -0.0771942138671875, -0.059291839599609375, -0.04138946533203125, -0.023487091064453125, -0.005584716796875, 0.012317657470703125, 0.03022003173828125, 0.048122406005859375, 0.0660247802734375, 0.08392715454101562, 0.10182952880859375, 0.11973190307617188, 0.13763427734375, 0.15553665161132812, 0.17343902587890625, 0.19134140014648438, 0.2092437744140625, 0.22714614868164062, 0.24504852294921875, 0.2629508972167969, 0.280853271484375, 0.2987556457519531, 0.31665802001953125, 0.3345603942871094, 0.3524627685546875, 0.3703651428222656, 0.38826751708984375, 0.4061698913574219, 0.424072265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 13.0, 14.0, 22.0, 28.0, 34.0, 52.0, 69.0, 85.0, 118.0, 177.0, 264.0, 446.0, 728.0, 1601.0, 3910.0, 12117.0, 48850.0, 242575.0, 608017.0, 96621.0, 21390.0, 6250.0, 2390.0, 1028.0, 592.0, 350.0, 219.0, 168.0, 112.0, 67.0, 56.0, 37.0, 32.0, 28.0, 18.0, 16.0, 10.0, 7.0, 6.0, 3.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0295639038085938, -0.9976043701171875, -0.9656448364257812, -0.933685302734375, -0.9017257690429688, -0.8697662353515625, -0.8378067016601562, -0.80584716796875, -0.7738876342773438, -0.7419281005859375, -0.7099685668945312, -0.678009033203125, -0.6460494995117188, -0.6140899658203125, -0.5821304321289062, -0.5501708984375, -0.5182113647460938, -0.4862518310546875, -0.45429229736328125, -0.422332763671875, -0.39037322998046875, -0.3584136962890625, -0.32645416259765625, -0.29449462890625, -0.26253509521484375, -0.2305755615234375, -0.19861602783203125, -0.166656494140625, -0.13469696044921875, -0.1027374267578125, -0.07077789306640625, -0.038818359375, -0.00685882568359375, 0.0251007080078125, 0.05706024169921875, 0.089019775390625, 0.12097930908203125, 0.1529388427734375, 0.18489837646484375, 0.21685791015625, 0.24881744384765625, 0.2807769775390625, 0.31273651123046875, 0.344696044921875, 0.37665557861328125, 0.4086151123046875, 0.44057464599609375, 0.4725341796875, 0.5044937133789062, 0.5364532470703125, 0.5684127807617188, 0.600372314453125, 0.6323318481445312, 0.6642913818359375, 0.6962509155273438, 0.72821044921875, 0.7601699829101562, 0.7921295166015625, 0.8240890502929688, 0.856048583984375, 0.8880081176757812, 0.9199676513671875, 0.9519271850585938, 0.98388671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 9.0, 8.0, 12.0, 23.0, 20.0, 25.0, 36.0, 31.0, 54.0, 60.0, 54.0, 51.0, 60.0, 63.0, 71.0, 62.0, 50.0, 43.0, 50.0, 29.0, 32.0, 35.0, 24.0, 23.0, 18.0, 7.0, 8.0, 10.0, 2.0, 4.0, 8.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8427734375, -1.7877960205078125, -1.732818603515625, -1.6778411865234375, -1.62286376953125, -1.5678863525390625, -1.512908935546875, -1.4579315185546875, -1.4029541015625, -1.3479766845703125, -1.292999267578125, -1.2380218505859375, -1.18304443359375, -1.1280670166015625, -1.073089599609375, -1.0181121826171875, -0.963134765625, -0.9081573486328125, -0.853179931640625, -0.7982025146484375, -0.74322509765625, -0.6882476806640625, -0.633270263671875, -0.5782928466796875, -0.5233154296875, -0.4683380126953125, -0.413360595703125, -0.3583831787109375, -0.30340576171875, -0.2484283447265625, -0.193450927734375, -0.1384735107421875, -0.08349609375, -0.0285186767578125, 0.026458740234375, 0.0814361572265625, 0.13641357421875, 0.1913909912109375, 0.246368408203125, 0.3013458251953125, 0.3563232421875, 0.4113006591796875, 0.466278076171875, 0.5212554931640625, 0.57623291015625, 0.6312103271484375, 0.686187744140625, 0.7411651611328125, 0.796142578125, 0.8511199951171875, 0.906097412109375, 0.9610748291015625, 1.01605224609375, 1.0710296630859375, 1.126007080078125, 1.1809844970703125, 1.2359619140625, 1.2909393310546875, 1.345916748046875, 1.4008941650390625, 1.45587158203125, 1.5108489990234375, 1.565826416015625, 1.6208038330078125, 1.67578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 17.0, 15.0, 16.0, 26.0, 50.0, 83.0, 118.0, 210.0, 426.0, 925.0, 2199.0, 6381.0, 21665.0, 90984.0, 713862.0, 163602.0, 33079.0, 9396.0, 3064.0, 1243.0, 537.0, 264.0, 137.0, 76.0, 55.0, 31.0, 29.0, 14.0, 8.0, 8.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.365966796875, -0.35509490966796875, -0.3442230224609375, -0.33335113525390625, -0.322479248046875, -0.31160736083984375, -0.3007354736328125, -0.28986358642578125, -0.27899169921875, -0.26811981201171875, -0.2572479248046875, -0.24637603759765625, -0.235504150390625, -0.22463226318359375, -0.2137603759765625, -0.20288848876953125, -0.1920166015625, -0.18114471435546875, -0.1702728271484375, -0.15940093994140625, -0.148529052734375, -0.13765716552734375, -0.1267852783203125, -0.11591339111328125, -0.10504150390625, -0.09416961669921875, -0.0832977294921875, -0.07242584228515625, -0.061553955078125, -0.05068206787109375, -0.0398101806640625, -0.02893829345703125, -0.01806640625, -0.00719451904296875, 0.0036773681640625, 0.01454925537109375, 0.025421142578125, 0.03629302978515625, 0.0471649169921875, 0.05803680419921875, 0.06890869140625, 0.07978057861328125, 0.0906524658203125, 0.10152435302734375, 0.112396240234375, 0.12326812744140625, 0.1341400146484375, 0.14501190185546875, 0.1558837890625, 0.16675567626953125, 0.1776275634765625, 0.18849945068359375, 0.199371337890625, 0.21024322509765625, 0.2211151123046875, 0.23198699951171875, 0.24285888671875, 0.25373077392578125, 0.2646026611328125, 0.27547454833984375, 0.286346435546875, 0.29721832275390625, 0.3080902099609375, 0.31896209716796875, 0.329833984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 6.0, 7.0, 14.0, 13.0, 16.0, 24.0, 33.0, 38.0, 44.0, 67.0, 72.0, 90.0, 100.0, 99.0, 60.0, 50.0, 40.0, 34.0, 41.0, 25.0, 13.0, 18.0, 14.0, 9.0, 9.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.288290023803711e-05, -6.093643605709076e-05, -5.898997187614441e-05, -5.704350769519806e-05, -5.509704351425171e-05, -5.315057933330536e-05, -5.120411515235901e-05, -4.925765097141266e-05, -4.731118679046631e-05, -4.536472260951996e-05, -4.341825842857361e-05, -4.147179424762726e-05, -3.952533006668091e-05, -3.757886588573456e-05, -3.563240170478821e-05, -3.368593752384186e-05, -3.173947334289551e-05, -2.9793009161949158e-05, -2.7846544981002808e-05, -2.5900080800056458e-05, -2.3953616619110107e-05, -2.2007152438163757e-05, -2.0060688257217407e-05, -1.8114224076271057e-05, -1.6167759895324707e-05, -1.4221295714378357e-05, -1.2274831533432007e-05, -1.0328367352485657e-05, -8.381903171539307e-06, -6.4354389905929565e-06, -4.4889748096466064e-06, -2.5425106287002563e-06, -5.960464477539062e-07, 1.3504177331924438e-06, 3.296881914138794e-06, 5.243346095085144e-06, 7.189810276031494e-06, 9.136274456977844e-06, 1.1082738637924194e-05, 1.3029202818870544e-05, 1.4975666999816895e-05, 1.6922131180763245e-05, 1.8868595361709595e-05, 2.0815059542655945e-05, 2.2761523723602295e-05, 2.4707987904548645e-05, 2.6654452085494995e-05, 2.8600916266441345e-05, 3.0547380447387695e-05, 3.2493844628334045e-05, 3.4440308809280396e-05, 3.6386772990226746e-05, 3.8333237171173096e-05, 4.0279701352119446e-05, 4.2226165533065796e-05, 4.4172629714012146e-05, 4.6119093894958496e-05, 4.8065558075904846e-05, 5.0012022256851196e-05, 5.1958486437797546e-05, 5.3904950618743896e-05, 5.5851414799690247e-05, 5.77978789806366e-05, 5.974434316158295e-05, 6.16908073425293e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 2.0, 9.0, 10.0, 16.0, 26.0, 38.0, 65.0, 84.0, 120.0, 205.0, 331.0, 574.0, 1094.0, 2435.0, 5712.0, 15472.0, 49339.0, 210132.0, 623015.0, 96859.0, 26931.0, 9026.0, 3573.0, 1577.0, 819.0, 397.0, 235.0, 143.0, 93.0, 70.0, 42.0, 27.0, 26.0, 19.0, 12.0, 8.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.343017578125, -0.3340492248535156, -0.32508087158203125, -0.3161125183105469, -0.3071441650390625, -0.2981758117675781, -0.28920745849609375, -0.2802391052246094, -0.271270751953125, -0.2623023986816406, -0.25333404541015625, -0.24436569213867188, -0.2353973388671875, -0.22642898559570312, -0.21746063232421875, -0.20849227905273438, -0.19952392578125, -0.19055557250976562, -0.18158721923828125, -0.17261886596679688, -0.1636505126953125, -0.15468215942382812, -0.14571380615234375, -0.13674545288085938, -0.127777099609375, -0.11880874633789062, -0.10984039306640625, -0.10087203979492188, -0.0919036865234375, -0.08293533325195312, -0.07396697998046875, -0.06499862670898438, -0.0560302734375, -0.047061920166015625, -0.03809356689453125, -0.029125213623046875, -0.0201568603515625, -0.011188507080078125, -0.00222015380859375, 0.006748199462890625, 0.015716552734375, 0.024684906005859375, 0.03365325927734375, 0.042621612548828125, 0.0515899658203125, 0.060558319091796875, 0.06952667236328125, 0.07849502563476562, 0.08746337890625, 0.09643173217773438, 0.10540008544921875, 0.11436843872070312, 0.1233367919921875, 0.13230514526367188, 0.14127349853515625, 0.15024185180664062, 0.159210205078125, 0.16817855834960938, 0.17714691162109375, 0.18611526489257812, 0.1950836181640625, 0.20405197143554688, 0.21302032470703125, 0.22198867797851562, 0.23095703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 5.0, 4.0, 7.0, 6.0, 11.0, 9.0, 16.0, 20.0, 21.0, 28.0, 30.0, 42.0, 48.0, 51.0, 77.0, 74.0, 93.0, 82.0, 74.0, 65.0, 45.0, 24.0, 23.0, 29.0, 24.0, 15.0, 7.0, 14.0, 6.0, 7.0, 9.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23376083374023438, -0.22582244873046875, -0.21788406372070312, -0.2099456787109375, -0.20200729370117188, -0.19406890869140625, -0.18613052368164062, -0.178192138671875, -0.17025375366210938, -0.16231536865234375, -0.15437698364257812, -0.1464385986328125, -0.13850021362304688, -0.13056182861328125, -0.12262344360351562, -0.11468505859375, -0.10674667358398438, -0.09880828857421875, -0.09086990356445312, -0.0829315185546875, -0.07499313354492188, -0.06705474853515625, -0.059116363525390625, -0.051177978515625, -0.043239593505859375, -0.03530120849609375, -0.027362823486328125, -0.0194244384765625, -0.011486053466796875, -0.00354766845703125, 0.004390716552734375, 0.0123291015625, 0.020267486572265625, 0.02820587158203125, 0.036144256591796875, 0.0440826416015625, 0.052021026611328125, 0.05995941162109375, 0.06789779663085938, 0.075836181640625, 0.08377456665039062, 0.09171295166015625, 0.09965133666992188, 0.1075897216796875, 0.11552810668945312, 0.12346649169921875, 0.13140487670898438, 0.13934326171875, 0.14728164672851562, 0.15522003173828125, 0.16315841674804688, 0.1710968017578125, 0.17903518676757812, 0.18697357177734375, 0.19491195678710938, 0.202850341796875, 0.21078872680664062, 0.21872711181640625, 0.22666549682617188, 0.2346038818359375, 0.24254226684570312, 0.25048065185546875, 0.2584190368652344, 0.266357421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 13.0, 26.0, 39.0, 56.0, 120.0, 206.0, 220.0, 115.0, 71.0, 36.0, 27.0, 17.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.064403057098389, -3.8263871669769287, -3.5883710384368896, -3.3503551483154297, -3.1123390197753906, -2.8743231296539307, -2.6363072395324707, -2.3982911109924316, -2.1602752208709717, -1.9222592115402222, -1.6842432022094727, -1.4462273120880127, -1.2082113027572632, -0.9701952934265137, -0.7321794033050537, -0.4941633939743042, -0.2561473846435547, -0.018131405115127563, 0.21988457441329956, 0.4579005241394043, 0.6959165334701538, 0.9339325428009033, 1.1719484329223633, 1.4099644422531128, 1.6479804515838623, 1.8859964609146118, 2.1240124702453613, 2.3620283603668213, 2.6000442504882812, 2.8380603790283203, 3.0760762691497803, 3.3140921592712402, 3.5521087646484375, 3.7901246547698975, 4.028140544891357, 4.2661566734313965, 4.5041728019714355, 4.742188453674316, 4.9802045822143555, 5.2182207107543945, 5.456236839294434, 5.694252967834473, 5.9322686195373535, 6.170284748077393, 6.408300876617432, 6.6463165283203125, 6.884332656860352, 7.122348785400391, 7.3603644371032715, 7.5983805656433105, 7.836396217346191, 8.07441234588623, 8.31242847442627, 8.550444602966309, 8.788459777832031, 9.02647590637207, 9.26449203491211, 9.502508163452148, 9.740524291992188, 9.978540420532227, 10.21655559539795, 10.454571723937988, 10.692587852478027, 10.930603981018066, 11.168620109558105]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 8.0, 7.0, 9.0, 20.0, 23.0, 17.0, 22.0, 28.0, 33.0, 38.0, 33.0, 33.0, 44.0, 99.0, 103.0, 91.0, 55.0, 46.0, 28.0, 39.0, 23.0, 27.0, 22.0, 35.0, 17.0, 18.0, 13.0, 0.0, 11.0, 7.0, 4.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.554224967956543, -5.378848075866699, -5.203471660614014, -5.028095245361328, -4.852718353271484, -4.677341461181641, -4.501965045928955, -4.3265886306762695, -4.151211738586426, -3.975835084915161, -3.8004584312438965, -3.625081777572632, -3.449705123901367, -3.2743284702301025, -3.098951816558838, -2.9235751628875732, -2.7481985092163086, -2.572821855545044, -2.3974452018737793, -2.2220685482025146, -2.04669189453125, -1.8713152408599854, -1.6959385871887207, -1.520561933517456, -1.3451852798461914, -1.1698086261749268, -0.9944319725036621, -0.8190553188323975, -0.6436786651611328, -0.46830201148986816, -0.2929253578186035, -0.11754870414733887, 0.05782794952392578, 0.23320460319519043, 0.4085812568664551, 0.5839579105377197, 0.7593345642089844, 0.934711217880249, 1.1100878715515137, 1.2854645252227783, 1.460841178894043, 1.6362178325653076, 1.8115944862365723, 1.986971139907837, 2.1623477935791016, 2.337724447250366, 2.513101100921631, 2.6884777545928955, 2.86385440826416, 3.039231061935425, 3.2146077156066895, 3.389984369277954, 3.5653610229492188, 3.7407376766204834, 3.916114330291748, 4.091490745544434, 4.266867637634277, 4.442244529724121, 4.617620944976807, 4.792997360229492, 4.968374252319336, 5.14375114440918, 5.319127559661865, 5.494503974914551, 5.6698808670043945]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 20.0, 13.0, 20.0, 39.0, 69.0, 83.0, 126.0, 238.0, 445.0, 769.0, 1595.0, 3760.0, 11425.0, 58023.0, 729596.0, 3006143.0, 331740.0, 35846.0, 8545.0, 2969.0, 1291.0, 657.0, 349.0, 200.0, 108.0, 75.0, 37.0, 28.0, 26.0, 7.0, 10.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7275390625, -0.7009506225585938, -0.6743621826171875, -0.6477737426757812, -0.621185302734375, -0.5945968627929688, -0.5680084228515625, -0.5414199829101562, -0.51483154296875, -0.48824310302734375, -0.4616546630859375, -0.43506622314453125, -0.408477783203125, -0.38188934326171875, -0.3553009033203125, -0.32871246337890625, -0.3021240234375, -0.27553558349609375, -0.2489471435546875, -0.22235870361328125, -0.195770263671875, -0.16918182373046875, -0.1425933837890625, -0.11600494384765625, -0.08941650390625, -0.06282806396484375, -0.0362396240234375, -0.00965118408203125, 0.016937255859375, 0.04352569580078125, 0.0701141357421875, 0.09670257568359375, 0.123291015625, 0.14987945556640625, 0.1764678955078125, 0.20305633544921875, 0.229644775390625, 0.25623321533203125, 0.2828216552734375, 0.30941009521484375, 0.33599853515625, 0.36258697509765625, 0.3891754150390625, 0.41576385498046875, 0.442352294921875, 0.46894073486328125, 0.4955291748046875, 0.5221176147460938, 0.5487060546875, 0.5752944946289062, 0.6018829345703125, 0.6284713745117188, 0.655059814453125, 0.6816482543945312, 0.7082366943359375, 0.7348251342773438, 0.76141357421875, 0.7880020141601562, 0.8145904541015625, 0.8411788940429688, 0.867767333984375, 0.8943557739257812, 0.9209442138671875, 0.9475326538085938, 0.97412109375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 8.0, 14.0, 11.0, 16.0, 26.0, 42.0, 38.0, 50.0, 32.0, 50.0, 58.0, 44.0, 61.0, 65.0, 47.0, 40.0, 49.0, 37.0, 41.0, 46.0, 40.0, 24.0, 37.0, 25.0, 13.0, 17.0, 8.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.52685546875, -0.512847900390625, -0.49884033203125, -0.484832763671875, -0.4708251953125, -0.456817626953125, -0.44281005859375, -0.428802490234375, -0.414794921875, -0.400787353515625, -0.38677978515625, -0.372772216796875, -0.3587646484375, -0.344757080078125, -0.33074951171875, -0.316741943359375, -0.302734375, -0.288726806640625, -0.27471923828125, -0.260711669921875, -0.2467041015625, -0.232696533203125, -0.21868896484375, -0.204681396484375, -0.190673828125, -0.176666259765625, -0.16265869140625, -0.148651123046875, -0.1346435546875, -0.120635986328125, -0.10662841796875, -0.092620849609375, -0.07861328125, -0.064605712890625, -0.05059814453125, -0.036590576171875, -0.0225830078125, -0.008575439453125, 0.00543212890625, 0.019439697265625, 0.033447265625, 0.047454833984375, 0.06146240234375, 0.075469970703125, 0.0894775390625, 0.103485107421875, 0.11749267578125, 0.131500244140625, 0.1455078125, 0.159515380859375, 0.17352294921875, 0.187530517578125, 0.2015380859375, 0.215545654296875, 0.22955322265625, 0.243560791015625, 0.257568359375, 0.271575927734375, 0.28558349609375, 0.299591064453125, 0.3135986328125, 0.327606201171875, 0.34161376953125, 0.355621337890625, 0.36962890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 7.0, 7.0, 11.0, 22.0, 22.0, 40.0, 50.0, 99.0, 199.0, 403.0, 1034.0, 3331.0, 19067.0, 294660.0, 3643321.0, 212170.0, 15627.0, 2658.0, 813.0, 320.0, 161.0, 86.0, 56.0, 33.0, 25.0, 17.0, 11.0, 11.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1248931884765625, -1.086700439453125, -1.0485076904296875, -1.01031494140625, -0.9721221923828125, -0.933929443359375, -0.8957366943359375, -0.8575439453125, -0.8193511962890625, -0.781158447265625, -0.7429656982421875, -0.70477294921875, -0.6665802001953125, -0.628387451171875, -0.5901947021484375, -0.552001953125, -0.5138092041015625, -0.475616455078125, -0.4374237060546875, -0.39923095703125, -0.3610382080078125, -0.322845458984375, -0.2846527099609375, -0.2464599609375, -0.2082672119140625, -0.170074462890625, -0.1318817138671875, -0.09368896484375, -0.0554962158203125, -0.017303466796875, 0.0208892822265625, 0.05908203125, 0.0972747802734375, 0.135467529296875, 0.1736602783203125, 0.21185302734375, 0.2500457763671875, 0.288238525390625, 0.3264312744140625, 0.3646240234375, 0.4028167724609375, 0.441009521484375, 0.4792022705078125, 0.51739501953125, 0.5555877685546875, 0.593780517578125, 0.6319732666015625, 0.670166015625, 0.7083587646484375, 0.746551513671875, 0.7847442626953125, 0.82293701171875, 0.8611297607421875, 0.899322509765625, 0.9375152587890625, 0.9757080078125, 1.0139007568359375, 1.052093505859375, 1.0902862548828125, 1.12847900390625, 1.1666717529296875, 1.204864501953125, 1.2430572509765625, 1.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 8.0, 16.0, 17.0, 24.0, 42.0, 56.0, 115.0, 173.0, 236.0, 398.0, 646.0, 705.0, 572.0, 391.0, 221.0, 131.0, 101.0, 68.0, 37.0, 32.0, 20.0, 15.0, 12.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.2529296875, -1.2240524291992188, -1.1951751708984375, -1.1662979125976562, -1.137420654296875, -1.1085433959960938, -1.0796661376953125, -1.0507888793945312, -1.02191162109375, -0.9930343627929688, -0.9641571044921875, -0.9352798461914062, -0.906402587890625, -0.8775253295898438, -0.8486480712890625, -0.8197708129882812, -0.7908935546875, -0.7620162963867188, -0.7331390380859375, -0.7042617797851562, -0.675384521484375, -0.6465072631835938, -0.6176300048828125, -0.5887527465820312, -0.55987548828125, -0.5309982299804688, -0.5021209716796875, -0.47324371337890625, -0.444366455078125, -0.41548919677734375, -0.3866119384765625, -0.35773468017578125, -0.328857421875, -0.29998016357421875, -0.2711029052734375, -0.24222564697265625, -0.213348388671875, -0.18447113037109375, -0.1555938720703125, -0.12671661376953125, -0.09783935546875, -0.06896209716796875, -0.0400848388671875, -0.01120758056640625, 0.017669677734375, 0.04654693603515625, 0.0754241943359375, 0.10430145263671875, 0.1331787109375, 0.16205596923828125, 0.1909332275390625, 0.21981048583984375, 0.248687744140625, 0.27756500244140625, 0.3064422607421875, 0.33531951904296875, 0.36419677734375, 0.39307403564453125, 0.4219512939453125, 0.45082855224609375, 0.479705810546875, 0.5085830688476562, 0.5374603271484375, 0.5663375854492188, 0.59521484375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 8.0, 10.0, 17.0, 30.0, 48.0, 62.0, 126.0, 154.0, 179.0, 147.0, 94.0, 61.0, 30.0, 14.0, 12.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818429946899414, -8.582716941833496, -8.347002983093262, -8.111289978027344, -7.875576496124268, -7.639863014221191, -7.404149532318115, -7.168436050415039, -6.932723045349121, -6.697009563446045, -6.461296081542969, -6.225583076477051, -5.989869594573975, -5.754156112670898, -5.518442630767822, -5.282729148864746, -5.04701566696167, -4.811302185058594, -4.575588703155518, -4.339875221252441, -4.104162216186523, -3.8684487342834473, -3.632735252380371, -3.397021770477295, -3.161308526992798, -2.9255950450897217, -2.6898818016052246, -2.4541683197021484, -2.2184548377990723, -1.9827415943145752, -1.747028112411499, -1.5113147497177124, -1.2756013870239258, -1.0398880243301392, -0.8041746020317078, -0.5684611797332764, -0.33274781703948975, -0.09703445434570312, 0.13867902755737305, 0.37439239025115967, 0.6101057529449463, 0.8458191156387329, 1.0815324783325195, 1.3172459602355957, 1.5529593229293823, 1.788672685623169, 2.024386167526245, 2.260099411010742, 2.4958128929138184, 2.7315263748168945, 2.9672396183013916, 3.2029531002044678, 3.438666343688965, 3.674379825592041, 3.910093307495117, 4.145806789398193, 4.3815202713012695, 4.617233753204346, 4.852947235107422, 5.08866024017334, 5.324373722076416, 5.560087203979492, 5.795800685882568, 6.0315141677856445, 6.2672271728515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 4.0, 6.0, 8.0, 11.0, 18.0, 12.0, 13.0, 17.0, 23.0, 24.0, 20.0, 28.0, 32.0, 33.0, 39.0, 45.0, 50.0, 70.0, 72.0, 61.0, 48.0, 53.0, 39.0, 41.0, 35.0, 29.0, 22.0, 26.0, 19.0, 20.0, 19.0, 17.0, 16.0, 9.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.362426280975342, -4.2425456047058105, -4.122664928436279, -4.002784252166748, -3.8829033374786377, -3.7630226612091064, -3.643141984939575, -3.523261308670044, -3.4033803939819336, -3.2834997177124023, -3.163619041442871, -3.04373836517334, -2.9238574504852295, -2.8039767742156982, -2.684096097946167, -2.5642154216766357, -2.4443347454071045, -2.3244540691375732, -2.204573392868042, -2.0846924781799316, -1.9648118019104004, -1.8449311256408691, -1.725050449371338, -1.6051697731018066, -1.4852889776229858, -1.3654083013534546, -1.2455275058746338, -1.1256468296051025, -1.0057661533355713, -0.8858853578567505, -0.7660046815872192, -0.6461239457130432, -0.5262432098388672, -0.40636247396469116, -0.2864817678928375, -0.1666010618209839, -0.04672032594680786, 0.07316040992736816, 0.19304108619689941, 0.31292182207107544, 0.43280255794525146, 0.5526832938194275, 0.6725640296936035, 0.7924447059631348, 0.9123254418373108, 1.0322061777114868, 1.152086853981018, 1.2719676494598389, 1.3918483257293701, 1.5117290019989014, 1.6316097974777222, 1.7514904737472534, 1.8713712692260742, 1.9912519454956055, 2.1111326217651367, 2.231013298034668, 2.350893974304199, 2.4707746505737305, 2.5906553268432617, 2.710536003112793, 2.8304169178009033, 2.9502975940704346, 3.070178270339966, 3.190058946609497, 3.3099398612976074]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 9.0, 14.0, 28.0, 36.0, 53.0, 85.0, 136.0, 215.0, 341.0, 588.0, 1150.0, 2255.0, 4841.0, 11164.0, 26879.0, 70052.0, 202999.0, 409270.0, 201734.0, 69623.0, 26419.0, 10899.0, 4856.0, 2241.0, 1118.0, 618.0, 348.0, 203.0, 131.0, 70.0, 64.0, 35.0, 28.0, 17.0, 9.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6417007446289062, -0.6183624267578125, -0.5950241088867188, -0.571685791015625, -0.5483474731445312, -0.5250091552734375, -0.5016708374023438, -0.47833251953125, -0.45499420166015625, -0.4316558837890625, -0.40831756591796875, -0.384979248046875, -0.36164093017578125, -0.3383026123046875, -0.31496429443359375, -0.2916259765625, -0.26828765869140625, -0.2449493408203125, -0.22161102294921875, -0.198272705078125, -0.17493438720703125, -0.1515960693359375, -0.12825775146484375, -0.10491943359375, -0.08158111572265625, -0.0582427978515625, -0.03490447998046875, -0.011566162109375, 0.01177215576171875, 0.0351104736328125, 0.05844879150390625, 0.081787109375, 0.10512542724609375, 0.1284637451171875, 0.15180206298828125, 0.175140380859375, 0.19847869873046875, 0.2218170166015625, 0.24515533447265625, 0.26849365234375, 0.29183197021484375, 0.3151702880859375, 0.33850860595703125, 0.361846923828125, 0.38518524169921875, 0.4085235595703125, 0.43186187744140625, 0.4552001953125, 0.47853851318359375, 0.5018768310546875, 0.5252151489257812, 0.548553466796875, 0.5718917846679688, 0.5952301025390625, 0.6185684204101562, 0.64190673828125, 0.6652450561523438, 0.6885833740234375, 0.7119216918945312, 0.735260009765625, 0.7585983276367188, 0.7819366455078125, 0.8052749633789062, 0.82861328125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 9.0, 11.0, 10.0, 13.0, 11.0, 21.0, 21.0, 29.0, 28.0, 32.0, 34.0, 48.0, 46.0, 47.0, 44.0, 56.0, 56.0, 45.0, 54.0, 41.0, 48.0, 36.0, 41.0, 35.0, 28.0, 32.0, 22.0, 23.0, 24.0, 17.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.52978515625, -0.5157623291015625, -0.501739501953125, -0.4877166748046875, -0.47369384765625, -0.4596710205078125, -0.445648193359375, -0.4316253662109375, -0.4176025390625, -0.4035797119140625, -0.389556884765625, -0.3755340576171875, -0.36151123046875, -0.3474884033203125, -0.333465576171875, -0.3194427490234375, -0.305419921875, -0.2913970947265625, -0.277374267578125, -0.2633514404296875, -0.24932861328125, -0.2353057861328125, -0.221282958984375, -0.2072601318359375, -0.1932373046875, -0.1792144775390625, -0.165191650390625, -0.1511688232421875, -0.13714599609375, -0.1231231689453125, -0.109100341796875, -0.0950775146484375, -0.0810546875, -0.0670318603515625, -0.053009033203125, -0.0389862060546875, -0.02496337890625, -0.0109405517578125, 0.003082275390625, 0.0171051025390625, 0.0311279296875, 0.0451507568359375, 0.059173583984375, 0.0731964111328125, 0.08721923828125, 0.1012420654296875, 0.115264892578125, 0.1292877197265625, 0.143310546875, 0.1573333740234375, 0.171356201171875, 0.1853790283203125, 0.19940185546875, 0.2134246826171875, 0.227447509765625, 0.2414703369140625, 0.2554931640625, 0.2695159912109375, 0.283538818359375, 0.2975616455078125, 0.31158447265625, 0.3256072998046875, 0.339630126953125, 0.3536529541015625, 0.36767578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 14.0, 21.0, 16.0, 17.0, 38.0, 53.0, 64.0, 90.0, 140.0, 223.0, 302.0, 494.0, 759.0, 1479.0, 3296.0, 11892.0, 76198.0, 773562.0, 150938.0, 19894.0, 4734.0, 1819.0, 880.0, 486.0, 351.0, 222.0, 164.0, 117.0, 74.0, 52.0, 43.0, 28.0, 30.0, 14.0, 10.0, 6.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.396484375, -1.3537139892578125, -1.310943603515625, -1.2681732177734375, -1.22540283203125, -1.1826324462890625, -1.139862060546875, -1.0970916748046875, -1.0543212890625, -1.0115509033203125, -0.968780517578125, -0.9260101318359375, -0.88323974609375, -0.8404693603515625, -0.797698974609375, -0.7549285888671875, -0.712158203125, -0.6693878173828125, -0.626617431640625, -0.5838470458984375, -0.54107666015625, -0.4983062744140625, -0.455535888671875, -0.4127655029296875, -0.3699951171875, -0.3272247314453125, -0.284454345703125, -0.2416839599609375, -0.19891357421875, -0.1561431884765625, -0.113372802734375, -0.0706024169921875, -0.02783203125, 0.0149383544921875, 0.057708740234375, 0.1004791259765625, 0.14324951171875, 0.1860198974609375, 0.228790283203125, 0.2715606689453125, 0.3143310546875, 0.3571014404296875, 0.399871826171875, 0.4426422119140625, 0.48541259765625, 0.5281829833984375, 0.570953369140625, 0.6137237548828125, 0.656494140625, 0.6992645263671875, 0.742034912109375, 0.7848052978515625, 0.82757568359375, 0.8703460693359375, 0.913116455078125, 0.9558868408203125, 0.9986572265625, 1.0414276123046875, 1.084197998046875, 1.1269683837890625, 1.16973876953125, 1.2125091552734375, 1.255279541015625, 1.2980499267578125, 1.3408203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 7.0, 14.0, 13.0, 9.0, 17.0, 22.0, 21.0, 31.0, 16.0, 43.0, 38.0, 37.0, 45.0, 57.0, 62.0, 61.0, 55.0, 48.0, 47.0, 46.0, 52.0, 30.0, 32.0, 31.0, 27.0, 22.0, 17.0, 18.0, 17.0, 6.0, 5.0, 5.0, 6.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.4106903076171875, -1.362396240234375, -1.3141021728515625, -1.26580810546875, -1.2175140380859375, -1.169219970703125, -1.1209259033203125, -1.0726318359375, -1.0243377685546875, -0.976043701171875, -0.9277496337890625, -0.87945556640625, -0.8311614990234375, -0.782867431640625, -0.7345733642578125, -0.686279296875, -0.6379852294921875, -0.589691162109375, -0.5413970947265625, -0.49310302734375, -0.4448089599609375, -0.396514892578125, -0.3482208251953125, -0.2999267578125, -0.2516326904296875, -0.203338623046875, -0.1550445556640625, -0.10675048828125, -0.0584564208984375, -0.010162353515625, 0.0381317138671875, 0.08642578125, 0.1347198486328125, 0.183013916015625, 0.2313079833984375, 0.27960205078125, 0.3278961181640625, 0.376190185546875, 0.4244842529296875, 0.4727783203125, 0.5210723876953125, 0.569366455078125, 0.6176605224609375, 0.66595458984375, 0.7142486572265625, 0.762542724609375, 0.8108367919921875, 0.859130859375, 0.9074249267578125, 0.955718994140625, 1.0040130615234375, 1.05230712890625, 1.1006011962890625, 1.148895263671875, 1.1971893310546875, 1.2454833984375, 1.2937774658203125, 1.342071533203125, 1.3903656005859375, 1.43865966796875, 1.4869537353515625, 1.535247802734375, 1.5835418701171875, 1.6318359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 2.0, 11.0, 5.0, 10.0, 21.0, 16.0, 25.0, 29.0, 38.0, 40.0, 68.0, 85.0, 118.0, 188.0, 414.0, 820.0, 1868.0, 5050.0, 21892.0, 214776.0, 752087.0, 38609.0, 7538.0, 2486.0, 1025.0, 466.0, 288.0, 180.0, 97.0, 73.0, 45.0, 38.0, 29.0, 19.0, 19.0, 17.0, 17.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.395416259765625, -0.38311767578125, -0.370819091796875, -0.3585205078125, -0.346221923828125, -0.33392333984375, -0.321624755859375, -0.309326171875, -0.297027587890625, -0.28472900390625, -0.272430419921875, -0.2601318359375, -0.247833251953125, -0.23553466796875, -0.223236083984375, -0.2109375, -0.198638916015625, -0.18634033203125, -0.174041748046875, -0.1617431640625, -0.149444580078125, -0.13714599609375, -0.124847412109375, -0.112548828125, -0.100250244140625, -0.08795166015625, -0.075653076171875, -0.0633544921875, -0.051055908203125, -0.03875732421875, -0.026458740234375, -0.01416015625, -0.001861572265625, 0.01043701171875, 0.022735595703125, 0.0350341796875, 0.047332763671875, 0.05963134765625, 0.071929931640625, 0.084228515625, 0.096527099609375, 0.10882568359375, 0.121124267578125, 0.1334228515625, 0.145721435546875, 0.15802001953125, 0.170318603515625, 0.1826171875, 0.194915771484375, 0.20721435546875, 0.219512939453125, 0.2318115234375, 0.244110107421875, 0.25640869140625, 0.268707275390625, 0.281005859375, 0.293304443359375, 0.30560302734375, 0.317901611328125, 0.3302001953125, 0.342498779296875, 0.35479736328125, 0.367095947265625, 0.37939453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 15.0, 21.0, 24.0, 35.0, 58.0, 86.0, 130.0, 168.0, 129.0, 80.0, 55.0, 37.0, 27.0, 28.0, 10.0, 10.0, 10.0, 7.0, 7.0, 4.0, 1.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.314847946166992e-05, -8.051563054323196e-05, -7.7882781624794e-05, -7.524993270635605e-05, -7.261708378791809e-05, -6.998423486948013e-05, -6.735138595104218e-05, -6.471853703260422e-05, -6.208568811416626e-05, -5.94528391957283e-05, -5.6819990277290344e-05, -5.4187141358852386e-05, -5.155429244041443e-05, -4.892144352197647e-05, -4.628859460353851e-05, -4.3655745685100555e-05, -4.10228967666626e-05, -3.839004784822464e-05, -3.575719892978668e-05, -3.3124350011348724e-05, -3.0491501092910767e-05, -2.785865217447281e-05, -2.522580325603485e-05, -2.2592954337596893e-05, -1.9960105419158936e-05, -1.7327256500720978e-05, -1.469440758228302e-05, -1.2061558663845062e-05, -9.428709745407104e-06, -6.795860826969147e-06, -4.163011908531189e-06, -1.5301629900932312e-06, 1.1026859283447266e-06, 3.7355348467826843e-06, 6.368383765220642e-06, 9.0012326836586e-06, 1.1634081602096558e-05, 1.4266930520534515e-05, 1.6899779438972473e-05, 1.953262835741043e-05, 2.216547727584839e-05, 2.4798326194286346e-05, 2.7431175112724304e-05, 3.0064024031162262e-05, 3.269687294960022e-05, 3.532972186803818e-05, 3.7962570786476135e-05, 4.059541970491409e-05, 4.322826862335205e-05, 4.586111754179001e-05, 4.8493966460227966e-05, 5.1126815378665924e-05, 5.375966429710388e-05, 5.639251321554184e-05, 5.90253621339798e-05, 6.165821105241776e-05, 6.429105997085571e-05, 6.692390888929367e-05, 6.955675780773163e-05, 7.218960672616959e-05, 7.482245564460754e-05, 7.74553045630455e-05, 8.008815348148346e-05, 8.272100239992142e-05, 8.535385131835938e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 7.0, 15.0, 12.0, 30.0, 32.0, 42.0, 58.0, 86.0, 151.0, 225.0, 395.0, 758.0, 1451.0, 3293.0, 8797.0, 35291.0, 262514.0, 663926.0, 52002.0, 11707.0, 3933.0, 1770.0, 834.0, 471.0, 264.0, 164.0, 105.0, 70.0, 43.0, 24.0, 28.0, 12.0, 13.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2445068359375, -0.2347698211669922, -0.22503280639648438, -0.21529579162597656, -0.20555877685546875, -0.19582176208496094, -0.18608474731445312, -0.1763477325439453, -0.1666107177734375, -0.1568737030029297, -0.14713668823242188, -0.13739967346191406, -0.12766265869140625, -0.11792564392089844, -0.10818862915039062, -0.09845161437988281, -0.088714599609375, -0.07897758483886719, -0.06924057006835938, -0.05950355529785156, -0.04976654052734375, -0.04002952575683594, -0.030292510986328125, -0.020555496215820312, -0.0108184814453125, -0.0010814666748046875, 0.008655548095703125, 0.018392562866210938, 0.02812957763671875, 0.03786659240722656, 0.047603607177734375, 0.05734062194824219, 0.06707763671875, 0.07681465148925781, 0.08655166625976562, 0.09628868103027344, 0.10602569580078125, 0.11576271057128906, 0.12549972534179688, 0.1352367401123047, 0.1449737548828125, 0.1547107696533203, 0.16444778442382812, 0.17418479919433594, 0.18392181396484375, 0.19365882873535156, 0.20339584350585938, 0.2131328582763672, 0.222869873046875, 0.2326068878173828, 0.24234390258789062, 0.25208091735839844, 0.26181793212890625, 0.27155494689941406, 0.2812919616699219, 0.2910289764404297, 0.3007659912109375, 0.3105030059814453, 0.3202400207519531, 0.32997703552246094, 0.33971405029296875, 0.34945106506347656, 0.3591880798339844, 0.3689250946044922, 0.378662109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 8.0, 7.0, 16.0, 13.0, 13.0, 19.0, 13.0, 34.0, 41.0, 56.0, 68.0, 69.0, 91.0, 78.0, 77.0, 73.0, 64.0, 39.0, 36.0, 32.0, 28.0, 24.0, 14.0, 6.0, 10.0, 6.0, 5.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.266357421875, -0.258056640625, -0.249755859375, -0.241455078125, -0.233154296875, -0.224853515625, -0.216552734375, -0.208251953125, -0.199951171875, -0.191650390625, -0.183349609375, -0.175048828125, -0.166748046875, -0.158447265625, -0.150146484375, -0.141845703125, -0.133544921875, -0.125244140625, -0.116943359375, -0.108642578125, -0.100341796875, -0.092041015625, -0.083740234375, -0.075439453125, -0.067138671875, -0.058837890625, -0.050537109375, -0.042236328125, -0.033935546875, -0.025634765625, -0.017333984375, -0.009033203125, -0.000732421875, 0.007568359375, 0.015869140625, 0.024169921875, 0.032470703125, 0.040771484375, 0.049072265625, 0.057373046875, 0.065673828125, 0.073974609375, 0.082275390625, 0.090576171875, 0.098876953125, 0.107177734375, 0.115478515625, 0.123779296875, 0.132080078125, 0.140380859375, 0.148681640625, 0.156982421875, 0.165283203125, 0.173583984375, 0.181884765625, 0.190185546875, 0.198486328125, 0.206787109375, 0.215087890625, 0.223388671875, 0.231689453125, 0.239990234375, 0.248291015625, 0.256591796875, 0.264892578125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 17.0, 26.0, 48.0, 96.0, 214.0, 363.0, 113.0, 55.0, 23.0, 9.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.465110778808594, -10.140054702758789, -9.814998626708984, -9.48994255065918, -9.164886474609375, -8.83983039855957, -8.514774322509766, -8.189718246459961, -7.864662170410156, -7.539606094360352, -7.214550018310547, -6.889493942260742, -6.5644378662109375, -6.239381790161133, -5.914325714111328, -5.589269638061523, -5.264213562011719, -4.939157485961914, -4.614101409912109, -4.289045333862305, -3.9639892578125, -3.6389331817626953, -3.3138771057128906, -2.988821029663086, -2.6637649536132812, -2.3387088775634766, -2.013652801513672, -1.6885967254638672, -1.3635406494140625, -1.0384845733642578, -0.7134284973144531, -0.38837242126464844, -0.06331729888916016, 0.26173877716064453, 0.5867948532104492, 0.9118509292602539, 1.2369070053100586, 1.5619630813598633, 1.887019157409668, 2.2120752334594727, 2.5371313095092773, 2.862187385559082, 3.1872434616088867, 3.5122995376586914, 3.837355613708496, 4.162411689758301, 4.4874677658081055, 4.81252384185791, 5.137579917907715, 5.4626359939575195, 5.787692070007324, 6.112748146057129, 6.437804222106934, 6.762860298156738, 7.087916374206543, 7.412972450256348, 7.738028526306152, 8.063084602355957, 8.388140678405762, 8.713196754455566, 9.038252830505371, 9.363308906555176, 9.68836498260498, 10.013421058654785, 10.33847713470459]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 6.0, 12.0, 20.0, 15.0, 16.0, 18.0, 14.0, 9.0, 31.0, 24.0, 25.0, 25.0, 25.0, 32.0, 64.0, 100.0, 145.0, 86.0, 54.0, 40.0, 31.0, 21.0, 21.0, 18.0, 20.0, 19.0, 13.0, 14.0, 13.0, 9.0, 10.0, 5.0, 8.0, 7.0, 8.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.8092498779296875, -6.626408100128174, -6.443565845489502, -6.260724067687988, -6.077882289886475, -5.895040512084961, -5.712198257446289, -5.529356479644775, -5.346514701843262, -5.163672924041748, -4.980830669403076, -4.7979888916015625, -4.615147113800049, -4.432305335998535, -4.249463081359863, -4.06662130355835, -3.8837790489196777, -3.700937032699585, -3.5180952548980713, -3.3352532386779785, -3.152411460876465, -2.969569444656372, -2.7867274284362793, -2.6038856506347656, -2.421043634414673, -2.23820161819458, -2.0553598403930664, -1.8725178241729736, -1.6896759271621704, -1.5068340301513672, -1.3239920139312744, -1.1411501169204712, -0.958308219909668, -0.7754663228988647, -0.5926243662834167, -0.40978240966796875, -0.22694051265716553, -0.044098615646362305, 0.13874340057373047, 0.3215852975845337, 0.5044271945953369, 0.6872690916061401, 0.8701110482215881, 1.0529530048370361, 1.2357949018478394, 1.4186367988586426, 1.6014788150787354, 1.7843207120895386, 1.9671626091003418, 2.1500046253204346, 2.3328464031219482, 2.515688419342041, 2.6985301971435547, 2.8813722133636475, 3.0642142295837402, 3.247056007385254, 3.4298980236053467, 3.6127400398254395, 3.795581817626953, 3.978423833847046, 4.161265850067139, 4.344107627868652, 4.526949882507324, 4.709791660308838, 4.892633438110352]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 8.0, 7.0, 9.0, 11.0, 21.0, 30.0, 48.0, 60.0, 102.0, 163.0, 280.0, 401.0, 755.0, 1367.0, 2606.0, 5273.0, 13367.0, 47802.0, 268769.0, 1423382.0, 1890469.0, 431973.0, 74425.0, 18942.0, 7030.0, 3274.0, 1615.0, 834.0, 509.0, 274.0, 181.0, 106.0, 61.0, 50.0, 27.0, 10.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.734375, -0.713470458984375, -0.69256591796875, -0.671661376953125, -0.6507568359375, -0.629852294921875, -0.60894775390625, -0.588043212890625, -0.567138671875, -0.546234130859375, -0.52532958984375, -0.504425048828125, -0.4835205078125, -0.462615966796875, -0.44171142578125, -0.420806884765625, -0.39990234375, -0.378997802734375, -0.35809326171875, -0.337188720703125, -0.3162841796875, -0.295379638671875, -0.27447509765625, -0.253570556640625, -0.232666015625, -0.211761474609375, -0.19085693359375, -0.169952392578125, -0.1490478515625, -0.128143310546875, -0.10723876953125, -0.086334228515625, -0.0654296875, -0.044525146484375, -0.02362060546875, -0.002716064453125, 0.0181884765625, 0.039093017578125, 0.05999755859375, 0.080902099609375, 0.101806640625, 0.122711181640625, 0.14361572265625, 0.164520263671875, 0.1854248046875, 0.206329345703125, 0.22723388671875, 0.248138427734375, 0.26904296875, 0.289947509765625, 0.31085205078125, 0.331756591796875, 0.3526611328125, 0.373565673828125, 0.39447021484375, 0.415374755859375, 0.436279296875, 0.457183837890625, 0.47808837890625, 0.498992919921875, 0.5198974609375, 0.540802001953125, 0.56170654296875, 0.582611083984375, 0.603515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 7.0, 11.0, 7.0, 12.0, 19.0, 18.0, 30.0, 25.0, 23.0, 42.0, 45.0, 54.0, 57.0, 59.0, 47.0, 57.0, 47.0, 53.0, 45.0, 45.0, 51.0, 43.0, 33.0, 30.0, 34.0, 21.0, 17.0, 16.0, 13.0, 10.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5046157836914062, -0.4911651611328125, -0.47771453857421875, -0.464263916015625, -0.45081329345703125, -0.4373626708984375, -0.42391204833984375, -0.41046142578125, -0.39701080322265625, -0.3835601806640625, -0.37010955810546875, -0.356658935546875, -0.34320831298828125, -0.3297576904296875, -0.31630706787109375, -0.3028564453125, -0.28940582275390625, -0.2759552001953125, -0.26250457763671875, -0.249053955078125, -0.23560333251953125, -0.2221527099609375, -0.20870208740234375, -0.19525146484375, -0.18180084228515625, -0.1683502197265625, -0.15489959716796875, -0.141448974609375, -0.12799835205078125, -0.1145477294921875, -0.10109710693359375, -0.087646484375, -0.07419586181640625, -0.0607452392578125, -0.04729461669921875, -0.033843994140625, -0.02039337158203125, -0.0069427490234375, 0.00650787353515625, 0.01995849609375, 0.03340911865234375, 0.0468597412109375, 0.06031036376953125, 0.073760986328125, 0.08721160888671875, 0.1006622314453125, 0.11411285400390625, 0.1275634765625, 0.14101409912109375, 0.1544647216796875, 0.16791534423828125, 0.181365966796875, 0.19481658935546875, 0.2082672119140625, 0.22171783447265625, 0.23516845703125, 0.24861907958984375, 0.2620697021484375, 0.27552032470703125, 0.288970947265625, 0.30242156982421875, 0.3158721923828125, 0.32932281494140625, 0.3427734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 8.0, 17.0, 28.0, 81.0, 123.0, 276.0, 625.0, 1787.0, 6419.0, 158708.0, 3991789.0, 28639.0, 3582.0, 1256.0, 501.0, 206.0, 112.0, 44.0, 31.0, 17.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6796875, -2.596771240234375, -2.51385498046875, -2.430938720703125, -2.3480224609375, -2.265106201171875, -2.18218994140625, -2.099273681640625, -2.016357421875, -1.933441162109375, -1.85052490234375, -1.767608642578125, -1.6846923828125, -1.601776123046875, -1.51885986328125, -1.435943603515625, -1.35302734375, -1.270111083984375, -1.18719482421875, -1.104278564453125, -1.0213623046875, -0.938446044921875, -0.85552978515625, -0.772613525390625, -0.689697265625, -0.606781005859375, -0.52386474609375, -0.440948486328125, -0.3580322265625, -0.275115966796875, -0.19219970703125, -0.109283447265625, -0.0263671875, 0.056549072265625, 0.13946533203125, 0.222381591796875, 0.3052978515625, 0.388214111328125, 0.47113037109375, 0.554046630859375, 0.636962890625, 0.719879150390625, 0.80279541015625, 0.885711669921875, 0.9686279296875, 1.051544189453125, 1.13446044921875, 1.217376708984375, 1.30029296875, 1.383209228515625, 1.46612548828125, 1.549041748046875, 1.6319580078125, 1.714874267578125, 1.79779052734375, 1.880706787109375, 1.963623046875, 2.046539306640625, 2.12945556640625, 2.212371826171875, 2.2952880859375, 2.378204345703125, 2.46112060546875, 2.544036865234375, 2.626953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 9.0, 15.0, 29.0, 31.0, 70.0, 134.0, 247.0, 386.0, 578.0, 847.0, 681.0, 440.0, 238.0, 139.0, 98.0, 52.0, 29.0, 19.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5879669189453125, -1.536285400390625, -1.4846038818359375, -1.43292236328125, -1.3812408447265625, -1.329559326171875, -1.2778778076171875, -1.2261962890625, -1.1745147705078125, -1.122833251953125, -1.0711517333984375, -1.01947021484375, -0.9677886962890625, -0.916107177734375, -0.8644256591796875, -0.812744140625, -0.7610626220703125, -0.709381103515625, -0.6576995849609375, -0.60601806640625, -0.5543365478515625, -0.502655029296875, -0.4509735107421875, -0.3992919921875, -0.3476104736328125, -0.295928955078125, -0.2442474365234375, -0.19256591796875, -0.1408843994140625, -0.089202880859375, -0.0375213623046875, 0.01416015625, 0.0658416748046875, 0.117523193359375, 0.1692047119140625, 0.22088623046875, 0.2725677490234375, 0.324249267578125, 0.3759307861328125, 0.4276123046875, 0.4792938232421875, 0.530975341796875, 0.5826568603515625, 0.63433837890625, 0.6860198974609375, 0.737701416015625, 0.7893829345703125, 0.841064453125, 0.8927459716796875, 0.944427490234375, 0.9961090087890625, 1.04779052734375, 1.0994720458984375, 1.151153564453125, 1.2028350830078125, 1.2545166015625, 1.3061981201171875, 1.357879638671875, 1.4095611572265625, 1.46124267578125, 1.5129241943359375, 1.564605712890625, 1.6162872314453125, 1.66796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 3.0, 7.0, 6.0, 14.0, 31.0, 39.0, 72.0, 97.0, 174.0, 184.0, 138.0, 86.0, 49.0, 36.0, 18.0, 10.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.121706008911133, -15.749980926513672, -15.378256797790527, -15.006531715393066, -14.634807586669922, -14.263082504272461, -13.891358375549316, -13.519633293151855, -13.147909164428711, -12.77618408203125, -12.404459953308105, -12.032734870910645, -11.6610107421875, -11.289285659790039, -10.917561531066895, -10.545836448669434, -10.174112319946289, -9.802387237548828, -9.430663108825684, -9.058938026428223, -8.687213897705078, -8.315488815307617, -7.943764686584473, -7.572039604187012, -7.200314521789551, -6.828589916229248, -6.456865310668945, -6.085140705108643, -5.71341609954834, -5.341691493988037, -4.969966888427734, -4.598241806030273, -4.226518154144287, -3.8547935485839844, -3.4830689430236816, -3.111344337463379, -2.739619731903076, -2.3678951263427734, -1.9961702823638916, -1.6244456768035889, -1.2527210712432861, -0.8809964656829834, -0.5092718005180359, -0.13754713535308838, 0.23417747020721436, 0.6059020757675171, 0.9776268005371094, 1.349351406097412, 1.7210760116577148, 2.0928006172180176, 2.4645252227783203, 2.836249828338623, 3.207974433898926, 3.5796990394592285, 3.9514238834381104, 4.323148727416992, 4.694872856140137, 5.0665974617004395, 5.438322067260742, 5.810046672821045, 6.181771278381348, 6.55349588394165, 6.925220489501953, 7.296945571899414, 7.668670177459717]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 6.0, 7.0, 12.0, 14.0, 15.0, 17.0, 23.0, 32.0, 27.0, 37.0, 34.0, 32.0, 41.0, 59.0, 80.0, 67.0, 68.0, 57.0, 41.0, 55.0, 55.0, 47.0, 34.0, 30.0, 19.0, 14.0, 21.0, 17.0, 13.0, 10.0, 2.0, 5.0, 2.0, 0.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.063162326812744, -5.852816581726074, -5.642470836639404, -5.432125091552734, -5.2217793464660645, -5.0114336013793945, -4.801088333129883, -4.590742111206055, -4.380396842956543, -4.170051097869873, -3.959705352783203, -3.749359607696533, -3.5390138626098633, -3.3286681175231934, -3.1183226108551025, -2.9079768657684326, -2.6976308822631836, -2.4872851371765137, -2.2769393920898438, -2.066593647003174, -1.8562480211257935, -1.6459022760391235, -1.4355566501617432, -1.2252109050750732, -1.0148651599884033, -0.8045194149017334, -0.5941737294197083, -0.3838280439376831, -0.17348229885101318, 0.03686344623565674, 0.2472090721130371, 0.45755481719970703, 0.667900562286377, 0.8782463073730469, 1.0885920524597168, 1.2989376783370972, 1.509283423423767, 1.719629168510437, 1.9299747943878174, 2.1403205394744873, 2.3506662845611572, 2.561012029647827, 2.771357774734497, 2.981703281402588, 3.192049026489258, 3.4023947715759277, 3.6127405166625977, 3.8230862617492676, 4.0334320068359375, 4.243777751922607, 4.454123497009277, 4.664469242095947, 4.874814987182617, 5.085160732269287, 5.295506477355957, 5.505851745605469, 5.716197967529297, 5.926543712615967, 6.136889457702637, 6.347235202789307, 6.557580947875977, 6.7679266929626465, 6.978272438049316, 7.188617706298828, 7.398963451385498]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 17.0, 11.0, 16.0, 35.0, 65.0, 81.0, 115.0, 218.0, 371.0, 721.0, 1359.0, 2846.0, 6563.0, 17086.0, 53040.0, 214036.0, 578929.0, 118492.0, 33745.0, 11609.0, 4654.0, 2124.0, 1061.0, 557.0, 313.0, 183.0, 129.0, 60.0, 36.0, 27.0, 16.0, 6.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68505859375, -0.663177490234375, -0.64129638671875, -0.619415283203125, -0.5975341796875, -0.575653076171875, -0.55377197265625, -0.531890869140625, -0.510009765625, -0.488128662109375, -0.46624755859375, -0.444366455078125, -0.4224853515625, -0.400604248046875, -0.37872314453125, -0.356842041015625, -0.3349609375, -0.313079833984375, -0.29119873046875, -0.269317626953125, -0.2474365234375, -0.225555419921875, -0.20367431640625, -0.181793212890625, -0.159912109375, -0.138031005859375, -0.11614990234375, -0.094268798828125, -0.0723876953125, -0.050506591796875, -0.02862548828125, -0.006744384765625, 0.01513671875, 0.037017822265625, 0.05889892578125, 0.080780029296875, 0.1026611328125, 0.124542236328125, 0.14642333984375, 0.168304443359375, 0.190185546875, 0.212066650390625, 0.23394775390625, 0.255828857421875, 0.2777099609375, 0.299591064453125, 0.32147216796875, 0.343353271484375, 0.365234375, 0.387115478515625, 0.40899658203125, 0.430877685546875, 0.4527587890625, 0.474639892578125, 0.49652099609375, 0.518402099609375, 0.540283203125, 0.562164306640625, 0.58404541015625, 0.605926513671875, 0.6278076171875, 0.649688720703125, 0.67156982421875, 0.693450927734375, 0.71533203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 7.0, 6.0, 15.0, 25.0, 31.0, 32.0, 19.0, 38.0, 68.0, 42.0, 53.0, 55.0, 67.0, 55.0, 76.0, 60.0, 54.0, 53.0, 44.0, 34.0, 27.0, 33.0, 17.0, 18.0, 13.0, 13.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57568359375, -0.5592460632324219, -0.5428085327148438, -0.5263710021972656, -0.5099334716796875, -0.4934959411621094, -0.47705841064453125, -0.4606208801269531, -0.444183349609375, -0.4277458190917969, -0.41130828857421875, -0.3948707580566406, -0.3784332275390625, -0.3619956970214844, -0.34555816650390625, -0.3291206359863281, -0.31268310546875, -0.2962455749511719, -0.27980804443359375, -0.2633705139160156, -0.2469329833984375, -0.23049545288085938, -0.21405792236328125, -0.19762039184570312, -0.181182861328125, -0.16474533081054688, -0.14830780029296875, -0.13187026977539062, -0.1154327392578125, -0.09899520874023438, -0.08255767822265625, -0.06612014770507812, -0.0496826171875, -0.033245086669921875, -0.01680755615234375, -0.000370025634765625, 0.0160675048828125, 0.032505035400390625, 0.04894256591796875, 0.06538009643554688, 0.081817626953125, 0.09825515747070312, 0.11469268798828125, 0.13113021850585938, 0.1475677490234375, 0.16400527954101562, 0.18044281005859375, 0.19688034057617188, 0.21331787109375, 0.22975540161132812, 0.24619293212890625, 0.2626304626464844, 0.2790679931640625, 0.2955055236816406, 0.31194305419921875, 0.3283805847167969, 0.344818115234375, 0.3612556457519531, 0.37769317626953125, 0.3941307067871094, 0.4105682373046875, 0.4270057678222656, 0.44344329833984375, 0.4598808288574219, 0.476318359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 7.0, 21.0, 31.0, 53.0, 59.0, 91.0, 191.0, 258.0, 564.0, 1286.0, 5016.0, 59711.0, 941462.0, 33983.0, 3679.0, 1016.0, 484.0, 273.0, 132.0, 82.0, 37.0, 33.0, 21.0, 18.0, 13.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.9833984375, -1.9387359619140625, -1.894073486328125, -1.8494110107421875, -1.80474853515625, -1.7600860595703125, -1.715423583984375, -1.6707611083984375, -1.6260986328125, -1.5814361572265625, -1.536773681640625, -1.4921112060546875, -1.44744873046875, -1.4027862548828125, -1.358123779296875, -1.3134613037109375, -1.268798828125, -1.2241363525390625, -1.179473876953125, -1.1348114013671875, -1.09014892578125, -1.0454864501953125, -1.000823974609375, -0.9561614990234375, -0.9114990234375, -0.8668365478515625, -0.822174072265625, -0.7775115966796875, -0.73284912109375, -0.6881866455078125, -0.643524169921875, -0.5988616943359375, -0.55419921875, -0.5095367431640625, -0.464874267578125, -0.4202117919921875, -0.37554931640625, -0.3308868408203125, -0.286224365234375, -0.2415618896484375, -0.1968994140625, -0.1522369384765625, -0.107574462890625, -0.0629119873046875, -0.01824951171875, 0.0264129638671875, 0.071075439453125, 0.1157379150390625, 0.160400390625, 0.2050628662109375, 0.249725341796875, 0.2943878173828125, 0.33905029296875, 0.3837127685546875, 0.428375244140625, 0.4730377197265625, 0.5177001953125, 0.5623626708984375, 0.607025146484375, 0.6516876220703125, 0.69635009765625, 0.7410125732421875, 0.785675048828125, 0.8303375244140625, 0.875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 10.0, 8.0, 10.0, 15.0, 12.0, 17.0, 24.0, 23.0, 31.0, 34.0, 63.0, 55.0, 68.0, 57.0, 72.0, 79.0, 61.0, 68.0, 50.0, 34.0, 34.0, 27.0, 16.0, 19.0, 18.0, 17.0, 9.0, 11.0, 13.0, 8.0, 4.0, 1.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.849609375, -1.7949981689453125, -1.740386962890625, -1.6857757568359375, -1.63116455078125, -1.5765533447265625, -1.521942138671875, -1.4673309326171875, -1.4127197265625, -1.3581085205078125, -1.303497314453125, -1.2488861083984375, -1.19427490234375, -1.1396636962890625, -1.085052490234375, -1.0304412841796875, -0.975830078125, -0.9212188720703125, -0.866607666015625, -0.8119964599609375, -0.75738525390625, -0.7027740478515625, -0.648162841796875, -0.5935516357421875, -0.5389404296875, -0.4843292236328125, -0.429718017578125, -0.3751068115234375, -0.32049560546875, -0.2658843994140625, -0.211273193359375, -0.1566619873046875, -0.10205078125, -0.0474395751953125, 0.007171630859375, 0.0617828369140625, 0.11639404296875, 0.1710052490234375, 0.225616455078125, 0.2802276611328125, 0.3348388671875, 0.3894500732421875, 0.444061279296875, 0.4986724853515625, 0.55328369140625, 0.6078948974609375, 0.662506103515625, 0.7171173095703125, 0.771728515625, 0.8263397216796875, 0.880950927734375, 0.9355621337890625, 0.99017333984375, 1.0447845458984375, 1.099395751953125, 1.1540069580078125, 1.2086181640625, 1.2632293701171875, 1.317840576171875, 1.3724517822265625, 1.42706298828125, 1.4816741943359375, 1.536285400390625, 1.5908966064453125, 1.6455078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 10.0, 11.0, 20.0, 31.0, 26.0, 42.0, 62.0, 97.0, 140.0, 307.0, 648.0, 1672.0, 5121.0, 25068.0, 770468.0, 218406.0, 19584.0, 4237.0, 1327.0, 546.0, 282.0, 157.0, 87.0, 59.0, 42.0, 31.0, 22.0, 14.0, 11.0, 9.0, 4.0, 5.0, 1.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16069793701171875, -0.1555023193359375, -0.15030670166015625, -0.145111083984375, -0.13991546630859375, -0.1347198486328125, -0.12952423095703125, -0.12432861328125, -0.11913299560546875, -0.1139373779296875, -0.10874176025390625, -0.103546142578125, -0.09835052490234375, -0.0931549072265625, -0.08795928955078125, -0.082763671875, -0.07756805419921875, -0.0723724365234375, -0.06717681884765625, -0.061981201171875, -0.05678558349609375, -0.0515899658203125, -0.04639434814453125, -0.04119873046875, -0.03600311279296875, -0.0308074951171875, -0.02561187744140625, -0.020416259765625, -0.01522064208984375, -0.0100250244140625, -0.00482940673828125, 0.0003662109375, 0.00556182861328125, 0.0107574462890625, 0.01595306396484375, 0.021148681640625, 0.02634429931640625, 0.0315399169921875, 0.03673553466796875, 0.04193115234375, 0.04712677001953125, 0.0523223876953125, 0.05751800537109375, 0.062713623046875, 0.06790924072265625, 0.0731048583984375, 0.07830047607421875, 0.08349609375, 0.08869171142578125, 0.0938873291015625, 0.09908294677734375, 0.104278564453125, 0.10947418212890625, 0.1146697998046875, 0.11986541748046875, 0.12506103515625, 0.13025665283203125, 0.1354522705078125, 0.14064788818359375, 0.145843505859375, 0.15103912353515625, 0.1562347412109375, 0.16143035888671875, 0.1666259765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 13.0, 22.0, 20.0, 27.0, 48.0, 56.0, 68.0, 106.0, 109.0, 129.0, 94.0, 71.0, 56.0, 32.0, 18.0, 18.0, 19.0, 16.0, 6.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.457069396972656e-05, -3.3342279493808746e-05, -3.211386501789093e-05, -3.0885450541973114e-05, -2.9657036066055298e-05, -2.842862159013748e-05, -2.7200207114219666e-05, -2.597179263830185e-05, -2.4743378162384033e-05, -2.3514963686466217e-05, -2.22865492105484e-05, -2.1058134734630585e-05, -1.982972025871277e-05, -1.8601305782794952e-05, -1.7372891306877136e-05, -1.614447683095932e-05, -1.4916062355041504e-05, -1.3687647879123688e-05, -1.2459233403205872e-05, -1.1230818927288055e-05, -1.000240445137024e-05, -8.773989975452423e-06, -7.545575499534607e-06, -6.317161023616791e-06, -5.088746547698975e-06, -3.8603320717811584e-06, -2.6319175958633423e-06, -1.4035031199455261e-06, -1.7508864402770996e-07, 1.0533258318901062e-06, 2.2817403078079224e-06, 3.5101547837257385e-06, 4.738569259643555e-06, 5.966983735561371e-06, 7.195398211479187e-06, 8.423812687397003e-06, 9.65222716331482e-06, 1.0880641639232635e-05, 1.2109056115150452e-05, 1.3337470591068268e-05, 1.4565885066986084e-05, 1.57942995429039e-05, 1.7022714018821716e-05, 1.8251128494739532e-05, 1.947954297065735e-05, 2.0707957446575165e-05, 2.193637192249298e-05, 2.3164786398410797e-05, 2.4393200874328613e-05, 2.562161535024643e-05, 2.6850029826164246e-05, 2.8078444302082062e-05, 2.9306858777999878e-05, 3.0535273253917694e-05, 3.176368772983551e-05, 3.2992102205753326e-05, 3.422051668167114e-05, 3.544893115758896e-05, 3.6677345633506775e-05, 3.790576010942459e-05, 3.913417458534241e-05, 4.0362589061260223e-05, 4.159100353717804e-05, 4.2819418013095856e-05, 4.404783248901367e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 17.0, 16.0, 22.0, 27.0, 36.0, 64.0, 76.0, 136.0, 181.0, 331.0, 620.0, 1101.0, 2022.0, 4221.0, 9338.0, 25297.0, 96643.0, 769873.0, 95549.0, 24983.0, 9341.0, 4001.0, 2013.0, 1063.0, 579.0, 342.0, 227.0, 142.0, 87.0, 60.0, 35.0, 23.0, 14.0, 17.0, 12.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10125732421875, -0.09832191467285156, -0.09538650512695312, -0.09245109558105469, -0.08951568603515625, -0.08658027648925781, -0.08364486694335938, -0.08070945739746094, -0.0777740478515625, -0.07483863830566406, -0.07190322875976562, -0.06896781921386719, -0.06603240966796875, -0.06309700012207031, -0.060161590576171875, -0.05722618103027344, -0.054290771484375, -0.05135536193847656, -0.048419952392578125, -0.04548454284667969, -0.04254913330078125, -0.03961372375488281, -0.036678314208984375, -0.03374290466308594, -0.0308074951171875, -0.027872085571289062, -0.024936676025390625, -0.022001266479492188, -0.01906585693359375, -0.016130447387695312, -0.013195037841796875, -0.010259628295898438, -0.00732421875, -0.0043888092041015625, -0.001453399658203125, 0.0014820098876953125, 0.00441741943359375, 0.0073528289794921875, 0.010288238525390625, 0.013223648071289062, 0.0161590576171875, 0.019094467163085938, 0.022029876708984375, 0.024965286254882812, 0.02790069580078125, 0.030836105346679688, 0.033771514892578125, 0.03670692443847656, 0.039642333984375, 0.04257774353027344, 0.045513153076171875, 0.04844856262207031, 0.05138397216796875, 0.05431938171386719, 0.057254791259765625, 0.06019020080566406, 0.0631256103515625, 0.06606101989746094, 0.06899642944335938, 0.07193183898925781, 0.07486724853515625, 0.07780265808105469, 0.08073806762695312, 0.08367347717285156, 0.08660888671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 5.0, 5.0, 13.0, 9.0, 4.0, 9.0, 7.0, 6.0, 12.0, 16.0, 19.0, 22.0, 33.0, 47.0, 53.0, 58.0, 84.0, 94.0, 86.0, 74.0, 61.0, 50.0, 41.0, 43.0, 19.0, 22.0, 19.0, 14.0, 14.0, 5.0, 3.0, 5.0, 7.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1153564453125, -0.11177921295166016, -0.10820198059082031, -0.10462474822998047, -0.10104751586914062, -0.09747028350830078, -0.09389305114746094, -0.0903158187866211, -0.08673858642578125, -0.0831613540649414, -0.07958412170410156, -0.07600688934326172, -0.07242965698242188, -0.06885242462158203, -0.06527519226074219, -0.061697959899902344, -0.0581207275390625, -0.054543495178222656, -0.05096626281738281, -0.04738903045654297, -0.043811798095703125, -0.04023456573486328, -0.03665733337402344, -0.033080101013183594, -0.02950286865234375, -0.025925636291503906, -0.022348403930664062, -0.01877117156982422, -0.015193939208984375, -0.011616706848144531, -0.008039474487304688, -0.004462242126464844, -0.000885009765625, 0.0026922225952148438, 0.0062694549560546875, 0.009846687316894531, 0.013423919677734375, 0.01700115203857422, 0.020578384399414062, 0.024155616760253906, 0.02773284912109375, 0.031310081481933594, 0.03488731384277344, 0.03846454620361328, 0.042041778564453125, 0.04561901092529297, 0.04919624328613281, 0.052773475646972656, 0.0563507080078125, 0.059927940368652344, 0.06350517272949219, 0.06708240509033203, 0.07065963745117188, 0.07423686981201172, 0.07781410217285156, 0.0813913345336914, 0.08496856689453125, 0.0885457992553711, 0.09212303161621094, 0.09570026397705078, 0.09927749633789062, 0.10285472869873047, 0.10643196105957031, 0.11000919342041016, 0.11358642578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 12.0, 19.0, 31.0, 49.0, 68.0, 339.0, 221.0, 83.0, 49.0, 28.0, 14.0, 20.0, 14.0, 7.0, 13.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.383368492126465, -4.236753463745117, -4.0901384353637695, -3.943523645401001, -3.7969086170196533, -3.6502938270568848, -3.503678798675537, -3.3570637702941895, -3.210448741912842, -3.063833713531494, -2.9172189235687256, -2.770603895187378, -2.6239888668060303, -2.4773740768432617, -2.330759048461914, -2.1841440200805664, -2.037529230117798, -1.8909143209457397, -1.744299292564392, -1.597684383392334, -1.4510693550109863, -1.3044544458389282, -1.1578395366668701, -1.0112245082855225, -0.8646095991134644, -0.7179946303367615, -0.5713796615600586, -0.4247647523880005, -0.2781497836112976, -0.13153481483459473, 0.015080094337463379, 0.16169512271881104, 0.30831003189086914, 0.454925000667572, 0.6015399694442749, 0.748154878616333, 0.8947698473930359, 1.0413848161697388, 1.1879997253417969, 1.3346147537231445, 1.4812296628952026, 1.6278445720672607, 1.7744596004486084, 1.9210745096206665, 2.0676894187927246, 2.2143044471740723, 2.36091947555542, 2.5075345039367676, 2.654149293899536, 2.800764322280884, 2.9473791122436523, 3.093994140625, 3.2406091690063477, 3.3872241973876953, 3.533838987350464, 3.6804540157318115, 3.82706880569458, 3.9736838340759277, 4.120298862457275, 4.266913414001465, 4.4135284423828125, 4.56014347076416, 4.706758499145508, 4.8533735275268555, 4.999988555908203]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 9.0, 20.0, 14.0, 21.0, 33.0, 32.0, 41.0, 40.0, 93.0, 360.0, 109.0, 48.0, 34.0, 29.0, 37.0, 14.0, 16.0, 21.0, 6.0, 11.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.447388648986816, -7.237386226654053, -7.027383804321289, -6.817381858825684, -6.60737943649292, -6.397377014160156, -6.187374591827393, -5.977372169494629, -5.767370223999023, -5.55736780166626, -5.347365379333496, -5.137363433837891, -4.927361011505127, -4.717358589172363, -4.5073561668396, -4.297353744506836, -4.087351322174072, -3.8773488998413086, -3.667346715927124, -3.4573442935943604, -3.247342109680176, -3.037339687347412, -2.8273372650146484, -2.6173348426818848, -2.4073326587677, -2.1973302364349365, -1.987328052520752, -1.7773256301879883, -1.5673233270645142, -1.35732102394104, -1.1473186016082764, -0.9373162984848022, -0.7273139953613281, -0.517311692237854, -0.3073093295097351, -0.09730696678161621, 0.11269533634185791, 0.32269763946533203, 0.5327000617980957, 0.7427023649215698, 0.952704668045044, 1.162706971168518, 1.3727092742919922, 1.5827116966247559, 1.79271399974823, 2.002716302871704, 2.2127187252044678, 2.4227209091186523, 2.632723331451416, 2.8427257537841797, 3.0527279376983643, 3.262730360031128, 3.4727325439453125, 3.682734966278076, 3.89273738861084, 4.1027398109436035, 4.312742233276367, 4.522744655609131, 4.7327470779418945, 4.9427490234375, 5.152751445770264, 5.362753868103027, 5.572756290435791, 5.782758712768555, 5.99276065826416]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 9.0, 13.0, 9.0, 14.0, 20.0, 26.0, 18.0, 27.0, 31.0, 23.0, 34.0, 96.0, 249.0, 110.0, 53.0, 31.0, 26.0, 27.0, 23.0, 22.0, 19.0, 15.0, 18.0, 14.0, 4.0, 4.0, 14.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.42236328125, -0.4097709655761719, -0.39717864990234375, -0.3845863342285156, -0.3719940185546875, -0.3594017028808594, -0.34680938720703125, -0.3342170715332031, -0.321624755859375, -0.3090324401855469, -0.29644012451171875, -0.2838478088378906, -0.2712554931640625, -0.2586631774902344, -0.24607086181640625, -0.23347854614257812, -0.22088623046875, -0.20829391479492188, -0.19570159912109375, -0.18310928344726562, -0.1705169677734375, -0.15792465209960938, -0.14533233642578125, -0.13274002075195312, -0.120147705078125, -0.10755538940429688, -0.09496307373046875, -0.08237075805664062, -0.0697784423828125, -0.057186126708984375, -0.04459381103515625, -0.032001495361328125, -0.0194091796875, -0.006816864013671875, 0.00577545166015625, 0.018367767333984375, 0.0309600830078125, 0.043552398681640625, 0.05614471435546875, 0.06873703002929688, 0.081329345703125, 0.09392166137695312, 0.10651397705078125, 0.11910629272460938, 0.1316986083984375, 0.14429092407226562, 0.15688323974609375, 0.16947555541992188, 0.18206787109375, 0.19466018676757812, 0.20725250244140625, 0.21984481811523438, 0.2324371337890625, 0.24502944946289062, 0.25762176513671875, 0.2702140808105469, 0.282806396484375, 0.2953987121582031, 0.30799102783203125, 0.3205833435058594, 0.3331756591796875, 0.3457679748535156, 0.35836029052734375, 0.3709526062011719, 0.383544921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 12.0, 20.0, 20.0, 50.0, 60.0, 116.0, 261.0, 1567.0, 20514.0, 8359533.0, 5204.0, 713.0, 228.0, 66.0, 49.0, 38.0, 21.0, 14.0, 24.0, 11.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0], "bins": [-8.410557746887207, -8.165172576904297, -7.919787406921387, -7.674402236938477, -7.429017066955566, -7.183631896972656, -6.938246726989746, -6.692861557006836, -6.447476387023926, -6.202091217041016, -5.9567060470581055, -5.711320877075195, -5.465935707092285, -5.220550537109375, -4.975165367126465, -4.729780197143555, -4.484394550323486, -4.239009380340576, -3.993624210357666, -3.748239040374756, -3.5028538703918457, -3.2574687004089355, -3.0120832920074463, -2.766698122024536, -2.521312952041626, -2.275927782058716, -2.0305426120758057, -1.785157322883606, -1.5397721529006958, -1.2943869829177856, -1.049001693725586, -0.8036165237426758, -0.5582318305969238, -0.3128466308116913, -0.06746143102645874, 0.1779237985610962, 0.42330896854400635, 0.6686941385269165, 0.9140794277191162, 1.1594645977020264, 1.4048497676849365, 1.6502349376678467, 1.8956201076507568, 2.141005516052246, 2.3863906860351562, 2.6317758560180664, 2.8771610260009766, 3.1225461959838867, 3.367931365966797, 3.613316535949707, 3.858701705932617, 4.104086875915527, 4.3494720458984375, 4.594857215881348, 4.840242385864258, 5.085627555847168, 5.331012725830078, 5.576397895812988, 5.821783065795898, 6.067168235778809, 6.312553405761719, 6.557938575744629, 6.803323745727539, 7.048708915710449, 7.294094562530518]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 5.0, 5.0, 6.0, 5.0, 4.0, 0.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.435504913330078, -7.155727386474609, -6.875950336456299, -6.59617280960083, -6.3163957595825195, -6.036618232727051, -5.756840705871582, -5.477063179016113, -5.197286128997803, -4.917508602142334, -4.637731552124023, -4.357954025268555, -4.078176498413086, -3.7983994483947754, -3.5186219215393066, -3.238844633102417, -2.9590673446655273, -2.6792900562286377, -2.399512767791748, -2.1197352409362793, -1.8399579524993896, -1.5601806640625, -1.2804032564163208, -1.0006258487701416, -0.720848560333252, -0.44107121229171753, -0.1612938642501831, 0.11848348379135132, 0.39826083183288574, 0.6780381202697754, 0.9578155279159546, 1.2375929355621338, 1.517369270324707, 1.7971465587615967, 2.0769238471984863, 2.356701374053955, 2.6364786624908447, 2.9162559509277344, 3.196033477783203, 3.4758107662200928, 3.7555880546569824, 4.035365581512451, 4.315142631530762, 4.5949201583862305, 4.874697685241699, 5.15447473526001, 5.4342522621154785, 5.714029312133789, 5.993806838989258, 6.273584365844727, 6.553361415863037, 6.833138942718506, 7.112915992736816, 7.392693519592285, 7.672471046447754, 7.952248573303223, 8.232025146484375, 8.511802673339844, 8.791580200195312, 9.071356773376465, 9.351134300231934, 9.630911827087402, 9.910689353942871, 10.19046688079834, 10.470244407653809]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 7.0, 15.0, 7.0, 26.0, 36.0, 48.0, 52.0, 83.0, 129.0, 209.0, 367.0, 672.0, 1360.0, 3066.0, 7299.0, 18477.0, 49297.0, 127573.0, 176938.0, 85647.0, 31665.0, 12020.0, 4861.0, 2078.0, 993.0, 561.0, 282.0, 174.0, 102.0, 75.0, 42.0, 31.0, 28.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.58203125, -3.48846435546875, -3.3948974609375, -3.30133056640625, -3.207763671875, -3.11419677734375, -3.0206298828125, -2.92706298828125, -2.83349609375, -2.73992919921875, -2.6463623046875, -2.55279541015625, -2.459228515625, -2.36566162109375, -2.2720947265625, -2.17852783203125, -2.0849609375, -1.99139404296875, -1.8978271484375, -1.80426025390625, -1.710693359375, -1.61712646484375, -1.5235595703125, -1.42999267578125, -1.33642578125, -1.24285888671875, -1.1492919921875, -1.05572509765625, -0.962158203125, -0.86859130859375, -0.7750244140625, -0.68145751953125, -0.587890625, -0.49432373046875, -0.4007568359375, -0.30718994140625, -0.213623046875, -0.12005615234375, -0.0264892578125, 0.06707763671875, 0.16064453125, 0.25421142578125, 0.3477783203125, 0.44134521484375, 0.534912109375, 0.62847900390625, 0.7220458984375, 0.81561279296875, 0.9091796875, 1.00274658203125, 1.0963134765625, 1.18988037109375, 1.283447265625, 1.37701416015625, 1.4705810546875, 1.56414794921875, 1.65771484375, 1.75128173828125, 1.8448486328125, 1.93841552734375, 2.031982421875, 2.12554931640625, 2.2191162109375, 2.31268310546875, 2.40625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 6.0, 9.0, 9.0, 11.0, 15.0, 13.0, 22.0, 37.0, 42.0, 45.0, 60.0, 67.0, 66.0, 89.0, 100.0, 66.0, 55.0, 71.0, 38.0, 43.0, 28.0, 31.0, 23.0, 10.0, 11.0, 9.0, 11.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5401611328125, -0.522216796875, -0.5042724609375, -0.486328125, -0.4683837890625, -0.450439453125, -0.4324951171875, -0.41455078125, -0.3966064453125, -0.378662109375, -0.3607177734375, -0.3427734375, -0.3248291015625, -0.306884765625, -0.2889404296875, -0.27099609375, -0.2530517578125, -0.235107421875, -0.2171630859375, -0.19921875, -0.1812744140625, -0.163330078125, -0.1453857421875, -0.12744140625, -0.1094970703125, -0.091552734375, -0.0736083984375, -0.0556640625, -0.0377197265625, -0.019775390625, -0.0018310546875, 0.01611328125, 0.0340576171875, 0.052001953125, 0.0699462890625, 0.087890625, 0.1058349609375, 0.123779296875, 0.1417236328125, 0.15966796875, 0.1776123046875, 0.195556640625, 0.2135009765625, 0.2314453125, 0.2493896484375, 0.267333984375, 0.2852783203125, 0.30322265625, 0.3211669921875, 0.339111328125, 0.3570556640625, 0.375, 0.3929443359375, 0.410888671875, 0.4288330078125, 0.44677734375, 0.4647216796875, 0.482666015625, 0.5006103515625, 0.5185546875, 0.5364990234375, 0.554443359375, 0.5723876953125, 0.59033203125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 16.0, 14.0, 40.0, 67.0, 74.0, 96.0, 74.0, 36.0, 16.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9679598808288574, -2.834298610687256, -2.7006375789642334, -2.566976547241211, -2.4333152770996094, -2.299654006958008, -2.1659929752349854, -2.032331943511963, -1.8986706733703613, -1.7650095224380493, -1.6313483715057373, -1.4976872205734253, -1.3640260696411133, -1.2303649187088013, -1.0967037677764893, -0.9630426168441772, -0.8293814659118652, -0.6957203149795532, -0.5620591640472412, -0.4283980131149292, -0.2947368621826172, -0.16107571125030518, -0.027414560317993164, 0.10624659061431885, 0.23990774154663086, 0.37356889247894287, 0.5072300434112549, 0.6408911943435669, 0.7745523452758789, 0.9082134962081909, 1.041874647140503, 1.175535798072815, 1.3091964721679688, 1.4428576231002808, 1.5765187740325928, 1.7101799249649048, 1.8438410758972168, 1.9775022268295288, 2.111163377761841, 2.2448244094848633, 2.378485679626465, 2.5121469497680664, 2.645807981491089, 2.7794690132141113, 2.913130283355713, 3.0467915534973145, 3.180452585220337, 3.3141136169433594, 3.447774887084961, 3.5814361572265625, 3.715097188949585, 3.8487582206726074, 3.982419490814209, 4.1160807609558105, 4.249741554260254, 4.3834028244018555, 4.517064094543457, 4.650725364685059, 4.78438663482666, 4.9180474281311035, 5.051708698272705, 5.185369968414307, 5.31903076171875, 5.452692031860352, 5.586353302001953]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 5.0, 5.0, 12.0, 19.0, 21.0, 31.0, 43.0, 49.0, 72.0, 48.0, 35.0, 34.0, 21.0, 14.0, 8.0, 6.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4449899196624756, -1.3852702379226685, -1.3255505561828613, -1.2658308744430542, -1.206111192703247, -1.1463913917541504, -1.0866717100143433, -1.0269520282745361, -0.967232346534729, -0.9075126647949219, -0.8477929830551147, -0.7880732417106628, -0.7283535599708557, -0.6686338782310486, -0.6089141368865967, -0.5491944551467896, -0.4894747734069824, -0.4297550916671753, -0.3700353801250458, -0.31031566858291626, -0.25059598684310913, -0.190876305103302, -0.13115659356117249, -0.07143688201904297, -0.01171720027923584, 0.04800249636173248, 0.1077221930027008, 0.16744188964366913, 0.22716158628463745, 0.2868812680244446, 0.3466009795665741, 0.4063206911087036, 0.46604037284851074, 0.5257600545883179, 0.585479736328125, 0.6451994776725769, 0.704919159412384, 0.7646388411521912, 0.8243585824966431, 0.8840782642364502, 0.9437979459762573, 1.0035176277160645, 1.0632373094558716, 1.1229569911956787, 1.1826767921447754, 1.242396354675293, 1.3021161556243896, 1.3618358373641968, 1.421555519104004, 1.481275200843811, 1.5409948825836182, 1.6007145643234253, 1.6604342460632324, 1.720154047012329, 1.7798737287521362, 1.8395934104919434, 1.8993130922317505, 1.9590327739715576, 2.0187525749206543, 2.078472137451172, 2.1381919384002686, 2.197911500930786, 2.257631301879883, 2.3173508644104004, 2.377070665359497]}, "eval/loss": 12.739469528198242, "eval/wer": 2.0272040002381093, "eval/runtime": 953.2256, "eval/samples_per_second": 2.772, "eval/steps_per_second": 0.347, "train/train_runtime": 120295.663, "train/train_samples_per_second": 4.745, "train/train_steps_per_second": 0.148, "train/total_flos": 0.0, "train/train_loss": 6.376821394805951} \ No newline at end of file